diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
index 5033ca6483..fc1636b743 100755
--- a/.github/CODEOWNERS
+++ b/.github/CODEOWNERS
@@ -5,6 +5,7 @@
 /AgentQnA/ abolfazl.shahbazi@intel.com kaokao.lv@intel.com minmin.hou@intel.com xinyu.ye@intel.com
 /AudioQnA/ sihan.chen@intel.com wenjiao.yue@intel.com
 /AvatarChatbot/ chun.tao@intel.com kaokao.lv@intel.com xinyu.ye@intel.com
+/BrowserUseAgent/ letong.han@intel.com yi.a.yao@intel.com
 /ChatQnA/ liang1.lv@intel.com letong.han@intel.com
 /CodeGen/ liang1.lv@intel.com qing.yao@intel.com
 /CodeTrans/ sihan.chen@intel.com letong.han@intel.com
diff --git a/.github/code_spell_ignore.txt b/.github/code_spell_ignore.txt
index c72099bfd8..49716a1268 100644
--- a/.github/code_spell_ignore.txt
+++ b/.github/code_spell_ignore.txt
@@ -1,4 +1,5 @@
 ModelIn
 modelin
 pressEnter
-PromptIn
\ No newline at end of file
+PromptIn
+OT
\ No newline at end of file
diff --git a/.github/env/_build_image.sh b/.github/env/_build_image.sh
deleted file mode 100644
index 61b0d902ed..0000000000
--- a/.github/env/_build_image.sh
+++ /dev/null
@@ -1,6 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2025 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-export VLLM_VER=v0.10.0
-export VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
diff --git a/.github/workflows/_build_image.yml b/.github/workflows/_build_image.yml
index a91c522847..09c698a427 100644
--- a/.github/workflows/_build_image.yml
+++ b/.github/workflows/_build_image.yml
@@ -78,7 +78,7 @@ jobs:
           fi
 
       - name: Checkout out GenAIExamples
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           ref: ${{ env.CHECKOUT_REF }}
           fetch-depth: 0
@@ -87,13 +87,6 @@ jobs:
         run: |
           cd ${{ github.workspace }}/${{ inputs.example }}/docker_image_build
           docker_compose_path=${{ github.workspace }}/${{ inputs.example }}/docker_image_build/build.yaml
-          source ${{ github.workspace }}/.github/env/_build_image.sh
-          if [[ $(grep -c "vllm:" ${docker_compose_path}) != 0 ]]; then
-              git clone -b ${VLLM_VER} --single-branch https://github.com/vllm-project/vllm.git
-          fi
-          if [[ $(grep -c "vllm-gaudi:" ${docker_compose_path}) != 0 ]]; then
-              git clone -b ${VLLM_FORK_VER} --single-branch https://github.com/HabanaAI/vllm-fork.git
-          fi
           git clone --depth 1 --branch ${{ inputs.opea_branch }} https://github.com/opea-project/GenAIComps.git
           cd GenAIComps && git rev-parse HEAD && cd ../
 
diff --git a/.github/workflows/_get-image-list.yml b/.github/workflows/_get-image-list.yml
index 0061070762..7f8e785cc7 100644
--- a/.github/workflows/_get-image-list.yml
+++ b/.github/workflows/_get-image-list.yml
@@ -31,10 +31,10 @@ jobs:
       run_matrix: ${{ steps.get-matrix.outputs.run_matrix }}
     steps:
       - name: Checkout out Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
 
       - name: Checkout GenAIComps Repository
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           repository: opea-project/GenAIComps
           path: GenAIComps
@@ -45,7 +45,7 @@ jobs:
           image_list=[]
           run_matrix="{\"include\":["
           if [[ ! -z "${{ inputs.examples }}" ]]; then
-              pip install yq
+              pip install yq==3.4.3
               examples=($(echo ${{ inputs.examples }} | tr ',' ' '))
               for example in ${examples[@]}
               do
diff --git a/.github/workflows/_get-test-matrix.yml b/.github/workflows/_get-test-matrix.yml
index 6608884eae..f710564d2d 100644
--- a/.github/workflows/_get-test-matrix.yml
+++ b/.github/workflows/_get-test-matrix.yml
@@ -47,7 +47,7 @@ jobs:
           echo "checkout ref ${{ env.CHECKOUT_REF }}"
 
       - name: Checkout out Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           ref: ${{ env.CHECKOUT_REF }}
           fetch-depth: 0
diff --git a/.github/workflows/_helm-e2e.yml b/.github/workflows/_helm-e2e.yml
index 3bc03826c5..f05f046cdc 100644
--- a/.github/workflows/_helm-e2e.yml
+++ b/.github/workflows/_helm-e2e.yml
@@ -55,7 +55,7 @@ jobs:
           echo "checkout ref ${CHECKOUT_REF}"
 
       - name: Checkout Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           ref: ${{ steps.get-checkout-ref.outputs.CHECKOUT_REF }}
           fetch-depth: 0
@@ -128,7 +128,7 @@ jobs:
           echo "checkout ref ${CHECKOUT_REF}"
 
       - name: Checkout Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           ref: ${{ steps.get-checkout-ref.outputs.CHECKOUT_REF }}
           fetch-depth: 0
diff --git a/.github/workflows/_run-docker-compose.yml b/.github/workflows/_run-docker-compose.yml
index 33efac6c0e..b8fb7ff6e4 100644
--- a/.github/workflows/_run-docker-compose.yml
+++ b/.github/workflows/_run-docker-compose.yml
@@ -61,7 +61,7 @@ jobs:
           echo "checkout ref ${CHECKOUT_REF}"
 
       - name: Checkout out Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           ref: ${{ steps.get-checkout-ref.outputs.CHECKOUT_REF }}
           fetch-depth: 0
@@ -69,17 +69,19 @@ jobs:
       - name: Get test matrix
         shell: bash
         id: test-case-matrix
+        env:
+          HARDWARE: ${{ inputs.hardware }}
         run: |
           example_l=$(echo ${{ inputs.example }} | tr '[:upper:]' '[:lower:]')
           cd ${{ github.workspace }}/${{ inputs.example }}/tests
           run_test_cases=""
 
-          if [[ "${{ inputs.hardware }}" == "gaudi"* ]]; then
+          if [[ "$HARDWARE" == "gaudi"* ]]; then
             hardware="gaudi"
-          elif [[ "${{ inputs.hardware }}" == "xeon"* ]]; then
+          elif [[ "$HARDWARE" == "xeon"* ]]; then
             hardware="xeon"
           else
-            hardware="${{ inputs.hardware }}"
+            hardware="$HARDWARE"
           fi
           default_test_case=$(find . -type f -name "test_compose_on_$hardware.sh" | cut -d/ -f2)
           if [ "$default_test_case" ]; then run_test_cases="$default_test_case"; fi
@@ -110,6 +112,13 @@ jobs:
               run_test_cases=$other_test_cases
           fi
 
+          if [[ "$hardware" == "xeon"* ]]; then
+            if [ -f "${{ github.workspace }}/${{ inputs.example }}/tests/test_ui_on_xeon.sh" ]; then
+              run_test_cases="$run_test_cases test_ui_on_xeon.sh";
+            elif [ -f "${{ github.workspace }}/${{ inputs.example }}/tests/test_ui_on_gaudi.sh" ]; then
+              run_test_cases="$run_test_cases test_ui_on_gaudi.sh";
+            fi
+          fi
           test_cases=$(echo $run_test_cases | tr ' ' '\n' | sort -u | jq -R '.' | jq -sc '.')
           echo "test_cases=$test_cases"
           echo "test_cases=$test_cases" >> $GITHUB_OUTPUT
@@ -141,7 +150,7 @@ jobs:
           docker images
 
       - name: Checkout out Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           ref: ${{ needs.get-test-case.outputs.CHECKOUT_REF }}
           fetch-depth: 0
@@ -234,7 +243,7 @@ jobs:
 
       - name: Publish pipeline artifact
         if: ${{ !cancelled() }}
-        uses: actions/upload-artifact@v4
+        uses: actions/upload-artifact@c7d193f32edcb7bfad88892161225aeda64e9392
         with:
           name: ${{ inputs.hardware }}_${{ inputs.example }}_${{ matrix.test_case }}
           path: ${{ github.workspace }}/${{ inputs.example }}/tests/*.log
diff --git a/.github/workflows/_run-one-click.yml b/.github/workflows/_run-one-click.yml
index a44822e2d2..78527d5938 100644
--- a/.github/workflows/_run-one-click.yml
+++ b/.github/workflows/_run-one-click.yml
@@ -27,6 +27,10 @@ on:
         description: 'Test examples with docker compose or k8s charts'
         required: true
         type: string
+      os:
+        description: OS to run the test on
+        required: true
+        type: string
       hardware:
         description: Hardware to run the test on
         required: true
@@ -56,7 +60,7 @@ jobs:
 
       - name: Checkout out Repo
         if: ${{ inputs.deploy_method == 'docker' }}
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
@@ -90,7 +94,7 @@ jobs:
 
       - name: Checkout out Repo
         if: ${{ inputs.deploy_method == 'k8s' }}
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
@@ -103,7 +107,8 @@ jobs:
           INPUT_DATA=$(
             jq -r --arg type "${{ inputs.deploy_method }}" --arg id "${{ inputs.example }}" \
               '.[$type][$id].inputs.clear[]' ${{ github.workspace }}/.github/workflows/one-click-inputs-nobuild.json | \
-            sed "s/\$hardware/${{ inputs.hardware }}/g"
+            sed "s|\$hardware|${{ inputs.hardware }}|g; \
+                 s|\$os|${{ inputs.os }}|g"
           )
           echo "Generated input:"
           echo "$INPUT_DATA"
@@ -122,20 +127,11 @@ jobs:
         id: get-default-params
         if: ${{ inputs.deploy_method == 'k8s' }}
         run: |
-          cd ${{ github.workspace }}
-          example=$(echo "${{ inputs.example }}" | cut -d'-' -f1)
-          PARAMS_JSON=$(python3 .github/workflows/scripts/get-params.py $example)
-          echo "LLM_model=$(echo "$PARAMS_JSON" | jq -r '.llm_model')" >> $GITHUB_ENV
-          if [ "$example" = "ChatQnA" ]; then
-            echo "LLM_model=$(echo "$PARAMS_JSON" | jq -r '.llm_model')" >> $GITHUB_ENV
-            echo "Embedding_model=$(echo "$PARAMS_JSON" | jq -r '.embed_model')" >> $GITHUB_ENV
-            echo "Reranking_model=$(echo "$PARAMS_JSON" | jq -r '.rerank_model')" >> $GITHUB_ENV
-            echo "Mount_dir=$(echo "$PARAMS_JSON" | jq -r '.mount_dir')" >> $GITHUB_ENV
-          elif [ "$example" = "VisualQnA" ]; then
-            echo "LVM_model=$(echo "$PARAMS_JSON" | jq -r '.lvm_model')" >> $GITHUB_ENV
-          elif [ "$example" = "AgentQnA" ]; then
-            echo "LLM_model=$(echo "$PARAMS_JSON" | jq -r '.gaudi.llm_model')" >> $GITHUB_ENV
-          fi
+          echo "LLM_model=" >> $GITHUB_ENV
+          echo "Embedding_model=" >> $GITHUB_ENV
+          echo "Reranking_model=" >> $GITHUB_ENV
+          echo "Mount_dir=" >> $GITHUB_ENV
+          echo "LVM_model=" >> $GITHUB_ENV
 
       - name: deploy and test
         shell: bash
@@ -157,7 +153,7 @@ jobs:
           LVM_model: ${{ env.LVM_model }}
         run: |
           cd ${{ github.workspace }}/one_click_deploy
-          python3 -m pip install -r requirements.txt
+          python3 -m pip install --require-hashes -r requirements.txt
 
           if [ "${{ inputs.deploy_method }}" = "k8s" ]; then
             export OPEA_K8S_VLLM_SKIP_WARMUP=TRUE
@@ -168,6 +164,7 @@ jobs:
             jq -r --arg type "${{ inputs.deploy_method }}" --arg id "${{ inputs.example }}" \
               '.[$type][$id].inputs.deploy[]' ${{ github.workspace }}/.github/workflows/one-click-inputs-nobuild.json | \
             sed "s|\$hardware|${{ inputs.hardware }}|g; \
+                 s|\$os|${{ inputs.os }}|g; \
                  s|\$HF_TOKEN|$HF_TOKEN|g; \
                  s|\$LLM_model|$LLM_model|g; \
                  s|\$Embedding_model|$Embedding_model|g; \
@@ -196,7 +193,8 @@ jobs:
           INPUT_DATA=$(
             jq -r --arg type "${{ inputs.deploy_method }}" --arg id "${{ inputs.example }}" \
               '.[$type][$id].inputs.clear[]' ${{ github.workspace }}/.github/workflows/one-click-inputs-nobuild.json | \
-            sed "s/\$hardware/${{ inputs.hardware }}/g"
+            sed "s|\$hardware|${{ inputs.hardware }}|g; \
+                 s|\$os|${{ inputs.os }}|g"
           )
           echo "Generated input:"
           echo "$INPUT_DATA"
@@ -207,7 +205,7 @@ jobs:
 
       - name: Publish pipeline artifact
         if: ${{ !cancelled() }}
-        uses: actions/upload-artifact@v4
+        uses: actions/upload-artifact@c7d193f32edcb7bfad88892161225aeda64e9392
         with:
           name: ${{ inputs.deploy_method }}
           path: ${{ github.workspace }}/${{ inputs.deploy_method }}-tests/test-results.log
diff --git a/.github/workflows/_trivy-scan.yml b/.github/workflows/_trivy-scan.yml
index 0ad85891ea..c90d74350b 100644
--- a/.github/workflows/_trivy-scan.yml
+++ b/.github/workflows/_trivy-scan.yml
@@ -43,20 +43,13 @@ jobs:
           sudo rm -rf ${{github.workspace}}/* || true
           docker system prune -f
       - name: Checkout out Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
       - name: Install Dependencies
         run: |
           sudo apt-get update
           sudo apt-get install -y jq
       - name: Clone Required Repo
         run: |
-          source ${{ github.workspace }}/.github/env/_build_image.sh
-          if [[ "${{ inputs.image }}" == "vllm" ]]; then
-              git clone -b ${VLLM_VER} --single-branch https://github.com/vllm-project/vllm.git
-          fi
-          if [[ "${{ inputs.image }}" == "vllm-gaudi" ]]; then
-              git clone -b ${VLLM_FORK_VER} --single-branch https://github.com/HabanaAI/vllm-fork.git
-          fi
           git clone --depth 1 https://github.com/opea-project/GenAIComps.git
           cd GenAIComps && git rev-parse HEAD && cd ../
       - name: Pull Image
@@ -98,7 +91,7 @@ jobs:
         shell: bash
 
       - name: Security Scan Container
-        uses: aquasecurity/trivy-action@0.24.0
+        uses: aquasecurity/trivy-action@6e7b7d1fd3e4fef0c5fa8cce1229c54b2c9bd0d8
         if: ${{ inputs.trivy_scan }}
         with:
           image-ref: ${{ env.OPEA_IMAGE_REPO }}opea/${{ inputs.image }}:${{ inputs.tag }}
diff --git a/.github/workflows/check-online-doc-build.yml b/.github/workflows/check-online-doc-build.yml
index fecb227503..3a3db1c4c8 100644
--- a/.github/workflows/check-online-doc-build.yml
+++ b/.github/workflows/check-online-doc-build.yml
@@ -17,12 +17,12 @@ jobs:
     steps:
 
     - name: Checkout
-      uses: actions/checkout@v4
+      uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
       with:
         path: GenAIExamples
 
     - name: Checkout docs
-      uses: actions/checkout@v4
+      uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
       with:
         repository: opea-project/docs
         path: docs
diff --git a/.github/workflows/daily-update-vllm-version.yml b/.github/workflows/daily-update-vllm-version.yml.disabled
similarity index 98%
rename from .github/workflows/daily-update-vllm-version.yml
rename to .github/workflows/daily-update-vllm-version.yml.disabled
index 0263c75239..ea579157e0 100644
--- a/.github/workflows/daily-update-vllm-version.yml
+++ b/.github/workflows/daily-update-vllm-version.yml.disabled
@@ -32,7 +32,7 @@ jobs:
       fail-fast: false
     steps:
       - name: Checkout repository
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
           ref: ${{ github.ref }}
diff --git a/.github/workflows/docker/code-scan.dockerfile b/.github/workflows/docker/code-scan.dockerfile
index 73fad03a26..0a91d86320 100644
--- a/.github/workflows/docker/code-scan.dockerfile
+++ b/.github/workflows/docker/code-scan.dockerfile
@@ -1,8 +1,8 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-ARG UBUNTU_VER=22.04
-FROM ubuntu:${UBUNTU_VER} as devel
+# ARG UBUNTU_VER=22.04
+FROM ubuntu@sha256:4e0171b9275e12d375863f2b3ae9ce00a4c53ddda176bd55868df97ac6f21a6e as devel
 
 ENV LANG=C.UTF-8
 
diff --git a/.github/workflows/dockerhub-description.yml b/.github/workflows/dockerhub-description.yml
index 296f464f47..a737eb5399 100644
--- a/.github/workflows/dockerhub-description.yml
+++ b/.github/workflows/dockerhub-description.yml
@@ -84,25 +84,25 @@ jobs:
       fail-fast: false
     steps:
     - name: Checkout GenAIExamples
-      uses: actions/checkout@v4
+      uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
       with:
         repository: opea-project/GenAIExamples
         path: GenAIExamples
 
     - name: Checkout GenAIComps
-      uses: actions/checkout@v4
+      uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
       with:
         repository: opea-project/GenAIComps
         path: GenAIComps
 
     - name: Checkout vllm-openvino
-      uses: actions/checkout@v4
+      uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
       with:
         repository: vllm-project/vllm
         path: vllm
 
     - name: Checkout vllm-gaudi
-      uses: actions/checkout@v4
+      uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
       with:
         repository: HabanaAI/vllm-fork
         ref: habana_main
diff --git a/.github/workflows/manual-docker-scan.yml b/.github/workflows/manual-docker-scan.yml
index 4aec879c02..b4c0e26988 100644
--- a/.github/workflows/manual-docker-scan.yml
+++ b/.github/workflows/manual-docker-scan.yml
@@ -59,7 +59,7 @@ jobs:
     runs-on: "docker-build-${{ inputs.node }}"
     if: always()
     steps:
-      - uses: actions/upload-artifact@v4.3.4
+      - uses: actions/upload-artifact@0b2256b8c012f0828dc542b3febcab082c67f72b
         with:
           name: trivy-scan-${{ inputs.tag }}-${{ github.run_number }}
           path: /tmp/scan-${{ inputs.tag }}-${{ github.run_number }}/*-trivy-scan.txt
diff --git a/.github/workflows/manual-freeze-tag.yml b/.github/workflows/manual-freeze-tag.yml
index 88c1bb6c85..bda0d134c4 100644
--- a/.github/workflows/manual-freeze-tag.yml
+++ b/.github/workflows/manual-freeze-tag.yml
@@ -3,7 +3,7 @@
 
 name: Freeze OPEA images release tag
 permissions:
-  contents: read
+  contents: write
 on:
   workflow_dispatch:
     inputs:
@@ -19,7 +19,7 @@ jobs:
 
     steps:
       - name: Checkout repository
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
           ref: ${{ github.ref }}
diff --git a/.github/workflows/manual-one-click-workflow.yml b/.github/workflows/manual-one-click-workflow.yml
index 0463da0f19..a1aec74c40 100644
--- a/.github/workflows/manual-one-click-workflow.yml
+++ b/.github/workflows/manual-one-click-workflow.yml
@@ -24,6 +24,14 @@ on:
         description: "Tag to apply to images"
         required: true
         type: string
+      os:
+        default: "debian"
+        description: "OS to run the test on debian or openeuler"
+        type: choice
+        required: true
+        options:
+          - debian
+          - openeuler
       deploy_methods:
         default: "docker,k8s"
         description: 'Test examples with docker compose or k8s charts(exclude AgentQnA k8s on Xeon)'
@@ -41,6 +49,7 @@ jobs:
       examples: ${{ steps.get-matrix.outputs.examples }}
       nodes: ${{ steps.get-matrix.outputs.nodes }}
       deploy_methods: ${{ steps.get-matrix.outputs.deploy_methods }}
+      OSs: ${{ steps.get-matrix.outputs.OSs }}
     steps:
     - name: Create Matrix
       id: get-matrix
@@ -54,9 +63,13 @@ jobs:
         deploy_methods=($(echo ${{ inputs.deploy_methods }} | tr ',' ' '))
         deploy_methods_json=$(printf '%s\n' "${deploy_methods[@]}" | sort -u | jq -R '.' | jq -sc '.')
         echo "deploy_methods=$deploy_methods_json" >> $GITHUB_OUTPUT
+        OSs=($(echo ${{ inputs.os }} | tr ',' ' '))
+        OSs_json=$(printf '%s\n' "${OSs[@]}" | sort -u | jq -R '.' | jq -sc '.')
+        echo "OSs=$OSs_json" >> $GITHUB_OUTPUT
         echo "examples=$examples_json"
         echo "nodes=$nodes_json"
         echo "deploy_methods=$deploy_methods_json"
+        echo "OSs=$OSs_json"
 
   run-examples:
     # permissions:
@@ -81,12 +94,14 @@ jobs:
         example: ${{ fromJson(needs.get-test-matrix.outputs.examples) }}
         hardware: ${{ fromJson(needs.get-test-matrix.outputs.nodes) }}
         deploy_method: ${{ fromJson(needs.get-test-matrix.outputs.deploy_methods) }}
+        os: ${{ fromJson(needs.get-test-matrix.outputs.OSs) }}
       fail-fast: false
     uses: ./.github/workflows/_run-one-click.yml
     with:
       hardware: ${{ matrix.hardware }}
       example: ${{ matrix.example }}
       deploy_method: ${{ matrix.deploy_method }}
+      os: ${{ matrix.os }}
       tag: ${{ inputs.tag }}
       registry: "opea"
     secrets: inherit
diff --git a/.github/workflows/mix-trellix.yml b/.github/workflows/mix-trellix.yml
index 65f18e6dbc..bad18fa631 100644
--- a/.github/workflows/mix-trellix.yml
+++ b/.github/workflows/mix-trellix.yml
@@ -17,7 +17,7 @@ jobs:
         run: sudo rm -rf ${{github.workspace}}/*
 
       - name: Checkout out Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
 
       - name: Run Trellix Scanner
         env:
@@ -26,6 +26,6 @@ jobs:
 
       - name: Publish pipeline artifact
         if: ${{ !cancelled() }}
-        uses: actions/upload-artifact@v4
+        uses: actions/upload-artifact@c7d193f32edcb7bfad88892161225aeda64e9392
         with:
           path: ${{ github.workspace }}/.github/workflows/scripts/codeScan/report.html
diff --git a/.github/workflows/one-click-inputs-nobuild.json b/.github/workflows/one-click-inputs-nobuild.json
index e1fef7ea43..610b20f563 100644
--- a/.github/workflows/one-click-inputs-nobuild.json
+++ b/.github/workflows/one-click-inputs-nobuild.json
@@ -7,6 +7,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -21,7 +22,7 @@
           "y",
           "Y"
         ],
-        "clear": ["1", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["1", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "ChatQnA-Qwen": {
@@ -31,6 +32,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -45,7 +47,7 @@
           "y",
           "Y"
         ],
-        "clear": ["1", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["1", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "CodeTrans": {
@@ -55,6 +57,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -66,7 +69,7 @@
           "y",
           "Y"
         ],
-        "clear": ["2", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["2", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "DocSum": {
@@ -76,6 +79,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -87,7 +91,7 @@
           "y",
           "Y"
         ],
-        "clear": ["3", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["3", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "CodeGen": {
@@ -97,6 +101,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -108,7 +113,7 @@
           "y",
           "Y"
         ],
-        "clear": ["4", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["4", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "AudioQnA": {
@@ -118,6 +123,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -129,7 +135,7 @@
           "y",
           "Y"
         ],
-        "clear": ["5", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["5", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "VisualQnA": {
@@ -139,6 +145,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -150,7 +157,7 @@
           "y",
           "Y"
         ],
-        "clear": ["6", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["6", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "FaqGen": {
@@ -160,6 +167,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -171,7 +179,7 @@
           "y",
           "Y"
         ],
-        "clear": ["7", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["7", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "AgentQnA": {
@@ -181,6 +189,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -193,7 +202,7 @@
           "y",
           "Y"
         ],
-        "clear": ["8", "1", "2", "docker", "$hardware", "Y"]
+        "clear": ["8", "1", "2", "docker", "$os", "$hardware", "Y"]
       }
     }
   },
@@ -205,6 +214,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -219,7 +229,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["1", "1", "2", "k8s", "y", "Y"]
+        "clear": ["1", "1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "ChatQnA-Qwen": {
@@ -229,6 +239,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -243,7 +254,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["1", "1", "2", "k8s", "y", "Y"]
+        "clear": ["1", "1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "CodeTrans": {
@@ -253,6 +264,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -265,7 +277,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["2", "1", "2", "k8s", "y", "Y"]
+        "clear": ["2", "1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "DocSum": {
@@ -275,6 +287,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -287,7 +300,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["3", "1", "2", "k8s", "y", "Y"]
+        "clear": ["3", "1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "CodeGen": {
@@ -297,6 +310,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -309,7 +323,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["4", "1", "2", "k8s", "y", "Y"]
+        "clear": ["4", "1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "AudioQnA": {
@@ -319,6 +333,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -331,7 +346,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["5", "1", "2", "k8s", "y", "Y"]
+        "clear": ["5", "1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "VisualQnA": {
@@ -341,6 +356,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -353,7 +369,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["6", "1", "2", "k8s", "y", "Y"]
+        "clear": ["6", "1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "FaqGen": {
@@ -363,6 +379,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -375,7 +392,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["7", "1", "2", "k8s", "y", "Y"]
+        "clear": ["7", "1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "AgentQnA": {
@@ -385,6 +402,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -398,7 +416,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["8", "1", "2", "k8s", "y", "Y"]
+        "clear": ["8", "1", "2", "k8s", "$os", "y", "Y"]
       }
     }
   }
diff --git a/.github/workflows/one-click-inputs.json b/.github/workflows/one-click-inputs.json
index dd2c516a2d..f42b163996 100644
--- a/.github/workflows/one-click-inputs.json
+++ b/.github/workflows/one-click-inputs.json
@@ -6,6 +6,7 @@
           "1",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -22,7 +23,7 @@
           "y",
           "Y"
         ],
-        "clear": ["1", "2", "docker", "$hardware", "Y"]
+        "clear": ["1", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "CodeTrans": {
@@ -31,6 +32,7 @@
           "2",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -44,7 +46,7 @@
           "y",
           "Y"
         ],
-        "clear": ["2", "2", "docker", "$hardware", "Y"]
+        "clear": ["2", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "DocSum": {
@@ -53,6 +55,7 @@
           "3",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -66,7 +69,7 @@
           "y",
           "Y"
         ],
-        "clear": ["3", "2", "docker", "$hardware", "Y"]
+        "clear": ["3", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "CodeGen": {
@@ -75,6 +78,7 @@
           "4",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -88,7 +92,7 @@
           "y",
           "Y"
         ],
-        "clear": ["4", "2", "docker", "$hardware", "Y"]
+        "clear": ["4", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "AudioQnA": {
@@ -97,6 +101,7 @@
           "5",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -110,7 +115,7 @@
           "y",
           "Y"
         ],
-        "clear": ["5", "2", "docker", "$hardware", "Y"]
+        "clear": ["5", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "VisualQnA": {
@@ -119,6 +124,7 @@
           "6",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -132,7 +138,7 @@
           "y",
           "Y"
         ],
-        "clear": ["6", "2", "docker", "$hardware", "Y"]
+        "clear": ["6", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "FaqGen": {
@@ -141,6 +147,7 @@
           "7",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -154,7 +161,7 @@
           "y",
           "Y"
         ],
-        "clear": ["7", "2", "docker", "$hardware", "Y"]
+        "clear": ["7", "2", "docker", "$os", "$hardware", "Y"]
       }
     },
     "AgentQnA": {
@@ -163,6 +170,7 @@
           "8",
           "1",
           "docker",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -177,7 +185,7 @@
           "y",
           "Y"
         ],
-        "clear": ["8", "2", "docker", "$hardware", "Y"]
+        "clear": ["8", "2", "docker", "$os", "$hardware", "Y"]
       }
     }
   },
@@ -188,6 +196,7 @@
           "1",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -204,7 +213,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["1", "2", "k8s", "y", "Y"]
+        "clear": ["1", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "CodeTrans": {
@@ -213,6 +222,7 @@
           "2",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -227,7 +237,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["2", "2", "k8s", "y", "Y"]
+        "clear": ["2", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "DocSum": {
@@ -236,6 +246,7 @@
           "3",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -250,7 +261,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["3", "2", "k8s", "y", "Y"]
+        "clear": ["3", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "CodeGen": {
@@ -259,6 +270,7 @@
           "4",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -273,7 +285,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["4", "2", "k8s", "y", "Y"]
+        "clear": ["4", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "AudioQnA": {
@@ -282,6 +294,7 @@
           "5",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -296,7 +309,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["5", "2", "k8s", "y", "Y"]
+        "clear": ["5", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "VisualQnA": {
@@ -305,6 +318,7 @@
           "6",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -319,7 +333,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["6", "2", "k8s", "y", "Y"]
+        "clear": ["6", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "FaqGen": {
@@ -328,6 +342,7 @@
           "7",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -342,7 +357,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["7", "2", "k8s", "y", "Y"]
+        "clear": ["7", "2", "k8s", "$os", "y", "Y"]
       }
     },
     "AgentQnA": {
@@ -351,6 +366,7 @@
           "8",
           "1",
           "k8s",
+          "$os",
           "$hardware",
           "$HF_TOKEN",
           "$http_proxy",
@@ -366,7 +382,7 @@
           "8080",
           "Y"
         ],
-        "clear": ["8", "2", "k8s", "y", "Y"]
+        "clear": ["8", "2", "k8s", "$os", "y", "Y"]
       }
     }
   }
diff --git a/.github/workflows/pr-chart-e2e.yml b/.github/workflows/pr-chart-e2e.yml
index 3990e5fce9..256151fb09 100644
--- a/.github/workflows/pr-chart-e2e.yml
+++ b/.github/workflows/pr-chart-e2e.yml
@@ -28,7 +28,7 @@ jobs:
       run_matrix: ${{ steps.get-test-matrix.outputs.run_matrix }}
     steps:
       - name: Checkout Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           ref: "refs/pull/${{ github.event.number }}/merge"
           fetch-depth: 0
diff --git a/.github/workflows/pr-check-duplicated-image.yml b/.github/workflows/pr-check-duplicated-image.yml
index 2922b8f4fe..8c39c64fd8 100644
--- a/.github/workflows/pr-check-duplicated-image.yml
+++ b/.github/workflows/pr-check-duplicated-image.yml
@@ -27,11 +27,11 @@ jobs:
         run: sudo rm -rf ${{github.workspace}}/*
 
       - name: Checkout Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
 
       - name: Check all the docker image build files
         run: |
-          pip install PyYAML
+          pip install PyYAML==6.0.3
           cd ${{github.workspace}}
           build_files=""
           for f in `find . -path "*/docker_image_build/build.yaml"`; do
diff --git a/.github/workflows/pr-code-scan.yml b/.github/workflows/pr-code-scan.yml
index f64184c519..839c196311 100644
--- a/.github/workflows/pr-code-scan.yml
+++ b/.github/workflows/pr-code-scan.yml
@@ -34,7 +34,7 @@ jobs:
       fail-fast: false
     steps:
       - name: Checkout out Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
 
       - name: Check Dangerous Command Injection
         uses: opea-project/validation/actions/check-cmd@main
@@ -62,7 +62,7 @@ jobs:
 
       - name: Publish pipeline artifact
         if: ${{ !cancelled() }}
-        uses: actions/upload-artifact@v4
+        uses: actions/upload-artifact@c7d193f32edcb7bfad88892161225aeda64e9392
         with:
           name: ${{ matrix.job_name }}
           path: ${{ github.workspace }}/.github/workflows/scripts/codeScan/${{ matrix.job_name }}.*
@@ -74,7 +74,7 @@ jobs:
       contents: read
     steps:
       - name: Repository checkout
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
@@ -98,7 +98,7 @@ jobs:
       - name: ShellCheck
         # if: ${{ env.changed_files != '' }}
         if: steps.get-changed-files.outputs.changed_files_exist == 'true'
-        uses: ludeeus/action-shellcheck@2.0.0
+        uses: ludeeus/action-shellcheck@00cae500b08a931fb5698e11e79bfbd38e612a38
         env:
           SHELLCHECK_OPTS: -e SC2164 -e SC2154 -e SC2034 -e SC2155 -e SC1090 -e SC2153 -e SC2046
         with:
diff --git a/.github/workflows/pr-dependency-review.yml b/.github/workflows/pr-dependency-review.yml
index 0867382269..01527452a8 100644
--- a/.github/workflows/pr-dependency-review.yml
+++ b/.github/workflows/pr-dependency-review.yml
@@ -13,7 +13,7 @@ jobs:
       pull-requests: write
     steps:
       - name: "Checkout Repository"
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
       - name: Dependency Review
         uses: actions/dependency-review-action@v4
         with:
diff --git a/.github/workflows/pr-dockerfile-path-and-build-yaml-scan.yml b/.github/workflows/pr-dockerfile-path-and-build-yaml-scan.yml
index 1894776d3f..7ecbd9ef09 100644
--- a/.github/workflows/pr-dockerfile-path-and-build-yaml-scan.yml
+++ b/.github/workflows/pr-dockerfile-path-and-build-yaml-scan.yml
@@ -17,7 +17,7 @@ jobs:
         run: sudo rm -rf ${{github.workspace}}/*
 
       - name: Checkout Repo GenAIExamples
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
 
       - name: Clone Repo GenAIComps
         run: |
@@ -50,7 +50,7 @@ jobs:
         run: sudo rm -rf ${{github.workspace}}/*
 
       - name: Checkout Repo GenAIExamples
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
@@ -85,11 +85,11 @@ jobs:
         run: sudo rm -rf ${{github.workspace}}/*
 
       - name: Checkout Repo GenAIExamples
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
 
       - name: Check name agreement in build.yaml
         run: |
-          pip install ruamel.yaml
+          pip install ruamel.yaml==0.18.6
           cd ${{github.workspace}}
           consistency="TRUE"
           build_yamls=$(find . -name 'build.yaml')
diff --git a/.github/workflows/pr-image-size.yml b/.github/workflows/pr-image-size.yml
index bbed2b0d88..ffd432c7bd 100644
--- a/.github/workflows/pr-image-size.yml
+++ b/.github/workflows/pr-image-size.yml
@@ -23,7 +23,7 @@ jobs:
       files: ${{ steps.changed-dockerfiles.outputs.files }}
     steps:
       - name: Checkout PR branch
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
@@ -46,16 +46,16 @@ jobs:
       matrix:
         dockerfile: ${{ fromJson(needs.get-check-list.outputs.files) }}
       fail-fast: false
-    # outputs:
-    #   comments: ${{ steps.build-check.outputs.comment_message }}
+    outputs:
+      skip: ${{ steps.build-check.outputs.skip }}
     steps:
       - name: Checkout PR branch
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
       - name: Set up Docker Buildx
-        uses: docker/setup-buildx-action@v3
+        uses: docker/setup-buildx-action@d70bba72b1f3fd22344832f00baa16ece964efeb
 
       - name: Build and check image sizes
         id: build-check
@@ -92,7 +92,11 @@ jobs:
           echo "Building base image for $dockerfile"
           git checkout ${{ github.event.pull_request.base.sha }}
           echo "::group::Build image_base"
-          docker build -f $file -t "$image_base" --no-cache . || true
+          if ! docker build -f "$file" -t "$image_base" --no-cache .; then
+            echo "skip=true" >> $GITHUB_ENV
+            echo "skip=true" >> $GITHUB_OUTPUT
+            exit 0
+          fi
           echo "::endgroup::"
           size_base=$(docker image inspect "$image_base" | jq '.[0].Size / (1024 * 1024) | round')
 
@@ -123,20 +127,23 @@ jobs:
           echo "summary_path=${{github.workspace}}/build-$image_name.md" >> $GITHUB_ENV
 
       - name: Download origin artifact log
-        uses: actions/download-artifact@v4
+        if: env.skip != 'true'
+        uses: actions/download-artifact@v4.1.3
         with:
           name: build-comments
           path: merged-files
         continue-on-error: true
 
       - name: Merge logs
+        if: env.skip != 'true'
         run: |
           mkdir -p merged-files
           ls merged-files/
           cp ${{ env.summary_path }} merged-files/
 
       - name: Save Summary as Artifact
-        uses: actions/upload-artifact@v4
+        if: env.skip != 'true'
+        uses: actions/upload-artifact@c7d193f32edcb7bfad88892161225aeda64e9392
         with:
           name: build-comments
           path: merged-files/
@@ -146,13 +153,13 @@ jobs:
     needs: build-and-check
     permissions:
       actions: read
-    if: always()
+    if: always() && needs.build-and-check.outputs.skip != 'true'
     runs-on: ubuntu-latest
     outputs:
       all_comments: ${{ steps.summary.outputs.all_comments }}
     steps:
       - name: Download Summary
-        uses: actions/download-artifact@v4
+        uses: actions/download-artifact@v4.1.3
         with:
           name: build-comments
           path: downloaded-files
diff --git a/.github/workflows/pr-link-path-scan.yml b/.github/workflows/pr-link-path-scan.yml
index 932646a52d..a14eaf3cd3 100644
--- a/.github/workflows/pr-link-path-scan.yml
+++ b/.github/workflows/pr-link-path-scan.yml
@@ -19,7 +19,7 @@ jobs:
         run: sudo rm -rf ${{github.workspace}}/*
 
       - name: Checkout Repo GenAIExamples
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
@@ -84,7 +84,7 @@ jobs:
         run: sudo rm -rf ${{github.workspace}}/*
 
       - name: Checkout Repo GenAIExamples
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
diff --git a/.github/workflows/pr-one-click.yml b/.github/workflows/pr-one-click.yml
index eb90bb0e26..b403a21c35 100644
--- a/.github/workflows/pr-one-click.yml
+++ b/.github/workflows/pr-one-click.yml
@@ -26,12 +26,14 @@ jobs:
     strategy:
       matrix:
         deploy_method: ["docker", "k8s"]
+        os: ["debian", "openeuler"]
       fail-fast: false
     uses: ./.github/workflows/_run-one-click.yml
     with:
       registry: "opea"
       tag: "ci"
       example: ChatQnA
-      hardware: gaudi
+      os: ${{ matrix.os }}
+      hardware: xeon
       deploy_method: ${{ matrix.deploy_method }}
     secrets: inherit
diff --git a/.github/workflows/push-images-path-detection.yml b/.github/workflows/push-images-path-detection.yml
index 9edfad2678..7137cb225c 100644
--- a/.github/workflows/push-images-path-detection.yml
+++ b/.github/workflows/push-images-path-detection.yml
@@ -19,7 +19,7 @@ jobs:
         run: sudo rm -rf ${{github.workspace}}/*
 
       - name: Checkout repo GenAIExamples
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
 
       - name: Check the validity of links
         run: |
diff --git a/.github/workflows/push-infra-issue-creation.yml b/.github/workflows/push-infra-issue-creation.yml
index 3f8a22baf8..0175ff0e86 100644
--- a/.github/workflows/push-infra-issue-creation.yml
+++ b/.github/workflows/push-infra-issue-creation.yml
@@ -18,7 +18,7 @@ jobs:
     runs-on: ubuntu-latest
     steps:
       - name: Checkout out Repo
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
@@ -42,7 +42,7 @@ jobs:
           echo "EOF" >> $GITHUB_ENV
 
       - name: Create Issue
-        uses: dacbd/create-issue-action@main
+        uses: dacbd/create-issue-action@fec641442c0897e734fad173cfe83ae21a2284a3
         with:
           token: ${{ secrets.ACTION_TOKEN }}
           owner: opea-project
diff --git a/.github/workflows/scorecard.yml b/.github/workflows/scorecard.yml
index e6286dfa5d..b08b860059 100644
--- a/.github/workflows/scorecard.yml
+++ b/.github/workflows/scorecard.yml
@@ -76,6 +76,6 @@ jobs:
       # Upload the results to GitHub's code scanning dashboard (optional).
       # Commenting out will disable upload of results to your repo's Code Scanning dashboard
       - name: "Upload to code-scanning"
-        uses: github/codeql-action/upload-sarif@v3
+        uses: github/codeql-action/upload-sarif@303c0aef88fc2fe5ff6d63d3b1596bfd83dfa1f9
         with:
           sarif_file: results.sarif
diff --git a/.github/workflows/scripts/docker_compose_clean_up.sh b/.github/workflows/scripts/docker_compose_clean_up.sh
index 1e88bb2c95..b83a8f0ca7 100644
--- a/.github/workflows/scripts/docker_compose_clean_up.sh
+++ b/.github/workflows/scripts/docker_compose_clean_up.sh
@@ -19,12 +19,12 @@ case "$1" in
         containers=$(cat $yaml_file | grep container_name | cut -d':' -f2)
         for container_name in $containers; do
             cid=$(docker ps -aq --filter "name=$container_name")
-            if [[ ! -z "$cid" ]]; then docker stop $cid && docker rm $cid && sleep 1s; fi
+            if [[ -n "$cid" ]]; then docker stop "$cid" && docker rm "$cid" && sleep 1s; fi
         done
         ;;
     ports)
         echo "Release all ports used by the services in $yaml_file ..."
-        pip install jq yq
+        pip install jq==1.10.0 yq==3.4.3
         ports=$(yq '.services[].ports[] | split(":")[0]' $yaml_file | grep -o '[0-9a-zA-Z_-]\+')
         echo "All ports list..."
         echo "$ports"
@@ -32,11 +32,9 @@ case "$1" in
           if [[ $port =~ [a-zA-Z_-] ]]; then
             echo "Search port value $port from the test case..."
             port_fix=$(grep -E "export $port=" tests/$test_case | cut -d'=' -f2)
-            if [[ "$port_fix" == "" ]]; then
-              echo "Can't find the port value from the test case, use the default value in yaml..."
-              port_fix=$(yq '.services[].ports[]' $yaml_file | grep $port | cut -d':' -f2 |  grep -o '[0-9a-zA-Z]\+')
+            if [[ "$port_fix"  ]]; then
+               port=$port_fix
             fi
-            port=$port_fix
           fi
           if [[ $port =~ [0-9] ]]; then
             if [[ $port == 5000 ]]; then
@@ -45,7 +43,7 @@ case "$1" in
             fi
             echo "Check port $port..."
             cid=$(docker ps --filter "publish=${port}" --format "{{.ID}}")
-            if [[ ! -z "$cid" ]]; then docker stop $cid && docker rm $cid && echo "release $port"; fi
+            if [[ -n "$cid" ]]; then docker stop "$cid" && docker rm "$cid" && echo "release $port"; fi
           fi
         done
         ;;
diff --git a/.github/workflows/scripts/get-params.py b/.github/workflows/scripts/get-params.py
deleted file mode 100644
index d597facaa9..0000000000
--- a/.github/workflows/scripts/get-params.py
+++ /dev/null
@@ -1,41 +0,0 @@
-#!/usr/bin/env python3
-# Copyright (C) 2025 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-import json
-import os
-import sys
-
-sys.path.append(os.path.join(os.path.dirname(__file__), "../../../one_click_deploy/core/"))
-from config import EXAMPLE_CONFIGS
-
-
-def get_example_defaults(example_name):
-    if example_name not in EXAMPLE_CONFIGS:
-        print(f"error: example '{example_name}' not found in EXAMPLE_CONFIGS")
-        sys.exit(1)
-
-    example_config = EXAMPLE_CONFIGS[example_name]
-    params = example_config.get("interactive_params", {})
-
-    if isinstance(params, list):
-        return {param["name"]: param["default"] for param in params}
-    elif isinstance(params, dict):
-        return {
-            device: {param["name"]: param["default"] for param in device_params}
-            for device, device_params in params.items()
-        }
-    else:
-        return {"error": "Invalid params format in EXAMPLE_CONFIGS for example: " + example_name}
-
-
-def main():
-    example_name = sys.argv[1]
-
-    defaults = get_example_defaults(example_name)
-
-    print(json.dumps(defaults, indent=2, ensure_ascii=False))
-
-
-if __name__ == "__main__":
-    main()
diff --git a/.github/workflows/scripts/k8s-utils.sh b/.github/workflows/scripts/k8s-utils.sh
index 0676a80d38..aa2a4f6d05 100755
--- a/.github/workflows/scripts/k8s-utils.sh
+++ b/.github/workflows/scripts/k8s-utils.sh
@@ -2,7 +2,7 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-set -e
+# set -e
 
 function dump_pod_log() {
     pod_name=$1
diff --git a/.github/workflows/weekly-one-click-test.yml b/.github/workflows/weekly-one-click-test.yml
index 39174073bf..d60d7971e4 100644
--- a/.github/workflows/weekly-one-click-test.yml
+++ b/.github/workflows/weekly-one-click-test.yml
@@ -26,7 +26,7 @@ jobs:
       deploy_methods: ${{ steps.get-matrix.outputs.deploy_methods }}
     steps:
       - name: Checkout
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
 
@@ -55,11 +55,16 @@ jobs:
         example: ${{ fromJson(needs.get-test-matrix.outputs.examples) }}
         node: ${{ fromJson(needs.get-test-matrix.outputs.nodes) }}
         deploy_method: ${{ fromJson(needs.get-test-matrix.outputs.deploy_methods) }}
+        exclude:
+          - example: AgentQnA
+            node: xeon
+            deploy_method: k8s
       fail-fast: false
     uses: ./.github/workflows/_run-one-click.yml
     with:
       hardware: ${{ matrix.node }}
       example: ${{ matrix.example }}
       deploy_method: ${{ matrix.deploy_method }}
+      os: "debian"
       registry: "opea"
     secrets: inherit
diff --git a/.github/workflows/weekly-update-images.yml b/.github/workflows/weekly-update-images.yml
index 9a8d1498a0..134476aeac 100644
--- a/.github/workflows/weekly-update-images.yml
+++ b/.github/workflows/weekly-update-images.yml
@@ -18,7 +18,7 @@ jobs:
       BRANCH_NAME: "update_images_tag"
     steps:
       - name: Checkout repository
-        uses: actions/checkout@v4
+        uses: actions/checkout@1e31de5234b9f8995739874a8ce0492dc87873e2
         with:
           fetch-depth: 0
           ref: "main"
diff --git a/AgentQnA/docker_compose/intel/hpu/gaudi/compose.yaml b/AgentQnA/docker_compose/intel/hpu/gaudi/compose.yaml
index 5f197b49c2..8680b83443 100644
--- a/AgentQnA/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/AgentQnA/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -128,7 +128,7 @@ services:
       OPENAI_API_BASE_URLS: ${SUPERVISOR_AGENT_ENDPOINT}
       ENABLE_OLLAMA_API: False
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.4
     container_name: vllm-gaudi-server
     ports:
       - "8086:8000"
diff --git a/AgentQnA/docker_image_build/build.yaml b/AgentQnA/docker_image_build/build.yaml
index 7db63b6fa8..cf757968de 100644
--- a/AgentQnA/docker_image_build/build.yaml
+++ b/AgentQnA/docker_image_build/build.yaml
@@ -17,12 +17,6 @@ services:
       dockerfile: ./docker/Dockerfile
     extends: agent
     image: ${REGISTRY:-opea}/agent-ui:${TAG:-latest}
-  vllm-gaudi:
-    build:
-      context: vllm-fork
-      dockerfile: Dockerfile.hpu
-    extends: agent
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   vllm-rocm:
     build:
       context: GenAIComps
diff --git a/AgentQnA/kubernetes/helm/rocm-tgi-values.yaml b/AgentQnA/kubernetes/helm/rocm-tgi-values.yaml
new file mode 100644
index 0000000000..9c2bc98eb8
--- /dev/null
+++ b/AgentQnA/kubernetes/helm/rocm-tgi-values.yaml
@@ -0,0 +1,57 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# Accelerate inferencing in heaviest components to improve performance
+# by overriding their subchart values
+vllm:
+  enabled: false
+tgi:
+  enabled: true
+  accelDevice: "rocm"
+  image:
+    repository: ghcr.io/huggingface/text-generation-inference
+    tag: "3.0.0-rocm"
+  LLM_MODEL_ID: meta-llama/Llama-3.3-70B-Instruct
+  MAX_INPUT_LENGTH: "2048"
+  MAX_TOTAL_TOKENS: "4096"
+  PYTORCH_TUNABLEOP_ENABLED: "0"
+  USE_FLASH_ATTENTION: "true"
+  FLASH_ATTENTION_RECOMPUTE: "false"
+  HIP_VISIBLE_DEVICES: "0,1"
+  MAX_BATCH_SIZE: "4"
+  extraCmdArgs: [ "--num-shard","2" ]
+  resources:
+    limits:
+      amd.com/gpu: "2"
+    requests:
+      cpu: 1
+      memory: 16Gi
+  securityContext:
+    readOnlyRootFilesystem: false
+    runAsNonRoot: false
+    runAsUser: 0
+    capabilities:
+      add:
+        - SYS_PTRACE
+  readinessProbe:
+    initialDelaySeconds: 60
+    periodSeconds: 5
+    timeoutSeconds: 1
+    failureThreshold: 120
+  startupProbe:
+    initialDelaySeconds: 60
+    periodSeconds: 5
+    timeoutSeconds: 1
+    failureThreshold: 120
+supervisor:
+  llm_endpoint_url: http://{{ .Release.Name }}-tgi
+  llm_engine: tgi
+  model: "meta-llama/Llama-3.3-70B-Instruct"
+ragagent:
+  llm_endpoint_url: http://{{ .Release.Name }}-tgi
+  llm_engine: tgi
+  model: "meta-llama/Llama-3.3-70B-Instruct"
+sqlagent:
+  llm_endpoint_url: http://{{ .Release.Name }}-tgi
+  llm_engine: tgi
+  model: "meta-llama/Llama-3.3-70B-Instruct"
diff --git a/AgentQnA/kubernetes/helm/rocm-values.yaml b/AgentQnA/kubernetes/helm/rocm-values.yaml
new file mode 100644
index 0000000000..0d5393b70f
--- /dev/null
+++ b/AgentQnA/kubernetes/helm/rocm-values.yaml
@@ -0,0 +1,52 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# Accelerate inferencing in heaviest components to improve performance
+# by overriding their subchart values
+
+tgi:
+  enabled: false
+vllm:
+  enabled: true
+  accelDevice: "rocm"
+  image:
+    repository: opea/vllm-rocm
+    tag: latest
+  env:
+    LLM_MODEL_ID: meta-llama/Llama-3.3-70B-Instruct
+    HIP_VISIBLE_DEVICES: "0,1"
+    TENSOR_PARALLEL_SIZE: "2"
+    HF_HUB_DISABLE_PROGRESS_BARS: "1"
+    HF_HUB_ENABLE_HF_TRANSFER: "0"
+    VLLM_USE_TRITON_FLASH_ATTN: "0"
+    VLLM_WORKER_MULTIPROC_METHOD: "spawn"
+    PYTORCH_JIT: "0"
+    HF_HOME: "/data"
+  extraCmd:
+    command: [ "python3", "/workspace/api_server.py" ]
+  extraCmdArgs: [ "--swap-space", "16",
+                  "--disable-log-requests",
+                  "--dtype", "float16",
+                  "--num-scheduler-steps", "1",
+                  "--distributed-executor-backend", "mp" ]
+  resources:
+    limits:
+      amd.com/gpu: "2"
+  startupProbe:
+    failureThreshold: 180
+  securityContext:
+    readOnlyRootFilesystem: false
+    runAsNonRoot: false
+    runAsUser: 0
+supervisor:
+  llm_endpoint_url: http://{{ .Release.Name }}-vllm
+  llm_engine: vllm
+  model: "meta-llama/Llama-3.3-70B-Instruct"
+ragagent:
+  llm_endpoint_url: http://{{ .Release.Name }}-vllm
+  llm_engine: vllm
+  model: "meta-llama/Llama-3.3-70B-Instruct"
+sqlagent:
+  llm_endpoint_url: http://{{ .Release.Name }}-vllm
+  llm_engine: vllm
+  model: "meta-llama/Llama-3.3-70B-Instruct"
diff --git a/AgentQnA/tests/step1_build_images.sh b/AgentQnA/tests/step1_build_images.sh
index 58b5c8d6e8..5a13c8a52b 100644
--- a/AgentQnA/tests/step1_build_images.sh
+++ b/AgentQnA/tests/step1_build_images.sh
@@ -40,12 +40,8 @@ function build_agent_docker_image_gaudi_vllm() {
     cd $WORKDIR/GenAIExamples/AgentQnA/docker_image_build/
     get_genai_comps
 
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
-
     echo "Build agent image with --no-cache..."
-    service_list="agent agent-ui vllm-gaudi"
+    service_list="agent agent-ui"
     docker compose -f build.yaml build ${service_list} --no-cache
 }
 
@@ -83,6 +79,7 @@ function main() {
         "rocm_vllm")
             echo "==================== Build agent docker image for ROCm VLLM ===================="
             build_agent_docker_image_rocm_vllm
+            docker image ls | grep vllm
             ;;
         "gaudi_vllm")
             echo "==================== Build agent docker image for Gaudi ===================="
@@ -97,8 +94,6 @@ function main() {
             exit 1
             ;;
     esac
-
-    docker image ls | grep vllm
 }
 
 main $1
diff --git a/ArbPostHearingAssistant/Dockerfile b/ArbPostHearingAssistant/Dockerfile
new file mode 100644
index 0000000000..9e739b204d
--- /dev/null
+++ b/ArbPostHearingAssistant/Dockerfile
@@ -0,0 +1,17 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+ARG IMAGE_REPO=opea
+ARG BASE_TAG=latest
+FROM opea/comps-base:latest
+
+USER root
+# FFmpeg needed for media processing
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends ffmpeg && \
+    apt-get clean && rm -rf /var/lib/apt/lists/*
+USER user
+
+COPY ./arb_post_hearing_assistant.py $HOME/arb_post_hearing_assistant.py
+
+ENTRYPOINT ["python", "arb_post_hearing_assistant.py"]
diff --git a/ArbPostHearingAssistant/README.md b/ArbPostHearingAssistant/README.md
new file mode 100644
index 0000000000..536257b50c
--- /dev/null
+++ b/ArbPostHearingAssistant/README.md
@@ -0,0 +1,32 @@
+# Arbitration Post-Hearing Assistant
+
+The Arbitration Post-Hearing Assistant is a GenAI-based module designed to process and summarize post-hearing transcripts or arbitration-related documents. It intelligently extracts key entities and insights to assist arbitrators, legal teams, and case managers in managing case follow-ups efficiently.
+
+## Table of contents
+
+1. [Architecture](#architecture)
+2. [Deployment Options](#deployment-options)
+
+## Architecture
+
+The architecture of the ArbPostHearingAssistant Application is illustrated below:
+
+![Architecture](./assets/img/arbitration_architecture.png)
+
+The ArbPostHearingAssistant example is implemented using the component-level microservices defined in [GenAIComps](https://github.com/opea-project/GenAIComps).
+
+## Deployment Options
+
+The table below lists currently available deployment options. They outline in detail the implementation of this example on selected hardware.
+
+| Category               | Deployment Option      | Description                                                                     |
+| ---------------------- | ---------------------- | ------------------------------------------------------------------------------- |
+| On-premise Deployments | Docker Compose (Xeon)  | [ArbPostHearingAssistant deployment on Xeon](./docker_compose/intel/cpu/xeon)   |
+|                        | Docker Compose (Gaudi) | [ArbPostHearingAssistant deployment on Gaudi](./docker_compose/intel/hpu/gaudi) |
+
+## Validated Configurations
+
+| **Deploy Method** | **LLM Engine** | **LLM Model**                      | **Hardware** |
+| ----------------- | -------------- | ---------------------------------- | ------------ |
+| Docker Compose    | vLLM, TGI      | mistralai/Mistral-7B-Instruct-v0.2 | Intel Gaudi  |
+| Docker Compose    | vLLM, TGI      | mistralai/Mistral-7B-Instruct-v0.2 | Intel Xeon   |
diff --git a/ArbPostHearingAssistant/README_miscellaneous.md b/ArbPostHearingAssistant/README_miscellaneous.md
new file mode 100644
index 0000000000..13d87b6913
--- /dev/null
+++ b/ArbPostHearingAssistant/README_miscellaneous.md
@@ -0,0 +1,45 @@
+# Table of Contents
+
+- [Table of Contents](#table-of-contents)
+  - [Build MegaService Docker Image](#build-megaservice-docker-image)
+  - [Build UI Docker Image](#build-ui-docker-image)
+  - [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+  - [Troubleshooting](#troubleshooting)
+
+## Build MegaService Docker Image
+
+To construct the Megaservice of ArbPostHearingAssistant, the [GenAIExamples](https://github.com/opea-project/GenAIExamples.git) repository is utilized. Build MegaService Docker image via command below:
+
+```bash
+git clone https://github.com/opea-project/GenAIExamples.git
+cd GenAIExamples/ArbPostHearingAssistant
+docker build --no-cache -t opea/arb-post-hearing-assistant:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+```
+
+## Build UI Docker Image
+
+Build frontend Docker image via below command:
+
+```bash
+cd GenAIExamples/ArbPostHearingAssistant/ui
+docker build -t opea/arb-post-hearing-assistant-gradio-ui:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f ./docker/Dockerfile .
+```
+
+## Generate a HuggingFace Access Token
+
+Some HuggingFace resources, such as certain models, are only accessible if the developer has an access token. If you don't have a HuggingFace access token, you can create one by registering at [HuggingFace](https://huggingface.co/) and following [these steps](https://huggingface.co/docs/transformers.js/en/guides/private#step-1-generating-a-user-access-token).
+
+## Troubleshooting
+
+1. If you get errors like "Access Denied", [validate micro service](./README.md#validate-microservices) first. A simple example:
+
+   ```bash
+   http_proxy=""
+   curl http://${host_ip}:8008/generate \
+     -X POST \
+     -d '{"inputs":"    ### System: Please translate the following Golang codes into  Python codes.    ### Original codes:    '\'''\'''\''Golang    \npackage main\n\nimport \"fmt\"\nfunc main() {\n    fmt.Println(\"Hello, World!\");\n    '\'''\'''\''    ### Translated codes:","parameters":{"max_tokens":17, "do_sample": true}}' \
+     -H 'Content-Type: application/json'
+   ```
+
+2. (Docker only) If all microservices work well, check the port ${host_ip}:7777, the port may be allocated by other users, you can modify the `compose.yaml`.
+3. (Docker only) If you get errors like "The container name is in use", change container name in `compose.yaml`.
diff --git a/ArbPostHearingAssistant/arb_post_hearing_assistant.py b/ArbPostHearingAssistant/arb_post_hearing_assistant.py
new file mode 100644
index 0000000000..30ae2271d3
--- /dev/null
+++ b/ArbPostHearingAssistant/arb_post_hearing_assistant.py
@@ -0,0 +1,148 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+import asyncio
+import base64
+import json
+import os
+import subprocess
+import uuid
+from typing import List
+
+from comps import MegaServiceEndpoint, MicroService, ServiceOrchestrator, ServiceRoleType, ServiceType
+from comps.cores.mega.utils import handle_message
+from comps.cores.proto.api_protocol import (
+    ArbPostHearingAssistantChatCompletionRequest,
+    ChatCompletionRequest,
+    ChatCompletionResponse,
+    ChatCompletionResponseChoice,
+    ChatMessage,
+    UsageInfo,
+)
+from fastapi import Request
+from fastapi.responses import StreamingResponse
+
+MEGA_SERVICE_PORT = int(os.getenv("MEGA_SERVICE_PORT", 8888))
+
+LLM_SERVICE_HOST_IP = os.getenv("LLM_SERVICE_HOST_IP", "0.0.0.0")
+LLM_SERVICE_PORT = int(os.getenv("LLM_SERVICE_PORT", 9000))
+
+
+def align_inputs(self, inputs, cur_node, runtime_graph, llm_parameters_dict, **kwargs):
+    if self.services[cur_node].service_type == ServiceType.ARB_POST_HEARING_ASSISTANT:
+        for key_to_replace in ["text", "asr_result"]:
+            if key_to_replace in inputs:
+                inputs["messages"] = inputs[key_to_replace]
+                del inputs[key_to_replace]
+
+        arbPostHearingAssistant_parameters = kwargs.get("arbPostHearingAssistant_parameters", None)
+        if arbPostHearingAssistant_parameters:
+            arbPostHearingAssistant_parameters = arbPostHearingAssistant_parameters.model_dump()
+            del arbPostHearingAssistant_parameters["messages"]
+            inputs.update(arbPostHearingAssistant_parameters)
+        if "id" in inputs:
+            del inputs["id"]
+        if "max_new_tokens" in inputs:
+            del inputs["max_new_tokens"]
+        if "input" in inputs:
+            del inputs["input"]
+    return inputs
+
+
+def align_outputs(self, data, *args, **kwargs):
+    return data
+
+
+class OpeaArbPostHearingAssistantService:
+    def __init__(self, host="0.0.0.0", port=8000):
+        self.host = host
+        self.port = port
+        ServiceOrchestrator.align_inputs = align_inputs
+        ServiceOrchestrator.align_outputs = align_outputs
+        self.megaservice = ServiceOrchestrator()
+        self.endpoint = "/v1/arb-post-hearing"
+
+    def add_remote_service(self):
+
+        arb_post_hearing_assistant = MicroService(
+            name="opea_service@arb_post_hearing_assistant",
+            host=LLM_SERVICE_HOST_IP,
+            port=LLM_SERVICE_PORT,
+            endpoint="/v1/arb-post-hearing",
+            use_remote_service=True,
+            service_type=ServiceType.ARB_POST_HEARING_ASSISTANT,
+        )
+        self.megaservice.add(arb_post_hearing_assistant)
+
+    async def handle_request(self, request: Request):
+        """Accept pure text."""
+        if "application/json" in request.headers.get("content-type"):
+            data = await request.json()
+            chunk_size = data.get("chunk_size", -1)
+            chunk_overlap = data.get("chunk_overlap", -1)
+            chat_request = ArbPostHearingAssistantChatCompletionRequest.model_validate(data)
+            prompt = handle_message(chat_request.messages)
+            print(f"messages:{chat_request.messages}")
+            print(f"prompt: {prompt}")
+            initial_inputs_data = {data["type"]: prompt}
+        else:
+            raise ValueError(f"Unknown request type: {request.headers.get('content-type')}")
+
+        arbPostHearingAssistant_parameters = ArbPostHearingAssistantChatCompletionRequest(
+            messages=chat_request.messages,
+            max_tokens=chat_request.max_tokens if chat_request.max_tokens else 1024,
+            top_k=chat_request.top_k if chat_request.top_k else 10,
+            top_p=chat_request.top_p if chat_request.top_p else 0.95,
+            temperature=chat_request.temperature if chat_request.temperature else 0.01,
+            frequency_penalty=chat_request.frequency_penalty if chat_request.frequency_penalty else 0.0,
+            presence_penalty=chat_request.presence_penalty if chat_request.presence_penalty else 0.0,
+            repetition_penalty=chat_request.repetition_penalty if chat_request.repetition_penalty else 1.03,
+            model=chat_request.model if chat_request.model else None,
+            language=chat_request.language if chat_request.language else "en",
+            chunk_overlap=chunk_overlap,
+            chunk_size=chunk_size,
+        )
+        result_dict, runtime_graph = await self.megaservice.schedule(
+            initial_inputs=initial_inputs_data, arbPostHearingAssistant_parameters=arbPostHearingAssistant_parameters
+        )
+
+        for node, response in result_dict.items():
+            # Here it suppose the last microservice in the megaservice is LLM.
+            if (
+                isinstance(response, StreamingResponse)
+                and node == list(self.megaservice.services.keys())[-1]
+                and self.megaservice.services[node].service_type == ServiceType.ARB_POST_HEARING_ASSISTANT
+            ):
+                return response
+
+        last_node = runtime_graph.all_leaves()[-1]
+        response = result_dict[last_node]["text"]
+        choices = []
+        usage = UsageInfo()
+        choices.append(
+            ChatCompletionResponseChoice(
+                index=0,
+                message=ChatMessage(role="assistant", content=response),
+                finish_reason="stop",
+            )
+        )
+        return ChatCompletionResponse(model="arbPostHearingAssistant", choices=choices, usage=usage)
+
+    def start(self):
+        self.service = MicroService(
+            self.__class__.__name__,
+            service_role=ServiceRoleType.MEGASERVICE,
+            host=self.host,
+            port=self.port,
+            endpoint=self.endpoint,
+            input_datatype=ArbPostHearingAssistantChatCompletionRequest,
+            output_datatype=ChatCompletionResponse,
+        )
+        self.service.add_route(self.endpoint, self.handle_request, methods=["POST"])
+        self.service.start()
+
+
+if __name__ == "__main__":
+    arbPostHearingAssistant = OpeaArbPostHearingAssistantService(port=MEGA_SERVICE_PORT)
+    arbPostHearingAssistant.add_remote_service()
+    arbPostHearingAssistant.start()
diff --git a/ArbPostHearingAssistant/assets/img/arbitration_architecture.png b/ArbPostHearingAssistant/assets/img/arbitration_architecture.png
new file mode 100644
index 0000000000..1baa205e65
Binary files /dev/null and b/ArbPostHearingAssistant/assets/img/arbitration_architecture.png differ
diff --git a/ArbPostHearingAssistant/assets/img/arbritation_post_hearing_ui_gradio_text.png b/ArbPostHearingAssistant/assets/img/arbritation_post_hearing_ui_gradio_text.png
new file mode 100644
index 0000000000..ee6355a476
Binary files /dev/null and b/ArbPostHearingAssistant/assets/img/arbritation_post_hearing_ui_gradio_text.png differ
diff --git a/ArbPostHearingAssistant/benchmark_arb_post_hearing_assistant.yaml b/ArbPostHearingAssistant/benchmark_arb_post_hearing_assistant.yaml
new file mode 100644
index 0000000000..9e3eda52b1
--- /dev/null
+++ b/ArbPostHearingAssistant/benchmark_arb_post_hearing_assistant.yaml
@@ -0,0 +1,77 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+deploy:
+  device: gaudi
+  version: 1.3.0
+  modelUseHostPath: /mnt/models
+  HF_TOKEN: "" # mandatory
+  node: [1]
+  namespace: ""
+  node_name: []
+  timeout: 1000  # timeout in seconds for services to be ready, default 30 minutes
+  interval: 5    # interval in seconds between service ready checks, default 5 seconds
+
+  services:
+    backend:
+      resources:
+        enabled: False
+        cores_per_instance: "16"
+        memory_capacity: "8000Mi"
+      replicaCount: [1]
+
+    llm:
+      engine: vllm  # or tgi
+      model_id: "mistralai/Mistral-7B-Instruct-v0.2" # mandatory
+      replicaCount: [1]
+      resources:
+        enabled: False
+        cards_per_instance: 1
+      model_params:
+        vllm:  # VLLM specific parameters
+          batch_params:
+            enabled: True
+            max_num_seqs: "8"    # Each value triggers an LLM service upgrade
+          token_params:
+            enabled: True
+            max_input_length: ""
+            max_total_tokens: ""
+            max_batch_total_tokens: ""
+            max_batch_prefill_tokens: ""
+        tgi:   # TGI specific parameters
+          batch_params:
+            enabled: True
+            max_batch_size: [1]  # Each value triggers an LLM service upgrade
+          token_params:
+            enabled: False
+            max_input_length: "1280"
+            max_total_tokens: "2048"
+            max_batch_total_tokens: "65536"
+            max_batch_prefill_tokens: "4096"
+
+    arbPostHearingAssistant-ui:
+      replicaCount: [1]
+
+    llm-uservice:
+      model_id: "mistralai/Mistral-7B-Instruct-v0.2" # mandatory
+      replicaCount: [1]
+
+    nginx:
+      replicaCount: [1]
+
+benchmark:
+  # http request behavior related fields
+  user_queries:              [16]
+  concurrency:               [4]
+  load_shape_type:           "constant" # "constant" or "poisson"
+  poisson_arrival_rate:      1.0  # only used when load_shape_type is "poisson"
+  warmup_iterations:         10
+  seed:                      1024
+  collect_service_metric:    True
+
+  # workload, all of the test cases will run for benchmark
+  bench_target: ["arbPostHearingAssistantfixed"] # specify the bench_target for benchmark
+  dataset: "/home/sdp/pubmed_10.txt"  # specify the absolute path to the dataset file
+  llm:
+    # specify the llm output token size
+    max_token_size:          [1024]
diff --git a/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/README.md b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/README.md
new file mode 100644
index 0000000000..dd4a1f7ee1
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/README.md
@@ -0,0 +1,186 @@
+# Deploy Arbitration Post-Hearing Assistant Application on AMD EPYC™ Processors with Docker Compose
+
+This document details the deployment procedure for a Arbitration Post-Hearing Assistant application using OPEA components on an AMD EPYC™ Processors.
+
+This example includes the following sections:
+
+- [Arbitration Post-Hearing Assistant Quick Start Deployment](#arb-post-hearing-assistant-quick-start-deployment): Demonstrates how to quickly deploy a Arbitration Post-Hearing Assistant application/pipeline on AMD EPYC platform.
+- [Arbitration Post-Hearing Assistant Docker Compose Files](#arb-post-hearing-assistant-docker-compose-files): Describes some example deployments and their docker compose files.
+- [Arbitration Post-Hearing Assistant Detailed Usage](#arb-post-hearing-assistant-detailed-usage): Provide more detailed usage.
+- [Launch the UI](#launch-the-ui): Guideline for UI usage
+
+## arb-post-hearing-assistant Quick Start Deployment
+
+This section explains how to quickly deploy and manually test the Arbitration Post-Hearing Assistant service on an AMD EPYC platform. The process involves the following basic steps:
+
+1. [Access the Code](#access-the-code)
+2. [Install Docker](#install-docker)
+3. [Determine your host external IP address](#determine-your-host-external-ip-address)
+4. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+5. [Set Up Environment](#set-up-environment)
+6. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+7. [Check the Deployment Status](#check-the-deployment-status)
+8. [Test the Pipeline](#test-the-pipeline)
+9. [Cleanup the Deployment](#cleanup-the-deployment)
+
+### Access the Code
+
+Clone the GenAIExample repository and access the Arbitration Post-Hearing Assistant AMD EPYC platform Docker Compose files and supporting scripts:
+
+```bash
+git clone https://github.com/opea-project/GenAIExamples.git
+cd GenAIExamples/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc
+```
+
+### Install Docker
+
+Ensure Docker is installed on your system. If Docker is not already installed, use the provided script to set it up:
+
+    source ./install_docker.sh
+
+This script installs Docker and its dependencies. After running it, verify the installation by checking the Docker version:
+
+    docker --version
+
+If Docker is already installed, this step can be skipped.
+
+### Determine your host external IP address
+
+Run the following command in your terminal to list network interfaces:
+
+    ifconfig
+
+Look for the inet address associated with your active network interface (e.g., enp99s0). For example:
+
+    enp99s0: flags=4163<UP,BROADCAST,RUNNING,MULTICAST>  mtu 1500
+        inet 10.101.16.119  netmask 255.255.255.0  broadcast 10.101.16.255
+
+In this example, the (`host_ip`) would be (`10.101.16.119`).
+
+    # Replace with your host's external IP address
+    export host_ip="your_external_ip_address"
+
+### Generate a HuggingFace Access Token
+
+Some HuggingFace resources, such as some models, are only accessible if you have an access token. If you do not already have a HuggingFace access token, you can create one by first creating an account by following the steps provided at [HuggingFace](https://huggingface.co/) and then generating a [user access token](https://huggingface.co/docs/transformers.js/en/guides/private#step-1-generating-a-user-access-token).
+
+```bash
+export HF_TOKEN="your_huggingface_token"
+```
+
+### Set Up Environment
+
+Set the environment variables
+
+```bash
+source ./set_env.sh
+```
+
+NOTE: by default vLLM does "warmup" at start, to optimize its performance for the specified model and the underlying platform, which can take long time. For development (and e.g. autoscaling) it can be skipped with `export VLLM_SKIP_WARMUP=true`.
+
+### Deploy the Services Using Docker Compose
+
+To deploy the Arbitration Post-Hearing Assistant services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute:
+
+```bash
+docker compose up -d
+```
+
+**Note**: developers should build docker image from source when:
+
+- Developing off the git main branch (as the container's ports in the repo may be different from the published docker image).
+- Unable to download the docker image.
+- Use a specific version of Docker image.
+
+Please refer to the table below to build different microservices from source:
+
+| Microservice                   | Deployment Guide                                                                                                                                            |
+| ------------------------------ | ----------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| vLLM                           | [vLLM build guide](https://github.com/opea-project/GenAIComps/tree/main/comps/third_parties/vllm#build-docker)                                              |
+| llm-arb-post-hearing-assistant | [LLM-ArbPostHearingAssistant build guide](https://github.com/opea-project/GenAIComps/tree/main/comps/arb_post_hearing_assistant/src/#12-build-docker-image) |
+| MegaService                    | [MegaService build guide](../../../../README_miscellaneous.md#build-megaservice-docker-image)                                                               |
+| UI                             | [Basic UI build guide](../../../../README_miscellaneous.md#build-ui-docker-image)                                                                           |
+
+### Check the Deployment Status
+
+After running docker compose, to check if all the containers launched via docker compose have started:
+
+```bash
+docker ps -a
+```
+
+For the default deployment, the following 4 containers should be running:
+
+```bash
+CONTAINER ID   IMAGE                                                           COMMAND                  CREATED       STATUS                 PORTS                                         NAMES
+24bd78300413   opea/arb-post-hearing-assistant-gradio-ui:latest                "python arb_post_hea…"   2 hours ago   Up 2 hours             0.0.0.0:5173->5173/tcp, [::]:5173->5173/tcp   arb-post-hearing-assistant-xeon-ui-server
+59e60c954e26   opea/arb-post-hearing-assistant:latest                          "python arb_post_hea…"   2 hours ago   Up 2 hours             0.0.0.0:8888->8888/tcp, [::]:8888->8888/tcp   arb-post-hearing-assistant-xeon-backend-server
+32afc12de996   opea/llm-arb-post-hearing-assistant:latest                      "python comps/arb_po…"   2 hours ago   Up 2 hours             0.0.0.0:9000->9000/tcp, [::]:9000->9000/tcp   arb-post-hearing-assistant-xeon-llm-server
+c8e539360aff   ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu   "text-generation-lau…"   2 hours ago   Up 2 hours (healthy)   0.0.0.0:8008->80/tcp, [::]:8008->80/tcp       arb-post-hearing-assistant-xeon-tgi-server
+```
+
+### Test the Pipeline
+
+Once the Arbitration Post-Hearing Assistant services are running, test the pipeline using the following command:
+
+```bash
+curl -X POST http://${host_ip}:8888/v1/arb-post-hearing \
+        -H "Content-Type: application/json" \
+        -d '{"type": "text", [10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone.","max_tokens":2000,"language":"en"}'
+```
+
+**Note** The value of _host_ip_ was set using the _set_env.sh_ script and can be found in the _.env_ file.
+
+### Cleanup the Deployment
+
+To stop the containers associated with the deployment, execute the following command:
+
+```bash
+docker compose -f compose.yaml down
+```
+
+All the Arbitration Post-Hearing Assistant containers will be stopped and then removed on completion of the "down" command.
+
+## arb-post-hearing-assistant Docker Compose Files
+
+In the context of deploying a Arbitration Post-Hearing Assistant pipeline on an AMD EPYC platform, we can pick and choose different large language model serving frameworks. The table below outlines the various configurations that are available as part of the application.
+
+| File                                   | Description                                                                               |
+| -------------------------------------- | ----------------------------------------------------------------------------------------- |
+| [compose.yaml](./compose.yaml)         | Default compose file using vllm as serving framework                                      |
+| [compose_tgi.yaml](./compose_tgi.yaml) | The LLM serving framework is TGI. All other configurations remain the same as the default |
+
+## arb-post-hearing-assistant Assistant Detailed Usage
+
+There are also some customized usage.
+
+### Query with text
+
+```bash
+# form input. Use English mode (default).
+curl http://${host_ip}:8888/v1/arb-post-hearing \
+      -H "Content-Type: multipart/form-data" \
+      -F "type=text" \
+      -F "messages=[10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone." \
+      -F "max_tokens=2000" \
+      -F "language=en"
+
+## Launch the UI
+
+### Gradio UI
+
+Open this URL `http://{host_ip}:5173` in your browser to access the Gradio based frontend.
+![project-screenshot](../../../../assets/img/arbritation_post_hearing_ui_gradio_text.png)
+
+### Profile Microservices
+
+To further analyze MicroService Performance, users could follow the instructions to profile MicroServices.
+
+#### 1. vLLM backend Service
+
+Users could follow previous section to testing vLLM microservice or Arbitration Post-Hearing Assistant MegaService. By default, vLLM profiling is not enabled. Users could start and stop profiling by following commands.
+
+## Conclusion
+
+This guide should enable developer to deploy the default configuration or any of the other compose yaml files for different configurations. It also highlights the configurable parameters that can be set before deployment.
+```
diff --git a/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/compose.yaml b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/compose.yaml
new file mode 100644
index 0000000000..2f3a622180
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/compose.yaml
@@ -0,0 +1,87 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  vllm-service:
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
+    container_name: arb-post-hearing-assistant-epyc-vllm-service
+    ports:
+      - "8008:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      MODEL_CACHE: ${MODEL_CACHE}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      VLLM_CPU_KVCACHE_SPACE: 40
+      VLLM_TORCH_PROFILER_DIR: "/mnt"
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model $LLM_MODEL_ID --host 0.0.0.0 --port 80
+
+  llm-arbPostHearingAssistant-vllm:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-epyc-llm-server
+    depends_on:
+      vllm-service:
+        condition: service_healthy
+    ports:
+      - ${LLM_PORT:-9000}:9000
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      HF_TOKEN: ${HF_TOKEN}
+      MODEL_CACHE: ${MODEL_CACHE}
+      MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: ${OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME}
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-epyc-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-epyc-backend-server
+    depends_on:
+      - vllm-service
+      - llm-arbPostHearingAssistant-vllm
+    ports:
+      - "${BACKEND_SERVICE_PORT:-8888}:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-epyc-ui-server
+    depends_on:
+      - arbPostHearingAssistant-epyc-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+      - DOC_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/compose_tgi.yaml b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/compose_tgi.yaml
new file mode 100644
index 0000000000..cb6b8c9f48
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/compose_tgi.yaml
@@ -0,0 +1,86 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  tgi-server:
+    image: ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
+    container_name: arb-post-hearing-assistant-epyc-tgi-server
+    ports:
+      - ${LLM_ENDPOINT_PORT:-8008}:80
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      TGI_LLM_ENDPOINT: ${TGI_LLM_ENDPOINT}
+      HF_TOKEN: ${HF_TOKEN}
+      MODEL_CACHE: ${MODEL_CACHE}
+      host_ip: ${host_ip}
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    shm_size: 1g
+    command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0  --max-input-length ${MAX_INPUT_TOKENS} --max-total-tokens ${MAX_TOTAL_TOKENS}
+
+  llm-arbPostHearingAssistant-tgi:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-epyc-llm-server
+    depends_on:
+      tgi-server:
+        condition: service_healthy
+    ports:
+      - ${LLM_PORT:-9000}:9000
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      HF_TOKEN: ${HF_TOKEN}
+      MODEL_CACHE: ${MODEL_CACHE}
+      MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: ${OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME}
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-epyc-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-epyc-backend-server
+    depends_on:
+      - tgi-server
+      - llm-arbPostHearingAssistant-tgi
+    ports:
+      - "${BACKEND_SERVICE_PORT:-8888}:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-epyc-ui-server
+    depends_on:
+      - arbPostHearingAssistant-epyc-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+      - DOC_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/install_docker.sh b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/install_docker.sh
new file mode 100644
index 0000000000..7a3b3a0a10
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/install_docker.sh
@@ -0,0 +1,37 @@
+#!/usr/bin/env bash
+
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# Update the package index
+sudo apt-get -y update
+
+# Install prerequisites
+sudo apt-get -y install ca-certificates curl
+
+# Create the directory for the Docker GPG key
+sudo install -m 0755 -d /etc/apt/keyrings
+
+# Add Docker's official GPG key
+sudo curl -fsSL https://download.docker.com/linux/ubuntu/gpg -o /etc/apt/keyrings/docker.asc
+
+# Set permissions for the GPG key
+sudo chmod a+r /etc/apt/keyrings/docker.asc
+
+# Add Docker repository to the sources list
+echo "deb [arch=$(dpkg --print-architecture) signed-by=/etc/apt/keyrings/docker.asc] https://download.docker.com/linux/ubuntu \
+  $(. /etc/os-release && echo "$VERSION_CODENAME") stable" | sudo tee /etc/apt/sources.list.d/docker.list > /dev/null
+
+# Update the package index with Docker packages
+sudo apt-get -y update
+
+# Install Docker packages
+sudo apt-get -y install docker-ce docker-ce-cli containerd.io docker-buildx-plugin docker-compose-plugin
+
+# Add the current user to the Docker group
+sudo usermod -aG docker $USER
+
+# Optional: Verify that Docker is installed correctly
+docker --version
+
+echo "Docker installation is complete. Log out and back in for the group changes to take effect."
diff --git a/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/set_env.sh b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/set_env.sh
new file mode 100644
index 0000000000..9a8a24af82
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/cpu/epyc/set_env.sh
@@ -0,0 +1,37 @@
+#!/usr/bin/env bash
+
+# Copyright (C) 2025 Advanced Micro Devices, Inc.
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+host_ip=$(hostname -I | awk '{print $1}')
+export host_ip # Example: host_ip="192.168.1.1"
+
+export no_proxy="${no_proxy},${host_ip}" # Example: no_proxy="localhost,127.0.0.1,192.168.1.1"
+export http_proxy=$http_proxy
+export https_proxy=$https_proxy
+export HF_TOKEN=${HF_TOKEN}
+
+export LLM_ENDPOINT_PORT=8008
+export LLM_MODEL_ID="mistralai/Mistral-7B-Instruct-v0.2"
+export MAX_INPUT_TOKENS=1024
+export MAX_TOTAL_TOKENS=2048
+
+export LLM_PORT=9000
+export LLM_SERVICE_PORT=9000
+export LLM_ENDPOINT="http://${host_ip}:${LLM_ENDPOINT_PORT}"
+export OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME="OpeaArbPostHearingAssistantTgi" # OpeaArbPostHearingAssistantVllm
+export FRONTEND_SERVICE_PORT=5173
+export MEGA_SERVICE_HOST_IP=${host_ip}
+export LLM_SERVICE_HOST_IP=${host_ip}
+
+export BACKEND_SERVICE_PORT=8888
+export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:${BACKEND_SERVICE_PORT}/v1/arb-post-hearing"
+
+export LOGFLAG=True
+export MODEL_CACHE=${model_cache:-"./data"}
+
+export NUM_CARDS=1
+export BLOCK_SIZE=128
+export MAX_NUM_SEQS=256
+export MAX_SEQ_LEN_TO_CAPTURE=2048
diff --git a/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/README.md b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/README.md
new file mode 100644
index 0000000000..6261e8d280
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/README.md
@@ -0,0 +1,217 @@
+# Example Arbitration Post-Hearing Assistant deployments on AMD GPU (ROCm)
+
+This document outlines the deployment process for a Arbitration Post-Hearing Assistant application utilizing OPEA components on an AMD GPU server.
+
+This example includes the following sections:
+
+- [Arbitration Post-Hearing Assistant Quick Start Deployment](#arb-post-hearing-assistant-quick-start-deployment): Demonstrates how to quickly deploy a Arbitration Post-Hearing Assistant application/pipeline on AMD GPU platform.
+- [Arbitration Post-Hearing Assistant Docker Compose Files](#arb-post-hearing-assistant-docker-compose-files): Describes some example deployments and their docker compose files.
+- [Arbitration Post-Hearing Assistant Detailed Usage](#arb-post-hearing-assistant-detailed-usage): Provide more detailed usage.
+- [Launch the UI](#launch-the-ui): Guideline for UI usage
+
+## arb-post-hearing-assistant Quick Start Deployment
+
+This section describes how to quickly deploy and test the Arbitration Post-Hearing Assistant service manually on an AMD GPU platform. The basic steps are:
+
+1. [Access the Code](#access-the-code)
+2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+3. [Configure the Deployment Environment](#configure-the-deployment-environment)
+4. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+5. [Check the Deployment Status](#check-the-deployment-status)
+6. [Test the Pipeline](#test-the-pipeline)
+7. [Cleanup the Deployment](#cleanup-the-deployment)
+
+### Access the Code
+
+Clone the GenAIExample repository and access the Arbitration Post-Hearing Assistant AMD GPU platform Docker Compose files and supporting scripts:
+
+```bash
+git clone https://github.com/opea-project/GenAIExamples.git
+cd GenAIExamples/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm
+```
+
+### Generate a HuggingFace Access Token
+
+Some HuggingFace resources, such as some models, are only accessible if you have an access token. If you do not already have a HuggingFace access token, you can create one by first creating an account by following the steps provided at [HuggingFace](https://huggingface.co/) and then generating a [user access token](https://huggingface.co/docs/transformers.js/en/guides/private#step-1-generating-a-user-access-token).
+
+### Configure the Deployment Environment
+
+To set up environment variables for deploying Arbitration Post-Hearing Assistant services, set up some parameters specific to the deployment environment and source the `set_env_*.sh` script in this directory:
+
+- if used vLLM - set_env_vllm.sh
+- if used TGI - set_env.sh
+
+Set the values of the variables:
+
+- **HOST_IP, HOST_IP_EXTERNAL** - These variables are used to configure the name/address of the service in the operating system environment for the application services to interact with each other and with the outside world.
+
+  If your server uses only an internal address and is not accessible from the Internet, then the values for these two variables will be the same and the value will be equal to the server's internal name/address.
+
+  If your server uses only an external, Internet-accessible address, then the values for these two variables will be the same and the value will be equal to the server's external name/address.
+
+  If your server is located on an internal network, has an internal address, but is accessible from the Internet via a proxy/firewall/load balancer, then the HOST_IP variable will have a value equal to the internal name/address of the server, and the EXTERNAL_HOST_IP variable will have a value equal to the external name/address of the proxy/firewall/load balancer behind which the server is located.
+
+  We set these values in the file set_env\*\*\*\*.sh
+
+- **Variables with names like "**\*\*\*\*\*\*\_PORT"\*\* - These variables set the IP port numbers for establishing network connections to the application services.
+  The values shown in the file set_env.sh or set_env_vllm.sh they are the values used for the development and testing of the application, as well as configured for the environment in which the development is performed. These values must be configured in accordance with the rules of network access to your environment's server, and must not overlap with the IP ports of other applications that are already in use.
+
+Setting variables in the operating system environment:
+
+```bash
+export HF_TOKEN="Your_HuggingFace_API_Token"
+source ./set_env_*.sh # replace the script name with the appropriate one
+```
+
+Consult the section on [Arbitration Post-Hearing Assistant Service configuration](#arb-post-hearing-assistant-configuration) for information on how service specific configuration parameters affect deployments.
+
+### Deploy the Services Using Docker Compose
+
+To deploy the Arbitration Post-Hearing Assistant services, execute the `docker compose up` command with the appropriate arguments. For a default deployment with TGI, execute the command below. It uses the 'compose.yaml' file.
+
+```bash
+cd docker_compose/amd/gpu/rocm
+# if used TGI
+docker compose -f compose.yaml up -d
+# if used vLLM
+# docker compose -f compose_vllm.yaml up -d
+```
+
+To enable GPU support for AMD GPUs, the following configuration is added to the Docker Compose file:
+
+- compose_vllm.yaml - for vLLM-based application
+- compose.yaml - for TGI-based
+
+```yaml
+shm_size: 1g
+devices:
+  - /dev/kfd:/dev/kfd
+  - /dev/dri:/dev/dri
+cap_add:
+  - SYS_PTRACE
+group_add:
+  - video
+security_opt:
+  - seccomp:unconfined
+```
+
+This configuration forwards all available GPUs to the container. To use a specific GPU, specify its `cardN` and `renderN` device IDs. For example:
+
+```yaml
+shm_size: 1g
+devices:
+  - /dev/kfd:/dev/kfd
+  - /dev/dri/card0:/dev/dri/card0
+  - /dev/dri/render128:/dev/dri/render128
+cap_add:
+  - SYS_PTRACE
+group_add:
+  - video
+security_opt:
+  - seccomp:unconfined
+```
+
+**How to Identify GPU Device IDs:**
+Use AMD GPU driver utilities to determine the correct `cardN` and `renderN` IDs for your GPU.
+
+> **Note**: developers should build docker image from source when:
+>
+> - Developing off the git main branch (as the container's ports in the repo may be different > from the published docker image).
+> - Unable to download the docker image.
+> - Use a specific version of Docker image.
+
+Please refer to the table below to build different microservices from source:
+
+| Microservice                   | Deployment Guide                                                                                                                                            |
+| ------------------------------ | ----------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| TGI                            | [TGI project](https://github.com/huggingface/text-generation-inference.git)                                                                                 |
+| vLLM                           | [vLLM build guide](https://github.com/opea-project/GenAIComps/tree/main/comps/third_parties/vllm#build-docker)                                              |
+| llm-arb-post-hearing-assistant | [LLM-ArbPostHearingAssistant build guide](https://github.com/opea-project/GenAIComps/tree/main/comps/arb_post_hearing_assistant/src/#12-build-docker-image) |
+| MegaService                    | [MegaService build guide](../../../../README_miscellaneous.md#build-megaservice-docker-image)                                                               |
+| UI                             | [Basic UI build guide](../../../../README_miscellaneous.md#build-ui-docker-image)                                                                           |
+
+### Check the Deployment Status
+
+After running docker compose, check if all the containers launched via docker compose have started:
+
+```
+docker ps -a
+```
+
+For the default deployment, the following 4 containers should have started:
+
+If used TGI:
+
+```bash
+CONTAINER ID   IMAGE                                                           COMMAND                  CREATED       STATUS                 PORTS                                         NAMES
+24bd78300413   opea/arb-post-hearing-assistant-gradio-ui:latest                "python arb_post_hea…"   2 hours ago   Up 2 hours             0.0.0.0:5173->5173/tcp, [::]:5173->5173/tcp   arb-post-hearing-assistant-xeon-ui-server
+59e60c954e26   opea/arb-post-hearing-assistant:latest                          "python arb_post_hea…"   2 hours ago   Up 2 hours             0.0.0.0:8888->8888/tcp, [::]:8888->8888/tcp   arb-post-hearing-assistant-xeon-backend-server
+32afc12de996   opea/llm-arb-post-hearing-assistant:latest                      "python comps/arb_po…"   2 hours ago   Up 2 hours             0.0.0.0:9000->9000/tcp, [::]:9000->9000/tcp   arb-post-hearing-assistant-xeon-llm-server
+c8e539360aff   ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu   "text-generation-lau…"   2 hours ago   Up 2 hours (healthy)   0.0.0.0:8008->80/tcp, [::]:8008->80/tcp       arb-post-hearing-assistant-xeon-tgi-server
+```
+
+### Test the Pipeline
+
+Once the Arbitration Post-Hearing Assistant services are running, test the pipeline using the following command:
+
+```bash
+curl -X POST http://${host_ip}:8888/v1/arb-post-hearing \
+        -H "Content-Type: application/json" \
+        -d '{"type": "text", [10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone.","max_tokens":2000,"language":"en"}'
+```
+
+**Note** The value of _host_ip_ was set using the _set_env.sh_ script and can be found in the _.env_ file.
+
+### Cleanup the Deployment
+
+To stop the containers associated with the deployment, execute the following command:
+
+```bash
+docker compose -f compose.yaml down
+```
+
+All the Arbitration Post-Hearing Assistant containers will be stopped and then removed on completion of the "down" command.
+
+## arb-post-hearing-assistant Docker Compose Files
+
+In the context of deploying a Arbitration Post-Hearing Assistant pipeline on an AMD GPU platform, we can pick and choose different large language model serving frameworks. The table below outlines the various configurations that are available as part of the application.
+
+| File                                     | Description                                                                                |
+| ---------------------------------------- | ------------------------------------------------------------------------------------------ |
+| [compose.yaml](./compose.yaml)           | Default compose file using tgi as serving framework                                        |
+| [compose_vllm.yaml](./compose_vllm.yaml) | The LLM serving framework is vLLM. All other configurations remain the same as the default |
+
+## arb-post-hearing-assistant Assistant Detailed Usage
+
+There are also some customized usage.
+
+### Query with text
+
+```bash
+# form input. Use English mode (default).
+curl http://${host_ip}:8888/v1/arb-post-hearing \
+      -H "Content-Type: multipart/form-data" \
+      -F "type=text" \
+      -F "messages=[10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone." \
+      -F "max_tokens=2000" \
+      -F "language=en"
+
+## Launch the UI
+
+### Gradio UI
+
+Open this URL `http://{host_ip}:5173` in your browser to access the Gradio based frontend.
+![project-screenshot](../../../../assets/img/arbritation_post_hearing_ui_gradio_text.png)
+
+### Profile Microservices
+
+To further analyze MicroService Performance, users could follow the instructions to profile MicroServices.
+
+#### 1. vLLM backend Service
+
+Users could follow previous section to testing vLLM microservice or Arbitration Post-Hearing Assistant MegaService. By default, vLLM profiling is not enabled. Users could start and stop profiling by following commands.
+
+## Conclusion
+
+This guide should enable developer to deploy the default configuration or any of the other compose yaml files for different configurations. It also highlights the configurable parameters that can be set before deployment.
+```
diff --git a/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/compose.yaml b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/compose.yaml
new file mode 100644
index 0000000000..833cd25bc4
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/compose.yaml
@@ -0,0 +1,96 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  arbPostHearingAssistant-tgi-service:
+    image: ghcr.io/huggingface/text-generation-inference:2.4.1-rocm
+    container_name: arb-post-hearing-assistant-tgi-service
+    ports:
+      - "${ARB_POSTHEARING_ASSISTANT_TGI_SERVICE_PORT:-8008}:80"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      TGI_LLM_ENDPOINT: "http://${HOST_IP}:${ARB_POSTHEARING_ASSISTANT_TGI_SERVICE_PORT}"
+      HF_TOKEN: ${ARB_POSTHEARING_ASSISTANT_HUGGINGFACEHUB_API_TOKEN}
+      host_ip: ${host_ip}
+      ARB_POSTHEARING_ASSISTANT_TGI_SERVICE_PORT: ${ARB_POSTHEARING_ASSISTANT_TGI_SERVICE_PORT}
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    shm_size: 20g
+    devices:
+      - /dev/kfd:/dev/kfd
+      - /dev/dri/:/dev/dri/
+    cap_add:
+      - SYS_PTRACE
+    group_add:
+      - video
+    security_opt:
+      - seccomp:unconfined
+    ipc: host
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://${host_ip}:${ARB_POSTHEARING_ASSISTANT_TGI_SERVICE_PORT}/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model-id ${ARB_POSTHEARING_ASSISTANT_LLM_MODEL_ID} --max-input-length ${ARB_POSTHEARING_ASSISTANT_MAX_INPUT_TOKENS} --max-total-tokens ${ARB_POSTHEARING_ASSISTANT_MAX_TOTAL_TOKENS}
+
+  arbPostHearingAssistant-llm-server:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-llm-server
+    depends_on:
+      arbPostHearingAssistant-tgi-service:
+        condition: service_healthy
+    ports:
+      - "${ARB_POSTHEARING_ASSISTANT_LLM_SERVER_PORT}:9000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${ARB_POSTHEARING_ASSISTANT_TGI_LLM_ENDPOINT}
+      HF_TOKEN: ${ARB_POSTHEARING_ASSISTANT_HUGGINGFACEHUB_API_TOKEN}
+      MAX_INPUT_TOKENS: ${ARB_POSTHEARING_ASSISTANT_MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${ARB_POSTHEARING_ASSISTANT_MAX_TOTAL_TOKENS}
+      LLM_MODEL_ID: ${ARB_POSTHEARING_ASSISTANT_LLM_MODEL_ID}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: "OpeaArbPostHearingAssistantTgi"
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-backend-server
+    depends_on:
+      - arbPostHearingAssistant-tgi-service
+      - arbPostHearingAssistant-llm-server
+    ports:
+      - "${ARB_POSTHEARING_ASSISTANT_BACKEND_SERVER_PORT}:8888"
+    environment:
+      no_proxy: ${no_proxy}
+      https_proxy: ${https_proxy}
+      http_proxy: ${http_proxy}
+      MEGA_SERVICE_HOST_IP: ${HOST_IP}
+      LLM_SERVICE_HOST_IP: ${HOST_IP}
+      LLM_SERVICE_PORT: ${ARB_POSTHEARING_ASSISTANT_LLM_SERVER_PORT}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-ui-server
+    depends_on:
+      - arbPostHearingAssistant-backend-server
+    ports:
+      - "5173:5173"
+    environment:
+      no_proxy: ${no_proxy}
+      https_proxy: ${https_proxy}
+      http_proxy: ${http_proxy}
+      BACKEND_SERVICE_ENDPOINT: ${BACKEND_SERVICE_ENDPOINT}
+      DOC_BASE_URL: ${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/compose_vllm.yaml b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/compose_vllm.yaml
new file mode 100644
index 0000000000..4884644117
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/compose_vllm.yaml
@@ -0,0 +1,97 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  arbPostHearingAssistant-vllm-service:
+    image: ${REGISTRY:-opea}/vllm-rocm:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-vllm-service
+    ports:
+      - "${ARB_POSTHEARING_ASSISTANT_VLLM_SERVICE_PORT:-8081}:8011"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      HF_HUB_DISABLE_PROGRESS_BARS: 1
+      HF_HUB_ENABLE_HF_TRANSFER: 0
+      VLLM_USE_TRITON_FLASH_ATTENTION: 0
+      PYTORCH_JIT: 0
+    healthcheck:
+      test: [ "CMD-SHELL", "curl -f http://${HOST_IP}:${ARB_POSTHEARING_ASSISTANT_VLLM_SERVICE_PORT:-8081}/health || exit 1" ]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    shm_size: 20G
+    devices:
+      - /dev/kfd:/dev/kfd
+      - /dev/dri/:/dev/dri/
+    cap_add:
+      - SYS_PTRACE
+    group_add:
+      - video
+    security_opt:
+      - seccomp:unconfined
+      - apparmor=unconfined
+    command: "--model ${ARB_POSTHEARING_ASSISTANT_LLM_MODEL_ID} --swap-space 16 --disable-log-requests --dtype float16 --tensor-parallel-size 4 --host 0.0.0.0 --port 8011 --num-scheduler-steps 1 --distributed-executor-backend \"mp\""
+    ipc: host
+
+  arbPostHearingAssistant-llm-server:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-llm-server
+    depends_on:
+      arbPostHearingAssistant-vllm-service:
+        condition: service_healthy
+    ports:
+      - "${ARB_POSTHEARING_ASSISTANT_LLM_SERVER_PORT}:9000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${ARB_POSTHEARING_ASSISTANT_LLM_ENDPOINT}
+      HF_TOKEN: ${ARB_POSTHEARING_ASSISTANT_HUGGINGFACEHUB_API_TOKEN}
+      MAX_INPUT_TOKENS: ${ARB_POSTHEARING_ASSISTANT_MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${ARB_POSTHEARING_ASSISTANT_MAX_TOTAL_TOKENS}
+      LLM_MODEL_ID: ${ARB_POSTHEARING_ASSISTANT_LLM_MODEL_ID}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: "OpeaArbPostHearingAssistantVllm"
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-backend-server
+    depends_on:
+      - arbPostHearingAssistant-vllm-service
+      - arbPostHearingAssistant-llm-server
+    ports:
+      - "${ARB_POSTHEARING_ASSISTANT_BACKEND_SERVER_PORT}:8888"
+    environment:
+      no_proxy: ${no_proxy}
+      https_proxy: ${https_proxy}
+      http_proxy: ${http_proxy}
+      MEGA_SERVICE_HOST_IP: ${HOST_IP}
+      LLM_SERVICE_HOST_IP: ${HOST_IP}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-ui-server
+    depends_on:
+      - arbPostHearingAssistant-backend-server
+    ports:
+      - "${ARB_POSTHEARING_ASSISTANT_FRONTEND_PORT:-5173}:5173"
+    environment:
+      no_proxy: ${no_proxy}
+      https_proxy: ${https_proxy}
+      http_proxy: ${http_proxy}
+      BACKEND_SERVICE_ENDPOINT: ${BACKEND_SERVICE_ENDPOINT}
+      DOC_BASE_URL: ${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/set_env.sh b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/set_env.sh
new file mode 100644
index 0000000000..330cacca9f
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/set_env.sh
@@ -0,0 +1,16 @@
+#!/usr/bin/env bash
+
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+export HOST_IP=${ip_address}
+export ARB_POSTHEARING_ASSISTANT_MAX_INPUT_TOKENS="2048"
+export ARB_POSTHEARING_ASSISTANT_MAX_TOTAL_TOKENS="4096"
+export ARB_POSTHEARING_ASSISTANT_LLM_MODEL_ID="mistralai/Mistral-7B-Instruct-v0.2"
+export ARB_POSTHEARING_ASSISTANT_TGI_SERVICE_PORT="8008"
+export ARB_POSTHEARING_ASSISTANT_TGI_LLM_ENDPOINT="http://${HOST_IP}:${ARB_POSTHEARING_ASSISTANT_TGI_SERVICE_PORT}"
+export HF_TOKEN=${HF_TOKEN}
+export ARB_POSTHEARING_ASSISTANT_LLM_SERVER_PORT="9000"
+export ARB_POSTHEARING_ASSISTANT_BACKEND_SERVER_PORT="18072"
+export ARB_POSTHEARING_ASSISTANT_FRONTEND_PORT="18073"
+export BACKEND_SERVICE_ENDPOINT="http://${HOST_IP}:${ARB_POSTHEARING_ASSISTANT_BACKEND_SERVER_PORT}/v1/arb-post-hearing"
diff --git a/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/set_env_vllm.sh b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/set_env_vllm.sh
new file mode 100644
index 0000000000..7ea62528f4
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/amd/gpu/rocm/set_env_vllm.sh
@@ -0,0 +1,16 @@
+#!/usr/bin/env bash
+
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+export HOST_IP=${ip_address}
+export HF_TOKEN=${HF_TOKEN}
+export ARB_POSTHEARING_ASSISTANT_MAX_INPUT_TOKENS=2048
+export ARB_POSTHEARING_ASSISTANT_MAX_TOTAL_TOKENS=4096
+export ARB_POSTHEARING_ASSISTANT_LLM_MODEL_ID="mistralai/Mistral-7B-Instruct-v0.2"
+export ARB_POSTHEARING_ASSISTANT_VLLM_SERVICE_PORT="8008"
+export ARB_POSTHEARING_ASSISTANT_LLM_ENDPOINT="http://${HOST_IP}:${ARB_POSTHEARING_ASSISTANT_VLLM_SERVICE_PORT}"
+export ARB_POSTHEARING_ASSISTANT_LLM_SERVER_PORT="9000"
+export ARB_POSTHEARING_ASSISTANT_BACKEND_SERVER_PORT="18072"
+export ARB_POSTHEARING_ASSISTANT_FRONTEND_PORT="18073"
+export BACKEND_SERVICE_ENDPOINT="http://${HOST_IP}:${ARB_POSTHEARING_ASSISTANT_BACKEND_SERVER_PORT}/v1/arb-post-hearing"
diff --git a/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/README.md b/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/README.md
new file mode 100644
index 0000000000..c82ba63ced
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/README.md
@@ -0,0 +1,176 @@
+# Example Arbitration Post-Hearing Assistant deployments on Intel Xeon Processor
+
+This document outlines the deployment process for a Arbitration Post-Hearing Assistant application utilizing OPEA components on an Intel Xeon server.
+
+This example includes the following sections:
+
+- [Arbitration Post-Hearing Assistant Quick Start Deployment](#arb-post-hearing-assistant-quick-start-deployment): Demonstrates how to quickly deploy a Arbitration Post-Hearing Assistant application/pipeline on Intel Xeon platform.
+- [Arbitration Post-Hearing Assistant Docker Compose Files](#arb-post-hearing-assistant-docker-compose-files): Describes some example deployments and their docker compose files.
+- [Arbitration Post-Hearing Assistant Detailed Usage](#arb-post-hearing-assistant-detailed-usage): Provide more detailed usage.
+- [Launch the UI](#launch-the-ui): Guideline for UI usage
+
+## arb-post-hearing-assistant Quick Start Deployment
+
+This section describes how to quickly deploy and test the Arbitration Post-Hearing Assistant service manually on an Intel Xeon platform. The basic steps are:
+
+- [Example Arbitration Post-Hearing Assistant deployments on Intel Xeon Processor](#example-arbitration-post-hearing-assistant-deployments-on-intel-xeon-processor)
+  - [arb-post-hearing-assistant Quick Start Deployment](#arb-post-hearing-assistant-quick-start-deployment)
+    - [Access the Code and Set Up Environment](#access-the-code-and-set-up-environment)
+    - [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+    - [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Test the Pipeline](#test-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [arb-post-hearing-assistant Docker Compose Files](#arb-post-hearing-assistant-docker-compose-files)
+    - [Running LLM models with remote endpoints](#running-llm-models-with-remote-endpoints)
+  - [arb-post-hearing-assistant Detailed Usage](#arb-post-hearing-assistant-detailed-usage)
+    - [Query with text](#query-with-text)
+
+### Access the Code and Set Up Environment
+
+Clone the GenAIExample repository and access the Arbitration Post-Hearing Assistant Intel Xeon platform Docker Compose files and supporting scripts:
+
+```bash
+git clone https://github.com/opea-project/GenAIExamples.git
+cd GenAIExamples/ArbPostHearingAssistant/docker_compose
+source intel/set_env.sh
+```
+
+> NOTE: by default vLLM does "warmup" at start, to optimize its performance for the specified model and the underlying platform, which can take long time. For development (and e.g. autoscaling) it can be skipped with `export VLLM_SKIP_WARMUP=true`.
+
+> NOTE: If any port on your local machine is occupied (like `9000/8008/8888`, etc.), modify it in `set_env.sh`, then run `source set_env.sh` again.
+
+### Generate a HuggingFace Access Token
+
+Some HuggingFace resources, such as some models, are only accessible if you have an access token. If you do not already have a HuggingFace access token, you can create one by first creating an account by following the steps provided at [HuggingFace](https://huggingface.co/) and then generating a [user access token](https://huggingface.co/docs/transformers.js/en/guides/private#step-1-generating-a-user-access-token).
+
+### Deploy the Services Using Docker Compose
+
+To deploy the Arbitration Post-Hearing Assistant services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute:
+
+```bash
+cd intel/cpu/xeon/
+docker compose up -d
+```
+
+**Note**: developers should build docker image from source when:
+
+- Developing off the git main branch (as the container's ports in the repo may be different from the published docker image).
+- Unable to download the docker image.
+- Use a specific version of Docker image.
+
+Please refer to the table below to build different microservices from source:
+
+| Microservice                   | Deployment Guide                                                                                                                                            |
+| ------------------------------ | ----------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| vLLM                           | [vLLM build guide](https://github.com/opea-project/GenAIComps/tree/main/comps/third_parties/vllm#build-docker)                                              |
+| llm-arb-post-hearing-assistant | [LLM-ArbPostHearingAssistant build guide](https://github.com/opea-project/GenAIComps/tree/main/comps/arb_post_hearing_assistant/src/#12-build-docker-image) |
+| MegaService                    | [MegaService build guide](../../../../README_miscellaneous.md#build-megaservice-docker-image)                                                               |
+| UI                             | [Basic UI build guide](../../../../README_miscellaneous.md#build-ui-docker-image)                                                                           |
+
+### Check the Deployment Status
+
+After running docker compose, to check if all the containers launched via docker compose have started:
+
+```bash
+docker ps -a
+```
+
+For the default deployment, the following 4 containers should be running:
+
+```bash
+CONTAINER ID   IMAGE                                                           COMMAND                  CREATED       STATUS                 PORTS                                         NAMES
+24bd78300413   opea/arb-post-hearing-assistant-gradio-ui:latest                "python arb_post_hea…"   2 hours ago   Up 2 hours             0.0.0.0:5173->5173/tcp, [::]:5173->5173/tcp   arb-post-hearing-assistant-xeon-ui-server
+59e60c954e26   opea/arb-post-hearing-assistant:latest                          "python arb_post_hea…"   2 hours ago   Up 2 hours             0.0.0.0:8888->8888/tcp, [::]:8888->8888/tcp   arb-post-hearing-assistant-xeon-backend-server
+32afc12de996   opea/llm-arb-post-hearing-assistant:latest                      "python comps/arb_po…"   2 hours ago   Up 2 hours             0.0.0.0:9000->9000/tcp, [::]:9000->9000/tcp   arb-post-hearing-assistant-xeon-llm-server
+c8e539360aff   ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu   "text-generation-lau…"   2 hours ago   Up 2 hours (healthy)   0.0.0.0:8008->80/tcp, [::]:8008->80/tcp       arb-post-hearing-assistant-xeon-tgi-server
+```
+
+### Test the Pipeline
+
+Once the Arbitration Post-Hearing Assistant services are running, test the pipeline using the following command:
+
+```bash
+curl -X POST http://${host_ip}:8888/v1/arb-post-hearing \
+        -H "Content-Type: application/json" \
+        -d '{"type": "text", [10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone.","max_tokens":2000,"language":"en"}'
+```
+
+**Note** The value of _host_ip_ was set using the _set_env.sh_ script and can be found in the _.env_ file.
+
+### Cleanup the Deployment
+
+To stop the containers associated with the deployment, execute the following command:
+
+```bash
+docker compose -f compose.yaml down
+```
+
+All the Arbitration Post-Hearing Assistant containers will be stopped and then removed on completion of the "down" command.
+
+## arb-post-hearing-assistant Docker Compose Files
+
+In the context of deploying a arb-post-hearing-assistant pipeline on an Intel® Xeon® platform, we can pick and choose different large language model serving frameworks. The table below outlines the various configurations that are available as part of the application.
+
+| File                                         | Description                                                                            |
+| -------------------------------------------- | -------------------------------------------------------------------------------------- |
+| [compose.yaml](./compose.yaml)               | Default compose file using vllm as serving framework                                   |
+| [compose_tgi.yaml](./compose_tgi.yaml)       | The LLM serving framework is TGI. All other configurations remain the same as default  |
+| [compose_remote.yaml](./compose_remote.yaml) | Uses remote inference endpoints for LLMs. All other configurations are same as default |
+
+### Running LLM models with remote endpoints
+
+When models are deployed on a remote server, a base URL and an API key are required to access them. To set up a remote server and acquire the base URL and API key, refer to [Intel® AI for Enterprise Inference](https://www.intel.com/content/www/us/en/developer/topic-technology/artificial-intelligence/enterprise-inference.html) offerings.
+
+Set the following environment variables.
+
+- `REMOTE_ENDPOINT` is the HTTPS endpoint of the remote server with the model of choice (i.e. https://api.example.com). **Note:** If the API for the models does not use LiteLLM, the second part of the model card needs to be appended to the URL. For example, set `REMOTE_ENDPOINT` to https://api.example.com/Llama-3.3-70B-Instruct if the model card is `meta-llama/Llama-3.3-70B-Instruct`.
+- `API_KEY` is the access token or key to access the model(s) on the server.
+- `LLM_MODEL_ID` is the model card which may need to be overwritten depending on what it is set to `set_env.sh`.
+
+```bash
+export REMOTE_ENDPOINT=<https-endpoint-of-remote-server>
+export API_KEY=<your-api-key>
+export LLM_MODEL_ID=<model-card>
+```
+
+After setting these environment variables, run `docker compose` with `compose_remote.yaml`:
+
+```bash
+docker compose -f compose_remote.yaml up -d
+```
+
+## arb-post-hearing-assistant Detailed Usage
+
+There are also some customized usage.
+
+### Query with text
+
+```bash
+# form input. Use English mode (default).
+curl http://${host_ip}:8888/v1/arb-post-hearing \
+      -H "Content-Type: application/json" \
+      -F "type=text" \
+      -F "messages=[10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone." \
+      -F "max_tokens=2000" \
+      -F "language=en"
+
+## Launch the UI
+
+### Gradio UI
+
+Open this URL `http://{host_ip}:5173` in your browser to access the Gradio based frontend.
+![project-screenshot](../../../../assets/img/arbritation_post_hearing_ui_gradio_text.png)
+
+### Profile Microservices
+
+To further analyze MicroService Performance, users could follow the instructions to profile MicroServices.
+
+#### 1. vLLM backend Service
+
+Users could follow previous section to testing vLLM microservice or Arbitration Post-Hearing Assistant MegaService. By default, vLLM profiling is not enabled. Users could start and stop profiling by following commands.
+
+## Conclusion
+
+This guide should enable developer to deploy the default configuration or any of the other compose yaml files for different configurations. It also highlights the configurable parameters that can be set before deployment.
+```
diff --git a/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose.yaml b/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose.yaml
new file mode 100644
index 0000000000..954a78adc2
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose.yaml
@@ -0,0 +1,86 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  vllm-service:
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
+    container_name: arb-post-hearing-assistant-xeon-vllm-service
+    ports:
+      - ${LLM_ENDPOINT_PORT:-8008}:80
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      VLLM_TORCH_PROFILER_DIR: "/mnt"
+      VLLM_CPU_KVCACHE_SPACE: 40
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model $LLM_MODEL_ID --host 0.0.0.0 --port 80
+
+  llm-arbPostHearingAssistant-vllm:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-llm-server
+    depends_on:
+      vllm-service:
+        condition: service_healthy
+    ports:
+      - ${LLM_PORT:-9000}:9000
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      HF_TOKEN: ${HF_TOKEN}
+      MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: ${OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME}
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-xeon-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-backend-server
+    depends_on:
+      - vllm-service
+      - llm-arbPostHearingAssistant-vllm
+    ports:
+      - "${BACKEND_SERVICE_PORT:-8888}:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+      - LLM_SERVICE_PORT=${LLM_PORT}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-ui-server
+    depends_on:
+      - arbPostHearingAssistant-xeon-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+      - DOC_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose_remote.yaml b/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose_remote.yaml
new file mode 100644
index 0000000000..a9726b2df4
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose_remote.yaml
@@ -0,0 +1,61 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  llm-arbPostHearingAssistant-vllm:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-llm-server
+    ports:
+      - ${LLM_PORT:-9000}:9000
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${REMOTE_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      OPENAI_API_KEY: ${API_KEY}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
+      HF_TOKEN: ${HF_TOKEN}
+      MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: ${OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME}
+
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-xeon-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-backend-server
+    depends_on:
+      - llm-arbPostHearingAssistant-vllm
+    ports:
+      - "${BACKEND_SERVICE_PORT:-8888}:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-ui-server
+    depends_on:
+      - arbPostHearingAssistant-xeon-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+      - DOC_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose_tgi.yaml b/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose_tgi.yaml
new file mode 100644
index 0000000000..fe0d31388f
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/intel/cpu/xeon/compose_tgi.yaml
@@ -0,0 +1,85 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  tgi-server:
+    image: ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
+    container_name: arb-post-hearing-assistant-xeon-tgi-server
+    ports:
+      - ${LLM_ENDPOINT_PORT:-8008}:80
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      TGI_LLM_ENDPOINT: ${TGI_LLM_ENDPOINT}
+      HF_TOKEN: ${HF_TOKEN}
+      host_ip: ${host_ip}
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    shm_size: 1g
+    command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0  --max-input-length ${MAX_INPUT_TOKENS} --max-total-tokens ${MAX_TOTAL_TOKENS}
+
+  llm-arbPostHearingAssistant-tgi:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-llm-server
+    depends_on:
+      tgi-server:
+        condition: service_healthy
+    ports:
+      - ${LLM_PORT:-9000}:9000
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      HF_TOKEN: ${HF_TOKEN}
+      MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: ${OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME}
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-xeon-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-backend-server
+    depends_on:
+      - tgi-server
+      - llm-arbPostHearingAssistant-tgi
+    ports:
+      - "${BACKEND_SERVICE_PORT:-8888}:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+      - LLM_SERVICE_PORT=${LLM_PORT}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-xeon-ui-server
+    depends_on:
+      - arbPostHearingAssistant-xeon-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+      - DOC_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/README.md b/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/README.md
new file mode 100644
index 0000000000..23eac48e93
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/README.md
@@ -0,0 +1,150 @@
+# Example Arbitration Post-Hearing Assistant deployments on Intel® Gaudi® Platform
+
+This document outlines the deployment process for a Arbitration Post-Hearing Assistant application utilizing OPEA components on Intel® Gaudi® AI Accelerators.
+
+This example includes the following sections:
+
+- [Arbitration Post-Hearing Assistant Quick Start Deployment](#arb-post-hearing-assistant-quick-start-deployment): Demonstrates how to quickly deploy a Arbitration Post-Hearing Assistant application/pipeline on Intel® Gaudi® platform.
+- [Arbitration Post-Hearing Assistant Docker Compose Files](#arb-post-hearing-assistant-docker-compose-files): Describes some example deployments and their docker compose files.
+- [Arbitration Post-Hearing Assistant Detailed Usage](#arb-post-hearing-assistant-detailed-usage): Provide more detailed usage.
+- [Launch the UI](#launch-the-ui): Guideline for UI usage
+
+**Note** This example requires access to a properly installed Intel® Gaudi® platform with a functional Docker service configured to use the habanalabs-container-runtime. Please consult the [Intel® Gaudi® software Installation Guide](https://docs.habana.ai/en/v1.20.0/Installation_Guide/Driver_Installation.html) for more information.
+
+## arb-post-hearing-assistant Quick Start Deployment
+
+This section describes how to quickly deploy and test the arb-post-hearing-assistant service manually on an Intel® Gaudi® platform. The basic steps are:
+
+1. [Access the Code](#access-the-code)
+2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+3. [Configure the Deployment Environment](#configure-the-deployment-environment)
+4. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+5. [Check the Deployment Status](#check-the-deployment-status)
+6. [Test the Pipeline](#test-the-pipeline)
+7. [Cleanup the Deployment](#cleanup-the-deployment)
+
+### Access the Code and Set Up Environment
+
+Clone the GenAIExample repository and access the Arbitration Post-Hearing Assistant Intel® Gaudi® platform Docker Compose files and supporting scripts:
+
+```bash
+git clone https://github.com/opea-project/GenAIExamples.git
+cd GenAIExamples/ArbPostHearingAssistant/docker_compose
+source intel/set_env.sh
+```
+
+> NOTE: by default vLLM does "warmup" at start, to optimize its performance for the specified model and the underlying platform, which can take long time. For development (and e.g. autoscaling) it can be skipped with `export VLLM_SKIP_WARMUP=true`.
+
+> NOTE: If any port on your local machine is occupied (like `9000/8008/8888`, etc.), modify it in `set_env.sh`, then run `source set_env.sh` again.
+
+### Generate a HuggingFace Access Token
+
+Some HuggingFace resources, such as some models, are only accessible if you have an access token. If you do not already have a HuggingFace access token, you can create one by first creating an account by following the steps provided at [HuggingFace](https://huggingface.co/) and then generating a [user access token](https://huggingface.co/docs/transformers.js/en/guides/private#step-1-generating-a-user-access-token).
+
+### Deploy the Services Using Docker Compose
+
+To deploy the Arbitration Post-Hearing Assistant services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute:
+
+```bash
+cd intel/hpu/gaudi/
+docker compose up -d
+```
+
+**Note**: developers should build docker image from source when:
+
+- Developing off the git main branch (as the container's ports in the repo may be different from the published docker image).
+- Unable to download the docker image.
+- Use a specific version of Docker image.
+
+Please refer to the table below to build different microservices from source:
+
+| Microservice                   | Deployment Guide                                                                                                                                            |
+| ------------------------------ | ----------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| vLLM                           | [vLLM build guide](https://github.com/opea-project/GenAIComps/tree/main/comps/third_parties/vllm#build-docker)                                              |
+| llm-arb-post-hearing-assistant | [LLM-ArbPostHearingAssistant build guide](https://github.com/opea-project/GenAIComps/tree/main/comps/arb_post_hearing_assistant/src/#12-build-docker-image) |
+| MegaService                    | [MegaService build guide](../../../../README_miscellaneous.md#build-megaservice-docker-image)                                                               |
+| UI                             | [Basic UI build guide](../../../../README_miscellaneous.md#build-ui-docker-image)                                                                           |
+
+### Check the Deployment Status
+
+After running docker compose, check if all the containers launched via docker compose have started:
+
+```bash
+docker ps -a
+```
+
+For the default deployment, the following 4 containers should be running:
+
+```bash
+CONTAINER ID   IMAGE                                                           COMMAND                  CREATED       STATUS                 PORTS                                         NAMES
+24bd78300413   opea/arb-post-hearing-assistant-gradio-ui:latest                "python arb_post_hea…"   2 hours ago   Up 2 hours             0.0.0.0:5173->5173/tcp, [::]:5173->5173/tcp   arb-post-hearing-assistant-xeon-ui-server
+59e60c954e26   opea/arb-post-hearing-assistant:latest                          "python arb_post_hea…"   2 hours ago   Up 2 hours             0.0.0.0:8888->8888/tcp, [::]:8888->8888/tcp   arb-post-hearing-assistant-xeon-backend-server
+32afc12de996   opea/llm-arb-post-hearing-assistant:latest                      "python comps/arb_po…"   2 hours ago   Up 2 hours             0.0.0.0:9000->9000/tcp, [::]:9000->9000/tcp   arb-post-hearing-assistant-xeon-llm-server
+c8e539360aff   ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu   "text-generation-lau…"   2 hours ago   Up 2 hours (healthy)   0.0.0.0:8008->80/tcp, [::]:8008->80/tcp       arb-post-hearing-assistant-xeon-tgi-server
+```
+
+### Test the Pipeline
+
+Once the Arbitration Post-Hearing Assistant services are running, test the pipeline using the following command:
+
+```bash
+curl -X POST http://${host_ip}:8888/v1/arb-post-hearing \
+        -H "Content-Type: application/json" \
+        -d '{"type": "text", [10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone.","max_tokens":2000,"language":"en"}'
+```
+
+**Note** The value of _host_ip_ was set using the _set_env.sh_ script and can be found in the _.env_ file.
+
+### Cleanup the Deployment
+
+To stop the containers associated with the deployment, execute the following command:
+
+```bash
+docker compose -f compose.yaml down
+```
+
+All the Arbitration Post-Hearing Assistant containers will be stopped and then removed on completion of the "down" command.
+
+## Arbitration Post-Hearing Assistant Docker Compose Files
+
+In the context of deploying a Arbitration Post-Hearing Assistant pipeline on an Intel® Gaudi® platform, the allocation and utilization of Gaudi devices across different services are important considerations for optimizing performance and resource efficiency. Each of the example deployments, defined by the example Docker compose yaml files, demonstrates a unique approach to leveraging Gaudi hardware, reflecting different priorities and operational strategies.
+
+| File                                   | Description                                                                               |
+| -------------------------------------- | ----------------------------------------------------------------------------------------- |
+| [compose.yaml](./compose.yaml)         | Default compose file using vllm as serving framework                                      |
+| [compose_tgi.yaml](./compose_tgi.yaml) | The LLM serving framework is TGI. All other configurations remain the same as the default |
+
+## Arbitration Post-Hearing Assistant Detailed Usage
+
+There are also some customized usage.
+
+### Query with text
+
+```bash
+# form input. Use English mode (default).
+curl http://${host_ip}:8888/v1/arb-post-hearing \
+      -H "Content-Type: application/json" \
+      -F "type=text" \
+      -F "messages=[10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone." \
+      -F "max_tokens=2000" \
+      -F "language=en"
+
+## Launch the UI
+
+### Gradio UI
+
+Open this URL `http://{host_ip}:5173` in your browser to access the Gradio based frontend.
+![project-screenshot](../../../../assets/img/arbritation_post_hearing_ui_gradio_text.png)
+
+### Profile Microservices
+
+To further analyze MicroService Performance, users could follow the instructions to profile MicroServices.
+
+#### 1. vLLM backend Service
+
+Users could follow previous section to testing vLLM microservice or Arbitration Post-Hearing Assistant MegaService. By default, vLLM profiling is not enabled. Users could start and stop profiling by following commands.
+
+## Conclusion
+
+This guide should enable developer to deploy the default configuration or any of the other compose yaml files for different configurations. It also highlights the configurable parameters that can be set before deployment.
+```
diff --git a/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/compose.yaml b/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/compose.yaml
new file mode 100644
index 0000000000..de9a98cda1
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -0,0 +1,97 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  vllm-service:
+    image: opea/vllm-gaudi:1.4
+    container_name: arb-post-hearing-assistant-gaudi-vllm-service
+    ports:
+      - ${LLM_ENDPOINT_PORT:-8008}:80
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      HABANA_VISIBLE_DEVICES: all
+      OMPI_MCA_btl_vader_single_copy_mechanism: none
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      NUM_CARDS: ${NUM_CARDS}
+      VLLM_SKIP_WARMUP: ${VLLM_SKIP_WARMUP:-false}
+      VLLM_TORCH_PROFILER_DIR: "/mnt"
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    runtime: habana
+    cap_add:
+      - SYS_NICE
+    ipc: host
+    command: --model $LLM_MODEL_ID --tensor-parallel-size ${NUM_CARDS} --host 0.0.0.0 --port 80 --block-size ${BLOCK_SIZE} --max-num-seqs ${MAX_NUM_SEQS} --max-seq-len-to-capture ${MAX_SEQ_LEN_TO_CAPTURE}
+
+  llm-arbPostHearingAssistant-vllm:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-gaudi-llm-server
+    depends_on:
+      vllm-service:
+        condition: service_healthy
+    ports:
+      - ${LLM_PORT:-9000}:9000
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: ${OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME}
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-gaudi-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-gaudi-backend-server
+    depends_on:
+      - vllm-service
+      - llm-arbPostHearingAssistant-vllm
+    ports:
+      - "${BACKEND_SERVICE_PORT:-8888}:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+      - LLM_SERVICE_PORT=${LLM_PORT}
+      - ASR_SERVICE_HOST_IP=${ASR_SERVICE_HOST_IP}
+      - ASR_SERVICE_PORT=${ASR_SERVICE_PORT}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-gaudi-ui-server
+    depends_on:
+      - arbPostHearingAssistant-gaudi-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+      - DOC_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
+
+volumes:
+  data:
diff --git a/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/compose_tgi.yaml b/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/compose_tgi.yaml
new file mode 100644
index 0000000000..3664ff31ca
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/intel/hpu/gaudi/compose_tgi.yaml
@@ -0,0 +1,98 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  tgi-gaudi-server:
+    image: ghcr.io/huggingface/tgi-gaudi:2.3.1
+    container_name: arb-post-hearing-assistant-gaudi-tgi-server
+    ports:
+      - ${LLM_ENDPOINT_PORT:-8008}:80
+    volumes:
+      - "${MODEL_CACHE}:/data"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      HF_HUB_DISABLE_PROGRESS_BARS: 1
+      HF_HUB_ENABLE_HF_TRANSFER: 0
+      HABANA_VISIBLE_DEVICES: all
+      OMPI_MCA_btl_vader_single_copy_mechanism: none
+      ENABLE_HPU_GRAPH: true
+      LIMIT_HPU_GRAPH: true
+      USE_FLASH_ATTENTION: true
+      FLASH_ATTENTION_RECOMPUTE: true
+      host_ip: ${host_ip}
+      LLM_ENDPOINT_PORT: ${LLM_ENDPOINT_PORT}
+    runtime: habana
+    cap_add:
+      - SYS_NICE
+    ipc: host
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model-id ${LLM_MODEL_ID} --max-input-length ${MAX_INPUT_TOKENS} --max-total-tokens ${MAX_TOTAL_TOKENS}
+
+  llm-arbPostHearingAssistant-tgi:
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-gaudi-llm-server
+    depends_on:
+      tgi-gaudi-server:
+        condition: service_healthy
+    ports:
+      - ${LLM_PORT:-9000}:9000
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
+      MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME: ${OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME}
+      LOGFLAG: ${LOGFLAG:-False}
+    restart: unless-stopped
+
+  arbPostHearingAssistant-gaudi-backend-server:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-gaudi-backend-server
+    depends_on:
+      - tgi-gaudi-server
+      - llm-arbPostHearingAssistant-tgi
+    ports:
+      - "${BACKEND_SERVICE_PORT:-8888}:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+      - LLM_SERVICE_PORT=${LLM_PORT}
+      - ASR_SERVICE_HOST_IP=${ASR_SERVICE_HOST_IP}
+      - ASR_SERVICE_PORT=${ASR_SERVICE_PORT}
+    ipc: host
+    restart: always
+
+  arbPostHearingAssistant-gradio-ui:
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+    container_name: arb-post-hearing-assistant-gaudi-ui-server
+    depends_on:
+      - arbPostHearingAssistant-gaudi-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+      - DOC_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ArbPostHearingAssistant/docker_compose/intel/set_env.sh b/ArbPostHearingAssistant/docker_compose/intel/set_env.sh
new file mode 100644
index 0000000000..f21595cb12
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_compose/intel/set_env.sh
@@ -0,0 +1,40 @@
+#!/usr/bin/env bash
+
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+SCRIPT_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+pushd "${SCRIPT_DIR}/../../.." > /dev/null
+source .set_env.sh
+popd > /dev/null
+
+export host_ip=$(hostname -I | awk '{print $1}') # Example: host_ip="192.168.1.1"
+export no_proxy="${no_proxy},${host_ip}" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
+export http_proxy=$http_proxy
+export https_proxy=$https_proxy
+export HF_TOKEN=${HF_TOKEN} #Enter your HF Token here
+
+export LLM_ENDPOINT_PORT=8008
+export LLM_MODEL_ID="mistralai/Mistral-7B-Instruct-v0.2"
+
+export BLOCK_SIZE=128
+export MAX_NUM_SEQS=256
+export MAX_SEQ_LEN_TO_CAPTURE=2048
+export NUM_CARDS=1
+export MAX_INPUT_TOKENS=1024
+export MAX_TOTAL_TOKENS=2048
+
+export LLM_PORT=9000
+export LLM_ENDPOINT="http://${host_ip}:${LLM_ENDPOINT_PORT}"
+export OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME="OpeaArbPostHearingAssistantTgi" # OpeaArbPostHearingAssistantVllm
+export FRONTEND_SERVICE_PORT=5173
+
+export MEGA_SERVICE_HOST_IP=${host_ip} #Example: MEGA_SERVICE_HOST_IP="localhost"
+export LLM_SERVICE_HOST_IP=${host_ip}  #Example: LLM_SERVICE_HOST_IP="localhost"
+
+# uncomment below during development
+# export VLLM_SKIP_WARMUP=true
+
+export BACKEND_SERVICE_PORT=8888
+export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:${BACKEND_SERVICE_PORT}/v1/arb-post-hearing"
+
+export LOGFLAG=True
diff --git a/ArbPostHearingAssistant/docker_image_build/build.yaml b/ArbPostHearingAssistant/docker_image_build/build.yaml
new file mode 100644
index 0000000000..3ab58ba7ec
--- /dev/null
+++ b/ArbPostHearingAssistant/docker_image_build/build.yaml
@@ -0,0 +1,30 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  arb-post-hearing-assistant:
+    build:
+      args:
+        IMAGE_REPO: ${REGISTRY}
+        BASE_TAG: ${TAG}
+        http_proxy: ${http_proxy}
+        https_proxy: ${https_proxy}
+        no_proxy: ${no_proxy}
+      context: ../
+      dockerfile: ./Dockerfile
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant:${TAG:-latest}
+  arb-post-hearing-assistant-gradio-ui:
+    build:
+      args:
+        http_proxy: ${http_proxy}
+        https_proxy: ${https_proxy}
+      context: ../ui
+      dockerfile: ./docker/Dockerfile.gradio
+    extends: arb-post-hearing-assistant
+    image: ${REGISTRY:-opea}/arb-post-hearing-assistant-gradio-ui:${TAG:-latest}
+  llm-arb-post-hearing-assistant:
+    build:
+      context: GenAIComps
+      dockerfile: comps/arb_post_hearing_assistant/src/Dockerfile
+    extends: arb-post-hearing-assistant
+    image: ${REGISTRY:-opea}/llm-arb-post-hearing-assistant:${TAG:-latest}
diff --git a/ArbPostHearingAssistant/kubernetes/gmc/README.md b/ArbPostHearingAssistant/kubernetes/gmc/README.md
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/ArbPostHearingAssistant/kubernetes/helm/README.md b/ArbPostHearingAssistant/kubernetes/helm/README.md
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/ArbPostHearingAssistant/tests/README.md b/ArbPostHearingAssistant/tests/README.md
new file mode 100644
index 0000000000..ba28b90048
--- /dev/null
+++ b/ArbPostHearingAssistant/tests/README.md
@@ -0,0 +1,15 @@
+# DocSum E2E test scripts
+
+## Set the required environment variable
+
+```bash
+export HF_TOKEN="Your_Huggingface_API_Token"
+```
+
+## Run test
+
+On Intel Xeon with TGI:
+
+```bash
+bash test_compose_tgi_on_xeon.sh
+```
diff --git a/ArbPostHearingAssistant/tests/test_compose_tgi_on_xeon.sh b/ArbPostHearingAssistant/tests/test_compose_tgi_on_xeon.sh
new file mode 100644
index 0000000000..e8ab41c43b
--- /dev/null
+++ b/ArbPostHearingAssistant/tests/test_compose_tgi_on_xeon.sh
@@ -0,0 +1,161 @@
+#!/bin/bash
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+export http_proxy=$http_proxy
+export https_proxy=$https_proxy
+export host_ip=$(hostname -I | awk '{print $1}')
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+
+source $WORKPATH/docker_compose/intel/set_env.sh
+export MODEL_CACHE=${model_cache:-"./data"}
+
+export MAX_INPUT_TOKENS=2048
+export MAX_TOTAL_TOKENS=4096
+
+export OPEA_ARB_POSTHEARING_ASSISTANT_COMPONENT_NAME="OpeaArbPostHearingAssistantTgi"
+
+# Get the root folder of the current script
+ROOT_FOLDER=$(dirname "$(readlink -f "$0")")
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="arb-post-hearing-assistant arb-post-hearing-assistant-gradio-ui llm-arb-post-hearing-assistant"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    sleep 1m
+}
+
+function validate_service() {
+    local URL="$1"
+    local EXPECTED_RESULT="$2"
+    local SERVICE_NAME="$3"
+    local DOCKER_NAME="$4"
+    local VALIDATE_TYPE="$5"
+    local INPUT_DATA="$6"
+
+    if [[ $VALIDATE_TYPE == *"json"* ]]; then
+        HTTP_RESPONSE=$(curl --silent --write-out "HTTPSTATUS:%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
+    else
+        echo "Skipping request: VALIDATE_TYPE does not contain 'json'."
+    fi
+    HTTP_STATUS=$(echo $HTTP_RESPONSE | tr -d '\n' | sed -e 's/.*HTTPSTATUS://')
+    RESPONSE_BODY=$(echo $HTTP_RESPONSE | sed -e 's/HTTPSTATUS\:.*//g')
+
+    docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+
+    # check response status
+    if [ "$HTTP_STATUS" -ne "200" ]; then
+        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
+        exit 1
+    else
+        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+    fi
+    # check response body
+    if [[ "$RESPONSE_BODY" != *"$EXPECTED_RESULT"* ]]; then
+        echo "EXPECTED_RESULT==> $EXPECTED_RESULT"
+        echo "RESPONSE_BODY==> $RESPONSE_BODY"
+        echo "[ $SERVICE_NAME ] Content does not match the expected result: $RESPONSE_BODY"
+        exit 1
+    else
+        echo "[ $SERVICE_NAME ] Content is as expected."
+    fi
+
+    sleep 1s
+}
+
+function validate_microservices() {
+    # Check if the microservices are running correctly.
+
+    # tgi for llm service
+    validate_service \
+        "${host_ip}:${LLM_ENDPOINT_PORT}/generate" \
+        "generated_text" \
+        "tgi-server" \
+        "arb-post-hearing-assistant-xeon-tgi-server" \
+        "json" \
+        '{"inputs":"What is Deep Learning?","parameters":{"max_new_tokens":17, "do_sample": true}}'
+
+    # llm microservice
+    validate_service \
+        "${host_ip}:${LLM_PORT}/v1/arb-post-hearing" \
+        "case_number" \
+        "llm-arbPostHearingAssistant-tgi" \
+        "arb-post-hearing-assistant-xeon-llm-server" \
+        "json" \
+        '{"messages": "[10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone.","type":"text","language":"en"}'
+
+}
+
+function validate_megaservice_text() {
+    echo ">>> Checking text data in json format"
+    validate_service \
+        "${host_ip}:${BACKEND_SERVICE_PORT}/v1/arb-post-hearing" \
+        "summary" \
+        "arbPostHearingAssistant-xeon-backend-server" \
+        "arb-post-hearing-assistant-xeon-backend-server" \
+        "json" \
+        '{"messages": "[10:00 AM] Arbitrator Hon. Rebecca Lawson: Good morning. This hearing is now in session for Case No. ARB/2025/0917. Lets begin with appearances. [10:01 AM] Attorney Michael Grant for Mr. Jonathan Reed: Good morning Your Honor. I represent the claimant Mr. Jonathan Reed. [10:01 AM] Attorney Lisa Chen for Ms. Rachel Morgan: Good morning. I represent the respondent Ms. Rachel Morgan. [10:03 AM] Arbitrator Hon. Rebecca Lawson: Thank you. Lets proceed with Mr. Reeds opening statement. [10:04 AM] Attorney Michael Grant: Ms. Morgan failed to deliver services as per the agreement dated March 15 2023. We have submitted relevant documentation including email correspondence and payment records. The delay caused substantial financial harm to our client. [10:15 AM] Attorney Lisa Chen: We deny any breach of contract. The delays were due to regulatory issues outside our control. Furthermore Mr. Reed did not provide timely approvals which contributed to the delay. [10:30 AM] Arbitrator Hon. Rebecca Lawson: Lets turn to Clause Z of the agreement. Id like both parties to submit written briefs addressing the applicability of the force majeure clause and the timeline of approvals. [11:00 AM] Attorney Michael Grant: Understood. Well submit by the deadline. [11:01 AM] Attorney Lisa Chen: Agreed. [11:02 AM] Arbitrator Hon. Rebecca Lawson: The next hearing is scheduled for October 22 2025 at 1030 AM Eastern Time. Please ensure your witnesses are available for cross examination. [4:45 PM] Arbitrator Hon. Rebecca Lawson: This session is adjourned. Thank you everyone.","type":"text","language":"en"}'
+
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose -f compose_tgi.yaml stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group:: Stopping any running Docker containers..."
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group:: Validating microservices"
+    validate_microservices
+    echo "::endgroup::"
+
+    echo "::group::validate_megaservice_text"
+    validate_megaservice_text
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/ArbPostHearingAssistant/ui/docker/Dockerfile.gradio b/ArbPostHearingAssistant/ui/docker/Dockerfile.gradio
new file mode 100644
index 0000000000..7739d8f05b
--- /dev/null
+++ b/ArbPostHearingAssistant/ui/docker/Dockerfile.gradio
@@ -0,0 +1,34 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# Use the official Python 3.11 slim image as the base image
+FROM python:3.11-slim
+
+# Set the default language environment variable
+ENV LANG=C.UTF-8
+
+# Define a build argument for architecture (default is "cpu")
+ARG ARCH="cpu"
+
+# Update the package list and install necessary packages
+RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missing build-essential 
+    
+# Create a directory for the application
+RUN mkdir -p /home/user
+
+# Copy the application code and requirements file to the container
+COPY ./gradio/arb_post_hearing_assistant_ui_gradio.py /home/user/arb_post_hearing_assistant_ui_gradio.py
+COPY ./gradio/requirements.txt /home/user/requirements.txt 
+
+# Install Python dependencies
+RUN pip install --no-cache-dir --upgrade pip setuptools && \
+    pip install --no-cache-dir -r /home/user/requirements.txt
+
+# Set the working directory
+WORKDIR /home/user/
+
+# Expose the port that the application will run on
+EXPOSE 5173
+
+# Define the command to run the application
+CMD ["python", "arb_post_hearing_assistant_ui_gradio.py"]
diff --git a/ArbPostHearingAssistant/ui/gradio/README.md b/ArbPostHearingAssistant/ui/gradio/README.md
new file mode 100644
index 0000000000..fb6aaaaf05
--- /dev/null
+++ b/ArbPostHearingAssistant/ui/gradio/README.md
@@ -0,0 +1,97 @@
+# Arbitration Post-Hearing Assistant
+
+The Arbitration Post-Hearing Assistant is a GenAI-based module designed to process and summarize post-hearing transcripts or arbitration-related documents. It intelligently extracts key entities and insights to assist arbitrators, legal teams, and case managers in managing case follow-ups efficiently.
+
+## Key Features
+
+Automated Information Extraction:
+Identifies and extracts essential details such as:
+
+- Case number
+- Parties involved (claimant/respondent)
+- Arbitrator(s)
+- Hearing date and time
+- Next hearing schedule and purpose
+- Hearing outcomes and reasons
+
+## Docker
+
+### Build UI Docker Image
+
+To build the frontend Docker image, navigate to the `GenAIExamples/ArbPostHearingAssistant/ui` directory and run the following command:
+
+```bash
+cd GenAIExamples/ArbPostHearingAssistant/ui
+docker build -t opea/arb-post-hearing-assistant-gradio-ui:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f docker/Dockerfile.gradio .
+```
+
+This command builds the Docker image with the tag `opea/arb-post-hearing-assistant-gradio-ui:latest`. It also passes the proxy settings as build arguments to ensure that the build process can access the internet if you are behind a corporate firewall.
+
+### Run UI Docker Image
+
+To run the frontend Docker image, navigate to the `GenAIExamples/ArbPostHearingAssistant/ui/docker` directory and execute the following commands:
+
+```bash
+cd GenAIExamples/ArbPostHearingAssistant/ui/docker
+
+ip_address=$(hostname -I | awk '{print $1}')
+docker run -d -p 5173:5173 --ipc=host \
+   -e http_proxy=$http_proxy \
+   -e https_proxy=$https_proxy \
+   -e no_proxy=$no_proxy \
+   -e BACKEND_SERVICE_ENDPOINT=http://localhost:8888/v1/docsum \
+   opea/arb-post-hearing-assistant-gradio-ui:latest
+```
+
+This command runs the Docker container in interactive mode, mapping port 5173 of the host to port 5173 of the container. It also sets several environment variables, including the backend service endpoint, which is required for the frontend to communicate with the backend service.
+
+### Python
+
+To run the frontend application directly using Python, navigate to the `GenAIExamples/ArbPostHearingAssistant/ui/gradio` directory and run the following command:
+
+```bash
+cd GenAIExamples/ArbPostHearingAssistant/ui/gradio
+python arb_post_hearing_assistant_ui_gradio.py
+```
+
+This command starts the frontend application using Python.
+
+## 📸 Project Screenshots
+
+![project-screenshot](../../assets/img/arbritation_post_hearing_ui_gradio_text.png)
+
+### 🧐 Features
+
+Here are some of the project's features:
+
+## Features
+
+- **Automated Case Extraction:** Extracts key arbitration details including case number, claimant/respondent, arbitrator, hearing dates, next hearing schedule, and outcome.
+- **Hearing Summarization:** Generates concise summaries of post-hearing proceedings.
+- **LLM-Powered Processing:** Integrates with vLLM or TGI backends for natural language understanding.
+- **Structured Output:** Returns all extracted information in JSON format for easy storage, display, or integration with case management systems.
+- **Easy Deployment:** Containerized microservice, lightweight and reusable across legal workflows.
+- **Typical Flow:**
+  1. Upload or stream post-hearing transcript.
+  2. LLM backend analyzes text and extracts entities.
+  3. Returns structured JSON with case details and summary.
+
+## Additional Information
+
+### Prerequisites
+
+Ensure you have Docker installed and running on your system. Also, make sure you have the necessary proxy settings configured if you are behind a corporate firewall.
+
+### Environment Variables
+
+- `http_proxy`: Proxy setting for HTTP connections.
+- `https_proxy`: Proxy setting for HTTPS connections.
+- `no_proxy`: Comma-separated list of hosts that should be excluded from proxying.
+- `BACKEND_SERVICE_ENDPOINT`: The endpoint of the backend service that the frontend will communicate with.
+
+### Troubleshooting
+
+- Docker Build Issues: If you encounter issues while building the Docker image, ensure that your proxy settings are correctly configured and that you have internet access.
+- Docker Run Issues: If the Docker container fails to start, check the environment variables and ensure that the backend service is running and accessible.
+
+This README file provides detailed instructions and explanations for building and running the Dockerized frontend application, as well as running it directly using Python. It also highlights the key features of the project and provides additional information for troubleshooting and configuring the environment.
diff --git a/ArbPostHearingAssistant/ui/gradio/arb_post_hearing_assistant_ui_gradio.py b/ArbPostHearingAssistant/ui/gradio/arb_post_hearing_assistant_ui_gradio.py
new file mode 100644
index 0000000000..92db2872e7
--- /dev/null
+++ b/ArbPostHearingAssistant/ui/gradio/arb_post_hearing_assistant_ui_gradio.py
@@ -0,0 +1,120 @@
+# Copyright (C) 2025 Zensar Technologies Private Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+import json
+import logging
+import os
+import re
+
+import gradio as gr
+import requests
+import uvicorn
+from fastapi import FastAPI
+
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+
+class ArbPostHearingAssistantUI:
+    def __init__(self):
+        """Initialize class with headers and backend endpoint."""
+        self.HEADERS = {"Content-Type": "application/json"}
+        self.BACKEND_SERVICE_ENDPOINT = os.getenv(
+            "BACKEND_SERVICE_ENDPOINT", "http://localhost:8888/v1/arb-post-hearing"
+        )
+
+    def extract_json(self, text: str):
+        """Extract and clean embedded JSON from text."""
+        try:
+            match = re.search(r"\{.*\}", text, re.DOTALL)
+            if match:
+                json_str = match.group(0)
+                return json.loads(json_str)
+        except Exception as e:
+            logger.error("Error extracting JSON: %s", e)
+        return None
+
+    def summarize_arbitration_transcript(self, transcript):
+        """Generate a summary for the given document content."""
+        logger.info(">>> BACKEND_SERVICE_ENDPOINT - %s", self.BACKEND_SERVICE_ENDPOINT)
+
+        data = {"messages": transcript, "type": "text", "language": "en"}
+
+        try:
+            response = requests.post(
+                url=self.BACKEND_SERVICE_ENDPOINT,
+                headers=self.HEADERS,
+                data=json.dumps(data),
+                proxies={
+                    "http": os.environ.get("http_proxy", ""),
+                    "https": os.environ.get("https_proxy", ""),
+                },
+            )
+
+            if response.status_code == 200:
+                result = response.json()
+                raw_text = result["choices"][0]["message"]["content"]
+                extracted_json = self.extract_json(raw_text)
+
+                # Return pretty JSON if available
+                if extracted_json:
+                    return json.dumps(extracted_json, indent=4)
+
+                # Fallback if no JSON found
+                return json.dumps({"message": "something went wrong, please try again"}, indent=4)
+
+        except requests.exceptions.RequestException as e:
+            logger.error("Request exception: %s", e)
+            return json.dumps({"message": "something went wrong, please try again"}, indent=4)
+
+        return json.dumps({"message": "something went wrong, please try again"}, indent=4)
+
+    def render(self):
+        """Render the Gradio UI."""
+        logger.info(">>> Rendering Gradio UI")
+
+        with gr.Blocks() as text_ui:
+            with gr.Row():
+                with gr.Column():
+                    input_text = gr.TextArea(
+                        label="Enter your arbitration transcript to process:",
+                        placeholder="Please enter arbitration transcript before submitting",
+                        lines=20,
+                    )
+                    submit_btn = gr.Button("Generate")
+                with gr.Column():
+                    # ✅ Use Textbox to show formatted JSON properly
+                    generated_text = gr.JSON(label="Generated arbitration Summary", height=462, max_height=500)
+            submit_btn.click(fn=self.summarize_arbitration_transcript, inputs=[input_text], outputs=[generated_text])
+
+        with gr.Blocks() as self.demo:
+            gr.Markdown(
+                "<h1 style='text-align:center;'>⚖️ Arbitration Post Hearing Assistant</h1>",
+                elem_classes=["centered-title"],
+            )
+            with gr.Tabs():
+                with gr.TabItem("Paste Arbitration Transcript"):
+                    text_ui.render()
+
+        return self.demo
+
+
+# FastAPI + Gradio Integration
+app = FastAPI()
+
+demo = ArbPostHearingAssistantUI().render()
+demo.queue()
+app = gr.mount_gradio_app(app, demo, path="/")
+
+if __name__ == "__main__":
+    import argparse
+
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--host", type=str, default="0.0.0.0")
+    parser.add_argument("--port", type=int, default=5173)
+
+    args = parser.parse_args()
+    logger.info(">>> Starting server at %s:%d", args.host, args.port)
+
+    uvicorn.run("arb_post_hearing_assistant_ui_gradio:app", host=args.host, port=args.port)
diff --git a/ArbPostHearingAssistant/ui/gradio/requirements.txt b/ArbPostHearingAssistant/ui/gradio/requirements.txt
new file mode 100644
index 0000000000..095dee2b06
--- /dev/null
+++ b/ArbPostHearingAssistant/ui/gradio/requirements.txt
@@ -0,0 +1,4 @@
+gradio>5.22.0,<=5.34.0 
+numpy==1.26.4
+Pillow==10.3.0
+
diff --git a/AudioQnA/Dockerfile.openEuler b/AudioQnA/Dockerfile.openEuler
new file mode 100644
index 0000000000..3a6c5928a5
--- /dev/null
+++ b/AudioQnA/Dockerfile.openEuler
@@ -0,0 +1,10 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+ARG IMAGE_REPO=opea
+ARG BASE_TAG=latest
+FROM $IMAGE_REPO/comps-base:$BASE_TAG-openeuler
+
+COPY ./audioqna.py $HOME/audioqna.py
+
+ENTRYPOINT ["python", "audioqna.py"]
\ No newline at end of file
diff --git a/AudioQnA/docker_compose/amd/cpu/epyc/compose.yaml b/AudioQnA/docker_compose/amd/cpu/epyc/compose.yaml
index 9d614bd738..588113d72b 100644
--- a/AudioQnA/docker_compose/amd/cpu/epyc/compose.yaml
+++ b/AudioQnA/docker_compose/amd/cpu/epyc/compose.yaml
@@ -26,7 +26,7 @@ services:
       https_proxy: ${https_proxy}
     restart: unless-stopped
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - ${LLM_SERVER_PORT:-3006}:80
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/README.md b/AudioQnA/docker_compose/intel/cpu/xeon/README.md
index 78be7c12da..bbb604c394 100644
--- a/AudioQnA/docker_compose/intel/cpu/xeon/README.md
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/README.md
@@ -15,12 +15,19 @@ Note: The default LLM is `meta-llama/Meta-Llama-3-8B-Instruct`. Before deploying
 
 This section describes how to quickly deploy and test the AudioQnA service manually on an Intel® Xeon® processor. The basic steps are:
 
-1. [Access the Code](#access-the-code)
-2. [Configure the Deployment Environment](#configure-the-deployment-environment)
-3. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
-4. [Check the Deployment Status](#check-the-deployment-status)
-5. [Validate the Pipeline](#validate-the-pipeline)
-6. [Cleanup the Deployment](#cleanup-the-deployment)
+- [Deploying AudioQnA on Intel® Xeon® Processors](#deploying-audioqna-on-intel-xeon-processors)
+  - [Table of Contents](#table-of-contents)
+  - [AudioQnA Quick Start Deployment](#audioqna-quick-start-deployment)
+    - [Access the Code](#access-the-code)
+    - [Configure the Deployment Environment](#configure-the-deployment-environment)
+    - [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Validate the Pipeline](#validate-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [AudioQnA Docker Compose Files](#audioqna-docker-compose-files)
+    - [Running LLM models with remote endpoints](#running-llm-models-with-remote-endpoints)
+  - [Validate MicroServices](#validate-microservices)
+  - [Conclusion](#conclusion)
 
 ### Access the Code
 
@@ -59,7 +66,7 @@ To deploy the AudioQnA services, execute the `docker compose up` command with th
 
 ```bash
 cd docker_compose/intel/cpu/xeon
-docker compose -f compose.yaml up -d
+docker compose -f compose_tgi.yaml up -d
 ```
 
 > **Note**: developers should build docker image from source when:
@@ -80,6 +87,13 @@ Please refer to the table below to build different microservices from source:
 | MegaService  | [MegaService build guide](../../../../README_miscellaneous.md#build-megaservice-docker-image)                                     |
 | UI           | [Basic UI build guide](../../../../README_miscellaneous.md#build-ui-docker-image)                                                 |
 
+(Optional) Enabling monitoring using the command:
+
+```bash
+cd docker_compose/intel/cpu/xeon
+docker compose -f compose_tgi.yaml -f compose.monitoring.yaml up -d
+```
+
 ### Check the Deployment Status
 
 After running docker compose, check if all the containers launched via docker compose have started:
@@ -127,19 +141,26 @@ curl http://${host_ip}:3008/v1/audioqna \
 To stop the containers associated with the deployment, execute the following command:
 
 ```bash
-docker compose -f compose.yaml down
+docker compose -f compose_tgi.yaml down
+```
+
+If monitoring is enabled, stop the containers using the following command:
+
+```bash
+docker compose -f compose_tgi.yaml -f compose.monitoring.yaml down
 ```
 
 ## AudioQnA Docker Compose Files
 
 In the context of deploying an AudioQnA pipeline on an Intel® Xeon® platform, we can pick and choose different large language model serving frameworks, or single English TTS/multi-language TTS component. The table below outlines the various configurations that are available as part of the application. These configurations can be used as templates and can be extended to different components available in [GenAIComps](https://github.com/opea-project/GenAIComps.git).
 
-| File                                               | Description                                                                                                                                                                                                                  |
-| -------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| [compose.yaml](./compose.yaml)                     | Default compose file using vllm as serving framework and redis as vector database                                                                                                                                            |
-| [compose_tgi.yaml](./compose_tgi.yaml)             | The LLM serving framework is TGI. All other configurations remain the same as the default                                                                                                                                    |
-| [compose_multilang.yaml](./compose_multilang.yaml) | The TTS component is GPT-SoVITS. All other configurations remain the same as the default                                                                                                                                     |
-| [compose_remote.yaml](./compose_remote.yaml)       | The LLM used is hosted on a remote server and an endpoint is used to access this model. Additional environment variables need to be set before running. See [instructions](#running-llm-models-with-remote-endpoints) below. |
+| File                                                 | Description                                                                                                                                                                                                                  |
+| ---------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| [compose.yaml](./compose.yaml)                       | Default compose file using vllm as serving framework and redis as vector database                                                                                                                                            |
+| [compose_tgi.yaml](./compose_tgi.yaml)               | The LLM serving framework is TGI. All other configurations remain the same as the default                                                                                                                                    |
+| [compose_multilang.yaml](./compose_multilang.yaml)   | The TTS component is GPT-SoVITS. All other configurations remain the same as the default                                                                                                                                     |
+| [compose_remote.yaml](./compose_remote.yaml)         | The LLM used is hosted on a remote server and an endpoint is used to access this model. Additional environment variables need to be set before running. See [instructions](#running-llm-models-with-remote-endpoints) below. |
+| [compose.monitoring.yaml](./compose.monitoring.yaml) | Helper file for monitoring features. Can be used along with any compose files                                                                                                                                                |
 
 ### Running LLM models with remote endpoints
 
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/README_vllm.md b/AudioQnA/docker_compose/intel/cpu/xeon/README_vllm.md
index 8b94343e32..76e8eb2ea4 100644
--- a/AudioQnA/docker_compose/intel/cpu/xeon/README_vllm.md
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/README_vllm.md
@@ -23,7 +23,7 @@ git clone https://github.com/opea-project/GenAIExamples.git
 If you are using the main branch, then you do not need to make the transition, the main branch is used by default
 
 ```bash
-cd ~/searchqna-test/GenAIExamples/SearchQnA/docker_image_build
+cd GenAIExamples/AudioQnA/docker_image_build
 git clone https://github.com/opea-project/GenAIComps.git
 ```
 
@@ -31,7 +31,7 @@ If you are using a specific branch or tag, then we perform git checkout to the d
 
 ```bash
 ### Replace "v1.3" with the code version you need (branch or tag)
-cd cd ~/searchqna-test/GenAIExamples/SearchQnA/docker_image_build && git checkout v1.3
+cd GenAIExamples/AudioQnA/docker_image_build && git checkout v1.3
 git clone https://github.com/opea-project/GenAIComps.git
 ```
 
@@ -74,7 +74,7 @@ export HF_TOKEN='your_huggingfacehub_token'
 ### Setting variables in the file set_env_vllm.sh
 
 ```bash
-cd cd cd ~/searchqna-test/GenAIExamples/SearchQnA/docker_compose/amd/gpu/rocm
+cd ~/searchqna-test/GenAIExamples/SearchQnA/docker_compose/amd/gpu/rocm
 ### The example uses the Nano text editor. You can use any convenient text editor
 nano set_env_vllm.sh
 ```
@@ -106,8 +106,8 @@ export https_proxy="Your_HTTPs_Proxy"
 ### 3.1. Deploying applications using Docker Compose
 
 ```bash
-cd cd ~/audioqna-test/GenAIExamples/AudioQnA/docker_compose/amd/gpu/rocm/
-docker compose -f compose_vllm up -d
+cd GenAIExamples/AudioQnA/docker_compose/intel/cpu/xeon/
+docker compose up -d
 ```
 
 After starting the containers, you need to view their status with the command:
@@ -126,6 +126,12 @@ The following containers should be running:
 
 Containers should not restart.
 
+(Optional) Enabling monitoring using the command:
+
+```bash
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
 #### 3.1.1. Configuring GPU forwarding
 
 By default, in the Docker Compose file, compose_vllm.yaml is configured to forward all GPUs to the audioqna-vllm-service container.
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/compose.monitoring.yaml b/AudioQnA/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
new file mode 100644
index 0000000000..187427d348
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
@@ -0,0 +1,59 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.sysfs=/host/sys'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    ipc: host
+    restart: always
+    deploy:
+      mode: global
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/compose.yaml b/AudioQnA/docker_compose/intel/cpu/xeon/compose.yaml
index a9020a4b89..b48593a233 100644
--- a/AudioQnA/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/compose.yaml
@@ -25,7 +25,7 @@ services:
       https_proxy: ${https_proxy}
     restart: unless-stopped
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - ${LLM_SERVER_PORT:-3006}:80
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/compose_multilang.yaml b/AudioQnA/docker_compose/intel/cpu/xeon/compose_multilang.yaml
index 16b72813e2..21b3ecfc4d 100644
--- a/AudioQnA/docker_compose/intel/cpu/xeon/compose_multilang.yaml
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/compose_multilang.yaml
@@ -29,7 +29,7 @@ services:
     #  - ./pretrained_models/:/home/user/GPT-SoVITS/GPT_SoVITS/pretrained_models/
     restart: unless-stopped
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - ${LLM_SERVER_PORT:-3006}:80
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/compose_openeuler.yaml b/AudioQnA/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
new file mode 100644
index 0000000000..5ae931a78f
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
@@ -0,0 +1,91 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  whisper-service:
+    image: ${REGISTRY:-opea}/whisper:${TAG:-latest}-openeuler
+    container_name: whisper-service
+    ports:
+      - ${WHISPER_SERVER_PORT:-7066}:7066
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+    restart: unless-stopped
+  speecht5-service:
+    image: ${REGISTRY:-opea}/speecht5:${TAG:-latest}-openeuler
+    container_name: speecht5-service
+    ports:
+      - ${SPEECHT5_SERVER_PORT:-7055}:7055
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+    restart: unless-stopped
+  vllm-service:
+    image: openeuler/vllm-cpu:0.10.1-oe2403lts
+    container_name: vllm-service
+    ports:
+      - ${LLM_SERVER_PORT:-3006}:80
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
+    shm_size: 128g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      VLLM_TORCH_PROFILER_DIR: "/mnt"
+      LLM_SERVER_PORT: ${LLM_SERVER_PORT}
+      VLLM_CPU_OMP_THREADS_BIND: all
+      VLLM_CPU_KVCACHE_SPACE: 30
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://$host_ip:${LLM_SERVER_PORT}/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model ${LLM_MODEL_ID} --host 0.0.0.0 --port 80
+  audioqna-xeon-backend-server:
+    image: ${REGISTRY:-opea}/audioqna:${TAG:-latest}-openeuler
+    container_name: audioqna-xeon-backend-server
+    depends_on:
+      - whisper-service
+      - vllm-service
+      - speecht5-service
+    ports:
+      - "3008:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - WHISPER_SERVER_HOST_IP=${WHISPER_SERVER_HOST_IP}
+      - WHISPER_SERVER_PORT=${WHISPER_SERVER_PORT}
+      - LLM_SERVER_HOST_IP=${LLM_SERVER_HOST_IP}
+      - LLM_SERVER_PORT=${LLM_SERVER_PORT}
+      - LLM_MODEL_ID=${LLM_MODEL_ID}
+      - SPEECHT5_SERVER_HOST_IP=${SPEECHT5_SERVER_HOST_IP}
+      - SPEECHT5_SERVER_PORT=${SPEECHT5_SERVER_PORT}
+    ipc: host
+    restart: always
+  audioqna-xeon-ui-server:
+    image: ${REGISTRY:-opea}/audioqna-ui:${TAG:-latest}-openeuler
+    container_name: audioqna-xeon-ui-server
+    depends_on:
+      - audioqna-xeon-backend-server
+    ports:
+      - "5173:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - CHAT_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh b/AudioQnA/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..52cc7632d3
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,12 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/audioqna_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml b/AudioQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yaml b/AudioQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yaml
new file mode 100644
index 0000000000..a206521d67
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yaml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://$host_ip:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/prometheus.yaml b/AudioQnA/docker_compose/intel/cpu/xeon/prometheus.yaml
new file mode 100644
index 0000000000..0f1e5ff81d
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/prometheus.yaml
@@ -0,0 +1,29 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["opea_prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["vllm-service:80"]
+  - job_name: "tgi"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["tgi-service:80"]
+  - job_name: "audioqna-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["audioqna-xeon-backend-server:8888"]
+  - job_name: "prometheus-node-exporter"
+    scrape_interval: 30s
+    scrape_timeout: 25s
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
diff --git a/AudioQnA/docker_compose/intel/cpu/xeon/set_env.sh b/AudioQnA/docker_compose/intel/cpu/xeon/set_env.sh
index 3fb001855d..0c0f0a410f 100644
--- a/AudioQnA/docker_compose/intel/cpu/xeon/set_env.sh
+++ b/AudioQnA/docker_compose/intel/cpu/xeon/set_env.sh
@@ -3,6 +3,8 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &> /dev/null && pwd)
+
 # export host_ip=<your External Public IP>
 export host_ip=$(hostname -I | awk '{print $1}')
 export HF_TOKEN=${HF_TOKEN}
@@ -21,3 +23,9 @@ export SPEECHT5_SERVER_PORT=7055
 export LLM_SERVER_PORT=3006
 
 export BACKEND_SERVICE_ENDPOINT=http://${host_ip}:3008/v1/audioqna
+
+pushd "${SCRIPT_DIR}/grafana/dashboards" > /dev/null
+source download_opea_dashboard.sh
+popd > /dev/null
+
+export no_proxy="${no_proxy},localhost,127.0.0.1,${host_ip},node-exporter,opea_prometheus,grafana"
diff --git a/AudioQnA/docker_compose/intel/hpu/gaudi/README.md b/AudioQnA/docker_compose/intel/hpu/gaudi/README.md
index ae2ede434e..031fc81f79 100644
--- a/AudioQnA/docker_compose/intel/hpu/gaudi/README.md
+++ b/AudioQnA/docker_compose/intel/hpu/gaudi/README.md
@@ -15,12 +15,18 @@ Note: The default LLM is `meta-llama/Meta-Llama-3-8B-Instruct`. Before deploying
 
 This section describes how to quickly deploy and test the AudioQnA service manually on an Intel® Gaudi® processor. The basic steps are:
 
-1. [Access the Code](#access-the-code)
-2. [Configure the Deployment Environment](#configure-the-deployment-environment)
-3. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
-4. [Check the Deployment Status](#check-the-deployment-status)
-5. [Validate the Pipeline](#validate-the-pipeline)
-6. [Cleanup the Deployment](#cleanup-the-deployment)
+- [Deploying AudioQnA on Intel® Gaudi® Processors](#deploying-audioqna-on-intel-gaudi-processors)
+  - [Table of Contents](#table-of-contents)
+  - [AudioQnA Quick Start Deployment](#audioqna-quick-start-deployment)
+    - [Access the Code](#access-the-code)
+    - [Configure the Deployment Environment](#configure-the-deployment-environment)
+    - [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Validate the Pipeline](#validate-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [AudioQnA Docker Compose Files](#audioqna-docker-compose-files)
+  - [Validate MicroServices](#validate-microservices)
+  - [Conclusion](#conclusion)
 
 ### Access the Code
 
@@ -79,6 +85,13 @@ Please refer to the table below to build different microservices from source:
 | MegaService  | [MegaService build guide](../../../../README_miscellaneous.md#build-megaservice-docker-image)                        |
 | UI           | [Basic UI build guide](../../../../README_miscellaneous.md#build-ui-docker-image)                                    |
 
+(Optional) Enabling monitoring using the command:
+
+```bash
+cd docker_compose/intel/hpu/gaudi
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
 ### Check the Deployment Status
 
 After running docker compose, check if all the containers launched via docker compose have started:
@@ -128,6 +141,12 @@ To stop the containers associated with the deployment, execute the following com
 docker compose -f compose.yaml down
 ```
 
+If monitoring is enabled, stop the containers using the following command:
+
+```bash
+docker compose -f compose.yaml -f compose.monitoring.yaml down
+```
+
 ## AudioQnA Docker Compose Files
 
 In the context of deploying an AudioQnA pipeline on an Intel® Gaudi® platform, we can pick and choose different large language model serving frameworks. The table below outlines the various configurations that are available as part of the application. These configurations can be used as templates and can be extended to different components available in [GenAIComps](https://github.com/opea-project/GenAIComps.git).
diff --git a/AudioQnA/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml b/AudioQnA/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
new file mode 100644
index 0000000000..d64b97673e
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
@@ -0,0 +1,74 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.sysfs=/host/sys'
+      - --collector.filesystem.mount-points-exclude
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    ipc: host
+    restart: always
+    deploy:
+      mode: global
+
+  gaudi-metrics-exporter:
+    image: vault.habana.ai/gaudi-metric-exporter/metric-exporter:latest
+    privileged: true
+    container_name: gaudi-metrics-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+      - /dev:/dev
+    deploy:
+      mode: global
+    ports:
+      - 41611:41611
+    restart: unless-stopped
diff --git a/AudioQnA/docker_compose/intel/hpu/gaudi/compose.yaml b/AudioQnA/docker_compose/intel/hpu/gaudi/compose.yaml
index 3cfd68c9b1..b99050f722 100644
--- a/AudioQnA/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/AudioQnA/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -35,7 +35,7 @@ services:
       - SYS_NICE
     restart: unless-stopped
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.22.0
     container_name: vllm-gaudi-service
     ports:
       - ${LLM_SERVER_PORT:-3006}:80
diff --git a/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh b/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..0dcd3d9b04
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/gaudi_grafana_v2.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/audioqna_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
diff --git a/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml b/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yaml b/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yaml
new file mode 100644
index 0000000000..a206521d67
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yaml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://$host_ip:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/AudioQnA/docker_compose/intel/hpu/gaudi/prometheus.yaml b/AudioQnA/docker_compose/intel/hpu/gaudi/prometheus.yaml
new file mode 100644
index 0000000000..cdd5170266
--- /dev/null
+++ b/AudioQnA/docker_compose/intel/hpu/gaudi/prometheus.yaml
@@ -0,0 +1,34 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["opea_prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["vllm-gaudi-service:80"]
+  - job_name: "tgi"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["tgi-gaudi-service:80"]
+  - job_name: "audioqna-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["audioqna-gaudi-backend-server:8888"]
+  - job_name: "prometheus-node-exporter"
+    scrape_interval: 30s
+    scrape_timeout: 25s
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
+  - job_name: "gaudi-metrics-exporter"
+    scrape_interval: 30s
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["gaudi-metrics-exporter:41611"]
diff --git a/AudioQnA/docker_compose/intel/hpu/gaudi/set_env.sh b/AudioQnA/docker_compose/intel/hpu/gaudi/set_env.sh
index 4b19d19c08..4e18b81ac7 100644
--- a/AudioQnA/docker_compose/intel/hpu/gaudi/set_env.sh
+++ b/AudioQnA/docker_compose/intel/hpu/gaudi/set_env.sh
@@ -3,6 +3,8 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &> /dev/null && pwd)
+
 # export host_ip=<your External Public IP>
 export host_ip=$(hostname -I | awk '{print $1}')
 export HF_TOKEN=${HF_TOKEN}
@@ -26,3 +28,9 @@ export SPEECHT5_SERVER_PORT=7055
 export LLM_SERVER_PORT=3006
 
 export BACKEND_SERVICE_ENDPOINT=http://${host_ip}:3008/v1/audioqna
+
+pushd "${SCRIPT_DIR}/grafana/dashboards" > /dev/null
+source download_opea_dashboard.sh
+popd > /dev/null
+
+export no_proxy="${no_proxy},localhost,127.0.0.1,${host_ip},node-exporter,opea_prometheus,grafana"
diff --git a/AudioQnA/docker_image_build/build.yaml b/AudioQnA/docker_image_build/build.yaml
index e7688555c1..696a2bfdb6 100644
--- a/AudioQnA/docker_image_build/build.yaml
+++ b/AudioQnA/docker_image_build/build.yaml
@@ -13,12 +13,29 @@ services:
       context: ../
       dockerfile: ./Dockerfile
     image: ${REGISTRY:-opea}/audioqna:${TAG:-latest}
+  audioqna-openeuler:
+    build:
+      args:
+        IMAGE_REPO: ${REGISTRY}
+        BASE_TAG: ${TAG}
+        http_proxy: ${http_proxy}
+        https_proxy: ${https_proxy}
+        no_proxy: ${no_proxy}
+      context: ../
+      dockerfile: ./Dockerfile.openEuler
+    image: ${REGISTRY:-opea}/audioqna:${TAG:-latest}-openeuler
   audioqna-ui:
     build:
       context: ../ui
       dockerfile: ./docker/Dockerfile
     extends: audioqna
     image: ${REGISTRY:-opea}/audioqna-ui:${TAG:-latest}
+  audioqna-ui-openeuler:
+    build:
+      context: ../ui
+      dockerfile: ./docker/Dockerfile.openEuler
+    extends: audioqna
+    image: ${REGISTRY:-opea}/audioqna-ui:${TAG:-latest}-openeuler
   audioqna-multilang:
     build:
       context: ../
@@ -37,6 +54,12 @@ services:
       dockerfile: comps/third_parties/whisper/src/Dockerfile
     extends: audioqna
     image: ${REGISTRY:-opea}/whisper:${TAG:-latest}
+  whisper-openeuler:
+    build:
+      context: GenAIComps
+      dockerfile: comps/third_parties/whisper/src/Dockerfile.openEuler
+    extends: audioqna
+    image: ${REGISTRY:-opea}/whisper:${TAG:-latest}-openeuler
   asr:
     build:
       context: GenAIComps
@@ -61,6 +84,12 @@ services:
       dockerfile: comps/third_parties/speecht5/src/Dockerfile
     extends: audioqna
     image: ${REGISTRY:-opea}/speecht5:${TAG:-latest}
+  speecht5-openeuler:
+    build:
+      context: GenAIComps
+      dockerfile: comps/third_parties/speecht5/src/Dockerfile.openEuler
+    extends: audioqna
+    image: ${REGISTRY:-opea}/speecht5:${TAG:-latest}-openeuler
   tts:
     build:
       context: GenAIComps
@@ -73,18 +102,6 @@ services:
       dockerfile: comps/third_parties/gpt-sovits/src/Dockerfile
     extends: audioqna
     image: ${REGISTRY:-opea}/gpt-sovits:${TAG:-latest}
-  vllm:
-    build:
-      context: vllm
-      dockerfile: docker/Dockerfile.cpu
-    extends: audioqna
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
-  vllm-gaudi:
-    build:
-      context: vllm-fork
-      dockerfile: Dockerfile.hpu
-    extends: audioqna
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   vllm-rocm:
     build:
       context: GenAIComps
diff --git a/AudioQnA/kubernetes/helm/cpu-openeuler-values.yaml b/AudioQnA/kubernetes/helm/cpu-openeuler-values.yaml
new file mode 100644
index 0000000000..a9f0559098
--- /dev/null
+++ b/AudioQnA/kubernetes/helm/cpu-openeuler-values.yaml
@@ -0,0 +1,40 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# This file is based on cpu-values.yaml and overrides image tags to 'latest-openeuler'
+# for all enabled services to run on openEuler.
+image:
+  tag: latest-openeuler
+
+tgi:
+  enabled: false
+
+# Overrides from cpu-values.yaml
+vllm:
+  enabled: true
+  image:
+    repository: openeuler/vllm-cpu
+    tag: 0.10.1-oe2403lts
+
+speecht5:
+  enabled: true
+  image:
+    tag: latest-openeuler
+
+whisper:
+  enabled: true
+  image:
+    tag: latest-openeuler
+
+gpt-sovits:
+  enabled: false
+
+nginx:
+  image:
+    tag: latest-openeuler
+  service:
+    type: NodePort
+
+audioqna-ui:
+  image:
+    tag: latest-openeuler
diff --git a/AudioQnA/tests/test_compose_multilang_on_xeon.sh b/AudioQnA/tests/test_compose_multilang_on_xeon.sh
index 770838c1e2..22e569dc26 100644
--- a/AudioQnA/tests/test_compose_multilang_on_xeon.sh
+++ b/AudioQnA/tests/test_compose_multilang_on_xeon.sh
@@ -25,14 +25,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/vllm-project/vllm.git
-    cd ./vllm/
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null && cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="audioqna-multilang audioqna-ui whisper gpt-sovits vllm"
+    service_list="audioqna-multilang audioqna-ui whisper gpt-sovits"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -41,6 +35,7 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     # sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
diff --git a/AudioQnA/tests/test_compose_on_epyc.sh b/AudioQnA/tests/test_compose_on_epyc.sh
index 6fc56775a8..ac154e3632 100644
--- a/AudioQnA/tests/test_compose_on_epyc.sh
+++ b/AudioQnA/tests/test_compose_on_epyc.sh
@@ -27,20 +27,8 @@ function build_docker_images() {
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
 
-	git clone https://github.com/vllm-project/vllm.git
-	cd ./vllm/
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
-
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="audioqna audioqna-ui whisper speecht5 vllm"
+	service_list="audioqna audioqna-ui whisper speecht5"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -49,6 +37,7 @@ function build_docker_images() {
 function start_services() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc/
 	export host_ip=${ip_address}
+	export no_proxy="localhost,127.0.0.1,$ip_address"
 	source set_env.sh
 	# sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
diff --git a/AudioQnA/tests/test_compose_on_gaudi.sh b/AudioQnA/tests/test_compose_on_gaudi.sh
index c24f5ff82e..b42d5cee72 100644
--- a/AudioQnA/tests/test_compose_on_gaudi.sh
+++ b/AudioQnA/tests/test_compose_on_gaudi.sh
@@ -25,14 +25,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/HabanaAI/vllm-fork.git
-    cd vllm-fork/
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    echo "Check out vLLM tag ${VLLM_FORK_VER}"
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="audioqna audioqna-ui whisper-gaudi speecht5-gaudi vllm-gaudi"
+    service_list="audioqna audioqna-ui whisper-gaudi speecht5-gaudi"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -41,14 +35,15 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     # sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
     # Start Docker Containers
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     n=0
     until [[ "$n" -ge 200 ]]; do
-       docker logs vllm-gaudi-service > $LOG_PATH/vllm_service_start.log 2>&1
+       docker logs vllm-gaudi-service 2>&1| tee $LOG_PATH/vllm_service_start.log
        if grep -q complete $LOG_PATH/vllm_service_start.log; then
            break
        fi
@@ -58,8 +53,8 @@ function start_services() {
 
     n=0
     until [[ "$n" -ge 100 ]]; do
-       docker logs whisper-service > $LOG_PATH/whisper_service_start.log
-       if grep -q "Uvicorn server setup on port" $LOG_PATH/whisper_service_start.log; then
+       docker logs whisper-service 2>&1| tee $LOG_PATH/whisper_service_start.log
+       if grep -q "Uvicorn running on" $LOG_PATH/whisper_service_start.log; then
            break
        fi
        sleep 5s
@@ -70,16 +65,15 @@ function start_services() {
 
 function validate_megaservice() {
     response=$(http_proxy="" curl http://${ip_address}:3008/v1/audioqna -XPOST -d '{"audio": "UklGRigAAABXQVZFZm10IBIAAAABAAEARKwAAIhYAQACABAAAABkYXRhAgAAAAEA", "max_tokens":64}' -H 'Content-Type: application/json')
-    # always print the log
-    docker logs whisper-service > $LOG_PATH/whisper-service.log
-    docker logs speecht5-service > $LOG_PATH/tts-service.log
-    docker logs vllm-gaudi-service > $LOG_PATH/vllm-gaudi-service.log
-    docker logs audioqna-gaudi-backend-server > $LOG_PATH/audioqna-gaudi-backend-server.log
     echo "$response" | sed 's/^"//;s/"$//' | base64 -d > speech.mp3
 
     if [[ $(file speech.mp3) == *"RIFF"* ]]; then
         echo "Result correct."
     else
+        docker logs whisper-service > $LOG_PATH/whisper-service.log
+        docker logs speecht5-service > $LOG_PATH/tts-service.log
+        docker logs vllm-gaudi-service > $LOG_PATH/vllm-gaudi-service.log
+        docker logs audioqna-gaudi-backend-server > $LOG_PATH/audioqna-gaudi-backend-server.log
         echo "Result wrong."
         exit 1
     fi
@@ -87,7 +81,7 @@ function validate_megaservice() {
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f compose.yaml stop && docker compose rm -f
+    docker compose -f compose.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/AudioQnA/tests/test_compose_on_rocm.sh b/AudioQnA/tests/test_compose_on_rocm.sh
index 9456bf6bd1..8a235a6728 100644
--- a/AudioQnA/tests/test_compose_on_rocm.sh
+++ b/AudioQnA/tests/test_compose_on_rocm.sh
@@ -35,6 +35,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     # Start Docker Containers
     docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
diff --git a/AudioQnA/tests/test_compose_on_xeon.sh b/AudioQnA/tests/test_compose_on_xeon.sh
index a83e4a598e..023a5999b7 100644
--- a/AudioQnA/tests/test_compose_on_xeon.sh
+++ b/AudioQnA/tests/test_compose_on_xeon.sh
@@ -25,14 +25,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/vllm-project/vllm.git
-    cd ./vllm/
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null && cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="audioqna audioqna-ui whisper speecht5 vllm"
+    service_list="audioqna audioqna-ui whisper speecht5"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -41,11 +35,12 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     # sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
     # Start Docker Containers
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     n=0
     until [[ "$n" -ge 200 ]]; do
        docker logs vllm-service > $LOG_PATH/vllm_service_start.log 2>&1
@@ -79,7 +74,7 @@ function validate_megaservice() {
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f compose.yaml stop && docker compose rm -f
+    docker compose -f compose.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/AudioQnA/tests/test_compose_openeuler_on_xeon.sh b/AudioQnA/tests/test_compose_openeuler_on_xeon.sh
new file mode 100644
index 0000000000..3b30adfe2d
--- /dev/null
+++ b/AudioQnA/tests/test_compose_openeuler_on_xeon.sh
@@ -0,0 +1,104 @@
+#!/bin/bash
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+set -e
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG}-openeuler --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile.openEuler .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="audioqna-openeuler audioqna-ui-openeuler whisper-openeuler speecht5-openeuler"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    source set_env.sh
+    # sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
+
+    # Start Docker Containers
+    docker compose -f compose_openeuler.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    n=0
+    until [[ "$n" -ge 200 ]]; do
+       docker logs vllm-service > $LOG_PATH/vllm_service_start.log 2>&1
+       if grep -q complete $LOG_PATH/vllm_service_start.log; then
+           break
+       fi
+       sleep 5s
+       n=$((n+1))
+    done
+}
+
+
+function validate_megaservice() {
+    response=$(http_proxy="" curl http://${ip_address}:3008/v1/audioqna -XPOST -d '{"audio": "UklGRigAAABXQVZFZm10IBIAAAABAAEARKwAAIhYAQACABAAAABkYXRhAgAAAAEA", "max_tokens":64}' -H 'Content-Type: application/json')
+    # always print the log
+    docker logs whisper-service > $LOG_PATH/whisper-service.log
+    docker logs speecht5-service > $LOG_PATH/tts-service.log
+    docker logs vllm-service > $LOG_PATH/vllm-service.log
+    docker logs audioqna-xeon-backend-server > $LOG_PATH/audioqna-xeon-backend-server.log
+    echo "$response" | sed 's/^"//;s/"$//' | base64 -d > speech.mp3
+
+    if [[ $(file speech.mp3) == *"RIFF"* ]]; then
+        echo "Result correct."
+    else
+        echo "Result wrong."
+        exit 1
+    fi
+
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose -f compose_openeuler.yaml stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_megaservice"
+    validate_megaservice
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    docker system prune -f
+    echo "::endgroup::"
+
+}
+
+main
diff --git a/AudioQnA/tests/test_compose_tgi_on_epyc.sh b/AudioQnA/tests/test_compose_tgi_on_epyc.sh
index b442a155a8..e9c671839e 100644
--- a/AudioQnA/tests/test_compose_tgi_on_epyc.sh
+++ b/AudioQnA/tests/test_compose_tgi_on_epyc.sh
@@ -38,6 +38,7 @@ function build_docker_images() {
 function start_services() {
     echo $WORKPATH
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     # Start Docker Containers
     docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
diff --git a/AudioQnA/tests/test_compose_tgi_on_gaudi.sh b/AudioQnA/tests/test_compose_tgi_on_gaudi.sh
index dd68dfe770..13f170c865 100644
--- a/AudioQnA/tests/test_compose_tgi_on_gaudi.sh
+++ b/AudioQnA/tests/test_compose_tgi_on_gaudi.sh
@@ -35,9 +35,10 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     # Start Docker Containers
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     n=0
     until [[ "$n" -ge 200 ]]; do
        docker logs tgi-gaudi-service > $LOG_PATH/tgi_service_start.log
@@ -51,7 +52,7 @@ function start_services() {
     n=0
     until [[ "$n" -ge 100 ]]; do
        docker logs whisper-service > $LOG_PATH/whisper_service_start.log
-       if grep -q "Uvicorn server setup on port" $LOG_PATH/whisper_service_start.log; then
+       if grep -q "Uvicorn running on" $LOG_PATH/whisper_service_start.log; then
            break
        fi
        sleep 5s
@@ -80,7 +81,7 @@ function validate_megaservice() {
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f compose_tgi.yaml stop && docker compose rm -f
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/AudioQnA/tests/test_compose_tgi_on_xeon.sh b/AudioQnA/tests/test_compose_tgi_on_xeon.sh
index bc1f945062..d6e588f266 100644
--- a/AudioQnA/tests/test_compose_tgi_on_xeon.sh
+++ b/AudioQnA/tests/test_compose_tgi_on_xeon.sh
@@ -35,9 +35,10 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     # Start Docker Containers
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     n=0
     until [[ "$n" -ge 200 ]]; do
        docker logs tgi-service > $LOG_PATH/tgi_service_start.log
@@ -71,7 +72,7 @@ function validate_megaservice() {
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f compose_tgi.yaml stop && docker compose rm -f
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/AudioQnA/tests/test_compose_vllm_on_rocm.sh b/AudioQnA/tests/test_compose_vllm_on_rocm.sh
index 925b0ba9d8..0d15500107 100644
--- a/AudioQnA/tests/test_compose_vllm_on_rocm.sh
+++ b/AudioQnA/tests/test_compose_vllm_on_rocm.sh
@@ -33,6 +33,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env_vllm.sh
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
diff --git a/AudioQnA/ui/docker/Dockerfile.openEuler b/AudioQnA/ui/docker/Dockerfile.openEuler
new file mode 100644
index 0000000000..7392bb62fd
--- /dev/null
+++ b/AudioQnA/ui/docker/Dockerfile.openEuler
@@ -0,0 +1,31 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# Use node 20.11.1 as the base image
+FROM openeuler/node:20.11.1-oe2403lts@sha256:25c790f93c2243b361919620c069812319f614fd697e32e433402ae706a19ffd
+
+# Update package manager and install Git
+RUN yum update -y && \
+    yum install -y \
+        git && \
+    yum clean all && \
+    rm -rf /var/cache/yum
+
+# Copy the front-end code repository
+COPY svelte /home/user/svelte
+
+# Set the working directory
+WORKDIR /home/user/svelte
+
+# Install front-end dependencies
+RUN npm install --package-lock-only
+RUN npm ci
+
+# Build the front-end application
+RUN npm run build
+
+# Expose the port of the front-end application
+EXPOSE 5173
+
+# Run the front-end application in preview mode
+CMD ["npm", "run", "preview", "--", "--port", "5173", "--host", "0.0.0.0"]
diff --git a/AudioQnA/ui/svelte/package.json b/AudioQnA/ui/svelte/package.json
index c956cea6f6..928abd8b0a 100644
--- a/AudioQnA/ui/svelte/package.json
+++ b/AudioQnA/ui/svelte/package.json
@@ -18,7 +18,7 @@
     "@fortawesome/free-solid-svg-icons": "6.2.0",
     "@playwright/test": "^1.45.2",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "@tailwindcss/typography": "0.5.7",
     "@types/debug": "4.1.7",
diff --git a/BrowserUseAgent/Dockerfile b/BrowserUseAgent/Dockerfile
new file mode 100644
index 0000000000..ad7b3377db
--- /dev/null
+++ b/BrowserUseAgent/Dockerfile
@@ -0,0 +1,21 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+ARG IMAGE_REPO=opea
+ARG BASE_TAG=latest
+FROM $IMAGE_REPO/comps-base:$BASE_TAG
+
+USER root
+
+COPY ./requirements.txt $HOME/requirements.txt
+COPY ./browser_use_agent.py $HOME/browser_use_agent.py
+
+ARG uvpip='uv pip install --system --no-cache-dir'
+RUN uv pip install --system --upgrade pip setuptools uv && \
+    $uvpip pytest-playwright && \
+    playwright install chromium --with-deps --no-shell && \
+    $uvpip -r requirements.txt && \
+    $uvpip posthog==5.4.0
+
+USER user
+ENTRYPOINT ["python", "browser_use_agent.py"]
\ No newline at end of file
diff --git a/BrowserUseAgent/README.md b/BrowserUseAgent/README.md
new file mode 100644
index 0000000000..a15ca1e5d5
--- /dev/null
+++ b/BrowserUseAgent/README.md
@@ -0,0 +1,18 @@
+# Browser-use Agent Application
+
+Browser-use agent empowers anyone to automate repetitive web tasks. It controls your web browser to perform tasks like visiting websites and extracting data. The application is powered by [browser-use](https://github.com/browser-use/browser-use) and OPEA LLM serving microservice.
+
+## Deployment Options
+
+The table below lists currently available deployment options. They outline in detail the implementation of this example on selected hardware.
+
+| Category               | Deployment Option      | Description                                                       |
+| ---------------------- | ---------------------- | ----------------------------------------------------------------- |
+| On-premise Deployments | Docker Compose (Gaudi) | [Deployment on Gaudi](./docker_compose/intel/hpu/gaudi/README.md) |
+
+## Validated Configurations
+
+| **Deploy Method** | **LLM Engine** | **LLM Model**                | **Hardware** |
+| ----------------- | -------------- | ---------------------------- | ------------ |
+| Docker Compose    | vLLM           | Qwen/Qwen2.5-VL-32B-Instruct | Intel Gaudi  |
+| Docker Compose    | vLLM           | Qwen/Qwen2.5-VL-72B-Instruct | Intel Gaudi  |
diff --git a/BrowserUseAgent/browser_use_agent.py b/BrowserUseAgent/browser_use_agent.py
new file mode 100644
index 0000000000..78b97d464b
--- /dev/null
+++ b/BrowserUseAgent/browser_use_agent.py
@@ -0,0 +1,90 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+
+import os
+
+from browser_use import Agent, BrowserProfile
+from comps import opea_microservices, register_microservice
+from comps.cores.telemetry.opea_telemetry import opea_telemetry
+from fastapi import Request
+from langchain_openai import ChatOpenAI
+from pydantic import BaseModel, SecretStr
+
+LLM = None
+BROWSER_PROFILE = None
+LLM_ENDPOINT = os.getenv("LLM_ENDPOINT", "http://0.0.0.0:8008")
+LLM_MODEL = os.getenv("LLM_MODEL", "Qwen/Qwen2.5-VL-32B-Instruct")
+
+
+def initiate_llm_and_browser(llm_endpoint: str, model: str, secret_key: str = "sk-xxxxxx"):
+    # Initialize global LLM and BrowserProfile if not already initialized
+    global LLM, BROWSER_PROFILE
+    if not LLM:
+        LLM = ChatOpenAI(base_url=f"{llm_endpoint}/v1", model=model, api_key=SecretStr(secret_key), temperature=0.1)
+    if not BROWSER_PROFILE:
+        BROWSER_PROFILE = BrowserProfile(
+            headless=True,
+            chromium_sandbox=False,
+        )
+    return LLM, BROWSER_PROFILE
+
+
+class BrowserUseRequest(BaseModel):
+    task_prompt: str
+    use_vision: bool = True
+    secret_key: str = "sk-xxxxxx"
+    llm_endpoint: str = LLM_ENDPOINT
+    llm_model: str = LLM_MODEL
+    agent_max_steps: int = 10
+
+
+class BrowserUseResponse(BaseModel):
+    is_success: bool = False
+    model: str
+    task_prompt: str
+    use_vision: bool
+    agent_researched_urls: list[str] = []
+    agent_actions: list[str] = []
+    agent_durations: float
+    agent_steps: int
+    final_result: str
+
+
+@register_microservice(
+    name="opea_service@browser_use_agent",
+    endpoint="/v1/browser_use_agent",
+    host="0.0.0.0",
+    port=8022,
+)
+@opea_telemetry
+async def run(request: Request):
+    data = await request.json()
+    chat_request = BrowserUseRequest.model_validate(data)
+    llm, browser_profile = initiate_llm_and_browser(
+        llm_endpoint=chat_request.llm_endpoint, model=chat_request.llm_model, secret_key=chat_request.secret_key
+    )
+    agent = Agent(
+        task=chat_request.task_prompt,
+        llm=llm,
+        use_vision=chat_request.use_vision,
+        enable_memory=False,
+        browser_profile=browser_profile,
+    )
+    history = await agent.run(max_steps=chat_request.agent_max_steps)
+
+    return BrowserUseResponse(
+        is_success=history.is_successful() if history.is_successful() is not None else False,
+        model=chat_request.llm_model,
+        task_prompt=chat_request.task_prompt,
+        use_vision=chat_request.use_vision,
+        agent_researched_urls=history.urls(),
+        agent_actions=history.action_names(),
+        agent_durations=round(history.total_duration_seconds(), 3),
+        agent_steps=history.number_of_steps(),
+        final_result=history.final_result() if history.is_successful() else f"Task failed: {history.errors()}",
+    )
+
+
+if __name__ == "__main__":
+    opea_microservices["opea_service@browser_use_agent"].start()
diff --git a/BrowserUseAgent/docker_compose/intel/hpu/gaudi/README.md b/BrowserUseAgent/docker_compose/intel/hpu/gaudi/README.md
new file mode 100644
index 0000000000..7a82c0aebe
--- /dev/null
+++ b/BrowserUseAgent/docker_compose/intel/hpu/gaudi/README.md
@@ -0,0 +1,94 @@
+# Example BrowserUseAgent deployments on an Intel® Gaudi® Platform
+
+This example covers the single-node on-premises deployment of the BrowserUseAgent example using OPEA components. This example begins with a Quick Start section and then documents how to modify deployments, leverage new models and configure the number of allocated devices.
+
+**Note** This example requires access to a properly installed Intel® Gaudi® platform with a functional Docker service configured to use the habanalabs-container-runtime. Please consult the [Intel® Gaudi® software Installation Guide](https://docs.habana.ai/en/v1.20.1/Installation_Guide/Driver_Installation.html) for more information.
+
+## Quick Start Deployment
+
+This section describes how to quickly deploy and test the BrowserUseAgent service manually on an Intel® Gaudi® platform. The basic steps are:
+
+1. [Access the Code](#access-the-code)
+2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+3. [Configure the Deployment Environment](#configure-the-deployment-environment)
+4. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+5. [Check the Deployment Status](#check-the-deployment-status)
+6. [Test the Pipeline](#test-the-pipeline)
+7. [Cleanup the Deployment](#cleanup-the-deployment)
+
+### Access the Code
+
+Clone the GenAIExample repository and access the BrowserUseAgent Intel® Gaudi® platform Docker Compose files and supporting scripts:
+
+```bash
+git clone https://github.com/opea-project/GenAIExamples.git
+cd GenAIExamples/BrowserUseAgent/docker_compose/intel/hpu/gaudi/
+```
+
+Checkout a released version, such as v1.5:
+
+```bash
+git checkout v1.5
+```
+
+### Generate a HuggingFace Access Token
+
+Some HuggingFace resources, such as some models, are only accessible if you have an access token. If you do not already have a HuggingFace access token, you can create one by first creating an account by following the steps provided at [HuggingFace](https://huggingface.co/) and then generating a [user access token](https://huggingface.co/docs/transformers.js/en/guides/private#step-1-generating-a-user-access-token).
+
+### Configure the Deployment Environment
+
+To set up environment variables for deploying BrowserUseAgent services, source the _setup_env.sh_ script in this directory:
+
+```bash
+source ./set_env.sh
+```
+
+The _set_env.sh_ script will prompt for required and optional environment variables used to configure the BrowserUseAgent services. If a value is not entered, the script will use a default value for the same. Users need to check if the values fit your deployment environment.
+
+### Deploy the Services Using Docker Compose
+
+To deploy the BrowserUseAgent services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute:
+
+```bash
+docker compose up -d
+```
+
+The BrowserUseAgent docker images should automatically be downloaded from the `OPEA registry` and deployed on the Intel® Gaudi® Platform.
+
+### Check the Deployment Status
+
+After running docker compose, check if all the containers launched via docker compose have started:
+
+```bash
+docker ps -a
+```
+
+For the default deployment, the following 10 containers should have started:
+
+```
+CONTAINER ID   IMAGE                                                COMMAND                  CREATED         STATUS                            PORTS                                                                                                                                       NAMES
+96cb590c749c   opea/browser-use-agent:latest                        "python browser_use_…"   9 seconds ago   Up 8 seconds                      0.0.0.0:8022->8022/tcp, :::8022->8022/tcp                                                                                                   browser-use-agent-server
+8072e1c33a4b   opea/vllm-gaudi:1.22.0                               "python3 -m vllm.ent…"   9 seconds ago   Up 8 seconds (health: starting)   0.0.0.0:8008->80/tcp, [::]:8008->80/tcp                                                                                                     vllm-gaudi-server
+```
+
+### Test the Pipeline
+
+If you don't have existing websites to test, follow the [guide](./../../../../tests/webarena/README.md) to deploy one in your local environment.
+
+Once the BrowserUseAgent services are running, test the pipeline using the following command:
+
+```bash
+curl -X POST http://${host_ip}:${BROWSER_USE_AGENT_PORT}/v1/browser_use_agent \
+    -H "Content-Type: application/json" \
+    -d '{"task_prompt": "Navigate to http://10.7.4.57:8083/admin and login with the credentials: username: admin, password: admin1234. Then, find out What are the top-2 best-selling product in 2022?"}'
+```
+
+- Note that Update the `task_prompt` to match the evaluation question relevant to your configured website.
+
+### Cleanup the Deployment
+
+To stop the containers associated with the deployment, execute the following command:
+
+```bash
+docker compose -f compose.yaml down
+```
diff --git a/BrowserUseAgent/docker_compose/intel/hpu/gaudi/compose.yaml b/BrowserUseAgent/docker_compose/intel/hpu/gaudi/compose.yaml
new file mode 100644
index 0000000000..e7a2ffd867
--- /dev/null
+++ b/BrowserUseAgent/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -0,0 +1,50 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+x-common-environment:
+  &common-env
+  no_proxy: ${no_proxy}
+  http_proxy: ${http_proxy}
+  https_proxy: ${https_proxy}
+
+services:
+  vllm-gaudi-server:
+    image: opea/vllm-gaudi:1.22.0
+    container_name: vllm-gaudi-server
+    ports:
+      - ${LLM_ENDPOINT_PORT:-8008}:80
+    volumes:
+      - "${DATA_PATH:-./data}:/data"
+    environment:
+      <<: *common-env
+      HF_TOKEN: ${HF_TOKEN}
+      HF_HOME: /data
+      HABANA_VISIBLE_DEVICES: all
+      OMPI_MCA_btl_vader_single_copy_mechanism: none
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      VLLM_TORCH_PROFILER_DIR: "/mnt"
+      VLLM_SKIP_WARMUP: true
+      PT_HPU_ENABLE_LAZY_COLLECTIVES: true
+    runtime: habana
+    cap_add:
+      - SYS_NICE
+    ipc: host
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 150
+    command: --model $LLM_MODEL_ID --tensor-parallel-size $NUM_CARDS --host 0.0.0.0 --port 80 --max-seq-len-to-capture $MAX_TOTAL_TOKENS
+
+  browser-use-agent-server:
+    image: ${REGISTRY:-opea}/browser-use-agent:${TAG:-latest}
+    container_name: browser-use-agent-server
+    depends_on:
+      - vllm-gaudi-server
+    ports:
+      - ${BROWSER_USE_AGENT_PORT:-8022}:8022
+    environment:
+      <<: *common-env
+      LLM_ENDPOINT: ${LLM_ENDPOINT-http://0.0.0.0:8008}
+      LLM_MODEL: ${LLM_MODEL_ID-Qwen/Qwen2-VL-72B-Instruct}
+    ipc: host
diff --git a/BrowserUseAgent/docker_compose/intel/hpu/gaudi/set_env.sh b/BrowserUseAgent/docker_compose/intel/hpu/gaudi/set_env.sh
new file mode 100644
index 0000000000..b11bbf903d
--- /dev/null
+++ b/BrowserUseAgent/docker_compose/intel/hpu/gaudi/set_env.sh
@@ -0,0 +1,38 @@
+#!/usr/bin/env bash
+
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# Navigate to the parent directory and source the environment
+SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &> /dev/null && pwd)
+
+pushd "$SCRIPT_DIR/../../../../../" > /dev/null
+source .set_env.sh
+popd > /dev/null
+
+# Function to check if a variable is set
+check_var() {
+    if [ "$#" -ne 1 ]; then
+        echo "Error: Usage: check_var <ENV_VARIABLE_NAME>" >&2
+        return 2
+    fi
+
+    local var_name="$1"
+    if [ -n "${!var_name}" ]; then
+        # Variable value is non-empty
+        return 0
+    else
+        # Variable is unset or set to an empty string
+        return 1
+    fi
+}
+
+check_var "HF_TOKEN"
+export ip_address=$(hostname -I | awk '{print $1}')
+
+export LLM_ENDPOINT_PORT="${LLM_ENDPOINT_PORT:-8008}"
+export LLM_ENDPOINT="http://${ip_address}:${LLM_ENDPOINT_PORT}"
+export DATA_PATH="${DATA_PATH-"./data"}"
+export LLM_MODEL_ID="${LLM_MODEL_ID-"Qwen/Qwen2.5-VL-32B-Instruct"}"
+export MAX_TOTAL_TOKENS="${MAX_TOTAL_TOKENS-12288}"
+export NUM_CARDS="${NUM_CARDS-4}"
diff --git a/BrowserUseAgent/docker_image_build/build.yaml b/BrowserUseAgent/docker_image_build/build.yaml
new file mode 100644
index 0000000000..b7a7268d58
--- /dev/null
+++ b/BrowserUseAgent/docker_image_build/build.yaml
@@ -0,0 +1,15 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  browser-use-agent:
+    build:
+      args:
+        IMAGE_REPO: ${REGISTRY}
+        BASE_TAG: ${TAG}
+        http_proxy: ${http_proxy}
+        https_proxy: ${https_proxy}
+        no_proxy: ${no_proxy}
+      context: ../
+      dockerfile: ./Dockerfile
+    image: ${REGISTRY:-opea}/browser-use-agent:${TAG:-latest}
diff --git a/BrowserUseAgent/requirements.txt b/BrowserUseAgent/requirements.txt
new file mode 100644
index 0000000000..08afe30806
--- /dev/null
+++ b/BrowserUseAgent/requirements.txt
@@ -0,0 +1 @@
+browser-use==0.3.2
diff --git a/BrowserUseAgent/tests/README.md b/BrowserUseAgent/tests/README.md
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/BrowserUseAgent/tests/test_compose_on_gaudi.sh b/BrowserUseAgent/tests/test_compose_on_gaudi.sh
new file mode 100644
index 0000000000..63f234345a
--- /dev/null
+++ b/BrowserUseAgent/tests/test_compose_on_gaudi.sh
@@ -0,0 +1,149 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+export HF_TOKEN=${HF_TOKEN}
+export LLM_ENDPOINT_PORT=8008
+export LLM_ENDPOINT="http://0.0.0.0:${LLM_ENDPOINT_PORT}"
+export BROWSER_USE_AGENT_PORT=8022
+export LLM_MODEL_ID="Qwen/Qwen2.5-VL-32B-Instruct"
+export MAX_TOTAL_TOKENS=131072
+export NUM_CARDS=4
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    docker compose -f build.yaml build --no-cache --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    source set_env.sh
+
+    # Start Docker Containers
+    docker compose -f compose.yaml up -d --quiet-pull > ${LOG_PATH}/start_services_with_compose.log
+    n=0
+    until [[ "$n" -ge 200 ]]; do
+        echo "n=$n"
+        docker logs vllm-gaudi-server > vllm_service_start.log 2>&1
+        if grep -q "Application startup complete" vllm_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+}
+
+function validate_service() {
+    local URL="$1"
+    local EXPECTED_RESULT="$2"
+    local SERVICE_NAME="$3"
+    local DOCKER_NAME="$4"
+    local INPUT_DATA="$5"
+
+    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
+    if [ "$HTTP_STATUS" -eq 200 ]; then
+        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+
+        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
+
+        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
+            echo "[ $SERVICE_NAME ] Content is as expected."
+        else
+            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
+            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+            exit 1
+        fi
+    else
+        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
+        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+        exit 1
+    fi
+    sleep 1s
+}
+
+function validate_microservices() {
+    # vllm for llm service
+    validate_service \
+        "${ip_address}:${LLM_ENDPOINT_PORT}/v1/chat/completions" \
+        "content" \
+        "vllm-llm" \
+        "vllm-gaudi-server" \
+        '{"model": "'${LLM_MODEL_ID}'", "messages": [{"role": "user", "content": "What is Deep Learning?"}], "max_tokens":17}'
+}
+
+function validate_megaservice() {
+    # start web server for testing
+    cd $WORKPATH/tests/webarena
+    bash shopping_admin.sh start
+
+    # Curl the Mega Service
+    validate_service \
+        "${ip_address}:${BROWSER_USE_AGENT_PORT}/v1/browser_use_agent" \
+        "\"is_success\":true" \
+        "browser-use-agent" \
+        "browser-use-agent-server" \
+        '{"task_prompt": "Navigate to http://'${ip_address}':8084/admin and login with the credentials: username: admin, password: admin1234. Then, find out What are the top-3 best-selling product in 2022?"}'
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    docker compose -f compose.yaml down
+
+    cd $WORKPATH/tests/webarena
+    bash shopping_admin.sh stop
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    sleep 30
+    echo "::endgroup::"
+
+    echo "::group::validate_microservices"
+    validate_microservices
+    echo "::endgroup::"
+
+    echo "::group::validate_megaservice"
+    validate_megaservice
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/BrowserUseAgent/tests/webarena/README.md b/BrowserUseAgent/tests/webarena/README.md
new file mode 100644
index 0000000000..12be9ebade
--- /dev/null
+++ b/BrowserUseAgent/tests/webarena/README.md
@@ -0,0 +1,23 @@
+# Setup Scripts for Webarena
+
+We will launch a shopping admin website, part of [WebArena](https://github.com/web-arena-x/webarena), to serve as a web server for agent evaluation. The deployment process will follow the instructions in the [webarena-setup](https://github.com/gasse/webarena-setup) repository.
+
+## Download Docker Image
+
+1. Download shopping_admin_final_0719.tar from the [official webarena repo](https://github.com/web-arena-x/webarena/tree/main/environment_docker).
+
+2. Place the archive file, shopping_admin_final_0719.tar, into the directory specified by the `ARCHIVES_LOCATION` parameter within `tests/webarena/set_env.sh`
+
+## Launch the Web Site
+
+Please ensure Docker services work in your environment, and perform the following command to launch the web site:
+
+```bash
+bash shopping_admin.sh start
+```
+
+## Stop the Web Site
+
+```bash
+bash shopping_admin.sh stop
+```
diff --git a/BrowserUseAgent/tests/webarena/set_env.sh b/BrowserUseAgent/tests/webarena/set_env.sh
new file mode 100644
index 0000000000..0acd826453
--- /dev/null
+++ b/BrowserUseAgent/tests/webarena/set_env.sh
@@ -0,0 +1,11 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+WORKING_DIR="$(pwd)"
+PUBLIC_HOSTNAME="$(hostname -I | awk '{print $1}')"
+SHOPPING_ADMIN_USER="admin"
+SHOPPING_ADMIN_PASSWORD="admin1234"
+SHOPPING_ADMIN_PORT=8084
+SHOPPING_ADMIN_URL="http://${PUBLIC_HOSTNAME}:${SHOPPING_ADMIN_PORT}/admin"
+ARCHIVES_LOCATION="/data2/hf_model"
diff --git a/BrowserUseAgent/tests/webarena/shopping_admin.sh b/BrowserUseAgent/tests/webarena/shopping_admin.sh
new file mode 100644
index 0000000000..e3a5a998be
--- /dev/null
+++ b/BrowserUseAgent/tests/webarena/shopping_admin.sh
@@ -0,0 +1,83 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# Reference: https://github.com/gasse/webarena-setup
+
+# stop if any error occur
+set -e
+
+BASE_DIR=`dirname "${BASH_SOURCE[0]}"`
+source ${BASE_DIR}/set_env.sh
+
+assert() {
+  if ! "$@"; then
+    echo "Assertion failed: $*" >&2
+    exit 1
+  fi
+}
+
+load_docker_image() {
+  local IMAGE_NAME="$1"
+  local INPUT_FILE="$2"
+
+  if ! docker images --format "{{.Repository}}:{{.Tag}}" | grep -q "^${IMAGE_NAME}:"; then
+    echo "Loading Docker image ${IMAGE_NAME} from ${INPUT_FILE}"
+    docker load --input "${INPUT_FILE}"
+  else
+    echo "Docker image ${IMAGE_NAME} is already loaded."
+  fi
+}
+
+start() {
+    # Verify that the docker image archive file exists
+  assert [ -f ${ARCHIVES_LOCATION}/shopping_admin_final_0719.tar ]
+
+  # Load image
+  load_docker_image "shopping_admin_final_0719" ${ARCHIVES_LOCATION}/shopping_admin_final_0719.tar
+
+  # Create and run the container
+  docker create --name shopping_admin_server -p ${SHOPPING_ADMIN_PORT}:80 shopping_admin_final_0719
+
+  # Start the container
+  docker start shopping_admin_server
+  echo -n -e "Waiting 60 seconds for all services to start..."
+  sleep 60
+  echo -n -e " done\n"
+
+  echo -n -e "Configuring Magento settings inside the container..."
+  docker exec shopping_admin_server php /var/www/magento2/bin/magento config:set admin/security/password_is_forced 0
+  docker exec shopping_admin_server php /var/www/magento2/bin/magento config:set admin/security/password_lifetime 0
+  docker exec shopping_admin_server /var/www/magento2/bin/magento setup:store-config:set --base-url="http://${PUBLIC_HOSTNAME}:${SHOPPING_ADMIN_PORT}"
+  docker exec shopping_admin_server mysql -u magentouser -pMyPassword magentodb -e  "UPDATE core_config_data SET value='http://$PUBLIC_HOSTNAME:$SHOPPING_ADMIN_PORT/' WHERE path = 'web/secure/base_url';"
+  docker exec shopping_admin_server /var/www/magento2/bin/magento cache:flush
+  echo -n -e " done\n"
+}
+
+stop() {
+  docker stop shopping_admin_server || true
+  docker rm shopping_admin_server || true
+}
+
+case "$1" in
+    start)
+        echo "Starting shopping_admin server..."
+        start
+        echo "shopping_admin server started."
+        ;;
+    stop)
+        echo "Stopping shopping_admin server..."
+        stop
+        echo "shopping_admin server stopped."
+        ;;
+    restart)
+        echo "Restarting shopping_admin server..."
+        stop
+        sleep 2
+        start
+        echo "shopping_admin server restarted."
+        ;;
+    *)
+        echo "Usage: $0 {start|stop|restart}"
+        exit 1
+        ;;
+esac
diff --git a/ChatQnA/chatqna.py b/ChatQnA/chatqna.py
index 2e462b0f6e..ac67f4a16c 100644
--- a/ChatQnA/chatqna.py
+++ b/ChatQnA/chatqna.py
@@ -3,10 +3,11 @@
 
 import argparse
 import json
+import logging
 import os
 import re
 
-from comps import MegaServiceEndpoint, MicroService, ServiceOrchestrator, ServiceRoleType, ServiceType
+from comps import CustomLogger, MegaServiceEndpoint, MicroService, ServiceOrchestrator, ServiceRoleType, ServiceType
 from comps.cores.mega.utils import handle_message
 from comps.cores.proto.api_protocol import (
     ChatCompletionRequest,
@@ -20,6 +21,10 @@
 from fastapi.responses import StreamingResponse
 from langchain_core.prompts import PromptTemplate
 
+logger = CustomLogger(__name__)
+log_level = logging.DEBUG if os.getenv("LOGFLAG", "").lower() == "true" else logging.INFO
+logging.basicConfig(level=log_level, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
+
 
 class ChatTemplate:
     @staticmethod
@@ -62,6 +67,10 @@ def generate_rag_prompt(question, documents):
 
 
 def align_inputs(self, inputs, cur_node, runtime_graph, llm_parameters_dict, **kwargs):
+    logger.debug(
+        f"Aligning inputs for service: {self.services[cur_node].name}, type: {self.services[cur_node].service_type}"
+    )
+
     if self.services[cur_node].service_type == ServiceType.EMBEDDING:
         inputs["inputs"] = inputs["text"]
         del inputs["text"]
@@ -83,6 +92,9 @@ def align_inputs(self, inputs, cur_node, runtime_graph, llm_parameters_dict, **k
         # next_inputs["repetition_penalty"] = inputs["repetition_penalty"]
         next_inputs["temperature"] = inputs["temperature"]
         inputs = next_inputs
+
+    # Log the aligned inputs (be careful with sensitive data)
+    logger.debug(f"Aligned inputs for {self.services[cur_node].name}: {type(inputs)}")
     return inputs
 
 
@@ -123,7 +135,9 @@ def align_outputs(self, data, cur_node, inputs, runtime_graph, llm_parameters_di
                 elif input_variables == ["question"]:
                     prompt = prompt_template.format(question=data["initial_query"])
                 else:
-                    print(f"{prompt_template} not used, we only support 2 input variables ['question', 'context']")
+                    logger.warning(
+                        f"{prompt_template} not used, we only support 2 input variables ['question', 'context']"
+                    )
                     prompt = ChatTemplate.generate_rag_prompt(data["initial_query"], docs)
             else:
                 prompt = ChatTemplate.generate_rag_prompt(data["initial_query"], docs)
@@ -152,7 +166,7 @@ def align_outputs(self, data, cur_node, inputs, runtime_graph, llm_parameters_di
             elif input_variables == ["question"]:
                 prompt = prompt_template.format(question=prompt)
             else:
-                print(f"{prompt_template} not used, we only support 2 input variables ['question', 'context']")
+                logger.warning(f"{prompt_template} not used, we only support 2 input variables ['question', 'context']")
                 prompt = ChatTemplate.generate_rag_prompt(prompt, reranked_docs)
         else:
             prompt = ChatTemplate.generate_rag_prompt(prompt, reranked_docs)
@@ -171,27 +185,65 @@ def align_outputs(self, data, cur_node, inputs, runtime_graph, llm_parameters_di
 
 
 def align_generator(self, gen, **kwargs):
-    # OpenAI response format
-    # b'data:{"id":"","object":"text_completion","created":1725530204,"model":"meta-llama/Meta-Llama-3-8B-Instruct","system_fingerprint":"2.0.1-native","choices":[{"index":0,"delta":{"role":"assistant","content":"?"},"logprobs":null,"finish_reason":null}]}\n\n'
+    """Aligns the generator output to match ChatQnA's format of sending bytes.
+
+    Handles different LLM output formats (TGI, OpenAI) and properly filters
+    empty or null content chunks to avoid UI display issues.
+    """
+    # OpenAI response format example:
+    # b'data:{"id":"","object":"text_completion","created":1725530204,"model":"meta-llama/Meta-Llama-3-8B-Instruct",
+    # "system_fingerprint":"2.0.1-native","choices":[{"index":0,"delta":{"role":"assistant","content":"?"},
+    # "logprobs":null,"finish_reason":null}]}\n\n'
+
     for line in gen:
-        line = line.decode("utf-8")
-        chunks = [chunk.strip() for chunk in line.split("\n\n") if chunk.strip()]
-        for line in chunks:
+        try:
+            line = line.decode("utf-8")
             start = line.find("{")
             end = line.rfind("}") + 1
+
+            # Skip lines with invalid JSON structure
+            if start == -1 or end <= start:
+                logger.debug("Skipping line with invalid JSON structure")
+                continue
+
             json_str = line[start:end]
-            try:
-                # sometimes yield empty chunk, do a fallback here
-                json_data = json.loads(json_str)
-                if "ops" in json_data and "op" in json_data["ops"][0]:
-                    if "value" in json_data["ops"][0] and isinstance(json_data["ops"][0]["value"], str):
-                        yield f"data: {repr(json_data['ops'][0]['value'].encode('utf-8'))}\n\n"
-                    else:
-                        pass
-                elif "content" in json_data["choices"][0]["delta"]:
-                    yield f"data: {repr(json_data['choices'][0]['delta']['content'].encode('utf-8'))}\n\n"
-            except Exception as e:
-                yield f"data: {repr(json_str.encode('utf-8'))}\n\n"
+
+            # Parse the JSON data
+            json_data = json.loads(json_str)
+
+            # Handle TGI format responses
+            if "ops" in json_data and "op" in json_data["ops"][0]:
+                if "value" in json_data["ops"][0] and isinstance(json_data["ops"][0]["value"], str):
+                    yield f"data: {repr(json_data['ops'][0]['value'].encode('utf-8'))}\n\n"
+                # Empty value chunks are silently skipped
+
+            # Handle OpenAI format responses
+            elif "choices" in json_data and len(json_data["choices"]) > 0:
+                # Only yield content if it exists and is not null
+                if (
+                    "delta" in json_data["choices"][0]
+                    and "content" in json_data["choices"][0]["delta"]
+                    and json_data["choices"][0]["delta"]["content"] is not None
+                ):
+                    content = json_data["choices"][0]["delta"]["content"]
+                    yield f"data: {repr(content.encode('utf-8'))}\n\n"
+                # Null content chunks are silently skipped
+                elif (
+                    "delta" in json_data["choices"][0]
+                    and "content" in json_data["choices"][0]["delta"]
+                    and json_data["choices"][0]["delta"]["content"] is None
+                ):
+                    logger.debug("Skipping null content chunk")
+
+        except json.JSONDecodeError as e:
+            # Log the error with the problematic JSON string for better debugging
+            logger.error(f"JSON parsing error in align_generator: {e}\nProblematic JSON: {json_str[:200]}")
+            # Skip sending invalid JSON to avoid UI issues
+            continue
+        except Exception as e:
+            logger.error(f"Unexpected error in align_generator: {e}, line snippet: {line[:100]}...")
+            # Skip sending to avoid UI issues
+            continue
     yield "data: [DONE]\n\n"
 
 
diff --git a/ChatQnA/docker_compose/amd/cpu/epyc/compose.yaml b/ChatQnA/docker_compose/amd/cpu/epyc/compose.yaml
index ee5e810900..9b44783b5b 100644
--- a/ChatQnA/docker_compose/amd/cpu/epyc/compose.yaml
+++ b/ChatQnA/docker_compose/amd/cpu/epyc/compose.yaml
@@ -90,7 +90,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/amd/cpu/epyc/compose_faqgen.yaml b/ChatQnA/docker_compose/amd/cpu/epyc/compose_faqgen.yaml
index 13888c3e81..61580e1865 100644
--- a/ChatQnA/docker_compose/amd/cpu/epyc/compose_faqgen.yaml
+++ b/ChatQnA/docker_compose/amd/cpu/epyc/compose_faqgen.yaml
@@ -83,7 +83,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-server
     ports:
       - ${LLM_ENDPOINT_PORT:-9009}:80
diff --git a/ChatQnA/docker_compose/amd/cpu/epyc/compose_milvus.yaml b/ChatQnA/docker_compose/amd/cpu/epyc/compose_milvus.yaml
index ef1b271d76..7936c11135 100644
--- a/ChatQnA/docker_compose/amd/cpu/epyc/compose_milvus.yaml
+++ b/ChatQnA/docker_compose/amd/cpu/epyc/compose_milvus.yaml
@@ -147,7 +147,7 @@ services:
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
 
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/amd/cpu/epyc/compose_pinecone.yaml b/ChatQnA/docker_compose/amd/cpu/epyc/compose_pinecone.yaml
index 2681a92642..514a8803f6 100644
--- a/ChatQnA/docker_compose/amd/cpu/epyc/compose_pinecone.yaml
+++ b/ChatQnA/docker_compose/amd/cpu/epyc/compose_pinecone.yaml
@@ -77,7 +77,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/amd/cpu/epyc/compose_qdrant.yaml b/ChatQnA/docker_compose/amd/cpu/epyc/compose_qdrant.yaml
index 821bc02450..2850318d50 100644
--- a/ChatQnA/docker_compose/amd/cpu/epyc/compose_qdrant.yaml
+++ b/ChatQnA/docker_compose/amd/cpu/epyc/compose_qdrant.yaml
@@ -83,7 +83,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "6042:80"
diff --git a/ChatQnA/docker_compose/amd/cpu/epyc/compose_without_rerank.yaml b/ChatQnA/docker_compose/amd/cpu/epyc/compose_without_rerank.yaml
index 1b701c0279..296546e986 100644
--- a/ChatQnA/docker_compose/amd/cpu/epyc/compose_without_rerank.yaml
+++ b/ChatQnA/docker_compose/amd/cpu/epyc/compose_without_rerank.yaml
@@ -67,7 +67,7 @@ services:
       RETRIEVER_COMPONENT_NAME: "OPEA_RETRIEVER_REDIS"
     restart: unless-stopped
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/README.md b/ChatQnA/docker_compose/intel/cpu/xeon/README.md
index 08b61642db..899ee51db2 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/README.md
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/README.md
@@ -190,7 +190,7 @@ docker compose -f compose_remote.yaml up -d
 
 ## ChatQnA with Conversational UI (Optional)
 
-To access the Conversational UI (react based) frontend, modify the UI service in the `compose` file used to deploy. Replace `chaqna-xeon-ui-server` service with the `chatqna-xeon-conversation-ui-server` service as per the config below:
+To access the Conversational UI (react based) frontend, modify the UI service in the `compose` file used to deploy. Replace `chatqna-xeon-ui-server` service with the `chatqna-xeon-conversation-ui-server` service as per the config below:
 
 ```yaml
 chatqna-xeon-conversation-ui-server:
@@ -202,7 +202,7 @@ chatqna-xeon-conversation-ui-server:
   ports:
     - "5174:80"
   depends_on:
-    - chaqna-xeon-backend-server
+    - chatqna-xeon-backend-server
   ipc: host
   restart: always
 ```
@@ -210,7 +210,7 @@ chatqna-xeon-conversation-ui-server:
 Once the services are up, open the following URL in the browser: http://{host_ip}:5174. By default, the UI runs on port 80 internally. If the developer prefers to use a different host port to access the frontend, it can be modified by port mapping in the `compose.yaml` file as shown below:
 
 ```yaml
-  chaqna-gaudi-conversation-ui-server:
+  chatqna-gaudi-conversation-ui-server:
     image: opea/chatqna-conversation-ui:latest
     ...
     ports:
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/README_endpoint_openai.md b/ChatQnA/docker_compose/intel/cpu/xeon/README_endpoint_openai.md
new file mode 100644
index 0000000000..f9e84d07ec
--- /dev/null
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/README_endpoint_openai.md
@@ -0,0 +1,453 @@
+# Build Mega Service of ChatQnA on Xeon with an LLM Endpoint
+
+This document outlines the single node deployment process for a ChatQnA application utilizing the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservices on Intel Xeon server. The steps include pulling Docker images, container deployment via Docker Compose, and service execution to integrate microservices such as `embedding`, `retriever`, `rerank` and `llm`.
+
+## Table of contents
+
+1. [ChatQnA Quick Start Deployment](#chatqna-quick-start-Deployment)
+2. [ChatQnA Docker Compose file Options](#chatqna-docker-compose-files)
+3. [ChatQnA with Conversational UI](#chatqna-with-conversational-ui-optional)
+
+## ChatQnA Quick Start Deployment
+
+This section describes how to quickly deploy and test the ChatQnA service manually on an Intel® Xeon® processor. The basic steps are:
+
+1. [Access the Code](#access-the-code)
+2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+3. [Configure the Deployment Environment](#configure-the-deployment-environment)
+4. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+5. [Check the Deployment Status](#check-the-deployment-status)
+6. [Test the Pipeline](#test-the-pipeline)
+7. [Cleanup the Deployment](#cleanup-the-deployment)
+
+### Access the Code
+
+Clone the GenAIExample repository and access the ChatQnA Intel® Gaudi® platform Docker Compose files and supporting scripts:
+
+```
+git clone https://github.com/opea-project/GenAIComps
+cd GenAIComps
+
+# Build the opea/llm-textgen image.
+
+docker build \
+  --no-cache \
+  --build-arg https_proxy=$https_proxy \
+  --build-arg http_proxy=$http_proxy \
+  -t opea/llm-textgen:latest \
+  -f comps/llms/src/text-generation/Dockerfile .
+
+
+cd ../
+git clone https://github.com/opea-project/GenAIExamples.git
+cd GenAIExamples/ChatQnA/docker_compose/intel/cpu/xeon/
+```
+
+### Generate a HuggingFace Access Token
+
+Some HuggingFace resources, such as some models, are only accessible if the developer have an access token. In the absence of a HuggingFace access token, the developer can create one by first creating an account by following the steps provided at [HuggingFace](https://huggingface.co/) and then generating a [user access token](https://huggingface.co/docs/transformers.js/en/guides/private#step-1-generating-a-user-access-token).
+
+## Endpoint Access
+
+An OpenAI-compatible endpoint is required e.g., OpenRouter.ai. Please obtain a valid API key.
+
+### Configure the Deployment Environment
+
+To set up environment variables for deploying ChatQnA services, set up some parameters specific to the deployment environment and source the _setup_env.sh_ script in this directory:
+
+```bash
+cd GenAIExamples/ChatQnA/docker_compose/intel/cpu/xeon
+source set_env.sh # source environment variables then override below.
+
+export host_ip="External_Public_IP" # e.g. export host_ip=$(hostname -I | awk '{print $1}')
+export HF_TOKEN="Your_Huggingface_API_Token"
+export OPENAI_API_KEY="key for openAI-like endpoint"
+
+export LLM_MODEL_ID="" # e.g. "google/gemma-3-1b-it:free"
+export LLM_ENDPOINT=""  # e.g. "https://openrouter.ai/api" (please make sure to omit /v1 suffix)
+export no_proxy="" # Can set if any no proxy variables. See set_env.sh
+```
+
+Consult the section on [ChatQnA Service configuration](#chatqna-configuration) for information on how service specific configuration parameters affect deployments.
+
+### Deploy the Services Using Docker Compose
+
+To deploy the ChatQnA services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute the command below. It uses the 'compose.yaml' file.
+
+```bash
+NGINX_PORT=8080 docker compose -f compose_endpoint_openai.yaml up -d
+```
+
+Usage of NGINX_PORT=8080 allows you to access the chat console on localhost:8080 since webbrowser may use port 80.
+
+To enable Open Telemetry Tracing, compose.telemetry.yaml file need to be merged along with default compose.yaml file.  
+CPU example with Open Telemetry feature:
+
+> NOTE : To get supported Grafana Dashboard, please run download_opea_dashboard.sh following below commands.
+
+```bash
+./grafana/dashboards/download_opea_dashboard.sh
+NGINX_PORT=8080 docker compose -f compose_endpoint_openai.yaml -f compose.telemetry.yaml up -d
+```
+
+**Note**: developers should build docker image from source when:
+
+- Developing off the git main branch (as the container's ports in the repo may be different from the published docker image).
+- Unable to download the docker image.
+- Use a specific version of Docker image.
+
+Please refer to the table below to build different microservices from source:
+
+| Microservice | Deployment Guide                                                                              |
+| ------------ | --------------------------------------------------------------------------------------------- |
+| Dataprep     | https://github.com/opea-project/GenAIComps/tree/main/comps/dataprep                           |
+| Embedding    | https://github.com/opea-project/GenAIComps/tree/main/comps/embeddings                         |
+| Retriever    | https://github.com/opea-project/GenAIComps/tree/main/comps/retrievers                         |
+| Reranker     | https://github.com/opea-project/GenAIComps/tree/main/comps/rerankings                         |
+| LLM          | https://github.com/opea-project/GenAIComps/tree/main/comps/llms                               |
+| Megaservice  | [Megaservice build guide](../../../../README_miscellaneous.md#build-megaservice-docker-image) |
+| UI           | [Basic UI build guide](../../../../README_miscellaneous.md#build-ui-docker-image)             |
+
+### Check the Deployment Status
+
+After running docker compose, check if all the containers launched via docker compose have started:
+
+```
+docker ps -a
+```
+
+For the endpoint-based deployment, the following 9 containers should be running:
+
+```bash
+CONTAINER ID   IMAGE                                                   COMMAND                  CREATED          STATUS                    PORTS                                                                                  NAMES
+04f0e3607457   opea/nginx:${RELEASE_VERSION}                           "/docker-entrypoint.…"   17 minutes ago   Up 16 minutes             0.0.0.0:8080->80/tcp, [::]:8080->80/tcp                                                chatqna-xeon-nginx-server
+6d7fe1bfd0a5   opea/chatqna-ui:${RELEASE_VERSION}                      "docker-entrypoint.s…"   17 minutes ago   Up 16 minutes             0.0.0.0:5173->5173/tcp, :::5173->5173/tcp                                              chatqna-xeon-ui-server
+71d01fe8bc94   opea/chatqna:${RELEASE_VERSION}                         "python chatqna.py"      17 minutes ago   Up 16 minutes             0.0.0.0:8888->8888/tcp, :::8888->8888/tcp                                              chatqna-xeon-backend-server
+ea12fab1c70e   opea/retriever:${RELEASE_VERSION}                       "python opea_retriev…"   17 minutes ago   Up 17 minutes             0.0.0.0:7000->7000/tcp, :::7000->7000/tcp                                              retriever-redis-server
+253622403ed6   opea/dataprep:${RELEASE_VERSION}                        "sh -c 'python $( [ …"   17 minutes ago   Up 17 minutes (healthy)   0.0.0.0:6007->5000/tcp, [::]:6007->5000/tcp                                            dataprep-redis-server
+a552cf4f0dd0   redis/redis-stack:7.2.0-v9                              "/entrypoint.sh"         17 minutes ago   Up 17 minutes (healthy)   0.0.0.0:6379->6379/tcp, :::6379->6379/tcp, 0.0.0.0:8001->8001/tcp, :::8001->8001/tcp   redis-vector-db
+6795a52137f7   ghcr.io/huggingface/text-embeddings-inference:cpu-1.5   "text-embeddings-rou…"   17 minutes ago   Up 17 minutes             0.0.0.0:6006->80/tcp, [::]:6006->80/tcp                                                tei-embedding-server
+3e55313e714b   opea/llm-textgen:${RELEASE_VERSION}                     "bash entrypoint.sh"     17 minutes ago   Up 17 minutes             0.0.0.0:9000->9000/tcp, :::9000->9000/tcp                                              textgen-service-endpoint-openai
+10318f82c943   ghcr.io/huggingface/text-embeddings-inference:cpu-1.5   "text-embeddings-rou…"   17 minutes ago   Up 17 minutes             0.0.0.0:8808->80/tcp, [::]:8808->80/tcp                                                tei-reranking-server
+```
+
+If any issues are encountered during deployment, refer to the [troubleshooting](../../../../README_miscellaneous.md##troubleshooting) section.
+
+### Test the Pipeline
+
+Once the ChatQnA services are running, test the pipeline using the following command. This will send a sample query to the ChatQnA service and return a response.
+
+```bash
+curl http://${host_ip}:8888/v1/chatqna \
+    -H "Content-Type: application/json" \
+    -d '{
+        "messages": "What is the revenue of Nike in 2023?"
+    }'
+```
+
+**Note** : Access the ChatQnA UI by web browser through this URL: `http://${host_ip}:8080`. Please confirm the `8080` port is opened in the firewall. To validate each microservice used in the pipeline refer to the [Validate microservices](#validate-microservices) section.
+
+### Cleanup the Deployment
+
+To stop the containers associated with the deployment, execute the following command:
+
+```
+docker compose -f compose.yaml down
+```
+
+## ChatQnA Docker Compose Files
+
+In the context of deploying a ChatQnA pipeline on an Intel® Xeon® platform, we can pick and choose different vector databases, large language model serving frameworks, and remove pieces of the pipeline such as the reranker. The table below outlines the various configurations that are available as part of the application. These configurations can be used as templates and can be extended to different components available in [GenAIComps](https://github.com/opea-project/GenAIComps.git).
+
+| File                                                           | Description                                                                                                                                                           |
+| -------------------------------------------------------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| [compose.yaml](./compose.yaml)                                 | Default compose file using vllm as serving framework and redis as vector database                                                                                     |
+| [compose_endpoint_openai.yaml](./compose_endpoint_openai.yaml) | Uses OpenAI-compatible endpoint (remote or local) as LLM serving framework with redis as vector database.                                                             |
+| [compose_milvus.yaml](./compose_milvus.yaml)                   | Uses Milvus as the vector database. All other configurations remain the same as the default                                                                           |
+| [compose_pinecone.yaml](./compose_pinecone.yaml)               | Uses Pinecone as the vector database. All other configurations remain the same as the default. For more details, refer to [README_pinecone.md](./README_pinecone.md). |
+| [compose_qdrant.yaml](./compose_qdrant.yaml)                   | Uses Qdrant as the vector database. All other configurations remain the same as the default. For more details, refer to [README_qdrant.md](./README_qdrant.md).       |
+| [compose_tgi.yaml](./compose_tgi.yaml)                         | Uses TGI as the LLM serving framework. All other configurations remain the same as the default                                                                        |
+| [compose_without_rerank.yaml](./compose_without_rerank.yaml)   | Default configuration without the reranker                                                                                                                            |
+| [compose_faqgen.yaml](./compose_faqgen.yaml)                   | Enables FAQ generation using vLLM as the LLM serving framework. For more details, refer to [README_faqgen.md](./README_faqgen.md).                                    |
+| [compose_faqgen_tgi.yaml](./compose_faqgen_tgi.yaml)           | Enables FAQ generation using TGI as the LLM serving framework. For more details, refer to [README_faqgen.md](./README_faqgen.md).                                     |
+| [compose.telemetry.yaml](./compose.telemetry.yaml)             | Helper file for telemetry features for vllm. Can be used along with any compose files that serves vllm                                                                |
+| [compose_tgi.telemetry.yaml](./compose_tgi.telemetry.yaml)     | Helper file for telemetry features for tgi. Can be used along with any compose files that serves tgi                                                                  |
+| [compose_mariadb.yaml](./compose_mariadb.yaml)                 | Uses MariaDB Server as the vector database. All other configurations remain the same as the default                                                                   |
+
+## ChatQnA with Conversational UI (Optional)
+
+To access the Conversational UI (react based) frontend, modify the UI service in the `compose` file used to deploy. Replace `chatqna-xeon-ui-server` service with the `chatqna-xeon-conversation-ui-server` service as per the config below:
+
+```yaml
+chatqna-xeon-conversation-ui-server:
+  image: opea/chatqna-conversation-ui:latest
+  container_name: chatqna-xeon-conversation-ui-server
+  environment:
+    - APP_BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+    - APP_DATA_PREP_SERVICE_URL=${DATAPREP_SERVICE_ENDPOINT}
+  ports:
+    - "5174:80"
+  depends_on:
+    - chatqna-xeon-backend-server
+  ipc: host
+  restart: always
+```
+
+Once the services are up, open the following URL in the browser: http://{host_ip}:5174. By default, the UI runs on port 80 internally. If the developer prefers to use a different host port to access the frontend, it can be modified by port mapping in the `compose.yaml` file as shown below:
+
+```yaml
+  chatqna-xeon-conversation-ui-server:
+    image: opea/chatqna-conversation-ui:latest
+    ...
+    ports:
+      - "80:80"
+```
+
+Here is an example of running ChatQnA (default UI):
+
+![project-screenshot](../../../../assets/img/chat_ui_response.png)
+
+Here is an example of running ChatQnA with Conversational UI (React):
+
+![project-screenshot](../../../../assets/img/conversation_ui_response.png)
+
+### Validate Microservices
+
+Note, when verifying the microservices by curl or API from remote client, please make sure the **ports** of the microservices are opened in the firewall of the cloud node.  
+Follow the instructions to validate MicroServices.
+For details on how to verify the correctness of the response, refer to [how-to-validate_service](../../hpu/gaudi/how_to_validate_service.md).
+
+1. **TEI Embedding Service**
+   Send a test request to the TEI Embedding Service to ensure it is running correctly:
+
+   ```bash
+   curl http://${host_ip}:6006/embed \
+       -X POST \
+       -d '{"inputs":"What is Deep Learning?"}' \
+       -H 'Content-Type: application/json'
+   ```
+
+   If you receive a connection error, ensure that the service is running and the port 6006 is open in the firewall.
+
+2. **Retriever Microservice**
+
+   To consume the retriever microservice, you need to generate a mock embedding vector by Python script. The length of embedding vector
+   is determined by the embedding model.
+   Here we use the model `EMBEDDING_MODEL_ID="BAAI/bge-base-en-v1.5"`, which vector size is 768.
+
+   Check the vector dimension of your embedding model, set `your_embedding` dimension equal to it.
+
+   ```bash
+   export your_embedding=$(python3 -c "import random; embedding = [random.uniform(-1, 1) for _ in range(768)]; print(embedding)")
+   curl http://${host_ip}:7000/v1/retrieval \
+     -X POST \
+     -d "{\"text\":\"test\",\"embedding\":${your_embedding}}" \
+     -H 'Content-Type: application/json'
+   ```
+
+   If the response indicates an invalid embedding vector, verify that the vector size matches the model's expected dimension.
+
+3. **TEI Reranking Service**
+
+   To test the TEI Reranking Service, use the following `curl` command:
+
+   > Skip for ChatQnA without Rerank pipeline
+
+   ```bash
+   curl http://${host_ip}:8808/rerank \
+       -X POST \
+       -d '{"query":"What is Deep Learning?", "texts": ["Deep Learning is not...", "Deep learning is..."]}' \
+       -H 'Content-Type: application/json'
+   ```
+
+4. **LLM Backend Service**
+
+   In the first startup, this service will take more time to download, load and warm up the model. After it's finished, the service will be ready.
+
+   Try the command below to check whether the LLM serving is ready.
+
+   ```bash
+   docker logs textgen-service-endpoint-openai 2>&1 | grep complete
+   # If the service is ready, you will get the response like below.
+   INFO:     Application startup complete.
+   ```
+
+   Then try the `cURL` command below to validate services.
+
+You may also test your underlying LLM endpoint. E.g., if OpenRouter.ai:
+
+```bash
+curl https://openrouter.ai/api/v1/chat/completions \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer $OPENAI_API_KEY" \
+  -d '{
+  "model": ${LLM_MODEL_ID},
+  "messages": [
+    {
+      "role": "user",
+      "content": "What is the meaning of life?"
+    }
+  ]
+}'
+```
+
+To test the OPEA service that is based on the above:
+
+```bash
+  curl http://${host_ip}:9000/v1/chat/completions \
+    -X POST \
+    -d '{"model": "${LLM_MODEL_ID}", "messages": [{"role": "user", "content": "What is Deep Learning?"}], "max_tokens":17}' \
+    -H 'Content-Type: application/json'
+```
+
+5. **MegaService**
+
+   Use the following `curl` command to test the MegaService:
+
+   ```bash
+    curl http://${host_ip}:8888/v1/chatqna -H "Content-Type: application/json" -d '{
+          "messages": "What is the revenue of Nike in 2023?"
+          }'
+   ```
+
+6. **Nginx Service**
+
+   Use the following curl command to test the Nginx Service:
+
+   ```bash
+   curl http://${host_ip}:${NGINX_PORT}/v1/chatqna \
+       -H "Content-Type: application/json" \
+       -d '{"messages": "What is the revenue of Nike in 2023?"}'
+   ```
+
+7. **Dataprep Microservice(Optional) **
+
+   If you want to update the default knowledge base, you can use the following commands:
+
+   Update Knowledge Base via Local File [nke-10k-2023.pdf](https://github.com/opea-project/GenAIComps/blob/v1.1/comps/retrievers/redis/data/nke-10k-2023.pdf). Or
+   click [here](https://raw.githubusercontent.com/opea-project/GenAIComps/v1.1/comps/retrievers/redis/data/nke-10k-2023.pdf) to download the file via any web browser.
+   Or run this command to get the file on a terminal.
+
+   ```bash
+   wget https://raw.githubusercontent.com/opea-project/GenAIComps/v1.1/comps/retrievers/redis/data/nke-10k-2023.pdf
+   ```
+
+   Upload:
+
+   ```bash
+   curl -X POST "http://${host_ip}:6007/v1/dataprep/ingest" \
+       -H "Content-Type: multipart/form-data" \
+       -F "files=@./nke-10k-2023.pdf"
+   ```
+
+   This command updates a knowledge base by uploading a local file for processing. Update the file path according to your environment.
+
+   Add Knowledge Base via HTTP Links:
+
+   ```bash
+   curl -X POST "http://${host_ip}:6007/v1/dataprep/ingest" \
+       -H "Content-Type: multipart/form-data" \
+       -F 'link_list=["https://opea.dev"]'
+   ```
+
+   This command updates a knowledge base by submitting a list of HTTP links for processing.
+
+   Also, you are able to get the file list that you uploaded:
+
+   ```bash
+   curl -X POST "http://${host_ip}:6007/v1/dataprep/get" \
+       -H "Content-Type: application/json"
+   ```
+
+   Then you will get the response JSON like this. Notice that the returned `name`/`id` of the uploaded link is `https://xxx.txt`.
+
+   ```json
+   [
+     {
+       "name": "nke-10k-2023.pdf",
+       "id": "nke-10k-2023.pdf",
+       "type": "File",
+       "parent": ""
+     },
+     {
+       "name": "https://opea.dev.txt",
+       "id": "https://opea.dev.txt",
+       "type": "File",
+       "parent": ""
+     }
+   ]
+   ```
+
+   To delete the file/link you uploaded:
+
+   The `file_path` here should be the `id` get from `/v1/dataprep/get` API.
+
+   ```bash
+   # delete link
+   curl -X POST "http://${host_ip}:6007/v1/dataprep/delete" \
+       -d '{"file_path": "https://opea.dev.txt"}' \
+       -H "Content-Type: application/json"
+
+   # delete file
+   curl -X POST "http://${host_ip}:6007/v1/dataprep/delete" \
+       -d '{"file_path": "nke-10k-2023.pdf"}' \
+       -H "Content-Type: application/json"
+
+   # delete all uploaded files and links
+   curl -X POST "http://${host_ip}:6007/v1/dataprep/delete" \
+       -d '{"file_path": "all"}' \
+       -H "Content-Type: application/json"
+   ```
+
+### Profile Microservices
+
+To further analyze MicroService Performance, users could follow the instructions to profile MicroServices.
+
+#### 1. LLM Endpoint Service
+
+Users can profile the performance of the endpoint service using standard HTTP/network profiling tools such as:
+
+- cURL timing statistics
+- Browser developer tools
+- Network monitoring tools
+
+Example using cURL with timing data:
+
+```bash
+curl -w "\nTime Statistics:\n-----------------\n\
+DNS Lookup: %{time_namelookup}s\n\
+TCP Connect: %{time_connect}s\n\
+TLS Handshake: %{time_appconnect}s\n\
+First Byte: %{time_starttransfer}s\n\
+Total Time: %{time_total}s\n" \
+-H "Content-Type: application/json" \
+-H "Authorization: Bearer $OPENAI_API_KEY" \
+-d '{
+  "model": "${LLM_MODEL_ID}",
+  "messages": [
+    {
+      "role": "user",
+      "content": "What is machine learning?"
+    }
+  ]
+}' \
+${LLM_ENDPOINT}/v1/chat/completions
+```
+
+You can also use tools like `ab` (Apache Benchmark) for load testing:
+
+```bash
+ab -n 100 -c 10 -p payload.json -T 'application/json' \
+  -H "Authorization: Bearer $OPENAI_API_KEY" \
+  ${LLM_ENDPOINT}/v1/chat/completions
+```
+
+For detailed API latency monitoring, consider using:
+
+- Grafana for visualization
+- Prometheus for metrics collection
+- OpenTelemetry for distributed tracing
+
+## Conclusion
+
+This guide should enable developer to deploy the default configuration or any of the other compose yaml files for different configurations. It also highlights the configurable parameters that can be set before deployment.
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/README_opengauss.md b/ChatQnA/docker_compose/intel/cpu/xeon/README_opengauss.md
new file mode 100644
index 0000000000..4cf2670150
--- /dev/null
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/README_opengauss.md
@@ -0,0 +1,424 @@
+# Deploying ChatQnA with openGauss on Intel® Xeon® Processors
+
+This document outlines the deployment process for a ChatQnA application utilizing the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline on Intel® Xeon® servers. The pipeline integrates **openGauss** as the vector database (VectorDB) and includes microservices such as `embedding`, `retriever`, `rerank`, and `llm`.
+
+---
+
+## Table of Contents
+
+1. [Quick Start](#quick-start)
+2. [Build Docker Images](#build-docker-images)
+3. [Validate Microservices](#validate-microservices)
+4. [Launch the UI](#launch-the-ui)
+5. [Launch the Conversational UI (Optional)](#launch-the-conversational-ui-optional)
+
+---
+
+## Quick Start
+
+### 1.Set up Environment Variable
+
+To set up environment variables for deploying ChatQnA services, follow these steps:
+
+1. Set the required environment variables:
+
+   ```bash
+   # Example: host_ip="192.168.1.1"
+   export host_ip="External_Public_IP"
+   export HF_TOKEN="Your_Huggingface_API_Token"
+   export GS_USER="gaussdb"
+   export GS_PASSWORD="openGauss@123"
+   export GS_DB="postgres"
+   export GS_CONNECTION_STRING="opengauss+psycopg2://${GS_USER}:${GS_PASSWORD}@${ip_address}:5432/${GS_DB}"
+   ```
+
+2. If you are in a proxy environment, also set the proxy-related environment variables:
+
+   ```bash
+   export http_proxy="Your_HTTP_Proxy"
+   export https_proxy="Your_HTTPS_Proxy"
+   # Example: no_proxy="localhost,127.0.0.1,192.168.1.1"
+   export no_proxy="Your_No_Proxy",chatqna-xeon-ui-server,chatqna-xeon-backend-server,dataprep-opengauss-service,tei-embedding-service,retriever,tei-reranking-service,tgi-service,vllm-service
+   ```
+
+3. Set up other environment variables:
+   ```bash
+   source ./set_env.sh
+   ```
+
+### 2.Run Docker Compose
+
+```bash
+docker compose -f compose_opengauss.yaml up -d
+```
+
+It will automatically download the Docker image on `Docker hub`:
+
+```bash
+docker pull opea/chatqna:latest
+docker pull opea/chatqna-ui:latest
+```
+
+Note: You should build docker image from source by yourself if:
+
+- You are developing off the git main branch (as the container's ports in the repo may be different from the published docker image).
+- You can't download the docker image.
+- You want to use a specific version of Docker image.
+
+Please refer to ['Build Docker Images'](#build-docker-images) in below.
+
+### 3.Consume the ChatQnA Service
+
+```bash
+curl http://${host_ip}:8888/v1/chatqna \
+    -H "Content-Type: application/json" \
+    -d '{
+        "messages": "What is the revenue of Nike in 2023?"
+    }'
+```
+
+## Build Docker Images
+
+First of all, you need to build Docker Images locally and install the python package of it.
+
+```bash
+git clone https://github.com/opea-project/GenAIComps.git
+cd GenAIComps
+```
+
+### 1. Build Retriever Image
+
+```bash
+docker build --no-cache -t opea/retriever:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/retrievers/src/Dockerfile .
+```
+
+### 2. Build Dataprep Image
+
+```bash
+docker build --no-cache -t opea/dataprep:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/dataprep/src/Dockerfile .
+cd ..
+```
+
+### 3. Build MegaService Docker Image
+
+1. MegaService with Rerank
+
+   To construct the Mega Service with Rerank, we utilize the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline within the `chatqna.py` Python script. Build MegaService Docker image via below command:
+
+   ```bash
+   git clone https://github.com/opea-project/GenAIExamples.git
+   cd GenAIExamples/ChatQnA
+   docker build --no-cache -t opea/chatqna:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+   ```
+
+2. MegaService without Rerank
+
+   To construct the Mega Service without Rerank, we utilize the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline within the `chatqna_without_rerank.py` Python script. Build MegaService Docker image via below command:
+
+   ```bash
+   git clone https://github.com/opea-project/GenAIExamples.git
+   cd GenAIExamples/ChatQnA
+   docker build --no-cache -t opea/chatqna-without-rerank:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile.without_rerank .
+   ```
+
+### 4. Build UI Docker Image
+
+Build frontend Docker image via below command:
+
+```bash
+cd GenAIExamples/ChatQnA/ui
+docker build --no-cache -t opea/chatqna-ui:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f ./docker/Dockerfile .
+```
+
+### 5. Build Conversational React UI Docker Image (Optional)
+
+Build frontend Docker image that enables Conversational experience with ChatQnA megaservice via below command:
+
+**Export the value of the public IP address of your Xeon server to the `host_ip` environment variable**
+
+```bash
+cd GenAIExamples/ChatQnA/ui
+docker build --no-cache -t opea/chatqna-conversation-ui:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f ./docker/Dockerfile.react .
+```
+
+### 6. Build Nginx Docker Image
+
+```bash
+cd GenAIComps
+docker build -t opea/nginx:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/third_parties/nginx/src/Dockerfile .
+```
+
+Then run the command `docker images`, you will have the following 5 Docker Images:
+
+1. `opea/dataprep:latest`
+2. `opea/retriever:latest`
+3. `opea/chatqna:latest` or `opea/chatqna-without-rerank:latest`
+4. `opea/chatqna-ui:latest`
+5. `opea/nginx:latest`
+
+## 🚀 Start Microservices
+
+### Required Models
+
+By default, the embedding, reranking and LLM models are set to a default value as listed below:
+
+| Service   | Model                               |
+| --------- | ----------------------------------- |
+| Embedding | BAAI/bge-base-en-v1.5               |
+| Reranking | BAAI/bge-reranker-base              |
+| LLM       | meta-llama/Meta-Llama-3-8B-Instruct |
+
+Change the `xxx_MODEL_ID` below for your needs.
+
+For users in China who are unable to download models directly from Huggingface, you can use [ModelScope](https://www.modelscope.cn/models) or a Huggingface mirror to download models. The vLLM can load the models either online or offline as described below:
+
+1. Online
+
+   ```bash
+   export HF_TOKEN=${your_hf_token}
+   export HF_ENDPOINT="https://hf-mirror.com"
+   model_name="meta-llama/Meta-Llama-3-8B-Instruct"
+   docker run -p 8008:80 -v ./data:/root/.cache/huggingface/hub --name vllm-service -e HF_ENDPOINT=$HF_ENDPOINT -e http_proxy=$http_proxy -e https_proxy=$https_proxy --shm-size 128g opea/vllm:latest --model $model_name --host 0.0.0.0 --port 80
+   ```
+
+2. Offline
+
+   - Search your model name in ModelScope. For example, check [this page](https://modelscope.cn/models/LLM-Research/Meta-Llama-3-8B-Instruct/files) for model `Meta-Llama-3-8B-Instruct`.
+
+   - Click on `Download this model` button, and choose one way to download the model to your local path `/path/to/model`.
+
+   - Run the following command to start the LLM service.
+
+     ```bash
+     export HF_TOKEN=${your_hf_token}
+     export model_path="/path/to/model"
+     docker run -p 8008:80 -v $model_path:/root/.cache/huggingface/hub --name vllm-service --shm-size 128g opea/vllm:latest --model /root/.cache/huggingface/hub --host 0.0.0.0 --port 80
+     ```
+
+### Set up Environment Variables
+
+1. Set the required environment variables:
+
+   ```bash
+   # Example: host_ip="192.168.1.1"
+   export host_ip="External_Public_IP"
+   export HF_TOKEN="Your_Huggingface_API_Token"
+   # Example: NGINX_PORT=80
+   export NGINX_PORT=${your_nginx_port}
+   export GS_USER="gaussdb"
+   export GS_PASSWORD="openGauss@123"
+   export GS_DB="postgres"
+   export GS_CONNECTION_STRING="opengauss+psycopg2://${GS_USER}:${GS_PASSWORD}@${ip_address}:5432/${GS_DB}"
+   ```
+
+2. If you are in a proxy environment, also set the proxy-related environment variables:
+
+   ```bash
+   export http_proxy="Your_HTTP_Proxy"
+   export https_proxy="Your_HTTPs_Proxy"
+   # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
+   export no_proxy="Your_No_Proxy",chatqna-xeon-ui-server,chatqna-xeon-backend-server,dataprep-opengauss-service,tei-embedding-service,retriever,tei-reranking-service,tgi-service,vllm-service
+   ```
+
+3. Set up other environment variables, make sure to update the INDEX_NAME variable to use openGauss Index name:
+
+   ```bash
+   source ./set_env.sh
+   ```
+
+### Start all the services Docker Containers
+
+> Before running the docker compose command, you need to be in the folder that has the docker compose yaml file
+
+```bash
+cd GenAIExamples/ChatQnA/docker_compose/intel/cpu/xeon/
+```
+
+If use vLLM backend.
+
+```bash
+# Start ChatQnA with Rerank Pipeline
+docker compose -f compose_opengauss.yaml up -d
+```
+
+## Validate Microservices
+
+Note, when verify the microservices by curl or API from remote client, please make sure the **ports** of the microservices are opened in the firewall of the cloud node.
+Follow the instructions to validate MicroServices.
+For details on how to verify the correctness of the response, refer to [how-to-validate_service](../../hpu/gaudi/how_to_validate_service.md).
+
+1. TEI Embedding Service
+
+   ```bash
+   curl ${host_ip}:6006/embed \
+       -X POST \
+       -d '{"inputs":"What is Deep Learning?"}' \
+       -H 'Content-Type: application/json'
+   ```
+
+2. Retriever Microservice
+
+   To consume the retriever microservice, you need to generate a mock embedding vector by Python script. The length of embedding vector
+   is determined by the embedding model.
+   Here we use the model `EMBEDDING_MODEL_ID="BAAI/bge-base-en-v1.5"`, which vector size is 768.
+
+   Check the vector dimension of your embedding model, set `your_embedding` dimension equals to it.
+
+   ```bash
+   export your_embedding=$(python3 -c "import random; embedding = [random.uniform(-1, 1) for _ in range(768)]; print(embedding)")
+   curl http://${host_ip}:7000/v1/retrieval \
+     -X POST \
+     -d "{\"text\":\"test\",\"embedding\":${your_embedding}}" \
+     -H 'Content-Type: application/json'
+   ```
+
+3. TEI Reranking Service
+
+   > Skip for ChatQnA without Rerank pipeline
+
+   ```bash
+   curl http://${host_ip}:8808/rerank \
+       -X POST \
+       -d '{"query":"What is Deep Learning?", "texts": ["Deep Learning is not...", "Deep learning is..."]}' \
+       -H 'Content-Type: application/json'
+   ```
+
+4. LLM backend Service
+
+   In the first startup, this service will take more time to download, load and warm up the model. After it's finished, the service will be ready.
+
+   Try the command below to check whether the LLM serving is ready.
+
+   ```bash
+   docker logs vllm-service 2>&1 | grep complete
+   ```
+
+   If the service is ready, you will get the response like below.
+
+   ```text
+   INFO: Application startup complete.
+   ```
+
+   Then try the `cURL` command below to validate services.
+
+   ```bash
+   curl http://${host_ip}:9009/v1/chat/completions \
+     -X POST \
+     -d '{"model": "meta-llama/Meta-Llama-3-8B-Instruct", "messages": [{"role": "user", "content": "What is Deep Learning?"}], "max_tokens":17}' \
+     -H 'Content-Type: application/json'
+   ```
+
+5. MegaService
+
+   ```bash
+    curl http://${host_ip}:8888/v1/chatqna -H "Content-Type: application/json" -d '{
+          "messages": "What is the revenue of Nike in 2023?"
+          }'
+   ```
+
+6. Nginx Service
+
+   ```bash
+   curl http://${host_ip}:${NGINX_PORT}/v1/chatqna \
+       -H "Content-Type: application/json" \
+       -d '{"messages": "What is the revenue of Nike in 2023?"}'
+   ```
+
+7. Dataprep Microservice（Optional）
+
+If you want to update the default knowledge base, you can use the following commands:
+
+Update Knowledge Base via Local File [nke-10k-2023.pdf](https://raw.githubusercontent.com/opea-project/GenAIComps/v1.3/comps/third_parties/pathway/src/data/nke-10k-2023.pdf). Or
+click [here](https://raw.githubusercontent.com/opea-project/GenAIComps/v1.3/comps/third_parties/pathway/src/data/nke-10k-2023.pdf) to download the file via any web browser.
+Or run this command to get the file on a terminal.
+
+```bash
+wget https://raw.githubusercontent.com/opea-project/GenAIComps/v1.3/comps/third_parties/pathway/src/data/nke-10k-2023.pdf
+
+```
+
+Upload:
+
+```bash
+curl -X POST "http://${host_ip}:6007/v1/dataprep/ingest" \
+     -H "Content-Type: multipart/form-data" \
+     -F "files=@./nke-10k-2023.pdf"
+```
+
+This command updates a knowledge base by uploading a local file for processing. Update the file path according to your environment.
+
+Add Knowledge Base via HTTP Links:
+
+```bash
+curl -X POST "http://${host_ip}:6007/v1/dataprep/ingest" \
+     -H "Content-Type: multipart/form-data" \
+     -F 'link_list=["https://opea.dev"]'
+```
+
+This command updates a knowledge base by submitting a list of HTTP links for processing.
+
+To delete the files/link you uploaded:
+
+```bash
+# delete all uploaded files and links
+curl -X POST "http://${host_ip}:6007/v1/dataprep/delete" \
+     -d '{"file_path": "all"}' \
+     -H "Content-Type: application/json"
+```
+
+## Launch the UI
+
+### Launch with origin port
+
+To access the frontend, open the following URL in your browser: http://{host_ip}:5173. By default, the UI runs on port 5173 internally. If you prefer to use a different host port to access the frontend, you can modify the port mapping in the `compose.yaml` file as shown below:
+
+```yaml
+  chaqna-gaudi-ui-server:
+    image: opea/chatqna-ui:latest
+    ...
+    ports:
+      - "80:5173"
+```
+
+### Launch with Nginx
+
+If you want to launch the UI using Nginx, open this URL: `http://${host_ip}:${NGINX_PORT}` in your browser to access the frontend.
+
+## Launch the Conversational UI (Optional)
+
+To access the Conversational UI (react based) frontend, modify the UI service in the `compose.yaml` file. Replace `chaqna-xeon-ui-server` service with the `chatqna-xeon-conversation-ui-server` service as per the config below:
+
+```yaml
+chaqna-xeon-conversation-ui-server:
+  image: opea/chatqna-conversation-ui:latest
+  container_name: chatqna-xeon-conversation-ui-server
+  environment:
+    - APP_BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+    - APP_DATA_PREP_SERVICE_URL=${DATAPREP_SERVICE_ENDPOINT}
+  ports:
+    - "5174:80"
+  depends_on:
+    - chaqna-xeon-backend-server
+  ipc: host
+  restart: always
+```
+
+Once the services are up, open the following URL in your browser: http://{host_ip}:5174. By default, the UI runs on port 80 internally. If you prefer to use a different host port to access the frontend, you can modify the port mapping in the `compose.yaml` file as shown below:
+
+```yaml
+  chaqna-gaudi-conversation-ui-server:
+    image: opea/chatqna-conversation-ui:latest
+    ...
+    ports:
+      - "80:80"
+```
+
+![project-screenshot](../../../../assets/img/chat_ui_init.png)
+
+Here is an example of running ChatQnA:
+
+![project-screenshot](../../../../assets/img/chat_ui_response.png)
+
+Here is an example of running ChatQnA with Conversational UI (React):
+
+![project-screenshot](../../../../assets/img/conversation_ui_response.png)
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose.yaml
index fb9d4ce9c8..e276089e36 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose.yaml
@@ -89,7 +89,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_endpoint_openai.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_endpoint_openai.yaml
new file mode 100644
index 0000000000..ed8045276e
--- /dev/null
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_endpoint_openai.yaml
@@ -0,0 +1,173 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  redis-vector-db:
+    image: redis/redis-stack:7.2.0-v9
+    container_name: redis-vector-db
+    ports:
+      - "6379:6379"
+      - "8001:8001"
+    healthcheck:
+      test: ["CMD", "redis-cli", "ping"]
+      interval: 5s
+      timeout: 3s
+      retries: 10
+  dataprep-redis-service:
+    image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}
+    container_name: dataprep-redis-server
+    depends_on:
+      redis-vector-db:
+        condition: service_healthy
+      tei-embedding-service:
+        condition: service_started
+    ports:
+      - "6007:5000"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      REDIS_URL: redis://redis-vector-db:6379
+      REDIS_HOST: redis-vector-db
+      INDEX_NAME: ${INDEX_NAME}
+      TEI_ENDPOINT: http://tei-embedding-service:80
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:5000/v1/health_check || exit 1"]
+      interval: 10s
+      timeout: 5s
+      retries: 50
+    restart: unless-stopped
+  tei-embedding-service:
+    image: ghcr.io/huggingface/text-embeddings-inference:cpu-1.7
+    container_name: tei-embedding-server
+    ports:
+      - "6006:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+    command: --model-id ${EMBEDDING_MODEL_ID} --auto-truncate
+  retriever:
+    image: ${REGISTRY:-opea}/retriever:${TAG:-latest}
+    container_name: retriever-redis-server
+    depends_on:
+      - redis-vector-db
+    ports:
+      - "7000:7000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      REDIS_URL: redis://redis-vector-db:6379
+      REDIS_HOST: redis-vector-db
+      INDEX_NAME: ${INDEX_NAME}
+      TEI_EMBEDDING_ENDPOINT: http://tei-embedding-service:80
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
+      LOGFLAG: ${LOGFLAG}
+      RETRIEVER_COMPONENT_NAME: "OPEA_RETRIEVER_REDIS"
+    restart: unless-stopped
+  tei-reranking-service:
+    image: ghcr.io/huggingface/text-embeddings-inference:cpu-1.7
+    container_name: tei-reranking-server
+    ports:
+      - "8808:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+    command: --model-id ${RERANK_MODEL_ID} --auto-truncate
+  # Substitute vllm with OpeaTextGenService
+  textgen-service-endpoint-openai:  # Used instead of vllm
+    image: opea/llm-textgen:${TAG:-latest} # Changed image
+    container_name: textgen-service-endpoint-openai  # Updated container name
+    ipc: host
+    ports:
+      - "9000:9000"  # Changed port mapping
+    environment:
+      LLM_COMPONENT_NAME: OpeaTextGenService
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}  # Set to model ID
+      LLM_ENDPOINT: ${LLM_ENDPOINT}  # An openai compatible endpoint, e.g. Hugging Face, OpenRouter, OpenAI
+      OPENAI_API_KEY: ${OPENAI_API_KEY} # Add OpenRouter API Key
+  chatqna-xeon-backend-server:
+    image: ${REGISTRY:-opea}/chatqna:${TAG:-latest}
+    container_name: chatqna-xeon-backend-server
+    depends_on:
+      redis-vector-db:
+        condition: service_started
+      dataprep-redis-service:
+        condition: service_healthy
+      tei-embedding-service:
+        condition: service_started
+      retriever:
+        condition: service_started
+      tei-reranking-service:
+        condition: service_started
+      textgen-service-endpoint-openai:
+        condition: service_started
+    ports:
+      - "8888:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=chatqna-xeon-backend-server
+      - EMBEDDING_SERVER_HOST_IP=tei-embedding-service
+      - EMBEDDING_SERVER_PORT=${EMBEDDING_SERVER_PORT:-80}
+      - RETRIEVER_SERVICE_HOST_IP=retriever
+      - RERANK_SERVER_HOST_IP=tei-reranking-service
+      - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
+      - LLM_SERVER_HOST_IP=textgen-service-endpoint-openai  # Updated host IP
+      - LLM_SERVER_PORT=${LLM_SERVER_PORT:-9000}
+      - LLM_MODEL=${LLM_MODEL_ID}
+      - LOGFLAG=${LOGFLAG}
+    ipc: host
+    restart: always
+  chatqna-xeon-ui-server:
+    image: ${REGISTRY:-opea}/chatqna-ui:${TAG:-latest}
+    container_name: chatqna-xeon-ui-server
+    depends_on:
+      - chatqna-xeon-backend-server
+    ports:
+      - "5173:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+    ipc: host
+    restart: always
+  chatqna-xeon-nginx-server:
+    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
+    container_name: chatqna-xeon-nginx-server
+    depends_on:
+      - chatqna-xeon-backend-server
+      - chatqna-xeon-ui-server
+    ports:
+      - "${NGINX_PORT:-80}:80"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - FRONTEND_SERVICE_IP=chatqna-xeon-ui-server
+      - FRONTEND_SERVICE_PORT=5173
+      - BACKEND_SERVICE_NAME=chatqna
+      - BACKEND_SERVICE_IP=chatqna-xeon-backend-server
+      - BACKEND_SERVICE_PORT=8888
+      - DATAPREP_SERVICE_IP=dataprep-redis-service
+      - DATAPREP_SERVICE_PORT=5000
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_faqgen.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_faqgen.yaml
index e34f6f0062..a1a7d05fba 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/compose_faqgen.yaml
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_faqgen.yaml
@@ -81,7 +81,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-server
     ports:
       - ${LLM_ENDPOINT_PORT:-9009}:80
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_mariadb.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_mariadb.yaml
index ccd55bbce3..ab5217f359 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/compose_mariadb.yaml
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_mariadb.yaml
@@ -90,7 +90,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_milvus.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_milvus.yaml
index 67226bd404..2f6fe6d439 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/compose_milvus.yaml
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_milvus.yaml
@@ -144,7 +144,7 @@ services:
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
 
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_openeuler.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
index 44fef78971..679ddd2fd8 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
@@ -88,14 +88,13 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: openeuler/vllm-cpu:0.9.1-oe2403lts
+    image: openeuler/vllm-cpu:0.10.1-oe2403lts
     container_name: vllm-service
     ports:
       - "9009:80"
     volumes:
       - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
     shm_size: 128g
-    privileged: true
     environment:
       no_proxy: ${no_proxy}
       http_proxy: ${http_proxy}
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_opengauss.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_opengauss.yaml
new file mode 100644
index 0000000000..de131ba873
--- /dev/null
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_opengauss.yaml
@@ -0,0 +1,185 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  opengauss-db:
+    image: opengauss/opengauss:7.0.0-RC2.B015
+    container_name: opengauss-db
+    ports:
+      - "${GS_PORT:-5432}:5432"
+    restart: always
+    environment:
+      - GS_PASSWORD=${GS_PASSWORD}
+    healthcheck:
+        test: ["CMD-SHELL", "sleep 10 && exit 0"]
+        interval: 1s
+        timeout: 15s
+        retries: 1
+  dataprep-opengauss-service:
+    image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}
+    container_name: dataprep-opengauss-server
+    depends_on:
+      opengauss-db:
+        condition: service_healthy
+      tei-embedding-service:
+        condition: service_started
+    ports:
+      - "6007:5000"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      GS_CONNECTION_STRING: ${GS_CONNECTION_STRING}
+      DATAPREP_COMPONENT_NAME: "OPEA_DATAPREP_OPENGAUSS"
+      TEI_ENDPOINT: http://tei-embedding-service:80
+      TEI_EMBEDDING_ENDPOINT: http://tei-embedding-service:80
+      HF_TOKEN: ${HF_TOKEN}
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:5000/v1/health_check || exit 1"]
+      interval: 10s
+      timeout: 5s
+      retries: 50
+    restart: unless-stopped
+  tei-embedding-service:
+    image: ghcr.io/huggingface/text-embeddings-inference:cpu-1.7
+    container_name: tei-embedding-server
+    ports:
+      - "6006:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+    command: --model-id ${EMBEDDING_MODEL_ID} --auto-truncate
+  retriever:
+    image: ${REGISTRY:-opea}/retriever:${TAG:-latest}
+    container_name: retriever-opengauss-server
+    depends_on:
+      opengauss-db:
+        condition: service_healthy
+    ports:
+      - "7000:7000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      TEI_EMBEDDING_ENDPOINT: http://tei-embedding-service:80
+      HF_TOKEN: ${HF_TOKEN}
+      LOGFLAG: ${LOGFLAG}
+      GS_CONNECTION_STRING: ${GS_CONNECTION_STRING}
+      RETRIEVER_COMPONENT_NAME: "OPEA_RETRIEVER_OPENGAUSS"
+    restart: unless-stopped
+  tei-reranking-service:
+    image: ghcr.io/huggingface/text-embeddings-inference:cpu-1.7
+    container_name: tei-reranking-server
+    ports:
+      - "8808:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      HF_HUB_DISABLE_PROGRESS_BARS: 1
+      HF_HUB_ENABLE_HF_TRANSFER: 0
+    command: --model-id ${RERANK_MODEL_ID} --auto-truncate
+  vllm-service:
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
+    container_name: vllm-service
+    ports:
+      - "9009:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
+    shm_size: 128g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      VLLM_TORCH_PROFILER_DIR: "/mnt"
+      HF_HUB_OFFLINE: ${HF_HUB_OFFLINE:-0}
+      VLLM_CPU_KVCACHE_SPACE: 40
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://$host_ip:9009/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model $LLM_MODEL_ID --host 0.0.0.0 --port 80
+  chatqna-xeon-backend-server:
+    image: ${REGISTRY:-opea}/chatqna:${TAG:-latest}
+    container_name: chatqna-xeon-backend-server
+    depends_on:
+      opengauss-db:
+        condition: service_started
+      dataprep-opengauss-service:
+        condition: service_healthy
+      tei-embedding-service:
+        condition: service_started
+      retriever:
+        condition: service_started
+      tei-reranking-service:
+        condition: service_started
+      vllm-service:
+        condition: service_healthy
+    ports:
+      - "8888:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=chatqna-xeon-backend-server
+      - EMBEDDING_SERVER_HOST_IP=tei-embedding-service
+      - EMBEDDING_SERVER_PORT=${EMBEDDING_SERVER_PORT:-80}
+      - RETRIEVER_SERVICE_HOST_IP=retriever
+      - RERANK_SERVER_HOST_IP=tei-reranking-service
+      - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
+      - LLM_SERVER_HOST_IP=vllm-service
+      - LLM_SERVER_PORT=80
+      - LLM_MODEL=${LLM_MODEL_ID}
+      - LOGFLAG=${LOGFLAG}
+    ipc: host
+    restart: always
+  chatqna-xeon-ui-server:
+    image: ${REGISTRY:-opea}/chatqna-ui:${TAG:-latest}
+    container_name: chatqna-xeon-ui-server
+    depends_on:
+      - chatqna-xeon-backend-server
+    ports:
+      - "5173:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+    ipc: host
+    restart: always
+  chatqna-xeon-nginx-server:
+    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
+    container_name: chatqna-xeon-nginx-server
+    depends_on:
+      - chatqna-xeon-backend-server
+      - chatqna-xeon-ui-server
+    ports:
+      - "${NGINX_PORT:-80}:80"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - FRONTEND_SERVICE_IP=chatqna-xeon-ui-server
+      - FRONTEND_SERVICE_PORT=5173
+      - BACKEND_SERVICE_NAME=chatqna
+      - BACKEND_SERVICE_IP=chatqna-xeon-backend-server
+      - BACKEND_SERVICE_PORT=8888
+      - DATAPREP_SERVICE_IP=dataprep-opengauss-service
+      - DATAPREP_SERVICE_PORT=5000
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_pinecone.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_pinecone.yaml
index cfa6c5aebe..ffa4dd67f8 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/compose_pinecone.yaml
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_pinecone.yaml
@@ -76,7 +76,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_qdrant.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_qdrant.yaml
index fb12b77e1a..3fdd295374 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/compose_qdrant.yaml
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_qdrant.yaml
@@ -81,7 +81,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "6042:80"
diff --git a/ChatQnA/docker_compose/intel/cpu/xeon/compose_without_rerank.yaml b/ChatQnA/docker_compose/intel/cpu/xeon/compose_without_rerank.yaml
index 841a0ad531..00e6474b86 100644
--- a/ChatQnA/docker_compose/intel/cpu/xeon/compose_without_rerank.yaml
+++ b/ChatQnA/docker_compose/intel/cpu/xeon/compose_without_rerank.yaml
@@ -65,7 +65,7 @@ services:
       RETRIEVER_COMPONENT_NAME: "OPEA_RETRIEVER_REDIS"
     restart: unless-stopped
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/ChatQnA/docker_compose/intel/hpu/gaudi/README.md b/ChatQnA/docker_compose/intel/hpu/gaudi/README.md
index 9a1cd54bb8..40d282cc43 100644
--- a/ChatQnA/docker_compose/intel/hpu/gaudi/README.md
+++ b/ChatQnA/docker_compose/intel/hpu/gaudi/README.md
@@ -294,6 +294,43 @@ The `tgi-guardrails-service` uses the `GUARDRAILS_MODEL_ID` parameter to select
 
 The `vllm-guardrails-service` uses the `GUARDRAILS_MODEL_ID` parameter to select a [supported model](https://docs.vllm.ai/en/latest/models/supported_models.html) for the associated `opea/vllm-gaudi:latest` image. It uses the `NUM_CARDS` parameter.
 
+## ChatQnA with Conversational UI (Optional)
+
+To access the Conversational UI (react based) frontend, modify the UI service in the `compose` file used to deploy. Replace `chatqna-xeon-ui-server` service with the `chatqna-xeon-conversation-ui-server` service as per the config below:
+
+```yaml
+chatqna-xeon-conversation-ui-server:
+  image: opea/chatqna-conversation-ui:latest
+  container_name: chatqna-xeon-conversation-ui-server
+  environment:
+    - APP_BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+    - APP_DATA_PREP_SERVICE_URL=${DATAPREP_SERVICE_ENDPOINT}
+  ports:
+    - "5174:80"
+  depends_on:
+    - chatqna-xeon-backend-server
+  ipc: host
+  restart: always
+```
+
+Once the services are up, open the following URL in the browser: http://{host_ip}:5174. By default, the UI runs on port 80 internally. If the developer prefers to use a different host port to access the frontend, it can be modified by port mapping in the `compose.yaml` file as shown below:
+
+```yaml
+  chatqna-gaudi-conversation-ui-server:
+    image: opea/chatqna-conversation-ui:latest
+    ...
+    ports:
+      - "80:80"
+```
+
+Here is an example of running ChatQnA (default UI):
+
+![project-screenshot](../../../../assets/img/chat_ui_response.png)
+
+Here is an example of running ChatQnA with Conversational UI (React):
+
+![project-screenshot](../../../../assets/img/conversation_ui_response.png)
+
 ## Conclusion
 
 In examining the various services and configurations across different deployments, developers should gain a comprehensive understanding of how each component contributes to the overall functionality and performance of a ChatQnA pipeline on an Intel® Gaudi® platform. Key services such as the `vllm-service`, `tei-embedding-service`, `tei-reranking-service`, `tgi-guardrails-service`and `vllm-guardrails-service` each consume Gaudi accelerators, leveraging specific models and hardware resources to optimize their respective tasks. The `LLM_MODEL_ID`, `EMBEDDING_MODEL_ID`, `RERANK_MODEL_ID`, and `GUARDRAILS_MODEL_ID` parameters specify the models used, directly impacting the quality and effectiveness of language processing, embedding, reranking, and safety operations.
diff --git a/ChatQnA/docker_compose/intel/hpu/gaudi/compose.telemetry.yaml b/ChatQnA/docker_compose/intel/hpu/gaudi/compose.telemetry.yaml
index 00ace1e451..428271991c 100644
--- a/ChatQnA/docker_compose/intel/hpu/gaudi/compose.telemetry.yaml
+++ b/ChatQnA/docker_compose/intel/hpu/gaudi/compose.telemetry.yaml
@@ -62,7 +62,7 @@ services:
     command:
       - '--path.procfs=/host/proc'
       - '--path.sysfs=/host/sys'
-      - --collector.filesystem.ignored-mount-points
+      - --collector.filesystem.mount-points-exclude
       - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
     ports:
       - 9100:9100
diff --git a/ChatQnA/docker_compose/intel/hpu/gaudi/compose.yaml b/ChatQnA/docker_compose/intel/hpu/gaudi/compose.yaml
index 23e7cee19b..a762b21767 100644
--- a/ChatQnA/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/ChatQnA/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -92,7 +92,7 @@ services:
       MAX_WARMUP_SEQUENCE_LENGTH: 512
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.22.0
     container_name: vllm-gaudi-server
     ports:
       - "8007:80"
diff --git a/ChatQnA/docker_compose/intel/hpu/gaudi/compose_faqgen.yaml b/ChatQnA/docker_compose/intel/hpu/gaudi/compose_faqgen.yaml
index 3fa1b5c4af..182c2b5bc2 100644
--- a/ChatQnA/docker_compose/intel/hpu/gaudi/compose_faqgen.yaml
+++ b/ChatQnA/docker_compose/intel/hpu/gaudi/compose_faqgen.yaml
@@ -85,7 +85,7 @@ services:
       MAX_WARMUP_SEQUENCE_LENGTH: 512
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.22.0
     container_name: vllm-gaudi-server
     ports:
       - ${LLM_ENDPOINT_PORT:-8007}:80
diff --git a/ChatQnA/docker_compose/intel/hpu/gaudi/compose_guardrails.yaml b/ChatQnA/docker_compose/intel/hpu/gaudi/compose_guardrails.yaml
index e2ec071f1e..46ccee4773 100644
--- a/ChatQnA/docker_compose/intel/hpu/gaudi/compose_guardrails.yaml
+++ b/ChatQnA/docker_compose/intel/hpu/gaudi/compose_guardrails.yaml
@@ -32,7 +32,7 @@ services:
       retries: 50
     restart: unless-stopped
   vllm-guardrails-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.22.0
     container_name: vllm-guardrails-server
     ports:
       - "8088:80"
@@ -130,7 +130,7 @@ services:
       MAX_WARMUP_SEQUENCE_LENGTH: 512
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.22.0
     container_name: vllm-gaudi-server
     ports:
       - "8008:80"
diff --git a/ChatQnA/docker_compose/intel/hpu/gaudi/compose_without_rerank.yaml b/ChatQnA/docker_compose/intel/hpu/gaudi/compose_without_rerank.yaml
index 9c38b38772..017bf8d204 100644
--- a/ChatQnA/docker_compose/intel/hpu/gaudi/compose_without_rerank.yaml
+++ b/ChatQnA/docker_compose/intel/hpu/gaudi/compose_without_rerank.yaml
@@ -65,7 +65,7 @@ services:
       RETRIEVER_COMPONENT_NAME: "OPEA_RETRIEVER_REDIS"
     restart: unless-stopped
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.22.0
     container_name: vllm-gaudi-server
     ports:
       - "8007:80"
diff --git a/ChatQnA/docker_image_build/build.yaml b/ChatQnA/docker_image_build/build.yaml
index 3a5f6d4be3..2a5f8ccd62 100644
--- a/ChatQnA/docker_image_build/build.yaml
+++ b/ChatQnA/docker_image_build/build.yaml
@@ -114,18 +114,6 @@ services:
       context: GenAIComps
       dockerfile: comps/third_parties/vllm/src/Dockerfile.amd_gpu
     image: ${REGISTRY:-opea}/vllm-rocm:${TAG:-latest}
-  vllm:
-    build:
-      context: vllm
-      dockerfile: docker/Dockerfile.cpu
-    extends: chatqna
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
-  vllm-gaudi:
-    build:
-      context: vllm-fork
-      dockerfile: Dockerfile.hpu
-    extends: chatqna
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   nginx:
     build:
       context: GenAIComps
diff --git a/ChatQnA/kubernetes/helm/README.md b/ChatQnA/kubernetes/helm/README.md
index 8ada19b070..5186fe3c8d 100644
--- a/ChatQnA/kubernetes/helm/README.md
+++ b/ChatQnA/kubernetes/helm/README.md
@@ -14,7 +14,7 @@ helm install chatqna oci://ghcr.io/opea-project/charts/chatqna  --set global.HUG
 
 ```
 export HFTOKEN="insert-your-huggingface-token-here"
-helm install chatqna oci://ghcr.io/opea-project/charts/chatqna  --set global.HUGGINGFACEHUB_API_TOKEN=${HFTOKEN} -f gaudi-vllm-values.yaml
+helm install chatqna oci://ghcr.io/opea-project/charts/chatqna  --set global.HUGGINGFACEHUB_API_TOKEN=${HFTOKEN} -f gaudi-values.yaml
 ```
 
 ## Deploy variants of ChatQnA
diff --git a/ChatQnA/kubernetes/helm/cpu-openeuler-values.yaml b/ChatQnA/kubernetes/helm/cpu-openeuler-values.yaml
new file mode 100644
index 0000000000..5206d1abf9
--- /dev/null
+++ b/ChatQnA/kubernetes/helm/cpu-openeuler-values.yaml
@@ -0,0 +1,58 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# This file is based on cpu-values.yaml and overrides image tags to 'latest-openeuler'
+# for all enabled services to run on openEuler.
+
+# Overrides for the main chart image
+image:
+  tag: latest-openeuler
+
+# Overrides from cpu-values.yaml
+vllm:
+  image:
+    repository: openeuler/vllm-cpu
+    tag: 0.10.1-oe2403lts
+  LLM_MODEL_ID: meta-llama/Meta-Llama-3-8B-Instruct
+
+  # Uncomment the following model specific settings for DeepSeek models
+  #VLLM_CPU_KVCACHE_SPACE: 40
+  #resources:
+  #  requests:
+  #    memory: 60Gi # 40G for KV cache, and 20G for DeepSeek-R1-Distill-Qwen-7B, need to adjust it for other models
+
+# Overrides for subchart images
+# Based on the default values in opea-project/GenAIInfra/helm-charts/chatqna/values.yaml,
+# the following services are enabled by default.
+
+# data-prep service
+data-prep:
+  image:
+    tag: latest-openeuler
+
+# retriever-usvc service
+retriever-usvc:
+  image:
+    tag: latest-openeuler
+
+# tei-rerank service
+teirerank:
+  image:
+    repository: openeuler/text-embeddings-inference-cpu
+    tag: 1.7.0-oe2403lts
+
+# tei service
+tei:
+  image:
+    repository: openeuler/text-embeddings-inference-cpu
+    tag: 1.7.0-oe2403lts
+
+# nginx service
+nginx:
+  image:
+    tag: latest-openeuler
+
+# chatqna-ui service
+chatqna-ui:
+  image:
+    tag: latest-openeuler
diff --git a/ChatQnA/kubernetes/helm/faqgen-gaudi-tgi-values.yaml b/ChatQnA/kubernetes/helm/faqgen-gaudi-tgi-values.yaml
index 88fca4ed55..99b7fb5c58 100644
--- a/ChatQnA/kubernetes/helm/faqgen-gaudi-tgi-values.yaml
+++ b/ChatQnA/kubernetes/helm/faqgen-gaudi-tgi-values.yaml
@@ -49,8 +49,8 @@ teirerank:
   OMPI_MCA_btl_vader_single_copy_mechanism: "none"
   MAX_WARMUP_SEQUENCE_LENGTH: "512"
   image:
-    repository: ghcr.io/huggingface/tei-gaudi
-    tag: 1.5.0
+    repository: ghcr.io/huggingface/text-embeddings-inference
+    tag: hpu-1.7
   resources:
     limits:
       habana.ai/gaudi: 1
diff --git a/ChatQnA/kubernetes/helm/faqgen-gaudi-values.yaml b/ChatQnA/kubernetes/helm/faqgen-gaudi-values.yaml
index 7dd455e112..6e34ab4b09 100644
--- a/ChatQnA/kubernetes/helm/faqgen-gaudi-values.yaml
+++ b/ChatQnA/kubernetes/helm/faqgen-gaudi-values.yaml
@@ -42,8 +42,8 @@ teirerank:
   OMPI_MCA_btl_vader_single_copy_mechanism: "none"
   MAX_WARMUP_SEQUENCE_LENGTH: "512"
   image:
-    repository: ghcr.io/huggingface/tei-gaudi
-    tag: 1.5.0
+    repository: ghcr.io/huggingface/text-embeddings-inference
+    tag: hpu-1.7
   resources:
     limits:
       habana.ai/gaudi: 1
diff --git a/ChatQnA/kubernetes/helm/faqgen-rocm-tgi-values.yaml b/ChatQnA/kubernetes/helm/faqgen-rocm-tgi-values.yaml
new file mode 100644
index 0000000000..19ca79f10a
--- /dev/null
+++ b/ChatQnA/kubernetes/helm/faqgen-rocm-tgi-values.yaml
@@ -0,0 +1,52 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+CHATQNA_TYPE: "CHATQNA_FAQGEN"
+llm-uservice:
+  enabled: true
+  image:
+    repository: opea/llm-faqgen
+  LLM_MODEL_ID: meta-llama/Meta-Llama-3-8B-Instruct
+  FAQGEN_BACKEND: "TGI"
+  service:
+    port: 80
+tgi:
+  enabled: true
+  accelDevice: "rocm"
+  image:
+    repository: ghcr.io/huggingface/text-generation-inference
+    tag: "3.0.0-rocm"
+  LLM_MODEL_ID: meta-llama/Meta-Llama-3-8B-Instruct
+  MAX_INPUT_LENGTH: "2048"
+  MAX_TOTAL_TOKENS: "4096"
+  USE_FLASH_ATTENTION: "true"
+  FLASH_ATTENTION_RECOMPUTE: "false"
+  PYTORCH_TUNABLEOP_ENABLED: "0"
+  HIP_VISIBLE_DEVICES: "0,1"
+  MAX_BATCH_SIZE: "4"
+  extraCmdArgs: [ "--num-shard","2" ]
+  resources:
+    limits:
+      amd.com/gpu: "2"
+    requests:
+      cpu: 1
+      memory: 16Gi
+  securityContext:
+    readOnlyRootFilesystem: false
+    runAsNonRoot: false
+    runAsUser: 0
+    capabilities:
+      add:
+        - SYS_PTRACE
+  readinessProbe:
+    initialDelaySeconds: 60
+    periodSeconds: 5
+    timeoutSeconds: 1
+    failureThreshold: 120
+  startupProbe:
+    initialDelaySeconds: 60
+    periodSeconds: 5
+    timeoutSeconds: 1
+    failureThreshold: 120
+vllm:
+  enabled: false
diff --git a/ChatQnA/kubernetes/helm/faqgen-rocm-values.yaml b/ChatQnA/kubernetes/helm/faqgen-rocm-values.yaml
new file mode 100644
index 0000000000..e8941d8153
--- /dev/null
+++ b/ChatQnA/kubernetes/helm/faqgen-rocm-values.yaml
@@ -0,0 +1,45 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+CHATQNA_TYPE: "CHATQNA_FAQGEN"
+llm-uservice:
+  enabled: true
+  image:
+    repository: opea/llm-faqgen
+  LLM_MODEL_ID: meta-llama/Meta-Llama-3-8B-Instruct
+  FAQGEN_BACKEND: "vLLM"
+  service:
+    port: 80
+tgi:
+  enabled: false
+vllm:
+  enabled: true
+  accelDevice: "rocm"
+  image:
+    repository: opea/vllm-rocm
+    tag: latest
+  env:
+    HIP_VISIBLE_DEVICES: "0"
+    TENSOR_PARALLEL_SIZE: "1"
+    HF_HUB_DISABLE_PROGRESS_BARS: "1"
+    HF_HUB_ENABLE_HF_TRANSFER: "0"
+    VLLM_USE_TRITON_FLASH_ATTN: "0"
+    VLLM_WORKER_MULTIPROC_METHOD: "spawn"
+    PYTORCH_JIT: "0"
+    HF_HOME: "/data"
+  extraCmd:
+    command: [ "python3", "/workspace/api_server.py" ]
+  extraCmdArgs: [ "--swap-space", "16",
+                  "--disable-log-requests",
+                  "--dtype", "float16",
+                  "--num-scheduler-steps", "1",
+                  "--distributed-executor-backend", "mp" ]
+  resources:
+    limits:
+      amd.com/gpu: "1"
+  startupProbe:
+    failureThreshold: 180
+  securityContext:
+    readOnlyRootFilesystem: false
+    runAsNonRoot: false
+    runAsUser: 0
diff --git a/ChatQnA/kubernetes/helm/gaudi-tgi-values.yaml b/ChatQnA/kubernetes/helm/gaudi-tgi-values.yaml
index 027fecb3fd..c5fc0fa8f8 100644
--- a/ChatQnA/kubernetes/helm/gaudi-tgi-values.yaml
+++ b/ChatQnA/kubernetes/helm/gaudi-tgi-values.yaml
@@ -43,8 +43,8 @@ teirerank:
   OMPI_MCA_btl_vader_single_copy_mechanism: "none"
   MAX_WARMUP_SEQUENCE_LENGTH: "512"
   image:
-    repository: ghcr.io/huggingface/tei-gaudi
-    tag: 1.5.0
+    repository: ghcr.io/huggingface/text-embeddings-inference
+    tag: hpu-1.7
   resources:
     limits:
       habana.ai/gaudi: 1
@@ -60,8 +60,8 @@ teirerank:
 #   OMPI_MCA_btl_vader_single_copy_mechanism: "none"
 #   MAX_WARMUP_SEQUENCE_LENGTH: "512"
 #   image:
-#     repository: ghcr.io/huggingface/tei-gaudi
-#     tag: 1.5.0
+#     repository: ghcr.io/huggingface/text-embeddings-inference
+#     tag: hpu-1.7
 #   resources:
 #     limits:
 #       habana.ai/gaudi: 1
diff --git a/ChatQnA/kubernetes/helm/gaudi-values.yaml b/ChatQnA/kubernetes/helm/gaudi-values.yaml
index 19471c0e43..36a1ee29de 100644
--- a/ChatQnA/kubernetes/helm/gaudi-values.yaml
+++ b/ChatQnA/kubernetes/helm/gaudi-values.yaml
@@ -37,8 +37,8 @@ teirerank:
   OMPI_MCA_btl_vader_single_copy_mechanism: "none"
   MAX_WARMUP_SEQUENCE_LENGTH: "512"
   image:
-    repository: ghcr.io/huggingface/tei-gaudi
-    tag: 1.5.0
+    repository: ghcr.io/huggingface/text-embeddings-inference
+    tag: hpu-1.7
   resources:
     limits:
       habana.ai/gaudi: 1
diff --git a/ChatQnA/kubernetes/helm/guardrails-gaudi-values.yaml b/ChatQnA/kubernetes/helm/guardrails-gaudi-values.yaml
index 5c88e73d0f..bc2faef9a8 100644
--- a/ChatQnA/kubernetes/helm/guardrails-gaudi-values.yaml
+++ b/ChatQnA/kubernetes/helm/guardrails-gaudi-values.yaml
@@ -19,8 +19,8 @@ guardrails-usvc:
 # tei:
 #   accelDevice: "gaudi"
 #   image:
-#     repository: ghcr.io/huggingface/tei-gaudi
-#     tag: 1.5.0
+#     repository: ghcr.io/huggingface/text-embeddings-inference
+#     tag: hpu-1.7
 #   resources:
 #     limits:
 #       habana.ai/gaudi: 1
@@ -32,8 +32,8 @@ teirerank:
   OMPI_MCA_btl_vader_single_copy_mechanism: "none"
   MAX_WARMUP_SEQUENCE_LENGTH: "512"
   image:
-    repository: ghcr.io/huggingface/tei-gaudi
-    tag: "1.5.0"
+    repository: ghcr.io/huggingface/text-embeddings-inference
+    tag: hpu-1.7
   resources:
     limits:
       habana.ai/gaudi: 1
diff --git a/ChatQnA/kubernetes/helm/rocm-tgi-values.yaml b/ChatQnA/kubernetes/helm/rocm-tgi-values.yaml
new file mode 100644
index 0000000000..1a76b460d3
--- /dev/null
+++ b/ChatQnA/kubernetes/helm/rocm-tgi-values.yaml
@@ -0,0 +1,47 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# Accelerate inferencing in heaviest components to improve performance
+# by overriding their subchart values
+
+tgi:
+  enabled: true
+  accelDevice: "rocm"
+  image:
+    repository: ghcr.io/huggingface/text-generation-inference
+    tag: "3.0.0-rocm"
+  LLM_MODEL_ID: meta-llama/Meta-Llama-3-8B-Instruct
+  MAX_INPUT_LENGTH: "2048"
+  MAX_TOTAL_TOKENS: "4096"
+  PYTORCH_TUNABLEOP_ENABLED: "0"
+  USE_FLASH_ATTENTION: "true"
+  FLASH_ATTENTION_RECOMPUTE: "true"
+  HIP_VISIBLE_DEVICES: "0,1"
+  MAX_BATCH_SIZE: "4"
+  extraCmdArgs: [ "--num-shard","2" ]
+  resources:
+    limits:
+      amd.com/gpu: "2"
+    requests:
+      cpu: 1
+      memory: 16Gi
+  securityContext:
+    readOnlyRootFilesystem: false
+    runAsNonRoot: false
+    runAsUser: 0
+    capabilities:
+      add:
+        - SYS_PTRACE
+  readinessProbe:
+    initialDelaySeconds: 60
+    periodSeconds: 5
+    timeoutSeconds: 1
+    failureThreshold: 120
+  startupProbe:
+    initialDelaySeconds: 60
+    periodSeconds: 5
+    timeoutSeconds: 1
+    failureThreshold: 120
+
+vllm:
+  enabled: false
diff --git a/ChatQnA/kubernetes/helm/rocm-values.yaml b/ChatQnA/kubernetes/helm/rocm-values.yaml
new file mode 100644
index 0000000000..4d637bd8c6
--- /dev/null
+++ b/ChatQnA/kubernetes/helm/rocm-values.yaml
@@ -0,0 +1,39 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# Accelerate inferencing in heaviest components to improve performance
+# by overriding their subchart values
+
+tgi:
+  enabled: false
+vllm:
+  enabled: true
+  accelDevice: "rocm"
+  image:
+    repository: opea/vllm-rocm
+    tag: latest
+  env:
+    HIP_VISIBLE_DEVICES: "0"
+    TENSOR_PARALLEL_SIZE: "1"
+    HF_HUB_DISABLE_PROGRESS_BARS: "1"
+    HF_HUB_ENABLE_HF_TRANSFER: "0"
+    VLLM_USE_TRITON_FLASH_ATTN: "0"
+    VLLM_WORKER_MULTIPROC_METHOD: "spawn"
+    PYTORCH_JIT: "0"
+    HF_HOME: "/data"
+  extraCmd:
+    command: [ "python3", "/workspace/api_server.py" ]
+  extraCmdArgs: [ "--swap-space", "16",
+                  "--disable-log-requests",
+                  "--dtype", "float16",
+                  "--num-scheduler-steps", "1",
+                  "--distributed-executor-backend", "mp" ]
+  resources:
+    limits:
+      amd.com/gpu: "1"
+  startupProbe:
+    failureThreshold: 180
+  securityContext:
+    readOnlyRootFilesystem: false
+    runAsNonRoot: false
+    runAsUser: 0
diff --git a/ChatQnA/tests/test_compose_faqgen_on_epyc.sh b/ChatQnA/tests/test_compose_faqgen_on_epyc.sh
index 1571349095..c480fd1f2e 100644
--- a/ChatQnA/tests/test_compose_faqgen_on_epyc.sh
+++ b/ChatQnA/tests/test_compose_faqgen_on_epyc.sh
@@ -25,19 +25,9 @@ function build_docker_images() {
 	echo "GenAIComps test commit is $(git rev-parse HEAD)"
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
 
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="chatqna chatqna-ui dataprep retriever llm-faqgen vllm nginx"
+	service_list="chatqna chatqna-ui dataprep retriever llm-faqgen nginx"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -206,37 +196,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc
 	docker compose -f compose_faqgen.yaml down
@@ -264,10 +223,6 @@ function main() {
 	validate_megaservice
 	echo "::endgroup::"
 
-	echo "::group::validate_frontend"
-	validate_frontend
-	echo "::endgroup::"
-
 	echo "::group::stop_docker"
 	stop_docker
 	echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_faqgen_on_gaudi.sh b/ChatQnA/tests/test_compose_faqgen_on_gaudi.sh
index 58ab7526c2..08e718e1ca 100644
--- a/ChatQnA/tests/test_compose_faqgen_on_gaudi.sh
+++ b/ChatQnA/tests/test_compose_faqgen_on_gaudi.sh
@@ -23,12 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever llm-faqgen vllm-gaudi nginx"
+    service_list="chatqna chatqna-ui dataprep retriever llm-faqgen nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -36,6 +33,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env_faqgen.sh
 
     # Start Docker Containers
@@ -187,34 +185,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose -f compose_faqgen.yaml  down
@@ -242,10 +212,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_faqgen_on_rocm.sh b/ChatQnA/tests/test_compose_faqgen_on_rocm.sh
index 893807377f..e3248c7999 100644
--- a/ChatQnA/tests/test_compose_faqgen_on_rocm.sh
+++ b/ChatQnA/tests/test_compose_faqgen_on_rocm.sh
@@ -163,36 +163,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd "$WORKPATH"/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd "$WORKPATH"/docker_compose/amd/gpu/rocm
     docker compose -f compose_faqgen.yaml stop && docker compose rm -f
@@ -220,10 +190,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_faqgen_on_xeon.sh b/ChatQnA/tests/test_compose_faqgen_on_xeon.sh
index bb18e3db55..76270813a8 100644
--- a/ChatQnA/tests/test_compose_faqgen_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_faqgen_on_xeon.sh
@@ -23,13 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever llm-faqgen vllm nginx"
+    service_list="chatqna chatqna-ui dataprep retriever llm-faqgen nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -198,34 +194,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
     docker compose -f compose_faqgen.yaml  down
@@ -253,10 +221,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_faqgen_tgi_on_epyc.sh b/ChatQnA/tests/test_compose_faqgen_tgi_on_epyc.sh
index 75d86a4a6e..d9800d543e 100644
--- a/ChatQnA/tests/test_compose_faqgen_tgi_on_epyc.sh
+++ b/ChatQnA/tests/test_compose_faqgen_tgi_on_epyc.sh
@@ -25,16 +25,6 @@ function build_docker_images() {
 	echo "GenAIComps test commit is $(git rev-parse HEAD)"
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
 
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
 	service_list="chatqna chatqna-ui dataprep retriever llm-faqgen nginx"
@@ -206,37 +196,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc
 	docker compose -f compose_faqgen_tgi.yaml down
@@ -264,10 +223,6 @@ function main() {
 	validate_megaservice
 	echo "::endgroup::"
 
-	echo "::group::validate_frontend"
-	validate_frontend
-	echo "::endgroup::"
-
 	echo "::group::stop_docker"
 	stop_docker
 	echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_faqgen_tgi_on_gaudi.sh b/ChatQnA/tests/test_compose_faqgen_tgi_on_gaudi.sh
index e9868e0052..b346d8018d 100644
--- a/ChatQnA/tests/test_compose_faqgen_tgi_on_gaudi.sh
+++ b/ChatQnA/tests/test_compose_faqgen_tgi_on_gaudi.sh
@@ -34,6 +34,7 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     export FAQGen_COMPONENT_NAME="OpeaFaqGenTgi"
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env_faqgen.sh
 
     # Start Docker Containers
@@ -185,34 +186,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose -f compose_faqgen_tgi.yaml  down
@@ -240,10 +213,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_faqgen_tgi_on_xeon.sh b/ChatQnA/tests/test_compose_faqgen_tgi_on_xeon.sh
index d0b823f204..ca3993b8be 100644
--- a/ChatQnA/tests/test_compose_faqgen_tgi_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_faqgen_tgi_on_xeon.sh
@@ -198,34 +198,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
     docker compose -f compose_faqgen_tgi.yaml  down
@@ -253,10 +225,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_faqgen_vllm_on_rocm.sh b/ChatQnA/tests/test_compose_faqgen_vllm_on_rocm.sh
index f344f0030a..8c24185f31 100644
--- a/ChatQnA/tests/test_compose_faqgen_vllm_on_rocm.sh
+++ b/ChatQnA/tests/test_compose_faqgen_vllm_on_rocm.sh
@@ -138,35 +138,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm
     docker compose -f compose_vllm.yaml down
@@ -194,10 +165,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_guardrails_on_gaudi.sh b/ChatQnA/tests/test_compose_guardrails_on_gaudi.sh
index da8bc25b48..09bfffabe1 100644
--- a/ChatQnA/tests/test_compose_guardrails_on_gaudi.sh
+++ b/ChatQnA/tests/test_compose_guardrails_on_gaudi.sh
@@ -23,12 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm-gaudi guardrails nginx"
+    service_list="chatqna chatqna-ui dataprep retriever guardrails nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -154,34 +151,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose -f compose_guardrails.yaml down
@@ -209,10 +178,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_mariadb_on_xeon.sh b/ChatQnA/tests/test_compose_mariadb_on_xeon.sh
index 4d834e2abc..3c369357e4 100644
--- a/ChatQnA/tests/test_compose_mariadb_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_mariadb_on_xeon.sh
@@ -23,15 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    # make sure NOT change the pwd
-    cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -40,6 +34,7 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
     export MARIADB_PASSWORD="test"
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env_mariadb.sh
 
     # Start Docker Containers
diff --git a/ChatQnA/tests/test_compose_milvus_on_epyc.sh b/ChatQnA/tests/test_compose_milvus_on_epyc.sh
index 851f6cb33d..efba619f58 100644
--- a/ChatQnA/tests/test_compose_milvus_on_epyc.sh
+++ b/ChatQnA/tests/test_compose_milvus_on_epyc.sh
@@ -26,19 +26,9 @@ function build_docker_images() {
 	echo "GenAIComps test commit is $(git rev-parse HEAD)"
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
 
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+	service_list="chatqna chatqna-ui dataprep retriever nginx"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -181,39 +171,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	echo "[ TEST INFO ]: --------- frontend test started ---------"
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-	echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	echo "In stop docker"
 	echo $WORKPATH
@@ -243,10 +200,6 @@ function main() {
 	validate_megaservice
 	echo "::endgroup::"
 
-	echo "::group::validate_frontend"
-	validate_frontend
-	echo "::endgroup::"
-
 	echo "::group::stop_docker"
 	stop_docker
 	echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_milvus_on_xeon.sh b/ChatQnA/tests/test_compose_milvus_on_xeon.sh
index 2bd97cb05a..338c5515dc 100644
--- a/ChatQnA/tests/test_compose_milvus_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_milvus_on_xeon.sh
@@ -24,15 +24,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    # make sure NOT change the pwd
-    cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -40,6 +34,7 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     export LOGFLAG=true
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
 
     # Start Docker Containers
@@ -175,36 +170,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     echo "In stop docker"
     echo $WORKPATH
@@ -234,10 +199,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_on_epyc.sh b/ChatQnA/tests/test_compose_on_epyc.sh
index 851f6cb33d..efba619f58 100644
--- a/ChatQnA/tests/test_compose_on_epyc.sh
+++ b/ChatQnA/tests/test_compose_on_epyc.sh
@@ -26,19 +26,9 @@ function build_docker_images() {
 	echo "GenAIComps test commit is $(git rev-parse HEAD)"
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
 
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+	service_list="chatqna chatqna-ui dataprep retriever nginx"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -181,39 +171,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	echo "[ TEST INFO ]: --------- frontend test started ---------"
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-	echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	echo "In stop docker"
 	echo $WORKPATH
@@ -243,10 +200,6 @@ function main() {
 	validate_megaservice
 	echo "::endgroup::"
 
-	echo "::group::validate_frontend"
-	validate_frontend
-	echo "::endgroup::"
-
 	echo "::group::stop_docker"
 	stop_docker
 	echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_on_gaudi.sh b/ChatQnA/tests/test_compose_on_gaudi.sh
index 221f59c6e5..ace8e10b41 100644
--- a/ChatQnA/tests/test_compose_on_gaudi.sh
+++ b/ChatQnA/tests/test_compose_on_gaudi.sh
@@ -23,12 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm-gaudi nginx"
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -133,36 +130,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    export no_proxy="localhost,127.0.0.1,$ip_address"
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose -f compose.yaml -f compose.telemetry.yaml down
@@ -190,10 +157,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_on_rocm.sh b/ChatQnA/tests/test_compose_on_rocm.sh
index 5e31ea9969..63d978b92b 100644
--- a/ChatQnA/tests/test_compose_on_rocm.sh
+++ b/ChatQnA/tests/test_compose_on_rocm.sh
@@ -148,36 +148,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd "$WORKPATH"/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd "$WORKPATH"/docker_compose/amd/gpu/rocm
     docker compose stop && docker compose rm -f
@@ -205,10 +175,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_on_xeon.sh b/ChatQnA/tests/test_compose_on_xeon.sh
index 965ddb34dd..a241e4eeff 100644
--- a/ChatQnA/tests/test_compose_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_on_xeon.sh
@@ -23,15 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    # make sure NOT change the pwd
-    cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -39,7 +33,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
 
     # Start Docker Containers
@@ -132,35 +126,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
     docker compose -f compose.yaml -f compose.telemetry.yaml down
@@ -188,10 +153,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_openeuler_on_xeon.sh b/ChatQnA/tests/test_compose_openeuler_on_xeon.sh
index 5f641f5d62..38c275dd9c 100644
--- a/ChatQnA/tests/test_compose_openeuler_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_openeuler_on_xeon.sh
@@ -33,7 +33,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
 
     # Start Docker Containers
@@ -126,36 +126,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-
-    echo "[TEST INFO]: Preparing frontend test using Docker..."
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    echo "[TEST INFO]: Running frontend tests in Docker..."
-    exit_status=0
-
-    docker run --rm \
-        --network="host" \
-        -v $PWD:/work \
-        -w /work \
-        mcr.microsoft.com/playwright:v1.40.0-focal \
-        /bin/bash -c "
-            npm install &&
-            npm ci &&
-            npx playwright install &&
-            npx playwright test
-        " || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
     docker compose -f compose_openeuler.yaml -f compose.telemetry.yaml down
@@ -183,10 +153,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_opengauss_on_xeon.sh b/ChatQnA/tests/test_compose_opengauss_on_xeon.sh
new file mode 100644
index 0000000000..cda5c20b03
--- /dev/null
+++ b/ChatQnA/tests/test_compose_opengauss_on_xeon.sh
@@ -0,0 +1,215 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+export host_ip=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    export LOGFLAG=true
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    export GS_USER="gaussdb"
+    export GS_PASSWORD="openGauss@123"
+    export GS_DB="postgres"
+    export GS_CONNECTION_STRING="opengauss+psycopg2://${GS_USER}:${GS_PASSWORD}@$ip_address:5432/${GS_DB}"
+
+    source set_env.sh
+
+    # Start Docker Containers
+    docker compose -f compose_opengauss.yaml up -d --quiet-pull > ${LOG_PATH}/start_services_with_compose.log
+
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs vllm-service > ${LOG_PATH}/vllm_service_start.log 2>&1
+        if grep -q complete ${LOG_PATH}/vllm_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+}
+
+function validate_service() {
+    local URL="$1"
+    local EXPECTED_RESULT="$2"
+    local SERVICE_NAME="$3"
+    local DOCKER_NAME="$4"
+    local INPUT_DATA="$5"
+
+    if [[ $SERVICE_NAME == *"dataprep_upload_file"* ]]; then
+        cd $LOG_PATH
+        HTTP_RESPONSE=$(curl --silent --write-out "HTTPSTATUS:%{http_code}" -X POST -F 'files=@./dataprep_file.txt' -H 'Content-Type: multipart/form-data' "$URL")
+    elif [[ $SERVICE_NAME == *"dataprep_del"* ]]; then
+        HTTP_RESPONSE=$(curl --silent --write-out "HTTPSTATUS:%{http_code}" -X POST -d '{"file_path": "all"}' -H 'Content-Type: application/json' "$URL")
+    else
+        HTTP_RESPONSE=$(curl --silent --write-out "HTTPSTATUS:%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
+    fi
+    HTTP_STATUS=$(echo $HTTP_RESPONSE | tr -d '\n' | sed -e 's/.*HTTPSTATUS://')
+    RESPONSE_BODY=$(echo $HTTP_RESPONSE | sed -e 's/HTTPSTATUS\:.*//g')
+
+    docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+
+
+    # check response status
+    if [ "$HTTP_STATUS" -ne "200" ]; then
+        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
+        exit 1
+    else
+        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+    fi
+    echo "Response"
+    echo $RESPONSE_BODY
+    echo "Expected Result"
+    echo $EXPECTED_RESULT
+    # check response body
+    if [[ "$RESPONSE_BODY" != *"$EXPECTED_RESULT"* ]]; then
+        echo "[ $SERVICE_NAME ] Content does not match the expected result: $RESPONSE_BODY"
+        exit 1
+    else
+        echo "[ $SERVICE_NAME ] Content is as expected."
+    fi
+
+    sleep 1s
+}
+
+function validate_microservices() {
+    # Check if the microservices are running correctly.
+
+    # tei for embedding service
+    validate_service \
+        "${ip_address}:6006/embed" \
+        "[[" \
+        "tei-embedding" \
+        "tei-embedding-server" \
+        '{"inputs":"What is Deep Learning?"}'
+
+    sleep 1m # retrieval can't curl as expected, try to wait for more time
+
+    # test /v1/dataprep/ingest upload file
+    echo "Deep learning is a subset of machine learning that utilizes neural networks with multiple layers to analyze various levels of abstract data representations. It enables computers to identify patterns and make decisions with minimal human intervention by learning from large amounts of data." > $LOG_PATH/dataprep_file.txt
+    validate_service \
+       "http://${ip_address}:6007/v1/dataprep/ingest" \
+        "Data preparation succeeded" \
+        "dataprep_upload_file" \
+        "dataprep-opengauss-server"
+
+    # test /v1/dataprep/delete
+    validate_service \
+       "http://${ip_address}:6007/v1/dataprep/delete" \
+       '{"status":true}' \
+        "dataprep_del" \
+        "dataprep-opengauss-server"
+
+    # test /v1/dataprep/delete
+    validate_service \
+       "http://${ip_address}:6007/v1/dataprep/delete" \
+       '{"status":true}' \
+        "dataprep_del" \
+        "dataprep-opengauss-server"
+
+
+    # retrieval microservice
+    test_embedding=$(python3 -c "import random; embedding = [random.uniform(-1, 1) for _ in range(768)]; print(embedding)")
+    validate_service \
+        "${ip_address}:7000/v1/retrieval" \
+        " " \
+        "retrieval" \
+        "retriever-opengauss-server" \
+        "{\"text\":\"What is the revenue of Nike in 2023?\",\"embedding\":${test_embedding}}"
+
+    # tei for rerank microservice
+    echo "Validating reranking service"
+    validate_service \
+        "${ip_address}:8808/rerank" \
+        '{"index":1,"score":' \
+        "tei-rerank" \
+        "tei-reranking-server" \
+        '{"query":"What is Deep Learning?", "texts": ["Deep Learning is not...", "Deep learning is..."]}'
+
+
+    # tgi for llm service
+    echo "Validating llm service"
+    validate_service \
+        "${ip_address}:9009/v1/chat/completions" \
+        "content" \
+        "vllm-llm" \
+        "vllm-service" \
+        '{"model": "meta-llama/Meta-Llama-3-8B-Instruct", "messages": [{"role": "user", "content": "What is Deep Learning?"}], "max_tokens": 17}'
+}
+
+function validate_megaservice() {
+    # Curl the Mega Service
+    validate_service \
+        "${ip_address}:8888/v1/chatqna" \
+        "Nike" \
+        "chatqna-megaservice" \
+        "chatqna-xeon-backend-server" \
+        '{"messages": "What is the revenue of Nike in 2023?"}'
+
+}
+
+function stop_docker() {
+    echo "In stop docker"
+    echo $WORKPATH
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose -f compose_opengauss.yaml down
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_microservices"
+    validate_microservices
+    echo "::endgroup::"
+
+    echo "::group::validate_megaservice"
+    validate_megaservice
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/ChatQnA/tests/test_compose_pinecone_on_epyc.sh b/ChatQnA/tests/test_compose_pinecone_on_epyc.sh
index 02bddd1450..10bb819ca5 100755
--- a/ChatQnA/tests/test_compose_pinecone_on_epyc.sh
+++ b/ChatQnA/tests/test_compose_pinecone_on_epyc.sh
@@ -26,19 +26,9 @@ function build_docker_images() {
 	echo "GenAIComps test commit is $(git rev-parse HEAD)"
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
 
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+	service_list="chatqna chatqna-ui dataprep retriever nginx"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -176,39 +166,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	echo "[ TEST INFO ]: --------- frontend test started ---------"
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-	echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	echo "In stop docker"
 	echo $WORKPATH
diff --git a/ChatQnA/tests/test_compose_pinecone_on_xeon.sh b/ChatQnA/tests/test_compose_pinecone_on_xeon.sh
index 64c8efc7df..f5efee6c80 100755
--- a/ChatQnA/tests/test_compose_pinecone_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_pinecone_on_xeon.sh
@@ -24,15 +24,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    # Not change the pwd
-    cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -174,36 +168,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     echo "In stop docker"
     echo $WORKPATH
diff --git a/ChatQnA/tests/test_compose_qdrant_on_epyc.sh b/ChatQnA/tests/test_compose_qdrant_on_epyc.sh
index 1489a346c7..e93983ec31 100644
--- a/ChatQnA/tests/test_compose_qdrant_on_epyc.sh
+++ b/ChatQnA/tests/test_compose_qdrant_on_epyc.sh
@@ -24,19 +24,9 @@ function build_docker_images() {
 	echo "GenAIComps test commit is $(git rev-parse HEAD)"
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
 
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+	service_list="chatqna chatqna-ui dataprep retriever nginx"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -167,36 +157,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc
 	docker compose -f compose_qdrant.yaml down
@@ -224,10 +184,6 @@ function main() {
 	validate_megaservice
 	echo "::endgroup::"
 
-	echo "::group::validate_frontend"
-	validate_frontend
-	echo "::endgroup::"
-
 	echo "::group::stop_docker"
 	stop_docker
 	echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_qdrant_on_xeon.sh b/ChatQnA/tests/test_compose_qdrant_on_xeon.sh
index c7a17aac49..2a522fa7a8 100644
--- a/ChatQnA/tests/test_compose_qdrant_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_qdrant_on_xeon.sh
@@ -23,15 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    # Not change the pwd
-    cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -39,7 +33,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     export INDEX_NAME="rag-qdrant"
     source set_env.sh
 
@@ -159,33 +153,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
     docker compose -f compose_qdrant.yaml down
@@ -213,10 +180,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_tgi_on_epyc.sh b/ChatQnA/tests/test_compose_tgi_on_epyc.sh
index 81cce137e9..98efb16223 100644
--- a/ChatQnA/tests/test_compose_tgi_on_epyc.sh
+++ b/ChatQnA/tests/test_compose_tgi_on_epyc.sh
@@ -178,39 +178,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	echo "[ TEST INFO ]: --------- frontend test started ---------"
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-	echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc
 	docker compose -f compose_tgi.yaml -f compose_tgi.telemetry.yaml down
@@ -238,10 +205,6 @@ function main() {
 	validate_megaservice
 	echo "::endgroup::"
 
-	echo "::group::validate_frontend"
-	validate_frontend
-	echo "::endgroup::"
-
 	echo "::group::stop_docker"
 	stop_docker
 	echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_tgi_on_gaudi.sh b/ChatQnA/tests/test_compose_tgi_on_gaudi.sh
index 356914ea1c..eb79b34440 100644
--- a/ChatQnA/tests/test_compose_tgi_on_gaudi.sh
+++ b/ChatQnA/tests/test_compose_tgi_on_gaudi.sh
@@ -35,6 +35,7 @@ function start_services() {
     export NON_INTERACTIVE=true
     export host_ip=${ip_address}
     export telemetry=yes
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
 
     # Start Docker Containers
@@ -172,36 +173,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    export no_proxy="localhost,127.0.0.1,$ip_address"
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose -f compose_tgi.yaml -f compose_tgi.telemetry.yaml down
@@ -229,10 +200,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_tgi_on_xeon.sh b/ChatQnA/tests/test_compose_tgi_on_xeon.sh
index b2a56091a9..f3c1e8bffd 100644
--- a/ChatQnA/tests/test_compose_tgi_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_tgi_on_xeon.sh
@@ -32,7 +32,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
 
     # Start Docker Containers
@@ -170,36 +170,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
     docker compose -f compose_tgi.yaml -f compose_tgi.telemetry.yaml down
@@ -227,10 +197,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_vllm_on_rocm.sh b/ChatQnA/tests/test_compose_vllm_on_rocm.sh
index 9f61c05b89..d0e856960f 100644
--- a/ChatQnA/tests/test_compose_vllm_on_rocm.sh
+++ b/ChatQnA/tests/test_compose_vllm_on_rocm.sh
@@ -129,35 +129,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm
     docker compose -f compose_vllm.yaml down
@@ -185,10 +156,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_without_rerank_on_epyc.sh b/ChatQnA/tests/test_compose_without_rerank_on_epyc.sh
index 06f96f9290..1f14c10d10 100644
--- a/ChatQnA/tests/test_compose_without_rerank_on_epyc.sh
+++ b/ChatQnA/tests/test_compose_without_rerank_on_epyc.sh
@@ -24,19 +24,9 @@ function build_docker_images() {
 	echo "GenAIComps test commit is $(git rev-parse HEAD)"
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
 
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+	service_list="chatqna chatqna-ui dataprep retriever nginx"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -176,39 +166,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	echo "[ TEST INFO ]: --------- frontend test started ---------"
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-	echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc/
 	docker compose -f compose_without_rerank.yaml down
@@ -236,10 +193,6 @@ function main() {
 	validate_megaservice
 	echo "::endgroup::"
 
-	echo "::group::validate_frontend"
-	validate_frontend
-	echo "::endgroup::"
-
 	echo "::group::stop_docker"
 	stop_docker
 	echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_without_rerank_on_gaudi.sh b/ChatQnA/tests/test_compose_without_rerank_on_gaudi.sh
index b6fb222b39..62cbe30d3e 100644
--- a/ChatQnA/tests/test_compose_without_rerank_on_gaudi.sh
+++ b/ChatQnA/tests/test_compose_without_rerank_on_gaudi.sh
@@ -23,12 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm-gaudi nginx"
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -166,36 +163,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    export no_proxy="localhost,127.0.0.1,$ip_address"
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose  -f compose_without_rerank.yaml down
@@ -223,10 +190,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_compose_without_rerank_on_xeon.sh b/ChatQnA/tests/test_compose_without_rerank_on_xeon.sh
index f236a8ab76..7e2157cee7 100644
--- a/ChatQnA/tests/test_compose_without_rerank_on_xeon.sh
+++ b/ChatQnA/tests/test_compose_without_rerank_on_xeon.sh
@@ -23,16 +23,9 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    # Not change the pwd
-    cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="chatqna chatqna-ui dataprep retriever vllm nginx"
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -40,7 +33,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
 
     # Start Docker Containers
@@ -169,36 +162,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     docker compose -f compose_without_rerank.yaml down
@@ -226,10 +189,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ChatQnA/tests/test_ui_on_xeon.sh b/ChatQnA/tests/test_ui_on_xeon.sh
new file mode 100644
index 0000000000..5c3eb88d3f
--- /dev/null
+++ b/ChatQnA/tests/test_ui_on_xeon.sh
@@ -0,0 +1,79 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="chatqna chatqna-ui dataprep retriever nginx"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon
+
+    source set_env.sh
+
+    # Start Docker Containers
+    docker compose -f compose.yaml -f compose.telemetry.yaml up -d --quiet-pull > ${LOG_PATH}/start_services_with_compose.log
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs vllm-service > ${LOG_PATH}/vllm_service_start.log 2>&1
+        if grep -q complete ${LOG_PATH}/vllm_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon
+    docker compose -f compose.yaml -f compose.telemetry.yaml down
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/ChatQnA/ui/docker/Dockerfile.openEuler b/ChatQnA/ui/docker/Dockerfile.openEuler
index cb594a33bb..b61654e440 100644
--- a/ChatQnA/ui/docker/Dockerfile.openEuler
+++ b/ChatQnA/ui/docker/Dockerfile.openEuler
@@ -2,7 +2,7 @@
 # SPDX-License-Identifier: Apache-2.0
 
 # Use node 20.11.1 as the base image
-FROM openeuler/node:20.11.1-oe2403lts
+FROM openeuler/node:20.11.1-oe2403lts@sha256:25c790f93c2243b361919620c069812319f614fd697e32e433402ae706a19ffd
 
 # Update package manager and install Git
 RUN yum update -y && \
diff --git a/ChatQnA/ui/docker/Dockerfile.react.openEuler b/ChatQnA/ui/docker/Dockerfile.react.openEuler
index edd8a21bca..3a89471fda 100644
--- a/ChatQnA/ui/docker/Dockerfile.react.openEuler
+++ b/ChatQnA/ui/docker/Dockerfile.react.openEuler
@@ -2,13 +2,13 @@
 # SPDX-License-Identifier: Apache-2.0
 
 # Use node 20.11.1 as the base image
-FROM openeuler/node:20.11.1-oe2403lts as vite-app
+FROM openeuler/node:20.11.1-oe2403lts@sha256:25c790f93c2243b361919620c069812319f614fd697e32e433402ae706a19ffd as vite-app
  
 COPY react /usr/app/react
 WORKDIR /usr/app/react
 
-
-RUN ["npm", "install"]
+RUN ["npm", "install", "--package-lock-only"]
+RUN ["npm", "ci"]
 RUN ["npm", "run", "build"]
 
 
diff --git a/ChatQnA/ui/svelte/package.json b/ChatQnA/ui/svelte/package.json
index eaa981570a..d62d64712b 100644
--- a/ChatQnA/ui/svelte/package.json
+++ b/ChatQnA/ui/svelte/package.json
@@ -18,7 +18,7 @@
     "@fortawesome/free-solid-svg-icons": "6.2.0",
     "@playwright/test": "^1.45.2",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "@tailwindcss/typography": "0.5.7",
     "@types/debug": "4.1.7",
diff --git a/ChatQnA/ui/svelte/src/lib/network/chat/Network.ts b/ChatQnA/ui/svelte/src/lib/network/chat/Network.ts
index 060c5a5ffb..f7fb57c9b3 100644
--- a/ChatQnA/ui/svelte/src/lib/network/chat/Network.ts
+++ b/ChatQnA/ui/svelte/src/lib/network/chat/Network.ts
@@ -18,7 +18,7 @@ import { SSE } from "sse.js";
 const CHAT_BASE_URL = env.CHAT_BASE_URL;
 const MODEL_ID = env.MODEL_ID;
 
-export async function fetchTextStream(query: string) {
+export async function fetchTextStream(query: object) {
 	let payload = {};
 	let url = "";
 	let modelId = "meta-llama/Meta-Llama-3-8B-Instruct";
diff --git a/ChatQnA/ui/svelte/src/routes/+page.svelte b/ChatQnA/ui/svelte/src/routes/+page.svelte
index bcd0b8b708..3d7f6afadf 100644
--- a/ChatQnA/ui/svelte/src/routes/+page.svelte
+++ b/ChatQnA/ui/svelte/src/routes/+page.svelte
@@ -102,7 +102,7 @@
 		return decoded;
 	}
 
-	const callTextStream = async (query: string, startSendTime: number) => {
+	const callTextStream = async (query: object, startSendTime: number) => {
 		try {
 			const eventSource = await fetchTextStream(query);
 			eventSource.addEventListener("error", (e: any) => {
@@ -179,6 +179,22 @@
 		}
 	};
 
+	function mapRole(r: number): "user" | "assistant" | "system" {
+		if (r === 1) return "user";
+		if (r === 0) return "assistant";
+		return "system";
+	}
+
+	function multiMessages(
+		history: any[]
+	): { role: "user" | "assistant" | "system"; content: string }[] {
+		return history.map((m) => ({
+			role: mapRole(m.role),
+			content:
+				typeof m.content === "string" ? m.content : String(m.content ?? ""),
+		}));
+	}
+
 	const handleTextSubmit = async () => {
 		loading = true;
 		const newMessage = {
@@ -192,7 +208,7 @@
 		storeMessages();
 		query = "";
 
-		await callTextStream(newMessage.content, getCurrentTimeStamp());
+		await callTextStream(multiMessages(chatMessages), getCurrentTimeStamp());
 
 		scrollToBottom(scrollToDiv);
 		storeMessages();
diff --git a/CodeGen/Dockerfile.openEuler b/CodeGen/Dockerfile.openEuler
new file mode 100644
index 0000000000..ef31614245
--- /dev/null
+++ b/CodeGen/Dockerfile.openEuler
@@ -0,0 +1,10 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+ARG IMAGE_REPO=opea
+ARG BASE_TAG=latest
+FROM $IMAGE_REPO/comps-base:$BASE_TAG-openeuler
+
+COPY ./codegen.py $HOME/codegen.py
+
+ENTRYPOINT ["python", "codegen.py"]
diff --git a/CodeGen/README.md b/CodeGen/README.md
index 479ad11f29..9aebba4472 100644
--- a/CodeGen/README.md
+++ b/CodeGen/README.md
@@ -106,19 +106,58 @@ flowchart LR
 
 This CodeGen example can be deployed manually on various hardware platforms using Docker Compose or Kubernetes. Select the appropriate guide based on your target environment:
 
-| Hardware        | Deployment Mode      | Guide Link                                                               |
-| :-------------- | :------------------- | :----------------------------------------------------------------------- |
-| Intel Xeon CPU  | Single Node (Docker) | [Xeon Docker Compose Guide](./docker_compose/intel/cpu/xeon/README.md)   |
-| Intel Gaudi HPU | Single Node (Docker) | [Gaudi Docker Compose Guide](./docker_compose/intel/hpu/gaudi/README.md) |
-| AMD EPYC CPU    | Single Node (Docker) | [EPYC Docker Compose Guide](./docker_compose/amd/cpu/epyc/README.md)     |
-| AMD ROCm GPU    | Single Node (Docker) | [ROCm Docker Compose Guide](./docker_compose/amd/gpu/rocm/README.md)     |
-| Intel Xeon CPU  | Kubernetes (Helm)    | [Kubernetes Helm Guide](./kubernetes/helm/README.md)                     |
-| Intel Gaudi HPU | Kubernetes (Helm)    | [Kubernetes Helm Guide](./kubernetes/helm/README.md)                     |
-| Intel Xeon CPU  | Kubernetes (GMC)     | [Kubernetes GMC Guide](./kubernetes/gmc/README.md)                       |
-| Intel Gaudi HPU | Kubernetes (GMC)     | [Kubernetes GMC Guide](./kubernetes/gmc/README.md)                       |
+| Hardware        | Deployment Mode                      | Guide Link                                                                               |
+| :-------------- | :----------------------------------- | :--------------------------------------------------------------------------------------- |
+| Intel Xeon CPU  | Single Node (Docker)                 | [Xeon Docker Compose Guide](./docker_compose/intel/cpu/xeon/README.md)                   |
+| Intel Xeon CPU  | Single Node (Docker) with Monitoring | [Xeon Docker Compose with Monitoring Guide](./docker_compose/intel/cpu/xeon/README.md)   |
+| Intel Gaudi HPU | Single Node (Docker)                 | [Gaudi Docker Compose Guide](./docker_compose/intel/hpu/gaudi/README.md)                 |
+| Intel Gaudi HPU | Single Node (Docker) with Monitoring | [Gaudi Docker Compose with Monitoring Guide](./docker_compose/intel/hpu/gaudi/README.md) |
+| AMD EPYC CPU    | Single Node (Docker)                 | [EPYC Docker Compose Guide](./docker_compose/amd/cpu/epyc/README.md)                     |
+| AMD ROCm GPU    | Single Node (Docker)                 | [ROCm Docker Compose Guide](./docker_compose/amd/gpu/rocm/README.md)                     |
+| Intel Xeon CPU  | Kubernetes (Helm)                    | [Kubernetes Helm Guide](./kubernetes/helm/README.md)                                     |
+| Intel Gaudi HPU | Kubernetes (Helm)                    | [Kubernetes Helm Guide](./kubernetes/helm/README.md)                                     |
+| Intel Xeon CPU  | Kubernetes (GMC)                     | [Kubernetes GMC Guide](./kubernetes/gmc/README.md)                                       |
+| Intel Gaudi HPU | Kubernetes (GMC)                     | [Kubernetes GMC Guide](./kubernetes/gmc/README.md)                                       |
 
 _Note: Building custom microservice images can be done using the resources in [GenAIComps](https://github.com/opea-project/GenAIComps)._
 
+## Monitoring
+
+The CodeGen example supports monitoring capabilities for Intel Xeon and Intel Gaudi platforms. Monitoring includes:
+
+- **Prometheus**: For metrics collection and querying
+- **Grafana**: For visualization and dashboards
+- **Node Exporter**: For system metrics collection
+
+### Monitoring Features
+
+- Real-time metrics collection from all CodeGen microservices
+- Pre-configured dashboards for:
+  - vLLM/TGI performance metrics
+  - CodeGen MegaService metrics
+  - System resource utilization
+  - Node-level metrics
+
+### Enabling Monitoring
+
+Monitoring can be enabled by using the `compose.monitoring.yaml` file along with the main compose file:
+
+```bash
+# For Intel Xeon
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+
+# For Intel Gaudi
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
+### Accessing Monitoring Services
+
+Once deployed with monitoring, you can access:
+
+- **Prometheus**: `http://${HOST_IP}:9090`
+- **Grafana**: `http://${HOST_IP}:3000` (username: `admin`, password: `admin`)
+- **Node Exporter**: `http://${HOST_IP}:9100`
+
 ## Benchmarking
 
 Guides for evaluating the performance and accuracy of this CodeGen deployment are available:
diff --git a/CodeGen/docker_compose/amd/cpu/epyc/compose.yaml b/CodeGen/docker_compose/amd/cpu/epyc/compose.yaml
index 3622248e0b..3c19a7e459 100644
--- a/CodeGen/docker_compose/amd/cpu/epyc/compose.yaml
+++ b/CodeGen/docker_compose/amd/cpu/epyc/compose.yaml
@@ -4,7 +4,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-server
     ports:
       - "8028:80"
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/README.md b/CodeGen/docker_compose/intel/cpu/xeon/README.md
index f8cb1e03ff..ceda275bdc 100644
--- a/CodeGen/docker_compose/intel/cpu/xeon/README.md
+++ b/CodeGen/docker_compose/intel/cpu/xeon/README.md
@@ -49,7 +49,8 @@ This uses the default vLLM-based deployment using `compose.yaml`.
     # export https_proxy="your_https_proxy"
     # export no_proxy="localhost,127.0.0.1,${HOST_IP}" # Add other hosts if necessary
     source intel/set_env.sh
-    cd /intel/cpu/xeon
+    cd intel/cpu/xeon
+    bash grafana/dashboards/download_opea_dashboard.sh
     ```
 
     _Note: The compose file might read additional variables from set_env.sh. Ensure all required variables like ports (`LLM_SERVICE_PORT`, `MEGA_SERVICE_PORT`, etc.) are set if not using defaults from the compose file._
@@ -83,13 +84,13 @@ Different Docker Compose files are available to select the LLM serving backend.
 
 - **Compose File:** `compose.yaml`
 - **Description:** Uses vLLM optimized for Intel CPUs as the LLM serving engine. This is the default deployment option used in the Quick Start.
-- **Services Deployed:** `codegen-vllm-server`, `codegen-llm-server`, `codegen-tei-embedding-server`, `codegen-retriever-server`, `redis-vector-db`, `codegen-dataprep-server`, `codegen-backend-server`, `codegen-gradio-ui-server`.
+- **Services Deployed:** `codegen-vllm-server`, `codegen-llm-server`, `codegen-tei-embedding-server`, `codegen-retriever-server`, `redis-vector-db`, `codegen-dataprep-server`, `codegen-backend-server`, `codegen-ui-server`.
 
 #### TGI-based Deployment (`compose_tgi.yaml`)
 
 - **Compose File:** `compose_tgi.yaml`
 - **Description:** Uses Hugging Face Text Generation Inference (TGI) optimized for Intel CPUs as the LLM serving engine.
-- **Services Deployed:** `codegen-tgi-server`, `codegen-llm-server`, `codegen-tei-embedding-server`, `codegen-retriever-server`, `redis-vector-db`, `codegen-dataprep-server`, `codegen-backend-server`, `codegen-gradio-ui-server`.
+- **Services Deployed:** `codegen-tgi-server`, `codegen-llm-server`, `codegen-tei-embedding-server`, `codegen-retriever-server`, `redis-vector-db`, `codegen-dataprep-server`, `codegen-backend-server`, `codegen-ui-server`.
 - **To Run:**
 
   ```bash
@@ -101,7 +102,7 @@ Different Docker Compose files are available to select the LLM serving backend.
 
 - **Compose File:** `compose_remote.yaml`
 - **Description:** Uses remote endpoints to access the served LLM's. This is the default configurations except for the LLM serving engine.
-- **Services Deployed:** `codegen-tei-embedding-server`, `codegen-retriever-server`, `redis-vector-db`, `codegen-dataprep-server`, `codegen-backend-server`, `codegen-gradio-ui-server`.
+- **Services Deployed:** `codegen-tei-embedding-server`, `codegen-retriever-server`, `redis-vector-db`, `codegen-dataprep-server`, `codegen-backend-server`, `codegen-ui-server`.
 - **To Run:**
 
 When models are deployed on a remote server, a base URL and an API key are required to access them. To set up a remote server and acquire the base URL and API key, refer to [Intel® AI for Enterprise Inference](https://www.intel.com/content/www/us/en/developer/topic-technology/artificial-intelligence/enterprise-inference.html) offerings.
@@ -146,7 +147,7 @@ Key parameters are configured via environment variables set before running `dock
 Most of these parameters are in `set_env.sh`, you can either modify this file or overwrite the env variables by setting them.
 
 ```shell
-source CodeGen/docker_compose/set_env.sh
+source CodeGen/docker_compose/intel/set_env.sh
 ```
 
 #### Compose Files
@@ -158,7 +159,7 @@ Different Docker Compose files (`compose.yaml`, `compose_tgi.yaml`) control whic
 If you need to modify the microservices:
 
 1.  Clone the [OPEA GenAIComps](https://github.com/opea-project/GenAIComps) repository.
-2.  Follow build instructions in the respective component directories (e.g., `comps/llms/text-generation`, `comps/codegen`, `comps/ui/gradio`, etc.). Use the provided Dockerfiles (e.g., `CodeGen/Dockerfile`, `CodeGen/ui/docker/Dockerfile.gradio`).
+2.  Follow build instructions in the respective component directories (e.g., `comps/llms/text-generation`, `comps/codegen`, etc.). Use the provided Dockerfiles (e.g., `CodeGen/Dockerfile`, `CodeGen/ui/docker/Dockerfile`).
 3.  Tag your custom images appropriately (e.g., `my-custom-codegen:latest`).
 4.  Update the `image:` fields in the compose files (`compose.yaml` or `compose_tgi.yaml`) to use your custom image tags.
 
@@ -206,18 +207,17 @@ Use `curl` commands to test the main service endpoints. Ensure `HOST_IP` is corr
 
 Multiple UI options can be configured via the compose files.
 
-### Gradio UI (Default)
+### Svelte UI (Default)
 
-Access the default Gradio UI by navigating to:
+Access the default Svelte UI by navigating to:
 `http://{HOST_IP}:5173`
-_(Port `5173` is the default host mapping for `codegen-gradio-ui-server`)_
+_(Port `5173` is the default host mapping for `codegen-ui-server`)_
 
-![Gradio UI - Code Generation](../../../../assets/img/codegen_gradio_ui_main.png)
-![Gradio UI - Resource Management](../../../../assets/img/codegen_gradio_ui_dataprep.png)
+![Svelte UI - Code Generation](../../../../assets/img/codeGen_ui_init.jpg)
 
-### Svelte UI (Optional)
+### Gradio UI (Optional)
 
-1.  Modify the compose file (either `compose.yaml` or `compose_tgi.yaml`): Comment out the `codegen-gradio-ui-server` service and uncomment/add the `codegen-xeon-ui-server` (Svelte) service definition, ensuring the port mapping is correct (e.g., `"- 5173:5173"`).
+1.  Modify the compose file (either `compose.yaml` or `compose_tgi.yaml`): Comment out the `codegen-xeon-ui-server` (Svelte) service and uncomment/add the `codegen-gradio-ui-server` service definition, ensuring the port mapping is correct (e.g., `"- 5173:5173"`).
 2.  Restart Docker Compose: `docker compose up -d` or `docker compose -f compose_tgi.yaml up -d`
 3.  Access: `http://{HOST_IP}:5173` (or the host port you mapped).
 
@@ -252,7 +252,63 @@ Users can interact with the backend service using the `Neural Copilot` VS Code e
 - **"Container name is in use"**: Stop existing containers (`docker compose down`) or change `container_name` in the compose file.
 - **Resource Issues:** CodeGen models can be memory-intensive. Monitor host RAM usage. Increase Docker resources if needed.
 
-## Stopping the Application
+## Monitoring Deployment
+
+To enable monitoring for the CodeGen application, you can use the monitoring Docker Compose file along with the main deployment.
+
+### Option #1: Default Deployment (without monitoring)
+
+To deploy the CodeGen services without monitoring, execute:
+
+```bash
+docker compose up -d
+```
+
+### Option #2: Deployment with Monitoring
+
+> NOTE: To enable monitoring, `compose.monitoring.yaml` file need to be merged along with default `compose.yaml` file.
+
+To deploy with monitoring:
+
+```bash
+bash grafana/dashboards/download_opea_dashboard.sh
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
+### Accessing Monitoring Services
+
+Once deployed with monitoring, you can access:
+
+- **Prometheus**: `http://${HOST_IP}:9090`
+- **Grafana**: `http://${HOST_IP}:3000` (username: `admin`, password: `admin`)
+- **Node Exporter**: `http://${HOST_IP}:9100`
+
+### Monitoring Components
+
+The monitoring stack includes:
+
+- **Prometheus**: For metrics collection and querying
+- **Grafana**: For visualization and dashboards
+- **Node Exporter**: For system metrics collection
+
+### Monitoring Dashboards
+
+The following dashboards are automatically downloaded and configured:
+
+- vLLM Dashboard
+- TGI Dashboard
+- CodeGen MegaService Dashboard
+- Node Exporter Dashboard
+
+### Stopping the Application
+
+If monitoring is enabled, execute the following command:
+
+```bash
+docker compose -f compose.yaml -f compose.monitoring.yaml down
+```
+
+If monitoring is not enabled, execute:
 
 ```bash
 docker compose down  # for vLLM (compose.yaml)
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/compose.monitoring.yaml b/CodeGen/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
new file mode 100644
index 0000000000..dea34085b3
--- /dev/null
+++ b/CodeGen/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
@@ -0,0 +1,58 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.sysfs=/host/sys'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    restart: always
+    deploy:
+      mode: global
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/compose.yaml b/CodeGen/docker_compose/intel/cpu/xeon/compose.yaml
index abb1933789..99cbe8a373 100644
--- a/CodeGen/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/CodeGen/docker_compose/intel/cpu/xeon/compose.yaml
@@ -4,7 +4,7 @@
 services:
 
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-server
     ports:
       - "8028:80"
@@ -66,7 +66,7 @@ services:
     ipc: host
     restart: always
   codegen-xeon-ui-server:
-    image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}
+    image: ${REGISTRY:-opea}/codegen-ui:${TAG:-latest}
     container_name: codegen-xeon-ui-server
     depends_on:
       - codegen-xeon-backend-server
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/compose_openeuler.yaml b/CodeGen/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
new file mode 100644
index 0000000000..fd2b9fc9ba
--- /dev/null
+++ b/CodeGen/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
@@ -0,0 +1,174 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+
+  vllm-service:
+    image: openeuler/vllm-cpu:0.10.1-oe2403lts
+    container_name: vllm-server
+    ports:
+      - "8028:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      host_ip: ${host_ip}
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model ${LLM_MODEL_ID} --host 0.0.0.0 --port 80
+  llm-base:
+    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}-openeuler
+    container_name: llm-textgen-server
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      HF_TOKEN: ${HF_TOKEN}
+    restart: unless-stopped
+  llm-vllm-service:
+    extends: llm-base
+    container_name: llm-codegen-vllm-server
+    ports:
+      - "9000:9000"
+    ipc: host
+    depends_on:
+      vllm-service:
+        condition: service_healthy
+  codegen-xeon-backend-server:
+    image: ${REGISTRY:-opea}/codegen:${TAG:-latest}-openeuler
+    container_name: codegen-xeon-backend-server
+    depends_on:
+      llm-base:
+        condition: service_started
+      dataprep-redis-server:
+        condition: service_healthy
+    ports:
+      - "7778:7778"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+      - RETRIEVAL_SERVICE_HOST_IP=${RETRIEVAL_SERVICE_HOST_IP}
+      - REDIS_RETRIEVER_PORT=${REDIS_RETRIEVER_PORT}
+      - TEI_EMBEDDING_HOST_IP=${TEI_EMBEDDING_HOST_IP}
+      - EMBEDDER_PORT=${EMBEDDER_PORT}
+    ipc: host
+    restart: always
+  codegen-xeon-ui-server:
+    image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}-openeuler
+    container_name: codegen-xeon-ui-server
+    depends_on:
+      - codegen-xeon-backend-server
+    ports:
+      - "5173:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BASIC_URL=${BACKEND_SERVICE_ENDPOINT}
+      - MEGA_SERVICE_PORT=${MEGA_SERVICE_PORT}
+      - host_ip=${host_ip}
+      - DATAPREP_ENDPOINT=${DATAPREP_ENDPOINT}
+      - DATAPREP_REDIS_PORT=${DATAPREP_REDIS_PORT}
+    ipc: host
+    restart: always
+  redis-vector-db:
+    image: redis/redis-stack:7.2.0-v9
+    container_name: redis-vector-db
+    ports:
+      - "${REDIS_DB_PORT:-6379}:${REDIS_DB_PORT:-6379}"
+      - "${REDIS_INSIGHTS_PORT:-8001}:${REDIS_INSIGHTS_PORT:-8001}"
+  dataprep-redis-server:
+    image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}-openeuler
+    container_name: dataprep-redis-server
+    depends_on:
+      - redis-vector-db
+    ports:
+      - "${DATAPREP_REDIS_PORT}:5000"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      REDIS_URL: ${REDIS_URL}
+      REDIS_HOST: ${host_ip}
+      INDEX_NAME: ${INDEX_NAME}
+      HF_TOKEN: ${HF_TOKEN}
+      LOGFLAG: true
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:5000/v1/health_check || exit 1"]
+      interval: 10s
+      timeout: 5s
+      retries: 10
+    restart: unless-stopped
+  tei-embedding-serving:
+    image: openeuler/text-embeddings-inference-cpu:1.7.0-oe2403lts
+    container_name: tei-embedding-serving
+    entrypoint: /bin/sh -c "yum update -y && yum install -y curl && text-embeddings-router --json-output --model-id ${EMBEDDING_MODEL_ID} --auto-truncate"
+    ports:
+      - "${TEI_EMBEDDER_PORT:-12000}:80"
+    volumes:
+      - "./data:/data"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      host_ip: ${host_ip}
+      HF_TOKEN: ${HF_TOKEN}
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:80/health"]
+      interval: 10s
+      timeout: 6s
+      retries: 48
+  tei-embedding-server:
+    image: ${REGISTRY:-opea}/embedding:${TAG:-latest}-openeuler
+    container_name: tei-embedding-server
+    ports:
+      - "${EMBEDDER_PORT:-10201}:6000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      TEI_EMBEDDING_ENDPOINT: ${TEI_EMBEDDING_ENDPOINT}
+      EMBEDDING_COMPONENT_NAME: "OPEA_TEI_EMBEDDING"
+    depends_on:
+      tei-embedding-serving:
+        condition: service_healthy
+    restart: unless-stopped
+  retriever-redis:
+    image: ${REGISTRY:-opea}/retriever:${TAG:-latest}-openeuler
+    container_name: retriever-redis
+    depends_on:
+      - redis-vector-db
+    ports:
+      - "${REDIS_RETRIEVER_PORT:-7000}:${REDIS_RETRIEVER_PORT:-7000}"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      REDIS_URL: ${REDIS_URL}
+      REDIS_DB_PORT: ${REDIS_DB_PORT}
+      REDIS_INSIGHTS_PORT: ${REDIS_INSIGHTS_PORT}
+      REDIS_RETRIEVER_PORT: ${REDIS_RETRIEVER_PORT}
+      INDEX_NAME: ${INDEX_NAME}
+      TEI_EMBEDDING_ENDPOINT: ${TEI_EMBEDDING_ENDPOINT}
+      HF_TOKEN: ${HF_TOKEN}
+      LOGFLAG: ${LOGFLAG}
+      RETRIEVER_COMPONENT_NAME: ${RETRIEVER_COMPONENT_NAME:-OPEA_RETRIEVER_REDIS}
+    restart: unless-stopped
+networks:
+  default:
+    driver: bridge
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/compose_remote.yaml b/CodeGen/docker_compose/intel/cpu/xeon/compose_remote.yaml
index e4ad0fd364..62b79796ee 100644
--- a/CodeGen/docker_compose/intel/cpu/xeon/compose_remote.yaml
+++ b/CodeGen/docker_compose/intel/cpu/xeon/compose_remote.yaml
@@ -26,7 +26,7 @@ services:
     ipc: host
     restart: always
   codegen-xeon-ui-server:
-    image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}
+    image: ${REGISTRY:-opea}/codegen-ui:${TAG:-latest}
     container_name: codegen-xeon-ui-server
     depends_on:
       - codegen-xeon-backend-server
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/compose_tgi.yaml b/CodeGen/docker_compose/intel/cpu/xeon/compose_tgi.yaml
index 7c1c3802e5..0da9cdddd3 100644
--- a/CodeGen/docker_compose/intel/cpu/xeon/compose_tgi.yaml
+++ b/CodeGen/docker_compose/intel/cpu/xeon/compose_tgi.yaml
@@ -66,7 +66,7 @@ services:
     ipc: host
     restart: always
   codegen-xeon-ui-server:
-    image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}
+    image: ${REGISTRY:-opea}/codegen-ui:${TAG:-latest}
     container_name: codegen-xeon-ui-server
     depends_on:
       - codegen-xeon-backend-server
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/compose_tgi_openeuler.yaml b/CodeGen/docker_compose/intel/cpu/xeon/compose_tgi_openeuler.yaml
new file mode 100644
index 0000000000..93e997371f
--- /dev/null
+++ b/CodeGen/docker_compose/intel/cpu/xeon/compose_tgi_openeuler.yaml
@@ -0,0 +1,174 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+
+  tgi-service:
+    image: openeuler/text-generation-inference-cpu:2.4.0-oe2403lts
+    container_name: tgi-server
+    ports:
+      - "8028:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/data"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      host_ip: ${host_ip}
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0
+  llm-base:
+    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}-openeuler
+    container_name: llm-textgen-server
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      HF_TOKEN: ${HF_TOKEN}
+    restart: unless-stopped
+  llm-tgi-service:
+    extends: llm-base
+    container_name: llm-codegen-tgi-server
+    ports:
+      - "9000:9000"
+    ipc: host
+    depends_on:
+      tgi-service:
+        condition: service_healthy
+  codegen-xeon-backend-server:
+    image: ${REGISTRY:-opea}/codegen:${TAG:-latest}-openeuler
+    container_name: codegen-xeon-backend-server
+    depends_on:
+      llm-base:
+        condition: service_started
+      dataprep-redis-server:
+        condition: service_healthy
+    ports:
+      - "7778:7778"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+      - RETRIEVAL_SERVICE_HOST_IP=${RETRIEVAL_SERVICE_HOST_IP}
+      - REDIS_RETRIEVER_PORT=${REDIS_RETRIEVER_PORT}
+      - TEI_EMBEDDING_HOST_IP=${TEI_EMBEDDING_HOST_IP}
+      - EMBEDDER_PORT=${EMBEDDER_PORT}
+    ipc: host
+    restart: always
+  codegen-xeon-ui-server:
+    image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}-openeuler
+    container_name: codegen-xeon-ui-server
+    depends_on:
+      - codegen-xeon-backend-server
+    ports:
+      - "5173:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BASIC_URL=${BACKEND_SERVICE_ENDPOINT}
+      - MEGA_SERVICE_PORT=${MEGA_SERVICE_PORT}
+      - host_ip=${host_ip}
+      - DATAPREP_ENDPOINT=${DATAPREP_ENDPOINT}
+      - DATAPREP_REDIS_PORT=${DATAPREP_REDIS_PORT}
+    ipc: host
+    restart: always
+  redis-vector-db:
+    image: redis/redis-stack:7.2.0-v9
+    container_name: redis-vector-db
+    ports:
+      - "${REDIS_DB_PORT}:${REDIS_DB_PORT}"
+      - "${REDIS_INSIGHTS_PORT}:${REDIS_INSIGHTS_PORT}"
+  dataprep-redis-server:
+    image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}-openeuler
+    container_name: dataprep-redis-server
+    depends_on:
+      - redis-vector-db
+    ports:
+      - "${DATAPREP_REDIS_PORT}:5000"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      REDIS_URL: ${REDIS_URL}
+      REDIS_HOST: ${host_ip}
+      INDEX_NAME: ${INDEX_NAME}
+      HF_TOKEN: ${HF_TOKEN}
+      LOGFLAG: true
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:5000/v1/health_check || exit 1"]
+      interval: 10s
+      timeout: 5s
+      retries: 10
+    restart: unless-stopped
+  tei-embedding-serving:
+    image: openeuler/text-embeddings-inference-cpu:1.7.0-oe2403lts
+    container_name: tei-embedding-serving
+    entrypoint: /bin/sh -c "yum update -y && yum install -y curl && text-embeddings-router --json-output --model-id ${EMBEDDING_MODEL_ID} --auto-truncate"
+    ports:
+      - "${TEI_EMBEDDER_PORT:-12000}:80"
+    volumes:
+      - "./data:/data"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      host_ip: ${host_ip}
+      HF_TOKEN: ${HF_TOKEN}
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:80/health"]
+      interval: 10s
+      timeout: 6s
+      retries: 48
+  tei-embedding-server:
+    image: ${REGISTRY:-opea}/embedding:${TAG:-latest}-openeuler
+    container_name: tei-embedding-server
+    ports:
+      - "${EMBEDDER_PORT:-10201}:6000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      TEI_EMBEDDING_ENDPOINT: ${TEI_EMBEDDING_ENDPOINT}
+      EMBEDDING_COMPONENT_NAME: "OPEA_TEI_EMBEDDING"
+    depends_on:
+      tei-embedding-serving:
+        condition: service_healthy
+    restart: unless-stopped
+  retriever-redis:
+    image: ${REGISTRY:-opea}/retriever:${TAG:-latest}-openeuler
+    container_name: retriever-redis
+    depends_on:
+      - redis-vector-db
+    ports:
+      - "${REDIS_RETRIEVER_PORT}:${REDIS_RETRIEVER_PORT}"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      REDIS_URL: ${REDIS_URL}
+      REDIS_DB_PORT: ${REDIS_DB_PORT}
+      REDIS_INSIGHTS_PORT: ${REDIS_INSIGHTS_PORT}
+      REDIS_RETRIEVER_PORT: ${REDIS_RETRIEVER_PORT}
+      INDEX_NAME: ${INDEX_NAME}
+      TEI_EMBEDDING_ENDPOINT: ${TEI_EMBEDDING_ENDPOINT}
+      HF_TOKEN: ${HF_TOKEN}
+      LOGFLAG: ${LOGFLAG}
+      RETRIEVER_COMPONENT_NAME: ${RETRIEVER_COMPONENT_NAME:-OPEA_RETRIEVER_REDIS}
+    restart: unless-stopped
+networks:
+  default:
+    driver: bridge
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh b/CodeGen/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..48a4d78cf9
--- /dev/null
+++ b/CodeGen/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+cd "$SCRIPT_DIR"
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/codegen_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml b/CodeGen/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/CodeGen/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml b/CodeGen/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml
new file mode 100644
index 0000000000..a206521d67
--- /dev/null
+++ b/CodeGen/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://$host_ip:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/CodeGen/docker_compose/intel/cpu/xeon/prometheus.yaml b/CodeGen/docker_compose/intel/cpu/xeon/prometheus.yaml
new file mode 100644
index 0000000000..27d0940e09
--- /dev/null
+++ b/CodeGen/docker_compose/intel/cpu/xeon/prometheus.yaml
@@ -0,0 +1,27 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["opea_prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["vllm-server:80"]
+  - job_name: "tgi"
+    metrics_path: /metrics
+    static_configs:
+      - targets: [ "tgi-service:80" ]
+  - job_name: "codegen-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["codegen-xeon-backend-server:7778"]
+  - job_name: "prometheus-node-exporter"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
diff --git a/CodeGen/docker_compose/intel/hpu/gaudi/README.md b/CodeGen/docker_compose/intel/hpu/gaudi/README.md
index 0f1e438cf8..2d72155ff3 100644
--- a/CodeGen/docker_compose/intel/hpu/gaudi/README.md
+++ b/CodeGen/docker_compose/intel/hpu/gaudi/README.md
@@ -49,7 +49,10 @@ This uses the default vLLM-based deployment using `compose.yaml`.
     # export https_proxy="your_https_proxy"
     # export no_proxy="localhost,127.0.0.1,${HOST_IP}" # Add other hosts if necessary
     source intel/set_env.sh
-    cd /intel/hpu/gaudi
+    cd intel/hpu/gaudi
+    cd grafana/dashboards
+    bash download_opea_dashboard.sh
+    cd ../..
     ```
 
     _Note: The compose file might read additional variables from set_env.sh. Ensure all required variables like ports (`LLM_SERVICE_PORT`, `MEGA_SERVICE_PORT`, etc.) are set if not using defaults from the compose file._
@@ -83,7 +86,7 @@ There are two separate Docker Compose files to select the LLM serving backend ac
 - **Compose File:** `compose.yaml`
 - **Description:** Uses vLLM optimized for Intel Gaudi HPUs as the LLM serving engine. This is the default deployment used in the Quick Start.
 - **Gaudi Service:** `codegen-vllm-gaudi-server`
-- **Other Services:** `codegen-llm-server`, `codegen-tei-embedding-server` (CPU), `codegen-retriever-server` (CPU), `redis-vector-db` (CPU), `codegen-dataprep-server` (CPU), `codegen-backend-server` (CPU), `codegen-gradio-ui-server` (CPU).
+- **Other Services:** `codegen-llm-server`, `codegen-tei-embedding-server` (CPU), `codegen-retriever-server` (CPU), `redis-vector-db` (CPU), `codegen-dataprep-server` (CPU), `codegen-backend-server` (CPU), `codegen-ui-server` (CPU).
 
 ### TGI-based Deployment (`compose_tgi.yaml`)
 
@@ -194,23 +197,23 @@ Use `curl` commands targeting the main service endpoints. Ensure `HOST_IP` is co
 
 UI options are similar to the Xeon deployment.
 
-### Gradio UI (Default)
+### Svelte UI (Default)
 
-Access the default Gradio UI:
+Access the default Svelte UI:
 `http://{HOST_IP}:5173`
 _(Port `5173` is the default host mapping)_
 
-![Gradio UI](../../../../assets/img/codegen_gradio_ui_main.png)
+![Svelte UI](../../../../assets/img/codeGen_ui_init.jpg)
 
-### Svelte UI (Optional)
+### Gradio UI (Optional)
 
-1.  Modify the compose file (either `compose.yaml` or `compose_tgi.yaml`): Swap Gradio service for Svelte (`codegen-gaudi-ui-server`), check port map (e.g., `5173:5173`).
+1.  Modify the compose file (either `compose.yaml` or `compose_tgi.yaml`): Swap Svelte service for Gradio (`codegen-gradio-ui-server`), check port map (e.g., `5173:5173`).
 2.  Restart: `docker compose up -d` or `docker compose -f compose_tgi.yaml up -d`
 3.  Access: `http://{HOST_IP}:5173`
 
 ### React UI (Optional)
 
-1.  Modify the compose file (either `compose.yaml` or `compose_tgi.yaml`): Swap Gradio service for React (`codegen-gaudi-react-ui-server`), check port map (e.g., `5174:80`).
+1.  Modify the compose file (either `compose.yaml` or `compose_tgi.yaml`): Swap Svelte service for React (`codegen-gaudi-react-ui-server`), check port map (e.g., `5174:80`).
 2.  Restart: `docker compose up -d` or `docker compose -f compose_tgi.yaml up -d`
 3.  Access: `http://{HOST_IP}:5174`
 
@@ -228,7 +231,62 @@ Use the `Neural Copilot` extension configured with the CodeGen backend URL: `htt
 - **Model Download Issues:** Check `HF_TOKEN`, internet access, proxy settings. Check LLM service logs.
 - **Connection Errors:** Verify `HOST_IP`, ports, and proxy settings. Use `docker ps` and check service logs.
 
-## Stopping the Application
+## Monitoring Deployment
+
+To enable monitoring for the CodeGen application on Gaudi, you can use the monitoring Docker Compose file along with the main deployment.
+
+### Option #1: Default Deployment (without monitoring)
+
+To deploy the CodeGen services without monitoring, execute:
+
+```bash
+docker compose up -d
+```
+
+### Option #2: Deployment with Monitoring
+
+> NOTE: To enable monitoring, `compose.monitoring.yaml` file need to be merged along with default `compose.yaml` file.
+
+To deploy with monitoring:
+
+```bash
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
+### Accessing Monitoring Services
+
+Once deployed with monitoring, you can access:
+
+- **Prometheus**: `http://${HOST_IP}:9090`
+- **Grafana**: `http://${HOST_IP}:3000` (username: `admin`, password: `admin`)
+- **Node Exporter**: `http://${HOST_IP}:9100`
+
+### Monitoring Components
+
+The monitoring stack includes:
+
+- **Prometheus**: For metrics collection and querying
+- **Grafana**: For visualization and dashboards
+- **Node Exporter**: For system metrics collection
+
+### Monitoring Dashboards
+
+The following dashboards are automatically downloaded and configured:
+
+- vLLM Dashboard
+- TGI Dashboard
+- CodeGen MegaService Dashboard
+- Node Exporter Dashboard
+
+### Stopping the Application
+
+If monitoring is enabled, execute the following command:
+
+```bash
+docker compose -f compose.yaml -f compose.monitoring.yaml down
+```
+
+If monitoring is not enabled, execute:
 
 ```bash
 docker compose down  # for vLLM (compose.yaml)
diff --git a/CodeGen/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml b/CodeGen/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
new file mode 100644
index 0000000000..cd891a445d
--- /dev/null
+++ b/CodeGen/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
@@ -0,0 +1,73 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.sysfs=/host/sys'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    restart: always
+    deploy:
+      mode: global
+
+  gaudi-metrics-exporter:
+    image: vault.habana.ai/gaudi-metric-exporter/metric-exporter:latest
+    privileged: true
+    container_name: gaudi-metrics-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+      - /dev:/dev
+    deploy:
+      mode: global
+    ports:
+      - 41611:41611
+    restart: unless-stopped
diff --git a/CodeGen/docker_compose/intel/hpu/gaudi/compose.yaml b/CodeGen/docker_compose/intel/hpu/gaudi/compose.yaml
index 2e56d1b913..6b33db7e82 100644
--- a/CodeGen/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/CodeGen/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -3,7 +3,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.4
     container_name: vllm-gaudi-server
     ports:
       - "8028:80"
@@ -74,7 +74,7 @@ services:
     ipc: host
     restart: always
   codegen-gaudi-ui-server:
-    image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}
+    image: ${REGISTRY:-opea}/codegen-ui:${TAG:-latest}
     container_name: codegen-gaudi-ui-server
     depends_on:
       - codegen-gaudi-backend-server
diff --git a/CodeGen/docker_compose/intel/hpu/gaudi/compose_tgi.yaml b/CodeGen/docker_compose/intel/hpu/gaudi/compose_tgi.yaml
index 8339451000..aa8f4a51ea 100644
--- a/CodeGen/docker_compose/intel/hpu/gaudi/compose_tgi.yaml
+++ b/CodeGen/docker_compose/intel/hpu/gaudi/compose_tgi.yaml
@@ -74,7 +74,7 @@ services:
     ipc: host
     restart: always
   codegen-gaudi-ui-server:
-    image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}
+    image: ${REGISTRY:-opea}/codegen-ui:${TAG:-latest}
     container_name: codegen-gaudi-ui-server
     depends_on:
       - codegen-gaudi-backend-server
diff --git a/CodeGen/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh b/CodeGen/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..40f2cb12a6
--- /dev/null
+++ b/CodeGen/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,16 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+cd "$SCRIPT_DIR"
+
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/codegen_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/gaudi_grafana_v2.json
diff --git a/CodeGen/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml b/CodeGen/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/CodeGen/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/CodeGen/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml b/CodeGen/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml
new file mode 100644
index 0000000000..a206521d67
--- /dev/null
+++ b/CodeGen/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://$host_ip:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/CodeGen/docker_compose/intel/hpu/gaudi/prometheus.yaml b/CodeGen/docker_compose/intel/hpu/gaudi/prometheus.yaml
new file mode 100644
index 0000000000..f259e2f7f9
--- /dev/null
+++ b/CodeGen/docker_compose/intel/hpu/gaudi/prometheus.yaml
@@ -0,0 +1,32 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["opea_prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["codegen-vllm-gaudi-server:80"]
+  - job_name: "tgi"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["codegen-tgi-gaudi-server:80"]
+  - job_name: "codegen-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["codegen-gaudi-backend-server:7778"]
+  - job_name: "prometheus-node-exporter"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
+  - job_name: "gaudi-metrics-exporter"
+    scrape_interval: 30s
+    metrics_path: /metrics
+    static_configs:
+      - targets: [ "gaudi-metrics-exporter:41611" ]
diff --git a/CodeGen/docker_compose/intel/set_env.sh b/CodeGen/docker_compose/intel/set_env.sh
index 543e9fee88..5e08df213e 100644
--- a/CodeGen/docker_compose/intel/set_env.sh
+++ b/CodeGen/docker_compose/intel/set_env.sh
@@ -51,3 +51,9 @@ export DATAPREP_ENDPOINT="http://${HOST_IP}:${DATAPREP_REDIS_PORT}/v1/dataprep"
 export LOGFLAG=false
 export MODEL_CACHE=${model_cache:-"./data"}
 export NUM_CARDS=1
+
+
+# Set network proxy settings
+export no_proxy="${no_proxy},${HOST_IP},vllm-server,codegen-xeon-backend-server,codegen-xeon-ui-server,redis-vector-db,dataprep-redis-server,tei-embedding-serving,tei-embedding-server,retriever-redis,opea_prometheus,grafana,node-exporter,$JAEGER_IP" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
+export http_proxy=$http_proxy
+export https_proxy=$https_proxy
diff --git a/CodeGen/docker_image_build/build.yaml b/CodeGen/docker_image_build/build.yaml
index 282c29766c..f0bfa23580 100644
--- a/CodeGen/docker_image_build/build.yaml
+++ b/CodeGen/docker_image_build/build.yaml
@@ -31,45 +31,86 @@ services:
       dockerfile: ./docker/Dockerfile.gradio
     extends: codegen
     image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}
+  codegen-openeuler:
+    build:
+      args:
+        IMAGE_REPO: ${REGISTRY}
+        BASE_TAG: ${TAG}
+        http_proxy: ${http_proxy}
+        https_proxy: ${https_proxy}
+        no_proxy: ${no_proxy}
+      context: ../
+      dockerfile: ./Dockerfile.openEuler
+    image: ${REGISTRY:-opea}/codegen:${TAG:-latest}-openeuler
+  codegen-ui-openeuler:
+    build:
+      context: ../ui
+      dockerfile: ./docker/Dockerfile.openEuler
+    extends: codegen
+    image: ${REGISTRY:-opea}/codegen-ui:${TAG:-latest}-openeuler
+  codegen-react-ui-openeuler:
+    build:
+      context: ../ui
+      dockerfile: ./docker/Dockerfile.react.openEuler
+    extends: codegen
+    image: ${REGISTRY:-opea}/codegen-react-ui:${TAG:-latest}-openeuler
+  codegen-gradio-ui-openeuler:
+    build:
+      context: ../ui
+      dockerfile: ./docker/Dockerfile.gradio.openEuler
+    extends: codegen
+    image: ${REGISTRY:-opea}/codegen-gradio-ui:${TAG:-latest}-openeuler
   llm-textgen:
     build:
       context: GenAIComps
       dockerfile: comps/llms/src/text-generation/Dockerfile
     extends: codegen
     image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}
+  llm-textgen-openeuler:
+    build:
+      context: GenAIComps
+      dockerfile: comps/llms/src/text-generation/Dockerfile.openEuler
+    extends: codegen
+    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}-openeuler
   vllm-rocm:
     build:
       context: GenAIComps
       dockerfile: comps/third_parties/vllm/src/Dockerfile.amd_gpu
     extends: codegen
     image: ${REGISTRY:-opea}/vllm-rocm:${TAG:-latest}
-  vllm:
-    build:
-      context: vllm
-      dockerfile: docker/Dockerfile.cpu
-    extends: codegen
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
-  vllm-gaudi:
-    build:
-      context: vllm-fork
-      dockerfile: Dockerfile.hpu
-    extends: codegen
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   dataprep:
     build:
       context: GenAIComps
       dockerfile: comps/dataprep/src/Dockerfile
     extends: codegen
     image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}
+  dataprep-openeuler:
+    build:
+      context: GenAIComps
+      dockerfile: comps/dataprep/src/Dockerfile.openEuler
+    extends: codegen
+    image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}-openeuler
   retriever:
     build:
       context: GenAIComps
       dockerfile: comps/retrievers/src/Dockerfile
     extends: codegen
     image: ${REGISTRY:-opea}/retriever:${TAG:-latest}
+  retriever-openeuler:
+    build:
+      context: GenAIComps
+      dockerfile: comps/retrievers/src/Dockerfile.openEuler
+    extends: codegen
+    image: ${REGISTRY:-opea}/retriever:${TAG:-latest}-openeuler
   embedding:
     build:
       context: GenAIComps
       dockerfile: comps/embeddings/src/Dockerfile
     extends: codegen
     image: ${REGISTRY:-opea}/embedding:${TAG:-latest}
+  embedding-openeuler:
+    build:
+      context: GenAIComps
+      dockerfile: comps/embeddings/src/Dockerfile.openEuler
+    extends: codegen
+    image: ${REGISTRY:-opea}/embedding:${TAG:-latest}-openeuler
diff --git a/CodeGen/kubernetes/helm/cpu-openeuler-values.yaml b/CodeGen/kubernetes/helm/cpu-openeuler-values.yaml
new file mode 100644
index 0000000000..884d7177c7
--- /dev/null
+++ b/CodeGen/kubernetes/helm/cpu-openeuler-values.yaml
@@ -0,0 +1,40 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# This file is based on cpu-values.yaml and overrides image tags to 'latest-openeuler'
+# for all enabled services to run on openEuler.
+image:
+  tag: latest-openeuler
+
+tgi:
+  enabled: false
+vllm:
+  image:
+    repository: openeuler/vllm-cpu
+    tag: 0.10.1-oe2403lts
+  enabled: true
+llm-uservice:
+  image:
+    tag: latest-openeuler
+  TEXTGEN_BACKEND: vLLM
+
+tei:
+  image:
+    repository: openeuler/text-embeddings-inference-cpu
+    tag: 1.7.0-oe2403lts
+
+data-prep:
+  image:
+    tag: latest-openeuler
+
+retriever-usvc:
+  image:
+    tag: latest-openeuler
+
+embedding-usvc:
+  image:
+    tag: latest-openeuler
+
+codegen-ui:
+  image:
+    tag: latest-openeuler
diff --git a/CodeGen/kubernetes/helm/cpu-tgi-openeuler-values.yaml b/CodeGen/kubernetes/helm/cpu-tgi-openeuler-values.yaml
new file mode 100644
index 0000000000..42839003e0
--- /dev/null
+++ b/CodeGen/kubernetes/helm/cpu-tgi-openeuler-values.yaml
@@ -0,0 +1,42 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# This file is based on cpu-values.yaml and overrides image tags to 'latest-openeuler'
+# for all enabled services to run on openEuler.
+
+image:
+  tag: latest-openeuler
+
+tgi:
+  enabled: true
+  image:
+    repository: openeuler/text-generation-inference-cpu
+    tag: 2.4.0-oe2403lts
+
+vllm:
+  enabled: false
+llm-uservice:
+  image:
+    tag: latest-openeuler
+  TEXTGEN_BACKEND: TGI
+
+tei:
+  image:
+    repository: openeuler/text-embeddings-inference-cpu
+    tag: 1.7.0-oe2403lts
+
+data-prep:
+  image:
+    tag: latest-openeuler
+
+retriever-usvc:
+  image:
+    tag: latest-openeuler
+
+embedding-usvc:
+  image:
+    tag: latest-openeuler
+
+codegen-ui:
+  image:
+    tag: latest-openeuler
diff --git a/CodeGen/tests/test_compose_on_epyc.sh b/CodeGen/tests/test_compose_on_epyc.sh
index efe3c25598..56dfb45b37 100644
--- a/CodeGen/tests/test_compose_on_epyc.sh
+++ b/CodeGen/tests/test_compose_on_epyc.sh
@@ -28,19 +28,8 @@ function build_docker_images() {
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
 
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
-
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="codegen codegen-gradio-ui llm-textgen vllm dataprep retriever embedding"
+	service_list="codegen codegen-ui llm-textgen dataprep retriever embedding"
 
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
@@ -51,7 +40,7 @@ function build_docker_images() {
 function start_services() {
 	local compose_file="$1"
 	local llm_container_name="$2"
-
+	export no_proxy="localhost,127.0.0.1,$ip_address"
 	cd $WORKPATH/docker_compose/amd/cpu/epyc/
 
 	# Start Docker Containers
@@ -170,47 +159,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	source activate ${conda_env_name}
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
-function validate_gradio() {
-	local URL="http://${ip_address}:5173/health"
-	local HTTP_STATUS=$(curl "$URL")
-	local SERVICE_NAME="Gradio"
-
-	if [ "$HTTP_STATUS" = '{"status":"ok"}' ]; then
-		echo "[ $SERVICE_NAME ] HTTP status is 200. UI server is running successfully..."
-	else
-		echo "[ $SERVICE_NAME ] UI server has failed..."
-	fi
-}
-
 function stop_docker() {
 	local compose_file="$1"
 
@@ -258,10 +206,6 @@ function main() {
 		validate_megaservice
 		echo "::endgroup::"
 
-		echo "::group::validate_gradio"
-		validate_gradio
-		echo "::endgroup::"
-
 		stop_docker "${docker_compose_files[${i}]}"
 		sleep 5s
 	done
diff --git a/CodeGen/tests/test_compose_on_gaudi.sh b/CodeGen/tests/test_compose_on_gaudi.sh
index 516624827f..88c2c9aeee 100644
--- a/CodeGen/tests/test_compose_on_gaudi.sh
+++ b/CodeGen/tests/test_compose_on_gaudi.sh
@@ -25,14 +25,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    # Download Gaudi vllm of latest tag
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    echo "Check out vLLM tag ${VLLM_FORK_VER}"
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="codegen codegen-gradio-ui llm-textgen vllm-gaudi dataprep retriever embedding"
+    service_list="codegen codegen-ui llm-textgen dataprep retriever embedding"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -41,11 +35,13 @@ function build_docker_images() {
 function start_services() {
     local compose_file="$1"
     local llm_container_name="$2"
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
 
+    # download grafana dashboard
+    bash grafana/dashboards/download_opea_dashboard.sh
     # Start Docker Containers
-    docker compose -f ${compose_file} up -d | tee ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f ${compose_file} -f compose.monitoring.yaml up -d | tee ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -152,51 +148,11 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-function validate_gradio() {
-    local URL="http://${ip_address}:5173/health"
-    local HTTP_STATUS=$(curl "$URL")
-    local SERVICE_NAME="Gradio"
-
-    if [ "$HTTP_STATUS" = '{"status":"ok"}' ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is 200. UI server is running successfully..."
-    else
-        echo "[ $SERVICE_NAME ] UI server has failed..."
-    fi
-}
-
 function stop_docker() {
     local compose_file="$1"
 
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f ${compose_file} down
+    docker compose -f ${compose_file} -f compose.monitoring.yaml down
 }
 
 function main() {
@@ -240,10 +196,6 @@ function main() {
         validate_megaservice
         echo "::endgroup::"
 
-        echo "::group::validate_gradio"
-        validate_gradio
-        echo "::endgroup::"
-
         stop_docker "${docker_compose_files[${i}]}"
         sleep 5s
     done
diff --git a/CodeGen/tests/test_compose_on_rocm.sh b/CodeGen/tests/test_compose_on_rocm.sh
index 173a0538fa..a0b9f5e024 100644
--- a/CodeGen/tests/test_compose_on_rocm.sh
+++ b/CodeGen/tests/test_compose_on_rocm.sh
@@ -111,35 +111,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose stop && docker compose rm -f
@@ -167,10 +138,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeGen/tests/test_compose_on_xeon.sh b/CodeGen/tests/test_compose_on_xeon.sh
index 0b138b2235..678108c494 100644
--- a/CodeGen/tests/test_compose_on_xeon.sh
+++ b/CodeGen/tests/test_compose_on_xeon.sh
@@ -26,14 +26,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="codegen codegen-gradio-ui llm-textgen vllm dataprep retriever embedding"
+    service_list="codegen codegen-ui llm-textgen dataprep retriever embedding"
 
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
@@ -44,11 +38,14 @@ function build_docker_images() {
 function start_services() {
     local compose_file="$1"
     local llm_container_name="$2"
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
 
+    # download grafana dashboard
+    bash grafana/dashboards/download_opea_dashboard.sh
+
     # Start Docker Containers
-    docker compose -f ${compose_file} up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f ${compose_file} -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -163,51 +160,11 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-function validate_gradio() {
-    local URL="http://${ip_address}:5173/health"
-    local HTTP_STATUS=$(curl "$URL")
-    local SERVICE_NAME="Gradio"
-
-    if [ "$HTTP_STATUS" = '{"status":"ok"}' ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is 200. UI server is running successfully..."
-    else
-        echo "[ $SERVICE_NAME ] UI server has failed..."
-    fi
-}
-
 function stop_docker() {
     local compose_file="$1"
 
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f ${compose_file} down
+    docker compose -f ${compose_file} -f compose.monitoring.yaml down
 }
 
 function main() {
@@ -250,10 +207,6 @@ function main() {
         validate_megaservice
         echo "::endgroup::"
 
-        echo "::group::validate_gradio"
-        validate_gradio
-        echo "::endgroup::"
-
         stop_docker "${docker_compose_files[${i}]}"
         sleep 5s
     done
diff --git a/CodeGen/tests/test_compose_openeuler_on_xeon.sh b/CodeGen/tests/test_compose_openeuler_on_xeon.sh
new file mode 100644
index 0000000000..b07dc99dcd
--- /dev/null
+++ b/CodeGen/tests/test_compose_openeuler_on_xeon.sh
@@ -0,0 +1,214 @@
+#!/bin/bash
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+source $WORKPATH/docker_compose/intel/set_env.sh
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG}-openeuler --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile.openEuler .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="codegen-openeuler codegen-gradio-ui-openeuler llm-textgen-openeuler dataprep-openeuler retriever-openeuler embedding-openeuler"
+
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker pull openeuler/text-generation-inference-cpu:2.4.0-oe2403lts
+    docker images && sleep 1s
+}
+
+function start_services() {
+    local compose_file="$1"
+    local llm_container_name="$2"
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+
+    # Start Docker Containers
+    docker compose -f ${compose_file} up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs ${llm_container_name} > ${LOG_PATH}/llm_service_start.log 2>&1
+        if grep -E "Connected|complete" ${LOG_PATH}/llm_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+}
+
+function validate_services() {
+    local URL="$1"
+    local EXPECTED_RESULT="$2"
+    local SERVICE_NAME="$3"
+    local DOCKER_NAME="$4"
+    local INPUT_DATA="$5"
+
+    if [[ "$SERVICE_NAME" == "ingest" ]]; then
+        local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -F "$INPUT_DATA" -F index_name=test_redis -H 'Content-Type: multipart/form-data' "$URL")
+
+        if [ "$HTTP_STATUS" -eq 200 ]; then
+            echo "[ $SERVICE_NAME ] HTTP status is 200. Data preparation succeeded..."
+        else
+            echo "[ $SERVICE_NAME ] Data preparation failed..."
+        fi
+
+    else
+        local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
+        if [ "$HTTP_STATUS" -eq 200 ]; then
+            echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+
+            local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
+
+            if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
+                echo "[ $SERVICE_NAME ] Content is as expected."
+            else
+                echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
+                docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+                exit 1
+            fi
+        else
+            echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
+            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+            exit 1
+        fi
+    fi
+    sleep 5s
+}
+
+function validate_microservices() {
+    local llm_container_name="$1"
+
+    # tgi for llm service
+    validate_services \
+        "${ip_address}:8028/v1/chat/completions" \
+        "completion_tokens" \
+        "llm-service" \
+        "${llm_container_name}" \
+        '{"model": "Qwen/Qwen2.5-Coder-7B-Instruct", "messages": [{"role": "user", "content": "What is Deep Learning?"}], "max_tokens": 256}'
+
+    # llm microservice
+    validate_services \
+        "${ip_address}:9000/v1/chat/completions" \
+        "data: " \
+        "llm" \
+        "llm-textgen-server" \
+        '{"query":"def print_hello_world():", "max_tokens": 256}'
+
+    # Data ingest microservice
+    validate_services \
+        "${ip_address}:6007/v1/dataprep/ingest" \
+        "Data preparation succeeded" \
+        "ingest" \
+        "dataprep-redis-server" \
+        'link_list=["https://modin.readthedocs.io/en/latest/index.html"]'
+
+}
+
+function validate_megaservice() {
+    # Curl the Mega Service
+    validate_services \
+        "${ip_address}:7778/v1/codegen" \
+        "print" \
+        "mega-codegen" \
+        "codegen-xeon-backend-server" \
+        '{"messages": "def print_hello_world():", "max_tokens": 256}'
+
+    # Curl the Mega Service with stream as false
+    validate_services \
+        "${ip_address}:7778/v1/codegen" \
+        "" \
+        "mega-codegen" \
+        "codegen-xeon-backend-server" \
+        '{ "messages": "def print_hello_world():", "max_tokens": 256, "stream": false}'
+
+    # Curl the Mega Service with index_name and agents_flag
+    validate_services \
+        "${ip_address}:7778/v1/codegen" \
+        "" \
+        "mega-codegen" \
+        "codegen-xeon-backend-server" \
+        '{ "index_name": "test_redis", "agents_flag": "True", "messages": "def print_hello_world():", "max_tokens": 256}'
+
+    validate_services \
+        "${ip_address}:7778/v1/codegen" \
+        "class" \
+        "mega-codegen" \
+        "codegen-xeon-backend-server" \
+        '{"model": "Qwen/Qwen2.5-Coder-7B-Instruct", "messages": [{"role": "user", "content": "Implement a basic Python class"}], "max_tokens":32}'
+
+}
+
+function stop_service() {
+    local compose_file="$1"
+
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose -f ${compose_file} down
+}
+
+function main() {
+    # all docker docker compose files for Xeon Platform
+    docker_compose_files=("compose_openeuler.yaml")
+    docker_llm_container_names=( "vllm-server")
+
+    # get number of compose files and LLM docker container names
+    len_compose_files=${#docker_compose_files[@]}
+    len_containers=${#docker_llm_container_names[@]}
+
+    # number of compose files and docker container names must be matched
+    if [ ${len_compose_files} -ne ${len_containers} ]; then
+        echo "Error: number of docker compose files ${len_compose_files} and container names ${len_containers} mismatched"
+        exit 1
+    fi
+
+    # stop_service, stop all compose files
+    for ((i = 0; i < len_compose_files; i++)); do
+        stop_service "${docker_compose_files[${i}]}"
+    done
+
+    # build docker images
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+
+    # loop all compose files
+    for ((i = 0; i < len_compose_files; i++)); do
+        echo "Process [${i}]: ${docker_compose_files[$i]}, ${docker_llm_container_names[${i}]}"
+        docker ps -a
+
+        echo "::group::start_services"
+        start_services "${docker_compose_files[${i}]}" "${docker_llm_container_names[${i}]}"
+        echo "::endgroup::"
+
+        echo "::group::validate_microservices"
+        validate_microservices "${docker_llm_container_names[${i}]}"
+        echo "::endgroup::"
+
+        echo "::group::validate_megaservice"
+        validate_megaservice
+        echo "::endgroup::"
+
+        stop_service "${docker_compose_files[${i}]}"
+        sleep 5s
+    done
+
+    docker system prune -f
+}
+
+main
diff --git a/CodeGen/tests/test_compose_tgi_on_epyc.sh b/CodeGen/tests/test_compose_tgi_on_epyc.sh
index 9476925d3f..347b322ccc 100644
--- a/CodeGen/tests/test_compose_tgi_on_epyc.sh
+++ b/CodeGen/tests/test_compose_tgi_on_epyc.sh
@@ -28,19 +28,8 @@ function build_docker_images() {
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
 
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
-
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="codegen codegen-gradio-ui llm-textgen vllm dataprep retriever embedding"
+	service_list="codegen codegen-ui llm-textgen dataprep retriever embedding"
 
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
@@ -51,7 +40,7 @@ function build_docker_images() {
 function start_services() {
 	local compose_file="$1"
 	local llm_container_name="$2"
-
+	export no_proxy="localhost,127.0.0.1,$ip_address"
 	cd $WORKPATH/docker_compose/amd/cpu/epyc/
 
 	# Start Docker Containers
@@ -170,47 +159,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	source activate ${conda_env_name}
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
-function validate_gradio() {
-	local URL="http://${ip_address}:5173/health"
-	local HTTP_STATUS=$(curl "$URL")
-	local SERVICE_NAME="Gradio"
-
-	if [ "$HTTP_STATUS" = '{"status":"ok"}' ]; then
-		echo "[ $SERVICE_NAME ] HTTP status is 200. UI server is running successfully..."
-	else
-		echo "[ $SERVICE_NAME ] UI server has failed..."
-	fi
-}
-
 function stop_docker() {
 	local compose_file="$1"
 
@@ -258,10 +206,6 @@ function main() {
 		validate_megaservice
 		echo "::endgroup::"
 
-		echo "::group::validate_gradio"
-		validate_gradio
-		echo "::endgroup::"
-
 		stop_docker "${docker_compose_files[${i}]}"
 		sleep 5s
 	done
diff --git a/CodeGen/tests/test_compose_vllm_on_rocm.sh b/CodeGen/tests/test_compose_vllm_on_rocm.sh
index 33fef0b279..053d8aeffb 100644
--- a/CodeGen/tests/test_compose_vllm_on_rocm.sh
+++ b/CodeGen/tests/test_compose_vllm_on_rocm.sh
@@ -110,35 +110,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-
 function stop_docker() {
     echo "OPENAI_API_KEY - ${OPENAI_API_KEY}"
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
@@ -167,10 +138,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeGen/tests/test_ui_on_xeon.sh b/CodeGen/tests/test_ui_on_xeon.sh
new file mode 100644
index 0000000000..e83b6c4079
--- /dev/null
+++ b/CodeGen/tests/test_ui_on_xeon.sh
@@ -0,0 +1,193 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+source $WORKPATH/docker_compose/intel/set_env.sh
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="codegen codegen-ui llm-textgen dataprep retriever embedding"
+
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker pull ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
+    docker images && sleep 1s
+}
+
+function start_services() {
+    local compose_file="$1"
+    local llm_container_name="$2"
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+
+    # Start Docker Containers
+    docker compose -f ${compose_file} up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    n=0
+    until [[ "$n" -ge 200 ]]; do
+        docker logs ${llm_container_name} > ${LOG_PATH}/llm_service_start.log 2>&1
+        if grep -E "Connected|complete|healthy" ${LOG_PATH}/llm_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+}
+
+function validate_frontend() {
+    cd $WORKPATH/ui/svelte
+    local conda_env_name="OPEA_e2e"
+    export PATH=${HOME}/miniforge3/bin/:$PATH
+    if conda info --envs | grep -q "$conda_env_name"; then
+        echo "$conda_env_name exist!"
+    else
+        conda create -n ${conda_env_name} python=3.12 -y
+    fi
+    source activate ${conda_env_name}
+
+    sed -i "s/localhost/$ip_address/g" playwright.config.ts
+
+    conda install -c conda-forge nodejs=22.6.0 -y
+    npm install && npm ci && npx playwright install --with-deps
+    node -v && npm -v && pip list
+
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+
+    # Wait for backend service to be ready
+    echo "Waiting for backend service to be ready..."
+    n=0
+    until [[ "$n" -ge 60 ]]; do
+        HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" "http://${ip_address}:7778/v1/chatcompletions")
+        if [ "$HTTP_STATUS" = "200" ] || [ "$HTTP_STATUS" = "500" ]; then  # 500 might be expected if model is loading
+            echo "Backend service is ready"
+            break
+        fi
+        echo "Waiting for backend service... (attempt $n/60), HTTP status: $HTTP_STATUS"
+        sleep 5s
+        n=$((n+1))
+    done
+
+    # Wait for UI service to be ready
+    echo "Waiting for UI service to be ready..."
+    n=0
+    until [[ "$n" -ge 60 ]]; do
+        HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" "http://${ip_address}:5173/health")
+        if [ "$HTTP_STATUS" = "200" ]; then
+            echo "UI service is ready"
+            break
+        fi
+        echo "Waiting for UI service... (attempt $n/60), HTTP status: $HTTP_STATUS"
+        sleep 5s
+        n=$((n+1))
+    done
+
+    # Run tests with better logging
+    echo "Starting Playwright tests..."
+    exit_status=0
+    npx playwright test --reporter=list > ${LOG_PATH}/frontend_test.log 2>&1 || exit_status=$?
+
+    if [ $exit_status -ne 0 ]; then
+        echo "[TEST INFO]: ---------frontend test failed---------"
+        echo "Test logs:"
+        cat ${LOG_PATH}/frontend_test.log
+        exit $exit_status
+    else
+        echo "[TEST INFO]: ---------frontend test passed---------"
+    fi
+}
+
+function validate_gradio() {
+    local URL="http://${ip_address}:5173/health"
+    local HTTP_STATUS=$(curl -s "$URL")
+    local SERVICE_NAME="CodeGen UI"
+
+    if [ "$HTTP_STATUS" = '{"status":"ok"}' ] || [ "$HTTP_STATUS" = "200" ]; then
+        echo "[ $SERVICE_NAME ] HTTP status is 200. UI server is running successfully..."
+    else
+        echo "[ $SERVICE_NAME ] UI server health check failed. Response: $HTTP_STATUS"
+    fi
+}
+
+function stop_docker() {
+    local compose_file="$1"
+
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose -f ${compose_file} down
+}
+
+function main() {
+    # all docker docker compose files for Xeon Platform
+    docker_compose_files=("compose_tgi.yaml" "compose.yaml")
+    docker_llm_container_names=("tgi-server" "vllm-server")
+
+    # get number of compose files and LLM docker container names
+    len_compose_files=${#docker_compose_files[@]}
+    len_containers=${#docker_llm_container_names[@]}
+
+    # number of compose files and docker container names must be matched
+    if [ ${len_compose_files} -ne ${len_containers} ]; then
+        echo "Error: number of docker compose files ${len_compose_files} and container names ${len_containers} mismatched"
+        exit 1
+    fi
+
+    # stop_docker, stop all compose files
+    for ((i = 0; i < len_compose_files; i++)); do
+        stop_docker "${docker_compose_files[${i}]}"
+    done
+
+    # build docker images
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+
+    # loop all compose files
+    for ((i = 0; i < len_compose_files; i++)); do
+        echo "Process [${i}]: ${docker_compose_files[$i]}, ${docker_llm_container_names[${i}]}"
+        docker ps -a
+
+        echo "::group::start_services"
+        start_services "${docker_compose_files[${i}]}" "${docker_llm_container_names[${i}]}"
+        echo "::endgroup::"
+
+        echo "::group::validate_ui"
+        validate_frontend
+        if [ $? -ne 0 ]; then
+            echo "Frontend validation failed, checking logs..."
+            if [ -f "${LOG_PATH}/frontend_test.log" ]; then
+                echo "Frontend test logs:"
+                cat "${LOG_PATH}/frontend_test.log"
+            fi
+        fi
+        echo "::endgroup::"
+
+        echo "::group::validate_gradio"
+        validate_gradio
+        echo "::endgroup::"
+
+        stop_docker "${docker_compose_files[${i}]}"
+        sleep 5s
+    done
+
+    docker system prune -f
+}
+
+main
diff --git a/CodeGen/ui/docker/Dockerfile.gradio.openEuler b/CodeGen/ui/docker/Dockerfile.gradio.openEuler
new file mode 100644
index 0000000000..a0605e33d2
--- /dev/null
+++ b/CodeGen/ui/docker/Dockerfile.gradio.openEuler
@@ -0,0 +1,30 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+FROM openeuler/python:3.11.13-oe2403lts@sha256:472759fb1852f35c9c0be20ff931aba6fbac1487175a0e46d6a73b6f6c33dd3c
+
+ENV LANG=C.UTF-8
+
+ARG ARCH="cpu"
+
+RUN yum update -y && \
+    yum install -y \
+        gcc \
+        g++ \
+        make \
+        java-21-openjdk \
+        jemalloc-devel \
+        ffmpeg \
+        wget && \
+    yum clean all && \
+    rm -rf /var/cache/yum
+
+RUN mkdir -p /home/user
+
+COPY gradio /home/user/gradio
+
+RUN pip install --no-cache-dir --upgrade pip setuptools && \
+pip install --no-cache-dir -r /home/user/gradio/requirements.txt
+
+WORKDIR /home/user/gradio
+ENTRYPOINT ["python", "codegen_ui_gradio.py"]
diff --git a/CodeGen/ui/docker/Dockerfile.openEuler b/CodeGen/ui/docker/Dockerfile.openEuler
new file mode 100644
index 0000000000..efa2cf2723
--- /dev/null
+++ b/CodeGen/ui/docker/Dockerfile.openEuler
@@ -0,0 +1,32 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# Use node 20.11.1 as the base image
+
+FROM openeuler/node:20.11.1-oe2403lts@sha256:25c790f93c2243b361919620c069812319f614fd697e32e433402ae706a19ffd
+
+# Update package manager and install Git
+RUN yum update -y && \
+    yum install -y \
+        git && \
+    yum clean all && \
+    rm -rf /var/cache/yum
+
+# Copy the front-end code repository
+COPY svelte /home/user/svelte
+
+# Set the working directory
+WORKDIR /home/user/svelte
+
+# Install front-end dependencies
+RUN npm install --package-lock-only
+RUN npm ci
+
+# Build the front-end application
+RUN npm run build
+
+# Expose the port of the front-end application
+EXPOSE 5173
+
+# Run the front-end application in preview mode
+CMD ["npm", "run", "preview", "--", "--port", "5173", "--host", "0.0.0.0"]
diff --git a/CodeGen/ui/docker/Dockerfile.react.openEuler b/CodeGen/ui/docker/Dockerfile.react.openEuler
new file mode 100644
index 0000000000..9cba915a56
--- /dev/null
+++ b/CodeGen/ui/docker/Dockerfile.react.openEuler
@@ -0,0 +1,21 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# Use node 20.11.1 as the base image
+FROM openeuler/node@sha256:25c790f93c2243b361919620c069812319f614fd697e32e433402ae706a19ffd as vite-app
+ 
+COPY react /usr/app/react
+WORKDIR /usr/app/react
+
+RUN ["npm", "install", "--package-lock-only"]
+RUN ["npm", "ci"]
+RUN ["npm", "run", "build"]
+
+
+FROM openeuler/nginx:1.29.0-oe2403lts@sha256:80dcb7274946ef6c0c5c6ccaac5c81b8ac9c4c7c49f1f0bf61d4d9371b165b18
+
+COPY --from=vite-app /usr/app/react/dist /usr/share/nginx/html
+COPY ./react/env.sh /docker-entrypoint.d/env.sh
+
+COPY ./react/nginx.conf /etc/nginx/conf.d/default.conf
+RUN chmod +x /docker-entrypoint.d/env.sh
diff --git a/CodeGen/ui/gradio/codegen_ui_gradio.py b/CodeGen/ui/gradio/codegen_ui_gradio.py
index b84269a577..10207d1090 100644
--- a/CodeGen/ui/gradio/codegen_ui_gradio.py
+++ b/CodeGen/ui/gradio/codegen_ui_gradio.py
@@ -164,7 +164,13 @@ def generate_code(query, index=None, use_agent=False):
 
 def ingest_file(file, index=None, chunk_size=100, chunk_overlap=150):
     headers = {}
-    file_input = {"files": open(file, "rb")}
+    # Restrict file access to UPLOAD_ROOT directory
+    UPLOAD_ROOT = os.path.abspath("./")
+    normalized_path = os.path.normpath(os.path.join(UPLOAD_ROOT, file))
+    # Ensure the constructed path is still within the upload root
+    if not normalized_path.startswith(UPLOAD_ROOT):
+        raise Exception("Access to the specified file is not allowed.")
+    file_input = {"files": open(normalized_path, "rb")}
 
     if index:
         data = {"index_name": index, "chunk_size": chunk_size, "chunk_overlap": chunk_overlap}
diff --git a/CodeGen/ui/gradio/requirements.txt b/CodeGen/ui/gradio/requirements.txt
index 2a4c8e1a30..14b3080e22 100644
--- a/CodeGen/ui/gradio/requirements.txt
+++ b/CodeGen/ui/gradio/requirements.txt
@@ -1,4 +1,4 @@
-gradio==5.22.0
+gradio>5.22.0,<=5.34.0 
 numpy==1.26.4
 opencv-python==4.10.0.82
 Pillow==10.3.0
diff --git a/CodeGen/ui/svelte/package.json b/CodeGen/ui/svelte/package.json
index cb2f611c58..050bd5b351 100644
--- a/CodeGen/ui/svelte/package.json
+++ b/CodeGen/ui/svelte/package.json
@@ -18,7 +18,7 @@
     "@fortawesome/free-solid-svg-icons": "6.2.0",
     "@playwright/test": "^1.45.2",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "@tailwindcss/typography": "0.5.7",
     "@types/debug": "4.1.7",
diff --git a/CodeGen/ui/svelte/src/lib/modules/chat/Output.svelte b/CodeGen/ui/svelte/src/lib/modules/chat/Output.svelte
index 015375ad6f..5bf3012431 100644
--- a/CodeGen/ui/svelte/src/lib/modules/chat/Output.svelte
+++ b/CodeGen/ui/svelte/src/lib/modules/chat/Output.svelte
@@ -37,12 +37,24 @@
 	import bash from "svelte-highlight/languages/bash";
 	import sql from "svelte-highlight/languages/sql";
 	import { marked } from "marked";
-	export let label = "";
+	import { afterUpdate, onMount } from "svelte";
+
 	export let output = "";
-	export let languages = "Python";
+	export let lang = "Python";
 	export let isCode = false;
+	export let md_output = "";
+	export let segments: Segment[] = [];
 
+	let outputEl: HTMLDivElement;
 	let copyText = "copy";
+	let shouldAutoscroll = true;
+
+	type Segment = {
+		id: number;
+		type: "text" | "code";
+		content: string;
+		lang?: string;
+	};
 
 	const languagesTag = {
 		Typescript: typescript,
@@ -65,53 +77,194 @@
 		Lua: lua,
 		Bash: bash,
 		Sql: sql,
-	} as { [key: string]: any };
-
-	function copyToClipboard(text) {
-		const textArea = document.createElement("textarea");
-		textArea.value = text;
-		document.body.appendChild(textArea);
-		textArea.select();
-		document.execCommand("copy");
-		document.body.removeChild(textArea);
+	} as const;
+
+	type LangKey = keyof typeof languagesTag;
+
+	const aliasMap: Record<string, LangKey> = {
+		javascript: "Javascript",
+		js: "Javascript",
+		jsx: "Javascript",
+		typescript: "Typescript",
+		ts: "Typescript",
+		tsx: "Typescript",
+
+		python: "Python",
+		py: "Python",
+
+		c: "C",
+		"c++": "Cpp",
+		cpp: "Cpp",
+		cxx: "Cpp",
+		csharp: "Csharp",
+		"c#": "Csharp",
+
+		go: "Go",
+		golang: "Go",
+		java: "Java",
+		swift: "Swift",
+		ruby: "Ruby",
+		rust: "Rust",
+		php: "Php",
+		kotlin: "Kotlin",
+		objectivec: "Objectivec",
+		objc: "Objectivec",
+		"objective-c": "Objectivec",
+		perl: "Perl",
+		matlab: "Matlab",
+		r: "R",
+		lua: "Lua",
+
+		bash: "Bash",
+		sh: "Bash",
+		shell: "Bash",
+		zsh: "Bash",
+
+		sql: "Sql",
+	};
+
+	$: normalizedLangKey = (() => {
+		const raw = (lang ?? "").toString().trim();
+		if (!raw) return null;
+		const lower = raw.toLowerCase();
+
+		if (lower in aliasMap) return aliasMap[lower];
+
+		const hit = (Object.keys(languagesTag) as LangKey[]).find(
+			(k) => k.toLowerCase() === lower
+		);
+		return hit ?? null;
+	})();
+
+	$: fullText = buildFullText();
+
+	function atBottom(el: HTMLElement, threshold = 8) {
+		return el.scrollHeight - el.scrollTop - el.clientHeight <= threshold;
+	}
+
+	function handleScroll() {
+		if (!outputEl) return;
+		shouldAutoscroll = atBottom(outputEl);
 	}
 
-	function handelCopy() {
-		copyToClipboard(output);
+	function scrollToBottom() {
+		if (!outputEl) return;
+		requestAnimationFrame(() =>
+			requestAnimationFrame(() => {
+				if (outputEl.scrollHeight) {
+					outputEl.scrollTop = outputEl.scrollHeight;
+				}
+			})
+		);
+	}
+
+	onMount(() => {
+		scrollToBottom();
+	});
+
+	afterUpdate(() => {
+		if (shouldAutoscroll) scrollToBottom();
+	});
+	async function copyAllFromDiv() {
+		await navigator.clipboard.writeText(outputEl.innerText);
 		copyText = "copied!";
-		setTimeout(() => {
-			copyText = "copy";
-		}, 1000);
+		setTimeout(() => (copyText = "copy"), 1000);
+	}
+
+	function copyToClipboard(text: string) {
+		if (navigator?.clipboard?.writeText) {
+			navigator.clipboard.writeText(text);
+		} else {
+			const textArea = document.createElement("textarea");
+			textArea.value = text;
+			document.body.appendChild(textArea);
+			textArea.select();
+			document.execCommand("copy");
+			document.body.removeChild(textArea);
+		}
+	}
+
+	function normalizeToKey(raw?: string | null) {
+		const s = (raw ?? "").trim().toLowerCase();
+		if (!s) return null;
+		if (s in aliasMap) return aliasMap[s as keyof typeof aliasMap];
+		const hit = (
+			Object.keys(languagesTag) as (keyof typeof languagesTag)[]
+		).find((k) => k.toLowerCase() === s);
+		return hit ?? null;
+	}
+
+	function buildFullText(): string {
+		if (segments && segments.length > 0) {
+			return segments
+				.map((seg) => {
+					if (seg.type === "code") {
+						const key = normalizeToKey(seg.lang) ?? "text";
+						return ["```" + key.toLowerCase(), seg.content, "```"].join("\n");
+					}
+					return seg.content;
+				})
+				.join("\n\n");
+		}
+
+		const parts: string[] = [];
+		if (isCode && output) {
+			const key = (normalizedLangKey ?? "text").toLowerCase();
+			parts.push(["```" + key, output, "```"].join("\n"));
+		}
+		if (md_output) {
+			parts.push(md_output);
+		}
+		return parts.join("\n\n");
 	}
 </script>
 
 <div class="flex w-full flex-col" data-testid="code-output">
-	<span
-		class=" mb-2 flex h-[3rem] w-full items-center justify-center bg-[#5856D6] px-8 py-2 text-center text-[0.89rem] uppercase leading-tight opacity-80"
-		>{label}</span
-	>
-
 	<div
 		class="flex justify-end border-2 border-none border-b-gray-800 bg-[#1C1C1C] px-3 text-white"
 	>
 		<button
 			class="rounded border border-none py-1 text-[0.8rem] text-[#abb2bf]"
-			on:click={() => {
-				handelCopy();
-			}}>{copyText}</button
+			on:click={copyAllFromDiv}>{copyText}</button
 		>
 	</div>
+
 	<div
-		class="code-format-style hiddenScroll h-[22rem] divide-y overflow-auto bg-[#011627]"
+		class="
+    hiddenScroll h-[22rem] overflow-auto
+    bg-[#011627] p-5 text-[13px]
+    leading-5
+  "
+		bind:this={outputEl}
+		on:scroll={handleScroll}
 	>
-		{#if isCode}
-			<Highlight language={python} code={output} let:highlighted>
-				<LineNumbers {highlighted} wrapLines hideBorder />
-			</Highlight>
+		{#if segments && segments.length > 0}
+			{#each segments as seg (seg.id)}
+				{#if seg.type === "code"}
+					<div class="relative border-t border-[#0c2233]">
+						<Highlight
+							language={languagesTag[normalizeToKey(seg.lang) ?? "Python"]}
+							code={seg.content}
+							let:highlighted
+						>
+							<LineNumbers {highlighted} wrapLines hideBorder />
+						</Highlight>
+					</div>
+				{:else}
+					<div>{@html marked(seg.content)}</div>
+				{/if}
+			{/each}
 		{:else}
-			<div class="bg-[#282c34] text-[#abb2bf]">
-				{@html marked(output)}
-			</div>
+			{#if isCode && output}
+				<Highlight language={python} code={output} let:highlighted>
+					<LineNumbers {highlighted} wrapLines hideBorder />
+				</Highlight>
+			{/if}
+			{#if md_output}
+				<div class="bg-[#282c34] py-2 text-[#abb2bf]">
+					{@html marked(md_output)}
+				</div>
+			{/if}
 		{/if}
 	</div>
 </div>
@@ -120,17 +273,8 @@
 	.hiddenScroll::-webkit-scrollbar {
 		display: none;
 	}
-
 	.hiddenScroll {
 		-ms-overflow-style: none; /* IE and Edge */
 		scrollbar-width: none; /* Firefox */
 	}
-
-	.code-format-style {
-		resize: none;
-		font-size: 16px;
-		border: solid rgba(128, 0, 128, 0) 4px;
-		box-shadow: 0 0 8px rgba(0, 0, 0, 0.19);
-		transition: 0.1s linear;
-	}
 </style>
diff --git a/CodeGen/ui/svelte/src/routes/+page.svelte b/CodeGen/ui/svelte/src/routes/+page.svelte
index 0e7d43beaf..d927ea9322 100644
--- a/CodeGen/ui/svelte/src/routes/+page.svelte
+++ b/CodeGen/ui/svelte/src/routes/+page.svelte
@@ -23,38 +23,196 @@
 	import PaperAirplane from "$lib/assets/chat/svelte/PaperAirplane.svelte";
 	import Output from "$lib/modules/chat/Output.svelte";
 
-	let code_output: string = "";
 	let query: string = "";
 	let loading: boolean = false;
-	let deleteFlag: boolean = false;
+	let inFence = false;
+	let tickRun = 0;
+	let skipLangLine = false;
+	let langBuf = "";
+	let currentLang = "";
+
+	type Segment = {
+		id: number;
+		type: "text" | "code";
+		content: string;
+		lang?: string;
+	};
+	let segments: Segment[] = [];
+	let _sid = 0;
+
+	const languageAliases: Record<string, string> = {
+		javascript: "Javascript",
+		js: "Javascript",
+		jsx: "Javascript",
+		typescript: "Typescript",
+		ts: "Typescript",
+		tsx: "Typescript",
+
+		python: "Python",
+		py: "Python",
+
+		c: "C",
+		"c++": "Cpp",
+		cpp: "Cpp",
+		cxx: "Cpp",
+		csharp: "Csharp",
+		"c#": "Csharp",
+
+		go: "Go",
+		golang: "Go",
+		java: "Java",
+		swift: "Swift",
+		ruby: "Ruby",
+		rust: "Rust",
+		php: "Php",
+		kotlin: "Kotlin",
+		objectivec: "Objectivec",
+		objc: "Objectivec",
+		"objective-c": "Objectivec",
+		perl: "Perl",
+		matlab: "Matlab",
+		r: "R",
+		lua: "Lua",
+
+		bash: "Bash",
+		sh: "Bash",
+		shell: "Bash",
+		zsh: "Bash",
+
+		sql: "Sql",
+	};
+
+	function canonicalLang(raw?: string | null): string | null {
+		const s = (raw ?? "").toString().trim();
+		if (!s) return null;
+		const lower = s.toLowerCase();
+		return languageAliases[lower] ?? s;
+	}
+
+	function appendText(s: string) {
+		if (!s) return;
+		const last = segments[segments.length - 1];
+		if (!last || last.type !== "text") {
+		segments = [...segments, { id: ++_sid, type: "text", content: "" }];
+		}
+		segments[segments.length - 1].content += s;
+	}
+
+	function appendCode(s: string) {
+		if (!s) return;
+		const last = segments[segments.length - 1];
+		if (!last || last.type !== "code") {
+		segments = [
+			...segments,
+			{
+			id: ++_sid,
+			type: "code",
+			content: "",
+			lang: currentLang || "python",
+			},
+		];
+		}
+		segments[segments.length - 1].content += s;
+	}
+
+	function settleTicks() {
+		if (tickRun === 0) return;
+
+		if (tickRun >= 3) {
+		const toggles = Math.floor(tickRun / 3);
+		for (let i = 0; i < toggles; i++) {
+			inFence = !inFence;
+			if (inFence) {
+			skipLangLine = true;
+			langBuf = "";
+			currentLang = "";
+			} else {
+			skipLangLine = false;
+			}
+		}
+		const leftovers = tickRun % 3;
+		if (leftovers) (inFence ? appendCode : appendText)("`".repeat(leftovers));
+		} else {
+		(inFence ? appendCode : appendText)("`".repeat(tickRun));
+		}
+		tickRun = 0;
+	}
+
+	function consumeChunk(s: string) {
+		for (let i = 0; i < s.length; i++) {
+		const ch = s[i];
+
+		if (ch === "`") {
+			tickRun++;
+			continue;
+		}
+
+		settleTicks();
+
+		if (skipLangLine) {
+			if (ch === "\n") {
+			skipLangLine = false;
+			const canon = canonicalLang(langBuf);
+			currentLang = canon ?? (langBuf.trim() || "python");
+			langBuf = "";
+			} else {
+			langBuf += ch;
+			}
+			continue;
+		}
+
+		if (inFence) appendCode(ch);
+		else appendText(ch);
+		}
+	}
 
 	const callTextStream = async (query: string) => {
 		loading = true;
-		code_output = "";
+
+		segments = [];
+		_sid = 0;
+		inFence = false;
+		tickRun = 0;
+		skipLangLine = false;
+		langBuf = "";
+		currentLang = "";
+
 		const eventSource = await fetchTextStream(query);
 
 		eventSource.addEventListener("message", (e: any) => {
-			let res = e.data;
+		const raw = String(e.data);
+		const payloads = raw
+			.split(/\r?\n/)
+			.map((l) => l.replace(/^data:\s*/, "").trim())
+			.filter((l) => l.length > 0);
 
-			if (res === "[DONE]") {
-				deleteFlag = false;
-				loading = false;
-				query = '';
-			} else {
-				let Msg = JSON.parse(res).choices[0].text;
-				if (Msg.includes("'''")) {
-					deleteFlag = true;
-				} else if (deleteFlag && Msg.includes("\\n")) {
-					deleteFlag = false;
-				} else if (Msg !== "</s>" && !deleteFlag) {
-					code_output += Msg.replace(/\\n/g, "\n");
-				}
+		for (const part of payloads) {
+			if (part === "[DONE]") {
+			settleTicks();
+			loading = false;
+			return;
 			}
+			try {
+			const json = JSON.parse(part);
+			const msg =
+				json.choices?.[0]?.delta?.content ?? json.choices?.[0]?.text ?? "";
+			if (!msg || msg === "</s>") continue;
+			consumeChunk(msg);
+			} catch (err) {
+			console.error("JSON chunk parse error:", err, part);
+			}
+		}
+		});
+
+		eventSource.addEventListener("error", () => {
+			loading = false;
 		});
+
 		eventSource.stream();
 	};
 
 	const handleTextSubmit = async () => {
+		if (!query) return;
 		await callTextStream(query);
 	};
 </script>
@@ -62,48 +220,47 @@
 <div class="flex grow flex-col text-white">
 	<div class="relative h-full items-center gap-5 bg-fixed sm:flex">
 		<div
-			class="relative mx-auto flex h-full w-full flex-col items-center sm:mt-0 sm:w-[70%]"
+		class="relative mx-auto flex h-full w-full flex-col items-center sm:mt-0 sm:w-[70%]"
 		>
-			<div
-				class="fixed relative flex w-full flex-col items-center justify-between bg-white p-2 pb-0"
-			>
-				<div class="relative my-4 flex w-full flex-row justify-center">
-					<div class="relative w-full focus:border-none">
-						<input
-							class="block w-full break-words border-0 border-b-2 border-gray-300 px-1 py-4 pl-4 pr-20 text-xs
+		<div
+			class="fixed relative flex w-full flex-col items-center justify-between bg-white p-2 pb-0"
+		>
+			<div class="relative my-4 flex w-full flex-row justify-center">
+			<div class="relative w-full focus:border-none">
+					<input
+					class="block w-full break-words border-0 border-b-2 border-gray-300 px-1 py-4 pl-4 pr-20 text-xs
 					text-gray-900 focus:border-gray-300 focus:ring-0 dark:border-gray-600 dark:bg-gray-700 dark:text-white dark:placeholder-gray-400 dark:focus:border-blue-500 dark:focus:ring-blue-500"
-							type="text"
-							data-testid="code-input"
-							placeholder="Enter prompt here"
-							disabled={loading}
-							maxlength="1200"
-							bind:value={query}
-							on:keydown={(event) => {
-								if (event.key === "Enter" && !event.shiftKey && query) {
-									event.preventDefault();
-									handleTextSubmit();
-								}
-							}}
-						/>
-						<button
-							on:click={() => {
-								if (query) {
-									handleTextSubmit();
-								}
-							}}
-							type="submit"
-							id="send"
-							class="absolute bottom-2.5 end-2.5 px-4 py-2 text-sm font-medium text-white dark:bg-blue-600 dark:hover:bg-blue-700 dark:focus:ring-blue-800"
-							><PaperAirplane /></button
-						>
-					</div>
+					type="text"
+					data-testid="code-input"
+					placeholder="Enter prompt here"
+					disabled={loading}
+					maxlength="1200"
+					bind:value={query}
+					on:keydown={(event) => {
+						if (event.key === "Enter" && !event.shiftKey && query) {
+						event.preventDefault();
+						handleTextSubmit();
+						}
+					}}
+					/>
+					<button
+					on:click={() => {
+						if (query) {
+						handleTextSubmit();
+						}
+					}}
+					type="submit"
+					id="send"
+					class="absolute bottom-2.5 end-2.5 px-4 py-2 text-sm font-medium text-white dark:bg-blue-600 dark:hover:bg-blue-700 dark:focus:ring-blue-800"
+					><PaperAirplane /></button>
+				</div>
 				</div>
 			</div>
 			<div class="mb-4 flex h-full w-full flex-col items-center">
-				{#if code_output !== ""}
-					<div class="w-full items-center gap-4">
-						<Output label="Generated results" output={code_output} />
-					</div>
+				{#if segments.length}
+				<div class="w-full items-center gap-4">
+					<Output {segments} />
+				</div>
 				{/if}
 				{#if loading}
 					<LoadingAnimation />
diff --git a/CodeGen/ui/svelte/tests/codeGen.spec.ts b/CodeGen/ui/svelte/tests/codeGen.spec.ts
index 751dd92b57..5c3de2789e 100644
--- a/CodeGen/ui/svelte/tests/codeGen.spec.ts
+++ b/CodeGen/ui/svelte/tests/codeGen.spec.ts
@@ -18,8 +18,12 @@ async function enterMessageToChat(page: Page, message: string) {
 	await page.getByTestId("code-input").click();
 	await page.getByTestId("code-input").fill(message);
 	await page.getByTestId("code-input").press("Enter");
-	await page.waitForTimeout(10000);
-	await expect(page.getByTestId("code-output")).toContainText("copy");
+
+	// Wait for the output container to appear first
+	await expect(page.getByTestId("code-output")).toBeVisible({ timeout: 30000 });
+
+	// Wait for content to be loaded and copy button to appear
+	await expect(page.getByTestId("code-output")).toContainText("copy", { timeout: 30000 });
 }
 
 // Test description: New Code Gen
diff --git a/CodeTrans/Dockerfile.openEuler b/CodeTrans/Dockerfile.openEuler
new file mode 100644
index 0000000000..9f62fe3280
--- /dev/null
+++ b/CodeTrans/Dockerfile.openEuler
@@ -0,0 +1,10 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+ARG IMAGE_REPO=opea
+ARG BASE_TAG=latest
+FROM $IMAGE_REPO/comps-base:$BASE_TAG-openeuler
+
+COPY ./code_translation.py $HOME/code_translation.py
+
+ENTRYPOINT ["python", "code_translation.py"]
diff --git a/CodeTrans/docker_compose/amd/cpu/epyc/compose.yaml b/CodeTrans/docker_compose/amd/cpu/epyc/compose.yaml
index 3b499de95b..d1b539e5f4 100644
--- a/CodeTrans/docker_compose/amd/cpu/epyc/compose.yaml
+++ b/CodeTrans/docker_compose/amd/cpu/epyc/compose.yaml
@@ -4,7 +4,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: codetrans-epyc-vllm-service
     ports:
       - "8008:80"
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/README.md b/CodeTrans/docker_compose/intel/cpu/xeon/README.md
index 131f03a999..43e76c8e6c 100755
--- a/CodeTrans/docker_compose/intel/cpu/xeon/README.md
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/README.md
@@ -54,6 +54,8 @@ Consult the section on [CodeTrans Service configuration](#codetrans-configuratio
 
 ### Deploy the Services Using Docker Compose
 
+#### Option #1
+
 To deploy the CodeTrans services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute the command below. It uses the 'compose.yaml' file.
 
 ```bash
@@ -61,6 +63,19 @@ cd cpu/xeon
 docker compose -f compose.yaml up -d
 ```
 
+#### Option #2
+
+> NOTE : To enable monitoring, `compose.monitoring.yaml` file need to be merged along with default `compose.yaml` file.
+
+To deploy with monitoring:
+
+```bash
+cd cpu/xeon/
+# download grafana dashboard
+bash grafana/dashboards/download_opea_dashboard.sh
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
 > **Note**: developers should build docker image from source when:
 >
 > - Developing off the git main branch (as the container's ports in the repo may be different > from the published docker image).
@@ -117,6 +132,15 @@ To stop the containers associated with the deployment, execute the following com
 docker compose -f compose.yaml down
 ```
 
+If monitoring is enabled, execute the following command:
+
+```bash
+cd cpu/xeon/
+# download grafana dashboard
+bash grafana/dashboards/download_opea_dashboard.sh
+docker compose -f compose.yaml -f compose.monitoring.yaml down
+```
+
 ## Configuration Parameters
 
 Key parameters are configured via environment variables set before running `docker compose up`.
@@ -137,11 +161,12 @@ Key parameters are configured via environment variables set before running `dock
 
 In the context of deploying a CodeTrans pipeline on an Intel® Xeon® platform, we can pick and choose different large language model serving frameworks. The table below outlines the various configurations that are available as part of the application. These configurations can be used as templates and can be extended to different components available in [GenAIComps](https://github.com/opea-project/GenAIComps.git).
 
-| File                                         | Description                                                                                                                                                                                                                                                 |
-| -------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| [compose.yaml](./compose.yaml)               | Default compose file using vllm as serving framework and redis as vector database.                                                                                                                                                                          |
-| [compose_tgi.yaml](./compose_tgi.yaml)       | The LLM serving framework is TGI. All other configurations remain the same as the default.                                                                                                                                                                  |
-| [compose_remote.yaml](./compose_remote.yaml) | The LLM used is hosted on a remote server and an endpoint is used to access this model. vLLM is the serving framework. Additional environment variables need to be set before running. See [instructions](#running-llm-models-with-remote-endpoints) below. |
+| File                                                 | Description                                                                                                                                                                                                                                                 |
+| ---------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| [compose.yaml](./compose.yaml)                       | Default compose file using vllm as serving framework and redis as vector database.                                                                                                                                                                          |
+| [compose_tgi.yaml](./compose_tgi.yaml)               | The LLM serving framework is TGI. All other configurations remain the same as the default.                                                                                                                                                                  |
+| [compose_remote.yaml](./compose_remote.yaml)         | The LLM used is hosted on a remote server and an endpoint is used to access this model. vLLM is the serving framework. Additional environment variables need to be set before running. See [instructions](#running-llm-models-with-remote-endpoints) below. |
+| [compose.monitoring.yaml](./compose.monitoring.yaml) | Helper file for monitoring features. Can be used along with any compose files                                                                                                                                                                               |
 
 ### Running LLM models with remote endpoints
 
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/compose.monitoring.yaml b/CodeTrans/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
new file mode 100644
index 0000000000..dea34085b3
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
@@ -0,0 +1,58 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.sysfs=/host/sys'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    restart: always
+    deploy:
+      mode: global
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/compose.yaml b/CodeTrans/docker_compose/intel/cpu/xeon/compose.yaml
index f950c770ec..4e4464f220 100644
--- a/CodeTrans/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/compose.yaml
@@ -3,7 +3,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: codetrans-xeon-vllm-service
     ports:
       - "8008:80"
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/compose_openeuler.yaml b/CodeTrans/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
new file mode 100644
index 0000000000..4fa6f9f5c3
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/compose_openeuler.yaml
@@ -0,0 +1,96 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  vllm-service:
+    image: openeuler/vllm-cpu:0.10.1-oe2403lts
+    container_name: codetrans-xeon-vllm-service
+    ports:
+      - "8008:80"
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      VLLM_TORCH_PROFILER_DIR: "/mnt"
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://$host_ip:8008/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model $LLM_MODEL_ID --host 0.0.0.0 --port 80
+  llm:
+    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}-openeuler
+    container_name: codetrans-xeon-llm-server
+    depends_on:
+      vllm-service:
+        condition: service_healthy
+    ports:
+      - "9000:9000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      LLM_COMPONENT_NAME: ${LLM_COMPONENT_NAME}
+      HF_TOKEN: ${HF_TOKEN}
+    restart: unless-stopped
+  codetrans-xeon-backend-server:
+    image: ${REGISTRY:-opea}/codetrans:${TAG:-latest}-openeuler
+    container_name: codetrans-xeon-backend-server
+    depends_on:
+      - vllm-service
+      - llm
+    ports:
+      - "${BACKEND_SERVICE_PORT:-7777}:7777"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+    ipc: host
+    restart: always
+  codetrans-xeon-ui-server:
+    image: ${REGISTRY:-opea}/codetrans-ui:${TAG:-latest}-openeuler
+    container_name: codetrans-xeon-ui-server
+    depends_on:
+      - codetrans-xeon-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+  codetrans-xeon-nginx-server:
+    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}-openeuler
+    container_name: codetrans-xeon-nginx-server
+    depends_on:
+      - codetrans-xeon-backend-server
+      - codetrans-xeon-ui-server
+    ports:
+      - "${NGINX_PORT:-80}:80"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - FRONTEND_SERVICE_IP=${FRONTEND_SERVICE_IP}
+      - FRONTEND_SERVICE_PORT=${FRONTEND_SERVICE_PORT}
+      - BACKEND_SERVICE_NAME=${BACKEND_SERVICE_NAME}
+      - BACKEND_SERVICE_IP=${BACKEND_SERVICE_IP}
+      - BACKEND_SERVICE_PORT=${BACKEND_SERVICE_PORT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/compose_tgi_openeuler.yaml b/CodeTrans/docker_compose/intel/cpu/xeon/compose_tgi_openeuler.yaml
new file mode 100644
index 0000000000..2806472fc9
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/compose_tgi_openeuler.yaml
@@ -0,0 +1,95 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  tgi-service:
+    image: openeuler/text-generation-inference-cpu:2.4.0-oe2403lts
+    container_name: codetrans-xeon-tgi-service
+    ports:
+      - "8008:80"
+    volumes:
+      - "${MODEL_CACHE}:/data"
+    shm_size: 1g
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      host_ip: ${host_ip}
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://$host_ip:8008/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0
+  llm:
+    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}-openeuler
+    container_name: codetrans-xeon-llm-server
+    depends_on:
+      tgi-service:
+        condition: service_healthy
+    ports:
+      - "9000:9000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${LLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      LLM_COMPONENT_NAME: ${LLM_COMPONENT_NAME}
+      HF_TOKEN: ${HF_TOKEN}
+    restart: unless-stopped
+  codetrans-xeon-backend-server:
+    image: ${REGISTRY:-opea}/codetrans:${TAG:-latest}-openeuler
+    container_name: codetrans-xeon-backend-server
+    depends_on:
+      - tgi-service
+      - llm
+    ports:
+      - "${BACKEND_SERVICE_PORT:-7777}:7777"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+    ipc: host
+    restart: always
+  codetrans-xeon-ui-server:
+    image: ${REGISTRY:-opea}/codetrans-ui:${TAG:-latest}-openeuler
+    container_name: codetrans-xeon-ui-server
+    depends_on:
+      - codetrans-xeon-backend-server
+    ports:
+      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BASE_URL=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+  codetrans-xeon-nginx-server:
+    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}-openeuler
+    container_name: codetrans-xeon-nginx-server
+    depends_on:
+      - codetrans-xeon-backend-server
+      - codetrans-xeon-ui-server
+    ports:
+      - "${NGINX_PORT:-80}:80"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - FRONTEND_SERVICE_IP=${FRONTEND_SERVICE_IP}
+      - FRONTEND_SERVICE_PORT=${FRONTEND_SERVICE_PORT}
+      - BACKEND_SERVICE_NAME=${BACKEND_SERVICE_NAME}
+      - BACKEND_SERVICE_IP=${BACKEND_SERVICE_IP}
+      - BACKEND_SERVICE_PORT=${BACKEND_SERVICE_PORT}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh b/CodeTrans/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..47d4f84587
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+cd "$SCRIPT_DIR"
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/codetrans_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml b/CodeTrans/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml b/CodeTrans/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml
new file mode 100644
index 0000000000..a206521d67
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://$host_ip:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/CodeTrans/docker_compose/intel/cpu/xeon/prometheus.yaml b/CodeTrans/docker_compose/intel/cpu/xeon/prometheus.yaml
new file mode 100644
index 0000000000..57bbf6e0db
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/cpu/xeon/prometheus.yaml
@@ -0,0 +1,23 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["opea_prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["codetrans-xeon-vllm-service:80"]
+  - job_name: "codetrans-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["codetrans-xeon-backend-server:7777"]
+  - job_name: "prometheus-node-exporter"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
diff --git a/CodeTrans/docker_compose/intel/hpu/gaudi/README.md b/CodeTrans/docker_compose/intel/hpu/gaudi/README.md
index 2597e1aeb6..830e9f7a7c 100755
--- a/CodeTrans/docker_compose/intel/hpu/gaudi/README.md
+++ b/CodeTrans/docker_compose/intel/hpu/gaudi/README.md
@@ -54,6 +54,8 @@ Consult the section on [CodeTrans Service configuration](#codetrans-configuratio
 
 ### Deploy the Services Using Docker Compose
 
+#### Option #1
+
 To deploy the CodeTrans services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute the command below. It uses the 'compose.yaml' file.
 
 ```bash
@@ -61,6 +63,19 @@ cd hpu/gaudi
 docker compose -f compose.yaml up -d
 ```
 
+#### Option #2
+
+> NOTE : To enable monitoring, `compose.monitoring.yaml` file need to be merged along with default `compose.yaml` file.
+
+To deploy with monitoring:
+
+```bash
+cd hpu/gaudi/
+# download grafana dashboard
+bash grafana/dashboards/download_opea_dashboard.sh
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
 > **Note**: developers should build docker image from source when:
 >
 > - Developing off the git main branch (as the container's ports in the repo may be different > from the published docker image).
@@ -117,6 +132,15 @@ To stop the containers associated with the deployment, execute the following com
 docker compose -f compose.yaml down
 ```
 
+If monitoring is enabled, execute the following command:
+
+```bash
+cd hpu/gaudi/
+# download grafana dashboard
+bash grafana/dashboards/download_opea_dashboard.sh
+docker compose -f compose.yaml -f compose.monitoring.yaml down
+```
+
 ## Configuration Parameters
 
 Key parameters are configured via environment variables set before running `docker compose up`.
diff --git a/CodeTrans/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml b/CodeTrans/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
new file mode 100644
index 0000000000..691671e656
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
@@ -0,0 +1,75 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.rootfs=/rootfs'
+      - '--path.sysfs=/host/sys'
+      - '--path.udev.data=/rootfs/run/udev/data'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    restart: always
+    deploy:
+      mode: global
+
+  gaudi-metrics-exporter:
+    image: vault.habana.ai/gaudi-metric-exporter/metric-exporter:latest
+    privileged: true
+    container_name: gaudi-metrics-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+      - /dev:/dev
+    deploy:
+      mode: global
+    ports:
+      - 41611:41611
+    restart: unless-stopped
diff --git a/CodeTrans/docker_compose/intel/hpu/gaudi/compose.yaml b/CodeTrans/docker_compose/intel/hpu/gaudi/compose.yaml
index 60728feabf..96ea18b3b0 100644
--- a/CodeTrans/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/CodeTrans/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -3,7 +3,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.4
     container_name: codetrans-gaudi-vllm-service
     ports:
       - "8008:80"
diff --git a/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh b/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..b601762739
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,14 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+cd "$SCRIPT_DIR"
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/gaudi_grafana_v2.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/codetrans_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
diff --git a/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml b/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml b/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml
new file mode 100644
index 0000000000..a206521d67
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://$host_ip:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/CodeTrans/docker_compose/intel/hpu/gaudi/prometheus.yaml b/CodeTrans/docker_compose/intel/hpu/gaudi/prometheus.yaml
new file mode 100644
index 0000000000..a9c3b5fc14
--- /dev/null
+++ b/CodeTrans/docker_compose/intel/hpu/gaudi/prometheus.yaml
@@ -0,0 +1,30 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["opea_prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["codetrans-gaudi-vllm-service:80"]
+  - job_name: "codetrans-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["codetrans-gaudi-backend-server:7777"]
+  - job_name: "prometheus-node-exporter"
+    scrape_interval: 30s
+    scrape_timeout: 25s
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
+  - job_name: "gaudi-metrics-exporter"
+    scrape_interval: 30s
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["gaudi-metrics-exporter:41611"]
diff --git a/CodeTrans/docker_compose/intel/set_env.sh b/CodeTrans/docker_compose/intel/set_env.sh
index 04c4048c52..0c2d0883c5 100644
--- a/CodeTrans/docker_compose/intel/set_env.sh
+++ b/CodeTrans/docker_compose/intel/set_env.sh
@@ -24,3 +24,9 @@ export FRONTEND_SERVICE_PORT=5173
 export BACKEND_SERVICE_NAME=codetrans
 export BACKEND_SERVICE_IP=${host_ip}
 export BACKEND_SERVICE_PORT=7777
+
+
+# Set network proxy settings
+export no_proxy="${no_proxy},${HOST_IP},vllm-server,codetrans-xeon-backend-server,codetrans-xeon-ui-server,redis-vector-db,dataprep-redis-server,tei-embedding-serving,tei-embedding-server,retriever-redis,opea_prometheus,grafana,node-exporter,$JAEGER_IP" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
+export http_proxy=$http_proxy
+export https_proxy=$https_proxy
diff --git a/CodeTrans/docker_image_build/build.yaml b/CodeTrans/docker_image_build/build.yaml
index b230d1d4ec..81cd9c9f50 100644
--- a/CodeTrans/docker_image_build/build.yaml
+++ b/CodeTrans/docker_image_build/build.yaml
@@ -13,36 +13,53 @@ services:
       context: ../
       dockerfile: ./Dockerfile
     image: ${REGISTRY:-opea}/codetrans:${TAG:-latest}
+  codetrans-openeuler:
+    build:
+      args:
+        IMAGE_REPO: ${REGISTRY:-opea}
+        BASE_TAG: ${TAG:-latest}
+        http_proxy: ${http_proxy}
+        https_proxy: ${https_proxy}
+        no_proxy: ${no_proxy}
+      context: ../
+      dockerfile: ./Dockerfile.openEuler
+    image: ${REGISTRY:-opea}/codetrans:${TAG:-latest}-openeuler
   codetrans-ui:
     build:
       context: ../ui
       dockerfile: ./docker/Dockerfile
     extends: codetrans
     image: ${REGISTRY:-opea}/codetrans-ui:${TAG:-latest}
+  codetrans-ui-openeuler:
+    build:
+      context: ../ui
+      dockerfile: ./docker/Dockerfile.openEuler
+    extends: codetrans
+    image: ${REGISTRY:-opea}/codetrans-ui:${TAG:-latest}-openeuler
   llm-textgen:
     build:
       context: GenAIComps
       dockerfile: comps/llms/src/text-generation/Dockerfile
     extends: codetrans
     image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}
-  vllm:
-    build:
-      context: vllm
-      dockerfile: docker/Dockerfile.cpu
-    extends: codetrans
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
-  vllm-gaudi:
+  llm-textgen-openeuler:
     build:
-      context: vllm-fork
-      dockerfile: Dockerfile.hpu
+      context: GenAIComps
+      dockerfile: comps/llms/src/text-generation/Dockerfile.openEuler
     extends: codetrans
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}-openeuler
   nginx:
     build:
       context: GenAIComps
       dockerfile: comps/third_parties/nginx/src/Dockerfile
     extends: codetrans
     image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
+  nginx-openeuler:
+    build:
+      context: GenAIComps
+      dockerfile: comps/third_parties/nginx/src/Dockerfile.openEuler
+    extends: codetrans
+    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}-openeuler
   vllm-rocm:
     build:
       context: GenAIComps
diff --git a/CodeTrans/tests/test_compose_on_epyc.sh b/CodeTrans/tests/test_compose_on_epyc.sh
index 50a9fb68b0..28f31f675b 100644
--- a/CodeTrans/tests/test_compose_on_epyc.sh
+++ b/CodeTrans/tests/test_compose_on_epyc.sh
@@ -28,19 +28,8 @@ function build_docker_images() {
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
 
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
-
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="codetrans codetrans-ui llm-textgen vllm nginx"
+	service_list="codetrans codetrans-ui llm-textgen nginx"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -49,7 +38,7 @@ function build_docker_images() {
 function start_services() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc
 	export HF_TOKEN=${HF_TOKEN}
-
+	export no_proxy="localhost,127.0.0.1,$ip_address"
 	export NGINX_PORT=80
 	source set_env.sh
 
@@ -129,37 +118,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc/
 	docker compose -f compose.yaml stop && docker compose rm -f
@@ -187,10 +145,6 @@ function main() {
 	validate_megaservice
 	echo "::endgroup::"
 
-	echo "::group::validate_frontend"
-	validate_frontend
-	echo "::endgroup::"
-
 	echo "::group::stop_docker"
 	stop_docker
 	echo "::endgroup::"
diff --git a/CodeTrans/tests/test_compose_on_gaudi.sh b/CodeTrans/tests/test_compose_on_gaudi.sh
index 07af411cc1..edfca863d7 100644
--- a/CodeTrans/tests/test_compose_on_gaudi.sh
+++ b/CodeTrans/tests/test_compose_on_gaudi.sh
@@ -25,12 +25,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="codetrans codetrans-ui llm-textgen vllm-gaudi nginx"
+    service_list="codetrans codetrans-ui llm-textgen nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -40,13 +36,17 @@ function start_services() {
     cd $WORKPATH/docker_compose/intel
     export HF_TOKEN=${HF_TOKEN}
     export NGINX_PORT=80
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     cd hpu/gaudi
 
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
+    # download grafana dashboard
+    bash grafana/dashboards/download_opea_dashboard.sh
+
     # Start Docker Containers
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -118,38 +118,9 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f compose.yaml stop && docker compose rm -f
+    docker compose  -f compose.yaml -f compose.monitoring.yaml  stop && docker compose rm -f
 }
 
 function main() {
@@ -174,10 +145,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeTrans/tests/test_compose_on_rocm.sh b/CodeTrans/tests/test_compose_on_rocm.sh
index ecc6a4fdfc..5524c1757b 100644
--- a/CodeTrans/tests/test_compose_on_rocm.sh
+++ b/CodeTrans/tests/test_compose_on_rocm.sh
@@ -120,34 +120,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose stop && docker compose rm -f
@@ -175,10 +147,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeTrans/tests/test_compose_on_xeon.sh b/CodeTrans/tests/test_compose_on_xeon.sh
index 8418ba05d1..bbd75208e8 100644
--- a/CodeTrans/tests/test_compose_on_xeon.sh
+++ b/CodeTrans/tests/test_compose_on_xeon.sh
@@ -25,14 +25,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="codetrans codetrans-ui llm-textgen vllm nginx"
+    service_list="codetrans codetrans-ui llm-textgen nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -41,15 +35,18 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel
     export HF_TOKEN=${HF_TOKEN}
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     export NGINX_PORT=80
     source set_env.sh
     cd cpu/xeon/
 
+    # download grafana dashboard
+    bash grafana/dashboards/download_opea_dashboard.sh
+
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
     # Start Docker Containers
-    docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -122,37 +119,9 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f compose.yaml stop && docker compose rm -f
+    docker compose -f compose.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
@@ -177,10 +146,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeTrans/tests/test_compose_openeuler_on_xeon.sh b/CodeTrans/tests/test_compose_openeuler_on_xeon.sh
new file mode 100644
index 0000000000..3b8d2010e2
--- /dev/null
+++ b/CodeTrans/tests/test_compose_openeuler_on_xeon.sh
@@ -0,0 +1,154 @@
+#!/bin/bash
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG}-openeuler --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile.openEuler .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="codetrans-openeuler codetrans-ui-openeuler llm-textgen-openeuler nginx-openeuler"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel
+    export HF_TOKEN=${HF_TOKEN}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    export NGINX_PORT=80
+    source set_env.sh
+    cd cpu/xeon/
+
+    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
+
+    # Start Docker Containers
+    docker compose -f compose_openeuler.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs codetrans-xeon-vllm-service > ${LOG_PATH}/vllm_service_start.log 2>&1
+        if grep -q complete ${LOG_PATH}/vllm_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+
+    sleep 1m
+}
+
+function validate_services() {
+    local URL="$1"
+    local EXPECTED_RESULT="$2"
+    local SERVICE_NAME="$3"
+    local DOCKER_NAME="$4"
+    local INPUT_DATA="$5"
+
+    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
+    if [ "$HTTP_STATUS" -eq 200 ]; then
+        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+
+        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
+
+        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
+            echo "[ $SERVICE_NAME ] Content is as expected."
+        else
+            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
+            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+            exit 1
+        fi
+    else
+        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
+        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+        exit 1
+    fi
+    sleep 5s
+}
+
+function validate_microservices() {
+    # llm microservice
+    validate_services \
+        "${ip_address}:9000/v1/chat/completions" \
+        "data: " \
+        "llm" \
+        "codetrans-xeon-llm-server" \
+        '{"query":"    ### System: Please translate the following Golang codes into  Python codes.    ### Original codes:    '\'''\'''\''Golang    \npackage main\n\nimport \"fmt\"\nfunc main() {\n    fmt.Println(\"Hello, World!\");\n    '\'''\'''\''    ### Translated codes:"}'
+
+}
+
+function validate_megaservice() {
+    # Curl the Mega Service
+    validate_services \
+        "${ip_address}:${BACKEND_SERVICE_PORT}/v1/codetrans" \
+        "print" \
+        "mega-codetrans" \
+        "codetrans-xeon-backend-server" \
+        '{"language_from": "Golang","language_to": "Python","source_code": "package main\n\nimport \"fmt\"\nfunc main() {\n    fmt.Println(\"Hello, World!\");\n}"}'
+
+    # test the megaservice via nginx
+    validate_services \
+        "${ip_address}:${NGINX_PORT}/v1/codetrans" \
+        "print" \
+        "mega-codetrans-nginx" \
+        "codetrans-xeon-nginx-server" \
+        '{"language_from": "Golang","language_to": "Python","source_code": "package main\n\nimport \"fmt\"\nfunc main() {\n    fmt.Println(\"Hello, World!\");\n}"}'
+
+}
+
+function stop_service() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose -f compose_openeuler.yaml stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group::stop_service"
+    stop_service
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_microservices"
+    validate_microservices
+    echo "::endgroup::"
+
+    echo "::group::validate_megaservice"
+    validate_megaservice
+    echo "::endgroup::"
+
+    echo "::group::stop_service"
+    stop_service
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/CodeTrans/tests/test_compose_tgi_on_epyc.sh b/CodeTrans/tests/test_compose_tgi_on_epyc.sh
index 2eb464c485..53dcb0caa0 100644
--- a/CodeTrans/tests/test_compose_tgi_on_epyc.sh
+++ b/CodeTrans/tests/test_compose_tgi_on_epyc.sh
@@ -39,7 +39,7 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
     export HF_TOKEN=${HF_TOKEN}
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     export NGINX_PORT=80
     source set_env.sh
 
@@ -127,37 +127,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    CONDA_ROOT=$(conda info --base)
-    source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-    conda activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    # npm install && npm ci && npx playwright install --with-deps
-    npm install && npm ci && npx playwright install
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
     docker compose -f compose_tgi.yaml stop && docker compose rm -f
@@ -185,10 +154,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeTrans/tests/test_compose_tgi_on_gaudi.sh b/CodeTrans/tests/test_compose_tgi_on_gaudi.sh
index 129e677149..964f6b6f01 100644
--- a/CodeTrans/tests/test_compose_tgi_on_gaudi.sh
+++ b/CodeTrans/tests/test_compose_tgi_on_gaudi.sh
@@ -36,15 +36,18 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel
     export HF_TOKEN=${HF_TOKEN}
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     export NGINX_PORT=80
     source set_env.sh
     cd hpu/gaudi/
 
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
+    # download grafana dashboard
+    bash grafana/dashboards/download_opea_dashboard.sh
+
     # Start Docker Containers
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml  up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -125,37 +128,9 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi/
-    docker compose -f compose_tgi.yaml stop && docker compose rm -f
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml  stop && docker compose rm -f
 }
 
 function main() {
@@ -180,10 +155,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeTrans/tests/test_compose_tgi_on_xeon.sh b/CodeTrans/tests/test_compose_tgi_on_xeon.sh
index aacd5dfda5..2957093520 100644
--- a/CodeTrans/tests/test_compose_tgi_on_xeon.sh
+++ b/CodeTrans/tests/test_compose_tgi_on_xeon.sh
@@ -36,15 +36,18 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel
     export HF_TOKEN=${HF_TOKEN}
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     export NGINX_PORT=80
     source set_env.sh
     cd cpu/xeon/
 
+    # download grafana dashboard
+    bash grafana/dashboards/download_opea_dashboard.sh
+
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
     # Start Docker Containers
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml  up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -125,37 +128,9 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f compose_tgi.yaml stop && docker compose rm -f
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml  stop && docker compose rm -f
 }
 
 function main() {
@@ -180,10 +155,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeTrans/tests/test_compose_tgi_openeuler_on_xeon.sh b/CodeTrans/tests/test_compose_tgi_openeuler_on_xeon.sh
new file mode 100644
index 0000000000..42c8cdee62
--- /dev/null
+++ b/CodeTrans/tests/test_compose_tgi_openeuler_on_xeon.sh
@@ -0,0 +1,163 @@
+#!/bin/bash
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG}-openeuler --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile.openEuler .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="codetrans-openeuler codetrans-ui-openeuler llm-textgen-openeuler nginx-openeuler"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker pull openeuler/text-generation-inference-cpu:2.4.0-oe2403lts
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel
+    export HF_TOKEN=${HF_TOKEN}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    export NGINX_PORT=80
+    source set_env.sh
+    cd cpu/xeon/
+
+    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
+
+    # Start Docker Containers
+    docker compose -f compose_tgi_openeuler.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs codetrans-xeon-tgi-service > ${LOG_PATH}/tgi_service_start.log
+        if grep -q Connected ${LOG_PATH}/tgi_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+
+    sleep 1m
+}
+
+function validate_services() {
+    local URL="$1"
+    local EXPECTED_RESULT="$2"
+    local SERVICE_NAME="$3"
+    local DOCKER_NAME="$4"
+    local INPUT_DATA="$5"
+
+    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
+    if [ "$HTTP_STATUS" -eq 200 ]; then
+        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+
+        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
+
+        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
+            echo "[ $SERVICE_NAME ] Content is as expected."
+        else
+            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
+            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+            exit 1
+        fi
+    else
+        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
+        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+        exit 1
+    fi
+    sleep 5s
+}
+
+function validate_microservices() {
+    # tgi for embedding service
+    validate_services \
+        "${ip_address}:8008/generate" \
+        "generated_text" \
+        "tgi" \
+        "codetrans-xeon-tgi-service" \
+        '{"inputs":"What is Deep Learning?","parameters":{"max_new_tokens":17, "do_sample": true}}'
+
+    # llm microservice
+    validate_services \
+        "${ip_address}:9000/v1/chat/completions" \
+        "data: " \
+        "llm" \
+        "codetrans-xeon-llm-server" \
+        '{"query":"    ### System: Please translate the following Golang codes into  Python codes.    ### Original codes:    '\'''\'''\''Golang    \npackage main\n\nimport \"fmt\"\nfunc main() {\n    fmt.Println(\"Hello, World!\");\n    '\'''\'''\''    ### Translated codes:"}'
+
+}
+
+function validate_megaservice() {
+    # Curl the Mega Service
+    validate_services \
+        "${ip_address}:${BACKEND_SERVICE_PORT}/v1/codetrans" \
+        "print" \
+        "mega-codetrans" \
+        "codetrans-xeon-backend-server" \
+        '{"language_from": "Golang","language_to": "Python","source_code": "package main\n\nimport \"fmt\"\nfunc main() {\n    fmt.Println(\"Hello, World!\");\n}"}'
+
+    # test the megaservice via nginx
+    validate_services \
+        "${ip_address}:${NGINX_PORT}/v1/codetrans" \
+        "print" \
+        "mega-codetrans-nginx" \
+        "codetrans-xeon-nginx-server" \
+        '{"language_from": "Golang","language_to": "Python","source_code": "package main\n\nimport \"fmt\"\nfunc main() {\n    fmt.Println(\"Hello, World!\");\n}"}'
+
+}
+
+function stop_service() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose -f compose_tgi_openeuler.yaml stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group::stop_service"
+    stop_service
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_microservices"
+    validate_microservices
+    echo "::endgroup::"
+
+    echo "::group::validate_megaservice"
+    validate_megaservice
+    echo "::endgroup::"
+
+    echo "::group::stop_service"
+    stop_service
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/CodeTrans/tests/test_compose_vllm_on_rocm.sh b/CodeTrans/tests/test_compose_vllm_on_rocm.sh
index 2ef8709607..6023b59467 100644
--- a/CodeTrans/tests/test_compose_vllm_on_rocm.sh
+++ b/CodeTrans/tests/test_compose_vllm_on_rocm.sh
@@ -119,34 +119,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose -f compose_vllm.yaml stop && docker compose -f compose_vllm.yaml rm -f
@@ -174,10 +146,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/CodeTrans/tests/test_ui_on_xeon.sh b/CodeTrans/tests/test_ui_on_xeon.sh
new file mode 100644
index 0000000000..4ee17bad47
--- /dev/null
+++ b/CodeTrans/tests/test_ui_on_xeon.sh
@@ -0,0 +1,120 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="codetrans codetrans-ui llm-textgen nginx"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel
+    export HF_TOKEN=${HF_TOKEN}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    export NGINX_PORT=80
+    source set_env.sh
+    cd cpu/xeon/
+
+    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
+
+    # Start Docker Containers
+    docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs codetrans-xeon-vllm-service > ${LOG_PATH}/vllm_service_start.log 2>&1
+        if grep -q complete ${LOG_PATH}/vllm_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+
+    sleep 1m
+}
+
+function validate_frontend() {
+    cd $WORKPATH/ui/svelte
+    local conda_env_name="OPEA_e2e"
+    export PATH=${HOME}/miniforge3/bin/:$PATH
+    if conda info --envs | grep -q "$conda_env_name"; then
+        echo "$conda_env_name exist!"
+    else
+        conda create -n ${conda_env_name} python=3.12 -y
+    fi
+    source activate ${conda_env_name}
+
+    sed -i "s/localhost/$ip_address/g" playwright.config.ts
+
+    conda install -c conda-forge nodejs=22.6.0 -y
+    npm install && npm ci && npx playwright install --with-deps
+    node -v && npm -v && pip list
+
+    exit_status=0
+    npx playwright test || exit_status=$?
+
+    if [ $exit_status -ne 0 ]; then
+        echo "[TEST INFO]: ---------frontend test failed---------"
+        exit $exit_status
+    else
+        echo "[TEST INFO]: ---------frontend test passed---------"
+    fi
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose -f compose.yaml stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_frontend"
+    validate_frontend
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/CodeTrans/ui/docker/Dockerfile b/CodeTrans/ui/docker/Dockerfile
index 1d5115f4b5..3a6ca7f7c9 100644
--- a/CodeTrans/ui/docker/Dockerfile
+++ b/CodeTrans/ui/docker/Dockerfile
@@ -1,8 +1,8 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-# Use node 20.11.1 as the base image
-FROM node:20.11.1
+# Use node 20.19.0 as the base image (required for chokidar@5.0.0 compatibility)
+FROM node:20.19.0
 
 # Update package manager and install Git
 RUN apt-get update -y && apt-get install -y git
diff --git a/CodeTrans/ui/docker/Dockerfile.openEuler b/CodeTrans/ui/docker/Dockerfile.openEuler
new file mode 100644
index 0000000000..08d34fea47
--- /dev/null
+++ b/CodeTrans/ui/docker/Dockerfile.openEuler
@@ -0,0 +1,30 @@
+# Copyright (C) 2025 Huawei Technologies Co., Ltd.
+# SPDX-License-Identifier: Apache-2.0
+
+# Use node 20.19.0 as the base image
+FROM openeuler/node:20.19.0-oe2403lts
+
+# Update package manager and install Git
+RUN yum update -y && \
+    yum install -y \
+        git && \
+    yum clean all && \
+    rm -rf /var/cache/yum
+
+# Copy the front-end code repository
+COPY svelte /home/user/svelte
+
+# Set the working directory
+WORKDIR /home/user/svelte
+
+# Install front-end dependencies
+RUN npm install
+
+# Build the front-end application
+RUN npm run build
+
+# Expose the port of the front-end application
+EXPOSE 5173
+
+# Run the front-end application in preview mode
+CMD ["npm", "run", "preview", "--", "--port", "5173", "--host", "0.0.0.0"]
diff --git a/CodeTrans/ui/svelte/package.json b/CodeTrans/ui/svelte/package.json
index ed45ce245f..855f74265c 100644
--- a/CodeTrans/ui/svelte/package.json
+++ b/CodeTrans/ui/svelte/package.json
@@ -16,7 +16,7 @@
   "devDependencies": {
     "@playwright/test": "^1.44.1",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/package": "^2.0.0",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "@types/prismjs": "^1.26.3",
diff --git a/CodeTrans/ui/svelte/src/routes/+page.svelte b/CodeTrans/ui/svelte/src/routes/+page.svelte
index fd6be39310..af19e26d31 100644
--- a/CodeTrans/ui/svelte/src/routes/+page.svelte
+++ b/CodeTrans/ui/svelte/src/routes/+page.svelte
@@ -83,12 +83,37 @@
   let deleteFlag: boolean = false;
   let inputClick: boolean = true;
 
-  function handelCopy() {
-    navigator.clipboard.writeText(output);
-    copyText = "copied!";
+  async function handelCopy() {
+    try {
+      if (navigator.clipboard && navigator.clipboard.writeText) {
+        await navigator.clipboard.writeText(output);
+        copyText = "copied!";
+      } else {
+        const textArea = document.createElement('textarea');
+        textArea.value = output;
+        textArea.style.position = 'fixed';
+        textArea.style.left = '-999999px';
+        textArea.style.top = '-999999px';
+        document.body.appendChild(textArea);
+        textArea.focus();
+        textArea.select();
+
+        if (document.execCommand('copy')) {
+          copyText = "copied!";
+        } else {
+          copyText = "copy failed";
+        }
+
+        document.body.removeChild(textArea);
+      }
+    } catch (err) {
+      console.error('Copy failed:', err);
+      copyText = "copy failed";
+    }
+
     setTimeout(() => {
       copyText = "copy";
-    }, 1000);
+    }, 2000);
   }
 
   function handelInputClick() {
diff --git a/DBQnA/docker_compose/amd/gpu/rocm/README.md b/DBQnA/docker_compose/amd/gpu/rocm/README.md
index f15b5db2b4..a0eda0c9bf 100644
--- a/DBQnA/docker_compose/amd/gpu/rocm/README.md
+++ b/DBQnA/docker_compose/amd/gpu/rocm/README.md
@@ -9,13 +9,17 @@ This document outlines the deployment process for DBQnA application which helps
 
 This section describes how to quickly deploy and test the DBQnA service manually on AMD GPU (ROCm). The basic steps are:
 
-1. [Access the Code](#access-the-code)
-2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
-3. [Configure the Deployment Environment](#configure-the-deployment-environment)
-4. [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
-5. [Check the Deployment Status](#check-the-deployment-status)
-6. [Test the Pipeline](#test-the-pipeline)
-7. [Cleanup the Deployment](#cleanup-the-deployment)
+- [Example DBQnA Deployment on AMD GPU (ROCm)](#example-dbqna-deployment-on-amd-gpu-rocm)
+  - [DBQnA Quick Start Deployment](#dbqna-quick-start-deployment)
+    - [Access the Code](#access-the-code)
+    - [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+    - [Configure the Deployment Environment](#configure-the-deployment-environment)
+    - [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Test the Pipeline](#test-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [DBQnA Docker Compose Files](#dbqna-docker-compose-files)
+  - [DBQnA Service Configuration for AMD GPUs](#dbqna-service-configuration-for-amd-gpus)
 
 ### Access the Code
 
@@ -73,10 +77,11 @@ For the default deployment, the following 4 containers should be running.
 Once the DBQnA service are running, test the pipeline using the following command:
 
 ```bash
-curl http://${host_ip}:${DBQNA_TEXT_TO_SQL_PORT}/v1/texttosql \
+url="postgresql://${POSTGRES_USER}:${POSTGRES_PASSWORD}@${host_ip}:5442/${POSTGRES_DB}"
+curl --connect-timeout 5 --max-time 120000 http://${host_ip}:9090/v1/text2query\
     -X POST \
-    -d '{"input_text": "Find the total number of Albums.","conn_str": {"user": "'${POSTGRES_USER}'","password": "'${POSTGRES_PASSWORD}'","host": "'${host_ip}'", "port": "5442", "database": "'${POSTGRES_DB}'"}}' \
-    -H 'Content-Type: application/json'
+    -d '{"query": "Find the total number of Albums.","conn_type": "sql", "conn_url": "'${url}'", "conn_user": "'${POSTGRES_USER}'","conn_password": "'${POSTGRES_PASSWORD}'","conn_dialect": "postgresql" }' \
+    -H 'Content-Type: application/json')
 ```
 
 ### Cleanup the Deployment
@@ -97,7 +102,7 @@ The compose.yaml is default compose file using tgi as serving framework
 | ----------------- | -------------------------------------------------------- |
 | dbqna-tgi-service | ghcr.io/huggingface/text-generation-inference:2.4.1-rocm |
 | postgres          | postgres:latest                                          |
-| text2sql          | opea/text2sql:latest                                     |
+| text2sql          | opea/text2query-sql:latest                               |
 | text2sql-react-ui | opea/text2sql-react-ui:latest                            |
 
 ## DBQnA Service Configuration for AMD GPUs
@@ -108,5 +113,5 @@ The table provides a comprehensive overview of the DBQnA service utilized across
 | ----------------- | -------------------------------------------------------- | -------- | --------------------------------------------------------------------------------------------------- |
 | dbqna-tgi-service | ghcr.io/huggingface/text-generation-inference:2.4.1-rocm | No       | Specific to the TGI deployment, focuses on text generation inference using AMD GPU (ROCm) hardware. |
 | postgres          | postgres:latest                                          | No       | Provides the relational database backend for storing and querying data used by the DBQnA pipeline.  |
-| text2sql          | opea/text2sql:latest                                     | No       | Handles text-to-SQL conversion tasks.                                                               |
+| text2sql          | opea/text2query-sql:latest                               | No       | Handles text-to-SQL conversion tasks.                                                               |
 | text2sql-react-ui | opea/text2sql-react-ui:latest                            | No       | Provides the user interface for the DBQnA service.                                                  |
diff --git a/DBQnA/docker_compose/amd/gpu/rocm/compose.yaml b/DBQnA/docker_compose/amd/gpu/rocm/compose.yaml
index f9585acf00..deaf099774 100644
--- a/DBQnA/docker_compose/amd/gpu/rocm/compose.yaml
+++ b/DBQnA/docker_compose/amd/gpu/rocm/compose.yaml
@@ -47,12 +47,16 @@ services:
       - ./chinook.sql:/docker-entrypoint-initdb.d/chinook.sql
 
   text2sql:
-    image: opea/text2sql:latest
+    image: opea/text2query-sql:latest
     container_name: text2sql
     ports:
-      - "${DBQNA_TEXT_TO_SQL_PORT:-9090}:8080"
+      - "${DBQNA_TEXT_TO_SQL_PORT:-9090}:9097"
     environment:
       TGI_LLM_ENDPOINT: ${DBQNA_TGI_LLM_ENDPOINT}
+      TEXT2QUERY_COMPONENT_NAME: OPEA_TEXT2QUERY_SQL
+    depends_on:
+      - dbqna-tgi-service
+      - postgres
 
   text2sql-react-ui:
     image: opea/text2sql-react-ui:latest
diff --git a/DBQnA/docker_compose/intel/cpu/xeon/README.md b/DBQnA/docker_compose/intel/cpu/xeon/README.md
index 1e816fed2a..08b57c4341 100644
--- a/DBQnA/docker_compose/intel/cpu/xeon/README.md
+++ b/DBQnA/docker_compose/intel/cpu/xeon/README.md
@@ -9,13 +9,17 @@ This document outlines the deployment process for DBQnA application which helps
 
 This section describes how to quickly deploy and test the DBQnA service manually on Intel® Xeon® platform. The basic steps are:
 
-1. [Access the Code](#access-the-code)
-2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
-3. [Configure the Deployment Environment](#configure-the-deployment-environment)
-4. [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
-5. [Check the Deployment Status](#check-the-deployment-status)
-6. [Test the Pipeline](#test-the-pipeline)
-7. [Cleanup the Deployment](#cleanup-the-deployment)
+- [Example DBQnA Deployment on Intel® Xeon® Platform](#example-dbqna-deployment-on-intel-xeon-platform)
+  - [DBQnA Quick Start Deployment](#dbqna-quick-start-deployment)
+    - [Access the Code](#access-the-code)
+    - [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+    - [Configure the Deployment Environment](#configure-the-deployment-environment)
+    - [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Test the Pipeline](#test-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [DBQnA Docker Compose Files](#dbqna-docker-compose-files)
+  - [DBQnA Service Configuration](#dbqna-service-configuration)
 
 ### Access the Code
 
@@ -80,7 +84,7 @@ CONTAINER ID   IMAGE
 2728db31368b   opea/text2sql-react-ui:latest                                                               "nginx -g 'daemon of…"   9 minutes ago   Up 9 minutes   0.0.0.0:5174->80/tcp, :::5174->80/tcp       dbqna-xeon-react-ui-server
 0ab75b92c300   postgres:latest                                                                             "docker-entrypoint.s…"   9 minutes ago   Up 9 minutes   0.0.0.0:5442->5432/tcp, :::5442->5432/tcp   postgres-container
 2662a69b515b   ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu                               "text-generation-lau…"   9 minutes ago   Up 9 minutes   0.0.0.0:8008->80/tcp, :::8008->80/tcp       tgi-service
-bb44512be80e   opea/text2sql:latest                                                                        "python opea_text2sq…"   9 minutes ago   Up 9 minutes   0.0.0.0:9090->8080/tcp, :::9090->8080/tcp   text2sql-service
+bb44512be80e   opea/text2query-sql:latest                                                                  "python opea_text2sq…"   9 minutes ago   Up 9 minutes   0.0.0.0:9090->8080/tcp, :::9090->8080/tcp   text2sql-service
 ```
 
 ### Test the Pipeline
@@ -88,10 +92,11 @@ bb44512be80e   opea/text2sql:latest
 Once the DBQnA service are running, test the pipeline using the following command:
 
 ```bash
-curl http://${host_ip}:9090/v1/text2sql\
+url="postgresql://${POSTGRES_USER}:${POSTGRES_PASSWORD}@${host_ip}:5442/${POSTGRES_DB}"
+curl --connect-timeout 5 --max-time 120000 http://${host_ip}:9090/v1/text2query\
     -X POST \
-    -d '{"input_text": "Find the total number of Albums.","conn_str": {"user": "'${POSTGRES_USER}'","password": "'${POSTGRES_PASSWORD}'","host": "'${host_ip}'", "port": "5442", "database": "'${POSTGRES_DB}'"}}' \
-    -H 'Content-Type: application/json'
+    -d '{"query": "Find the total number of Albums.","conn_type": "sql", "conn_url": "'${url}'", "conn_user": "'${POSTGRES_USER}'","conn_password": "'${POSTGRES_PASSWORD}'","conn_dialect": "postgresql" }' \
+    -H 'Content-Type: application/json')
 ```
 
 ### Cleanup the Deployment
@@ -121,7 +126,7 @@ The compose.yaml is default compose file using tgi as serving framework
 | -------------------------- | ------------------------------------------------------------- |
 | tgi-service                | ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu |
 | postgres                   | postgres:latest                                               |
-| text2sql                   | opea/text2sql:latest                                          |
+| text2sql                   | opea/text2query-sql:latest                                    |
 | dbqna-xeon-react-ui-server | opea/text2sql-react-ui:latest                                 |
 
 ## DBQnA Service Configuration
@@ -132,5 +137,5 @@ The table provides a comprehensive overview of the DBQnA service utilized across
 | -------------------------- | ------------------------------------------------------------- | -------- | --------------------------------------------------------------------------------------------------- |
 | tgi-service                | ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu | No       | Specific to the TGI deployment, focuses on text generation inference using AMD GPU (ROCm) hardware. |
 | postgres                   | postgres:latest                                               | No       | Provides the relational database backend for storing and querying data used by the DBQnA pipeline.  |
-| text2sql                   | opea/text2sql:latest                                          | No       | Handles text-to-SQL conversion tasks.                                                               |
+| text2sql                   | opea/text2query-sql:latest                                    | No       | Handles text-to-SQL conversion tasks.                                                               |
 | dbqna-xeon-react-ui-server | opea/text2sql-react-ui:latest                                 | No       | Provides the user interface for the DBQnA service.                                                  |
diff --git a/DBQnA/docker_compose/intel/cpu/xeon/compose.yaml b/DBQnA/docker_compose/intel/cpu/xeon/compose.yaml
index cb9339b834..b12eb32f3f 100644
--- a/DBQnA/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/DBQnA/docker_compose/intel/cpu/xeon/compose.yaml
@@ -31,12 +31,16 @@ services:
       - ./chinook.sql:/docker-entrypoint-initdb.d/chinook.sql
 
   text2sql-service:
-    image: ${REGISTRY:-opea}/text2sql:${TAG:-latest}
+    image: ${REGISTRY:-opea}/text2query-sql:${TAG:-latest}
     container_name: text2sql-service
     ports:
-      - "${TEXT2SQL_PORT}:8080"
+      - "${TEXT2SQL_PORT}:9097"
     environment:
       - TGI_LLM_ENDPOINT=${TGI_LLM_ENDPOINT}
+      - TEXT2QUERY_COMPONENT_NAME=OPEA_TEXT2QUERY_SQL
+    depends_on:
+      - tgi-service
+      - postgres
 
   dbqna-xeon-react-ui-server:
     image: ${REGISTRY:-opea}/text2sql-react-ui:${TAG:-latest}
diff --git a/DBQnA/docker_image_build/build.yaml b/DBQnA/docker_image_build/build.yaml
index 11d7f518b6..39d00f5916 100644
--- a/DBQnA/docker_image_build/build.yaml
+++ b/DBQnA/docker_image_build/build.yaml
@@ -2,22 +2,22 @@
 # SPDX-License-Identifier: Apache-2.0
 
 services:
-  text2sql:
+  text2query-sql:
     build:
       context: GenAIComps
-      dockerfile: comps/text2sql/src/Dockerfile
+      dockerfile: comps/text2query/src/Dockerfile
       args:
         IMAGE_REPO: ${REGISTRY:-opea}
         BASE_TAG: ${TAG:-latest}
         http_proxy: ${http_proxy}
         https_proxy: ${https_proxy}
         no_proxy: ${no_proxy}
-    image: ${REGISTRY:-opea}/text2sql:${TAG:-latest}
+    image: ${REGISTRY:-opea}/text2query-sql:${TAG:-latest}
   text2sql-react-ui:
     build:
       context: ../ui
       dockerfile: ./docker/Dockerfile.react
       args:
         texttosql_url: ${build_texttosql_url}
-    extends: text2sql
+    extends: text2query-sql
     image: ${REGISTRY:-opea}/text2sql-react-ui:${TAG:-latest}
diff --git a/DBQnA/tests/test_compose_on_rocm.sh b/DBQnA/tests/test_compose_on_rocm.sh
index e2dc0b81d6..f162c073c4 100644
--- a/DBQnA/tests/test_compose_on_rocm.sh
+++ b/DBQnA/tests/test_compose_on_rocm.sh
@@ -48,9 +48,10 @@ function start_services() {
 }
 
 function validate_microservice() {
-    result=$(http_proxy="" curl --connect-timeout 5 --max-time 120000 http://${ip_address}:${DBQNA_TEXT_TO_SQL_PORT}/v1/text2sql \
+    url="postgresql://${POSTGRES_USER}:${POSTGRES_PASSWORD}@${ip_address}:5442/${POSTGRES_DB}"
+    result=$(http_proxy="" curl --connect-timeout 5 --max-time 120000 http://${ip_address}:$TEXT2SQL_PORT/v1/text2query\
         -X POST \
-        -d '{"input_text": "Find the total number of Albums.","conn_str": {"user": "'${POSTGRES_USER}'","password": "'${POSTGRES_PASSWORD}'","host": "'${ip_address}'", "port": "5442", "database": "'${POSTGRES_DB}'" }}' \
+        -d '{"query": "Find the total number of Albums.","conn_type": "sql", "conn_url": "'${url}'", "conn_user": "'${POSTGRES_USER}'","conn_password": "'${POSTGRES_PASSWORD}'","conn_dialect": "postgresql" }' \
         -H 'Content-Type: application/json')
 
     if echo "$result" | jq -e '.result.output' > /dev/null 2>&1; then
@@ -66,35 +67,6 @@ function validate_microservice() {
 
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd $WORKPATH/ui/react
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npm run test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose stop && docker compose rm -f
@@ -118,10 +90,6 @@ function main() {
     validate_microservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/DBQnA/tests/test_compose_on_xeon.sh b/DBQnA/tests/test_compose_on_xeon.sh
index c410cc48f8..09eef4494f 100755
--- a/DBQnA/tests/test_compose_on_xeon.sh
+++ b/DBQnA/tests/test_compose_on_xeon.sh
@@ -29,6 +29,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     # Start Docker Containers
@@ -47,9 +48,10 @@ function start_services() {
 }
 
 function validate_microservice() {
-    result=$(http_proxy="" curl --connect-timeout 5 --max-time 120000 http://${ip_address}:$TEXT2SQL_PORT/v1/text2sql\
+    url="postgresql://${POSTGRES_USER}:${POSTGRES_PASSWORD}@${ip_address}:5442/${POSTGRES_DB}"
+    result=$(http_proxy="" curl --connect-timeout 5 --max-time 120000 http://${ip_address}:$TEXT2SQL_PORT/v1/text2query\
         -X POST \
-        -d '{"input_text": "Find the total number of Albums.","conn_str": {"user": "'${POSTGRES_USER}'","password": "'${POSTGRES_PASSWORD}'","host": "'${ip_address}'", "port": "5442", "database": "'${POSTGRES_DB}'" }}' \
+        -d '{"query": "Find the total number of Albums.","conn_type": "sql", "conn_url": "'${url}'", "conn_user": "'${POSTGRES_USER}'","conn_password": "'${POSTGRES_PASSWORD}'","conn_dialect": "postgresql" }' \
         -H 'Content-Type: application/json')
 
     if echo "$result" | jq -e '.result.output' > /dev/null 2>&1; then
@@ -65,35 +67,6 @@ function validate_microservice() {
 
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd $WORKPATH/ui/react
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npm run test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon
     docker compose stop && docker compose rm -f
@@ -117,10 +90,6 @@ function main() {
     validate_microservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/DBQnA/tests/test_ui_on_xeon.sh b/DBQnA/tests/test_ui_on_xeon.sh
new file mode 100755
index 0000000000..650157e9ce
--- /dev/null
+++ b/DBQnA/tests/test_ui_on_xeon.sh
@@ -0,0 +1,110 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    cd $WORKPATH/docker_image_build
+    git clone --single-branch --branch "${opea_branch:-"main"}" https://github.com/opea-project/GenAIComps.git
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker pull ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    source ./set_env.sh
+
+    # Start Docker Containers
+    docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    # check whether tgi is fully ready.
+    n=0
+    until [[ "$n" -ge 100 ]] || [[ $ready == true ]]; do
+        docker logs tgi-service > ${LOG_PATH}/tgi.log
+        n=$((n+1))
+        if grep -q Connected ${LOG_PATH}/tgi.log; then
+            break
+        fi
+        sleep 5s
+    done
+}
+
+function validate_frontend() {
+    echo "[ TEST INFO ]: --------- frontend test started ---------"
+    cd $WORKPATH/ui/react
+    local conda_env_name="OPEA_e2e"
+    export PATH=${HOME}/miniforge3/bin/:$PATH
+    if conda info --envs | grep -q "$conda_env_name"; then
+        echo "$conda_env_name exist!"
+    else
+        conda create -n ${conda_env_name} python=3.12 -y
+    fi
+
+    source activate ${conda_env_name}
+    echo "[ TEST INFO ]: --------- conda env activated ---------"
+
+    conda install -c conda-forge nodejs=22.6.0 -y
+    npm install && npm ci
+    node -v && npm -v && pip list
+
+    exit_status=0
+    npm run test || exit_status=$?
+
+    if [ $exit_status -ne 0 ]; then
+        echo "[TEST INFO]: ---------frontend test failed---------"
+        exit $exit_status
+    else
+        echo "[TEST INFO]: ---------frontend test passed---------"
+    fi
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon
+    docker compose stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_frontend"
+    validate_frontend
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/DBQnA/ui/react/src/App.test.tsx b/DBQnA/ui/react/src/App.test.tsx
index 5b346e8cb1..db16928d3a 100644
--- a/DBQnA/ui/react/src/App.test.tsx
+++ b/DBQnA/ui/react/src/App.test.tsx
@@ -21,21 +21,17 @@ const getHostIP = () => {
 test('testing api with dynamic host', async () => {
   // Get the dynamic host IP
   const host = await getHostIP();
-  const endpointUrl = `http://${host}:9090/v1/text2sql`;
-
-  const formData = {
-    user: 'postgres',
-    database: 'chinook',
-    host: host,
-    password: 'testpwd',
-    port: '5442',
-  };
-
+  const endpointUrl = `http://${host}:9090/v1/text2query`;
+  const connUrl = `postgresql://postgres:testpwd@${host}:5442/chinook`;
   const question = "Find the total number of invoices.";
 
   const payload = {
-    input_text: question,
-    conn_str: formData,
+    query: question,
+    conn_type: "sql",
+    conn_url: connUrl,
+    conn_user: "postgres",
+    conn_password: "testpwd",
+    conn_dialect: "postgresql",
   };
 
   const response = await axios.post(endpointUrl, payload);
@@ -47,6 +43,6 @@ test('testing api with dynamic host', async () => {
   expect(result.hasOwnProperty('sql')).toBe(true);
   expect(result.hasOwnProperty('output')).toBe(true);
   expect(result.hasOwnProperty('input')).toBe(true);
-  expect(result.input.input_text).toBe(question);
+  expect(result.input.query).toBe(question);
 
 }, apiTimeOutInSeconds * 1000);
diff --git a/DBQnA/ui/react/src/components/DbConnect/DBConnect.tsx b/DBQnA/ui/react/src/components/DbConnect/DBConnect.tsx
index bd41665e73..41e1a5b114 100644
--- a/DBQnA/ui/react/src/components/DbConnect/DBConnect.tsx
+++ b/DBQnA/ui/react/src/components/DbConnect/DBConnect.tsx
@@ -42,8 +42,15 @@ const DBConnect: React.FC = () => {
     e.preventDefault();
     try {
       let api_response: Record<string, any>;
-      let unifiedConnData = {"conn_str":formData};
-      api_response = await axios.post(`${TEXT_TO_SQL_URL}/postgres/health`, unifiedConnData);
+      let connUrl = `postgresql://${formData.user}:${formData.password}@${formData.host}:${formData.port}/${formData.database}`;
+      let unifiedConnData = {
+        conn_type: "sql",
+        conn_url: connUrl,
+        conn_user: formData.user,
+        conn_password: formData.password,
+        conn_dialect: "postgresql",
+      };
+      api_response = await axios.post(`${TEXT_TO_SQL_URL}/db/health`, unifiedConnData);
 
       setSqlStatus(null);
       setSqlError(null);
@@ -74,13 +81,18 @@ const DBConnect: React.FC = () => {
     e.preventDefault();
     setIsLoading(true);
     try {
+      const connUrl = `postgresql://${formData.user}:${formData.password}@${formData.host}:${formData.port}/${formData.database}`;
       const payload = {
-        input_text: question,
-        conn_str: formData,
+        query: question,
+        conn_type: "sql",
+        conn_url: connUrl,
+        conn_user: formData.user,
+        conn_password: formData.password,
+        conn_dialect: "postgresql",
       };
 
       let api_response: Record<string, any>;
-      api_response = await axios.post(`${TEXT_TO_SQL_URL}/text2sql`, payload);
+      api_response = await axios.post(`${TEXT_TO_SQL_URL}/text2query`, payload);
 
       setSqlQuery(api_response.data.result.sql); // Assuming the API returns an SQL query
       setQueryOutput(api_response.data.result.output);
diff --git a/DeepResearchAgent/Dockerfile b/DeepResearchAgent/Dockerfile
index d35d3ea7ea..e84b5e34ae 100644
--- a/DeepResearchAgent/Dockerfile
+++ b/DeepResearchAgent/Dockerfile
@@ -3,7 +3,7 @@
 
 ARG IMAGE_REPO=opea
 ARG BASE_TAG=latest
-FROM $IMAGE_REPO/comps-base:$BASE_TAG
+FROM opea/comps-base:$BASE_TAG
 
 COPY ./deep_researcher.yaml $HOME/deep_researcher.yaml
 COPY ./utils.py $HOME/utils.py
@@ -17,4 +17,4 @@ RUN pip install --no-cache-dir --upgrade pip setuptools uv && \
 
 USER user
 
-ENTRYPOINT ["python", "research_agent.py"]
+ENTRYPOINT ["python", "research_agent.py"]
\ No newline at end of file
diff --git a/DeepResearchAgent/docker_compose/intel/hpu/gaudi/compose.yaml b/DeepResearchAgent/docker_compose/intel/hpu/gaudi/compose.yaml
index dc7a05c270..d49af13a94 100644
--- a/DeepResearchAgent/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/DeepResearchAgent/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -20,7 +20,7 @@ x-common-agent-environment:
 services:
 
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.22.0
     container_name: vllm-gaudi-server
     ports:
       - "8000:8000"
diff --git a/DeepResearchAgent/docker_compose/intel/hpu/gaudi/set_env.sh b/DeepResearchAgent/docker_compose/intel/hpu/gaudi/set_env.sh
index e38d0ef378..9df0330f46 100644
--- a/DeepResearchAgent/docker_compose/intel/hpu/gaudi/set_env.sh
+++ b/DeepResearchAgent/docker_compose/intel/hpu/gaudi/set_env.sh
@@ -4,7 +4,7 @@
 # SPDX-License-Identifier: Apache-2.0
 
 # Navigate to the parent directory and source the environment
-SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &> /dev/null && pwd)
+SCRIPT_DIR="$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &> /dev/null && pwd)"
 
 pushd "$SCRIPT_DIR/../../../../../" > /dev/null
 source .set_env.sh
diff --git a/DeepResearchAgent/docker_image_build/build.yaml b/DeepResearchAgent/docker_image_build/build.yaml
index 5ac2e17a90..09ef66da26 100644
--- a/DeepResearchAgent/docker_image_build/build.yaml
+++ b/DeepResearchAgent/docker_image_build/build.yaml
@@ -13,9 +13,3 @@ services:
       context: ../
       dockerfile: ./Dockerfile
     image: ${REGISTRY:-opea}/deep-research-agent:${TAG:-latest}
-  vllm-gaudi:
-    build:
-      context: vllm-fork
-      dockerfile: Dockerfile.hpu
-    extends: deep-research-agent
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
diff --git a/DeepResearchAgent/tests/test_compose_on_gaudi.sh b/DeepResearchAgent/tests/test_compose_on_gaudi.sh
index c180640201..e76a66b9cc 100644
--- a/DeepResearchAgent/tests/test_compose_on_gaudi.sh
+++ b/DeepResearchAgent/tests/test_compose_on_gaudi.sh
@@ -25,9 +25,6 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
     docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
@@ -37,6 +34,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
 
     # Start Docker Containers
diff --git a/DocIndexRetriever/tests/test_compose_milvus_on_gaudi.sh b/DocIndexRetriever/tests/test_compose_milvus_on_gaudi.sh
index 46c5f22f0e..5f3f90842b 100644
--- a/DocIndexRetriever/tests/test_compose_milvus_on_gaudi.sh
+++ b/DocIndexRetriever/tests/test_compose_milvus_on_gaudi.sh
@@ -35,6 +35,7 @@ function build_docker_images() {
 function start_services() {
     echo "Starting Docker Services...."
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     # Start Docker Containers
diff --git a/DocIndexRetriever/tests/test_compose_milvus_on_xeon.sh b/DocIndexRetriever/tests/test_compose_milvus_on_xeon.sh
index 37bf681dcf..80f18fa515 100755
--- a/DocIndexRetriever/tests/test_compose_milvus_on_xeon.sh
+++ b/DocIndexRetriever/tests/test_compose_milvus_on_xeon.sh
@@ -35,6 +35,7 @@ function build_docker_images() {
 function start_services() {
     echo "Starting Docker Services...."
     cd $WORKPATH/docker_compose/intel/cpu/xeon
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     # Start Docker Containers
diff --git a/DocIndexRetriever/tests/test_compose_on_gaudi.sh b/DocIndexRetriever/tests/test_compose_on_gaudi.sh
index 11541eca1e..e65dbb8a15 100644
--- a/DocIndexRetriever/tests/test_compose_on_gaudi.sh
+++ b/DocIndexRetriever/tests/test_compose_on_gaudi.sh
@@ -35,6 +35,7 @@ function build_docker_images() {
 function start_services() {
     echo "Starting Docker Services...."
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     # Start Docker Containers
diff --git a/DocIndexRetriever/tests/test_compose_on_xeon.sh b/DocIndexRetriever/tests/test_compose_on_xeon.sh
index 229e47efea..92289e8bf5 100644
--- a/DocIndexRetriever/tests/test_compose_on_xeon.sh
+++ b/DocIndexRetriever/tests/test_compose_on_xeon.sh
@@ -35,6 +35,7 @@ function build_docker_images() {
 function start_services() {
     echo "Starting Docker Services...."
     cd $WORKPATH/docker_compose/intel/cpu/xeon
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     # Start Docker Containers
diff --git a/DocIndexRetriever/tests/test_compose_without_rerank_on_xeon.sh b/DocIndexRetriever/tests/test_compose_without_rerank_on_xeon.sh
index 37c477b2ad..96a8da8f6d 100644
--- a/DocIndexRetriever/tests/test_compose_without_rerank_on_xeon.sh
+++ b/DocIndexRetriever/tests/test_compose_without_rerank_on_xeon.sh
@@ -39,6 +39,7 @@ function build_docker_images() {
 function start_services() {
     echo "Starting Docker Services...."
     cd $WORKPATH/docker_compose/intel/cpu/xeon
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     # Start Docker Containers
diff --git a/DocSum/docker_compose/amd/cpu/epyc/compose.yaml b/DocSum/docker_compose/amd/cpu/epyc/compose.yaml
index ba0c4c0178..3a687b9b9c 100644
--- a/DocSum/docker_compose/amd/cpu/epyc/compose.yaml
+++ b/DocSum/docker_compose/amd/cpu/epyc/compose.yaml
@@ -4,7 +4,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: docsum-epyc-vllm-service
     ports:
       - "8008:80"
diff --git a/DocSum/docker_compose/intel/cpu/xeon/README.md b/DocSum/docker_compose/intel/cpu/xeon/README.md
index e0b2ab26c0..acd64b9eca 100644
--- a/DocSum/docker_compose/intel/cpu/xeon/README.md
+++ b/DocSum/docker_compose/intel/cpu/xeon/README.md
@@ -13,13 +13,26 @@ This example includes the following sections:
 
 This section describes how to quickly deploy and test the DocSum service manually on an Intel Xeon platform. The basic steps are:
 
-1. [Access the Code](#access-the-code)
-2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
-3. [Configure the Deployment Environment](#configure-the-deployment-environment)
-4. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
-5. [Check the Deployment Status](#check-the-deployment-status)
-6. [Test the Pipeline](#test-the-pipeline)
-7. [Cleanup the Deployment](#cleanup-the-deployment)
+- [Example DocSum deployments on Intel Xeon Processor](#example-docsum-deployments-on-intel-xeon-processor)
+  - [DocSum Quick Start Deployment](#docsum-quick-start-deployment)
+    - [Access the Code and Set Up Environment](#access-the-code-and-set-up-environment)
+    - [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+    - [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+      - [Option #1](#option-1)
+      - [Option #2](#option-2)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Test the Pipeline](#test-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [DocSum Docker Compose Files](#docsum-docker-compose-files)
+    - [Running LLM models with remote endpoints](#running-llm-models-with-remote-endpoints)
+  - [DocSum Detailed Usage](#docsum-detailed-usage)
+    - [Query with text](#query-with-text)
+    - [Query with audio and video](#query-with-audio-and-video)
+    - [Query with long context](#query-with-long-context)
+  - [Launch the UI](#launch-the-ui)
+    - [Gradio UI](#gradio-ui)
+    - [Launch the Svelte UI](#launch-the-svelte-ui)
+    - [Launch the React UI (Optional)](#launch-the-react-ui-optional)
 
 ### Access the Code and Set Up Environment
 
@@ -28,7 +41,7 @@ Clone the GenAIExample repository and access the ChatQnA Intel Xeon platform Doc
 ```bash
 git clone https://github.com/opea-project/GenAIExamples.git
 cd GenAIExamples/DocSum/docker_compose
-source intel/set_env.sh
+source intel/cpu/xeon/set_env.sh
 ```
 
 > NOTE: by default vLLM does "warmup" at start, to optimize its performance for the specified model and the underlying platform, which can take long time. For development (and e.g. autoscaling) it can be skipped with `export VLLM_SKIP_WARMUP=true`.
@@ -47,6 +60,8 @@ Some HuggingFace resources, such as some models, are only accessible if you have
 
 ### Deploy the Services Using Docker Compose
 
+#### Option #1
+
 To deploy the DocSum services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute:
 
 ```bash
@@ -54,6 +69,17 @@ cd intel/cpu/xeon/
 docker compose up -d
 ```
 
+#### Option #2
+
+> NOTE : To enable monitoring, `compose.monitoring.yaml` file need to be merged along with default `compose.yaml` file.
+
+To deploy with monitoring:
+
+```bash
+cd intel/cpu/xeon/
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
 **Note**: developers should build docker image from source when:
 
 - Developing off the git main branch (as the container's ports in the repo may be different from the published docker image).
@@ -109,17 +135,25 @@ To stop the containers associated with the deployment, execute the following com
 docker compose -f compose.yaml down
 ```
 
+If mornitoring is enabled, execute the following command:
+
+```bash
+cd intel/cpu/xeon/
+docker compose -f compose.yaml -f compose.monitoring.yaml down
+```
+
 All the DocSum containers will be stopped and then removed on completion of the "down" command.
 
 ## DocSum Docker Compose Files
 
 In the context of deploying a DocSum pipeline on an Intel® Xeon® platform, we can pick and choose different large language model serving frameworks. The table below outlines the various configurations that are available as part of the application.
 
-| File                                         | Description                                                                            |
-| -------------------------------------------- | -------------------------------------------------------------------------------------- |
-| [compose.yaml](./compose.yaml)               | Default compose file using vllm as serving framework                                   |
-| [compose_tgi.yaml](./compose_tgi.yaml)       | The LLM serving framework is TGI. All other configurations remain the same as default  |
-| [compose_remote.yaml](./compose_remote.yaml) | Uses remote inference endpoints for LLMs. All other configurations are same as default |
+| File                                                 | Description                                                                            |
+| ---------------------------------------------------- | -------------------------------------------------------------------------------------- |
+| [compose.yaml](./compose.yaml)                       | Default compose file using vllm as serving framework                                   |
+| [compose_tgi.yaml](./compose_tgi.yaml)               | The LLM serving framework is TGI. All other configurations remain the same as default  |
+| [compose_remote.yaml](./compose_remote.yaml)         | Uses remote inference endpoints for LLMs. All other configurations are same as default |
+| [compose.monitoring.yaml](./compose.monitoring.yaml) | Helper file for monitoring features. Can be used along with any compose files          |
 
 ### Running LLM models with remote endpoints
 
diff --git a/DocSum/docker_compose/intel/cpu/xeon/compose.monitoring.yaml b/DocSum/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
new file mode 100644
index 0000000000..187427d348
--- /dev/null
+++ b/DocSum/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
@@ -0,0 +1,59 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.sysfs=/host/sys'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    ipc: host
+    restart: always
+    deploy:
+      mode: global
diff --git a/DocSum/docker_compose/intel/cpu/xeon/compose.yaml b/DocSum/docker_compose/intel/cpu/xeon/compose.yaml
index 917bfc1140..163129ce95 100644
--- a/DocSum/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/DocSum/docker_compose/intel/cpu/xeon/compose.yaml
@@ -3,7 +3,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: docsum-xeon-vllm-service
     ports:
       - ${LLM_ENDPOINT_PORT:-8008}:80
diff --git a/DocSum/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh b/DocSum/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..5b59b3cd34
--- /dev/null
+++ b/DocSum/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,11 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/docsum_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
diff --git a/DocSum/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml b/DocSum/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/DocSum/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/DocSum/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml b/DocSum/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml
new file mode 100644
index 0000000000..a206521d67
--- /dev/null
+++ b/DocSum/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://$host_ip:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/DocSum/docker_compose/intel/cpu/xeon/prometheus.yaml b/DocSum/docker_compose/intel/cpu/xeon/prometheus.yaml
new file mode 100644
index 0000000000..758627c077
--- /dev/null
+++ b/DocSum/docker_compose/intel/cpu/xeon/prometheus.yaml
@@ -0,0 +1,27 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["opea_prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["docsum-xeon-vllm-service:80"]
+  - job_name: "tgi"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["docsum-xeon-tgi-server:80"]
+  - job_name: "docsum-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["docsum-xeon-backend-server:8888"]
+  - job_name: "prometheus-node-exporter"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
diff --git a/DocSum/docker_compose/intel/set_env.sh b/DocSum/docker_compose/intel/cpu/xeon/set_env.sh
similarity index 68%
rename from DocSum/docker_compose/intel/set_env.sh
rename to DocSum/docker_compose/intel/cpu/xeon/set_env.sh
index 0411335847..07f734f36e 100644
--- a/DocSum/docker_compose/intel/set_env.sh
+++ b/DocSum/docker_compose/intel/cpu/xeon/set_env.sh
@@ -2,15 +2,14 @@
 
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
-SCRIPT_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-pushd "${SCRIPT_DIR}/../../.." > /dev/null
+
+SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &> /dev/null && pwd)
+
+pushd "$SCRIPT_DIR/../../../../../" > /dev/null
 source .set_env.sh
 popd > /dev/null
 
 export host_ip=$(hostname -I | awk '{print $1}') # Example: host_ip="192.168.1.1"
-export no_proxy="${no_proxy},${host_ip}" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
-export http_proxy=$http_proxy
-export https_proxy=$https_proxy
 export HF_TOKEN=${HF_TOKEN}
 
 export LLM_ENDPOINT_PORT=8008
@@ -41,3 +40,13 @@ export NUM_CARDS=1
 export BLOCK_SIZE=128
 export MAX_NUM_SEQS=256
 export MAX_SEQ_LEN_TO_CAPTURE=2048
+
+# Download Grafana configurations
+pushd "${SCRIPT_DIR}/grafana/dashboards" > /dev/null
+source download_opea_dashboard.sh
+popd > /dev/null
+
+# Set network proxy settings
+export no_proxy="${no_proxy},${host_ip},docsum-xeon-vllm-service,docsum-xeon-tgi-server,docsum-xeon-backend-server,opea_prometheus,grafana,node-exporter,$JAEGER_IP" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
+export http_proxy=$http_proxy
+export https_proxy=$https_proxy
diff --git a/DocSum/docker_compose/intel/hpu/gaudi/README.md b/DocSum/docker_compose/intel/hpu/gaudi/README.md
index 03e53101e1..70e251e869 100644
--- a/DocSum/docker_compose/intel/hpu/gaudi/README.md
+++ b/DocSum/docker_compose/intel/hpu/gaudi/README.md
@@ -15,13 +15,25 @@ This example includes the following sections:
 
 This section describes how to quickly deploy and test the DocSum service manually on an Intel® Gaudi® platform. The basic steps are:
 
-1. [Access the Code](#access-the-code)
-2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
-3. [Configure the Deployment Environment](#configure-the-deployment-environment)
-4. [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
-5. [Check the Deployment Status](#check-the-deployment-status)
-6. [Test the Pipeline](#test-the-pipeline)
-7. [Cleanup the Deployment](#cleanup-the-deployment)
+- [Example DocSum deployments on Intel® Gaudi® Platform](#example-docsum-deployments-on-intel-gaudi-platform)
+  - [DocSum Quick Start Deployment](#docsum-quick-start-deployment)
+    - [Access the Code and Set Up Environment](#access-the-code-and-set-up-environment)
+    - [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+    - [Deploy the Services Using Docker Compose](#deploy-the-services-using-docker-compose)
+      - [Option #1](#option-1)
+      - [Option #2](#option-2)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Test the Pipeline](#test-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [DocSum Docker Compose Files](#docsum-docker-compose-files)
+  - [DocSum Detailed Usage](#docsum-detailed-usage)
+    - [Query with text](#query-with-text)
+    - [Query with audio and video](#query-with-audio-and-video)
+    - [Query with long context](#query-with-long-context)
+  - [Launch the UI](#launch-the-ui)
+    - [Gradio UI](#gradio-ui)
+    - [Launch the Svelte UI](#launch-the-svelte-ui)
+    - [Launch the React UI (Optional)](#launch-the-react-ui-optional)
 
 ### Access the Code and Set Up Environment
 
@@ -30,7 +42,7 @@ Clone the GenAIExample repository and access the DocSum Intel® Gaudi® platform
 ```bash
 git clone https://github.com/opea-project/GenAIExamples.git
 cd GenAIExamples/DocSum/docker_compose
-source intel/set_env.sh
+source intel/hpu/gaudi/set_env.sh
 ```
 
 > NOTE: by default vLLM does "warmup" at start, to optimize its performance for the specified model and the underlying platform, which can take long time. For development (and e.g. autoscaling) it can be skipped with `export VLLM_SKIP_WARMUP=true`.
@@ -49,6 +61,8 @@ Some HuggingFace resources, such as some models, are only accessible if you have
 
 ### Deploy the Services Using Docker Compose
 
+#### Option #1
+
 To deploy the DocSum services, execute the `docker compose up` command with the appropriate arguments. For a default deployment, execute:
 
 ```bash
@@ -56,6 +70,17 @@ cd intel/hpu/gaudi/
 docker compose up -d
 ```
 
+#### Option #2
+
+> NOTE : To enable monitoring, `compose.monitoring.yaml` file need to be merged along with default `compose.yaml` file.
+
+To deploy with monitoring:
+
+```bash
+cd intel/cpu/xeon/
+docker compose -f compose.yaml -f compose.monitoring.yaml up -d
+```
+
 **Note**: developers should build docker image from source when:
 
 - Developing off the git main branch (as the container's ports in the repo may be different from the published docker image).
@@ -117,10 +142,11 @@ All the DocSum containers will be stopped and then removed on completion of the
 
 In the context of deploying a DocSum pipeline on an Intel® Gaudi® platform, the allocation and utilization of Gaudi devices across different services are important considerations for optimizing performance and resource efficiency. Each of the example deployments, defined by the example Docker compose yaml files, demonstrates a unique approach to leveraging Gaudi hardware, reflecting different priorities and operational strategies.
 
-| File                                   | Description                                                                               |
-| -------------------------------------- | ----------------------------------------------------------------------------------------- |
-| [compose.yaml](./compose.yaml)         | Default compose file using vllm as serving framework                                      |
-| [compose_tgi.yaml](./compose_tgi.yaml) | The LLM serving framework is TGI. All other configurations remain the same as the default |
+| File                                                 | Description                                                                               |
+| ---------------------------------------------------- | ----------------------------------------------------------------------------------------- |
+| [compose.yaml](./compose.yaml)                       | Default compose file using vllm as serving framework                                      |
+| [compose_tgi.yaml](./compose_tgi.yaml)               | The LLM serving framework is TGI. All other configurations remain the same as the default |
+| [compose.monitoring.yaml](./compose.monitoring.yaml) | Helper file for monitoring features. Can be used along with any compose files             |
 
 ## DocSum Detailed Usage
 
diff --git a/DocSum/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml b/DocSum/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
new file mode 100644
index 0000000000..691671e656
--- /dev/null
+++ b/DocSum/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
@@ -0,0 +1,75 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.rootfs=/rootfs'
+      - '--path.sysfs=/host/sys'
+      - '--path.udev.data=/rootfs/run/udev/data'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    restart: always
+    deploy:
+      mode: global
+
+  gaudi-metrics-exporter:
+    image: vault.habana.ai/gaudi-metric-exporter/metric-exporter:latest
+    privileged: true
+    container_name: gaudi-metrics-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+      - /dev:/dev
+    deploy:
+      mode: global
+    ports:
+      - 41611:41611
+    restart: unless-stopped
diff --git a/DocSum/docker_compose/intel/hpu/gaudi/compose.yaml b/DocSum/docker_compose/intel/hpu/gaudi/compose.yaml
index 9311817f32..fbc10c06ca 100644
--- a/DocSum/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/DocSum/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -3,7 +3,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.4
     container_name: docsum-gaudi-vllm-service
     ports:
       - ${LLM_ENDPOINT_PORT:-8008}:80
diff --git a/DocSum/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh b/DocSum/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..b02827a300
--- /dev/null
+++ b/DocSum/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/gaudi_grafana_v2.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/docsum_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
diff --git a/DocSum/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml b/DocSum/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/DocSum/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/DocSum/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml b/DocSum/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml
new file mode 100644
index 0000000000..a206521d67
--- /dev/null
+++ b/DocSum/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://$host_ip:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/DocSum/docker_compose/intel/hpu/gaudi/prometheus.yaml b/DocSum/docker_compose/intel/hpu/gaudi/prometheus.yaml
new file mode 100644
index 0000000000..16693ae112
--- /dev/null
+++ b/DocSum/docker_compose/intel/hpu/gaudi/prometheus.yaml
@@ -0,0 +1,34 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["opea_prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["docsum-gaudi-vllm-service:80"]
+  - job_name: "tgi"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["docsum-gaudi-tgi-server:80"]
+  - job_name: "docsum-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["docsum-gaudi-backend-server:8888"]
+  - job_name: "prometheus-node-exporter"
+    scrape_interval: 30s
+    scrape_timeout: 25s
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
+  - job_name: "gaudi-metrics-exporter"
+    scrape_interval: 30s
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["gaudi-metrics-exporter:41611"]
diff --git a/DocSum/docker_compose/intel/hpu/gaudi/set_env.sh b/DocSum/docker_compose/intel/hpu/gaudi/set_env.sh
new file mode 100644
index 0000000000..e571ad82ab
--- /dev/null
+++ b/DocSum/docker_compose/intel/hpu/gaudi/set_env.sh
@@ -0,0 +1,52 @@
+#!/usr/bin/env bash
+
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &> /dev/null && pwd)
+
+pushd "$SCRIPT_DIR/../../../../../" > /dev/null
+source .set_env.sh
+popd > /dev/null
+
+export host_ip=$(hostname -I | awk '{print $1}') # Example: host_ip="192.168.1.1"
+export HF_TOKEN=${HF_TOKEN}
+
+export LLM_ENDPOINT_PORT=8008
+export LLM_MODEL_ID="meta-llama/Meta-Llama-3-8B-Instruct"
+
+export BLOCK_SIZE=128
+export MAX_NUM_SEQS=256
+export MAX_SEQ_LEN_TO_CAPTURE=2048
+export NUM_CARDS=1
+export MAX_INPUT_TOKENS=1024
+export MAX_TOTAL_TOKENS=2048
+
+export LLM_PORT=9000
+export LLM_ENDPOINT="http://${host_ip}:${LLM_ENDPOINT_PORT}"
+export ASR_SERVICE_PORT=7066
+export DocSum_COMPONENT_NAME="OpeaDocSumvLLM" # OpeaDocSumTgi
+export FRONTEND_SERVICE_PORT=5173
+export MEGA_SERVICE_HOST_IP=${host_ip}
+export LLM_SERVICE_HOST_IP=${host_ip}
+export ASR_SERVICE_HOST_IP=${host_ip}
+
+export BACKEND_SERVICE_PORT=8888
+export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:${BACKEND_SERVICE_PORT}/v1/docsum"
+
+export LOGFLAG=True
+
+export NUM_CARDS=1
+export BLOCK_SIZE=128
+export MAX_NUM_SEQS=256
+export MAX_SEQ_LEN_TO_CAPTURE=2048
+
+# Download Grafana configurations
+pushd "${SCRIPT_DIR}/grafana/dashboards" > /dev/null
+source download_opea_dashboard.sh
+popd > /dev/null
+
+# Set network proxy settings
+export no_proxy="${no_proxy},${host_ip},docsum-gaudi-vllm-service,docsum-gaudi-tgi-server,docsum-gaudi-backend-server,gaudi-metrics-exporter,opea_prometheus,grafana,node-exporter,$JAEGER_IP" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
+export http_proxy=$http_proxy
+export https_proxy=$https_proxy
diff --git a/DocSum/docker_image_build/build.yaml b/DocSum/docker_image_build/build.yaml
index b4a2eb9c54..dcd4433ad0 100644
--- a/DocSum/docker_image_build/build.yaml
+++ b/DocSum/docker_image_build/build.yaml
@@ -54,15 +54,3 @@ services:
       context: GenAIComps
       dockerfile: comps/third_parties/vllm/src/Dockerfile.amd_gpu
     image: ${REGISTRY:-opea}/vllm-rocm:${TAG:-latest}
-  vllm:
-    build:
-      context: vllm
-      dockerfile: docker/Dockerfile.cpu
-    extends: docsum
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
-  vllm-gaudi:
-    build:
-      context: vllm-fork
-      dockerfile: Dockerfile.hpu
-    extends: docsum
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
diff --git a/DocSum/tests/test_compose_on_epyc.sh b/DocSum/tests/test_compose_on_epyc.sh
index 1a4959366a..a67e05c681 100644
--- a/DocSum/tests/test_compose_on_epyc.sh
+++ b/DocSum/tests/test_compose_on_epyc.sh
@@ -38,19 +38,8 @@ function build_docker_images() {
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
 
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
-
 	echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-	service_list="docsum docsum-gradio-ui whisper llm-docsum vllm"
+	service_list="docsum docsum-gradio-ui whisper llm-docsum"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 
 	docker images && sleep 1s
@@ -58,6 +47,7 @@ function build_docker_images() {
 
 function start_services() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc/
+	export no_proxy="localhost,127.0.0.1,$ip_address"
 	docker compose -f compose.yaml up -d >${LOG_PATH}/start_services_with_compose.log
 	sleep 1m
 }
diff --git a/DocSum/tests/test_compose_on_gaudi.sh b/DocSum/tests/test_compose_on_gaudi.sh
index 2e13e41c9d..654ad01282 100644
--- a/DocSum/tests/test_compose_on_gaudi.sh
+++ b/DocSum/tests/test_compose_on_gaudi.sh
@@ -16,7 +16,7 @@ echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
 echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
 export REGISTRY=${IMAGE_REPO}
 export TAG=${IMAGE_TAG}
-source $WORKPATH/docker_compose/intel/set_env.sh
+source $WORKPATH/docker_compose/intel/hpu/gaudi/set_env.sh
 
 export MODEL_CACHE=${model_cache:-"./data"}
 
@@ -27,12 +27,6 @@ export MAX_SEQ_LEN_TO_CAPTURE=2048
 export MAX_INPUT_TOKENS=2048
 export MAX_TOTAL_TOKENS=4096
 
-# set service host and no_proxy
-export LLM_ENDPOINT="http://vllm-service:80"
-export LLM_SERVICE_HOST_IP="llm-docsum-vllm"
-export ASR_SERVICE_HOST_IP="whisper"
-export no_proxy=$no_proxy,$LLM_SERVICE_HOST_IP,$ASR_SERVICE_HOST_IP,"vllm-service"
-
 # Get the root folder of the current script
 ROOT_FOLDER=$(dirname "$(readlink -f "$0")")
 
@@ -46,12 +40,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="docsum docsum-gradio-ui whisper llm-docsum vllm-gaudi"
+    service_list="docsum docsum-gradio-ui whisper llm-docsum"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log 2>&1
 
     docker images && sleep 1s
@@ -59,7 +49,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 2m
 }
 
@@ -359,7 +349,7 @@ function validate_megaservice_long_text() {
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f compose.yaml stop && docker compose rm -f
+    docker compose -f compose.yaml -f compose.monitoring.yaml stop && docker compose -f compose.yaml -f compose.monitoring.yaml rm -f
 }
 
 function main() {
diff --git a/DocSum/tests/test_compose_on_xeon.sh b/DocSum/tests/test_compose_on_xeon.sh
index 5ceed1ec03..0b7d678db2 100644
--- a/DocSum/tests/test_compose_on_xeon.sh
+++ b/DocSum/tests/test_compose_on_xeon.sh
@@ -17,7 +17,7 @@ echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
 export REGISTRY=${IMAGE_REPO}
 export TAG=${IMAGE_TAG}
 
-source $WORKPATH/docker_compose/intel/set_env.sh
+source $WORKPATH/docker_compose/intel/cpu/xeon/set_env.sh
 export MODEL_CACHE=${model_cache:-"./data"}
 
 export MAX_INPUT_TOKENS=2048
@@ -36,14 +36,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="docsum docsum-gradio-ui whisper llm-docsum vllm"
+    service_list="docsum docsum-gradio-ui whisper llm-docsum"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
 
     docker images && sleep 1s
@@ -51,7 +45,8 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    docker compose -f compose.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 1m
 }
 
@@ -351,7 +346,7 @@ function validate_megaservice_long_text() {
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose stop && docker compose rm -f
+    docker compose -f compose.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/DocSum/tests/test_compose_tgi_on_epyc.sh b/DocSum/tests/test_compose_tgi_on_epyc.sh
index b1caf7685c..33442bb270 100644
--- a/DocSum/tests/test_compose_tgi_on_epyc.sh
+++ b/DocSum/tests/test_compose_tgi_on_epyc.sh
@@ -47,6 +47,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 1m
 }
diff --git a/DocSum/tests/test_compose_tgi_on_gaudi.sh b/DocSum/tests/test_compose_tgi_on_gaudi.sh
index c6133515cf..19111a3ded 100644
--- a/DocSum/tests/test_compose_tgi_on_gaudi.sh
+++ b/DocSum/tests/test_compose_tgi_on_gaudi.sh
@@ -16,7 +16,7 @@ echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
 export REGISTRY=${IMAGE_REPO}
 export TAG=${IMAGE_TAG}
 
-source $WORKPATH/docker_compose/intel/set_env.sh
+source $WORKPATH/docker_compose/intel/hpu/gaudi/set_env.sh
 export MODEL_CACHE=${model_cache:-"./data"}
 
 export MAX_INPUT_TOKENS=2048
@@ -45,7 +45,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 1m
 }
 
@@ -88,36 +88,51 @@ function validate_service() {
     local FORM_DATA5="${11}"
     local FORM_DATA6="${12}"
 
-    if [[ $VALIDATE_TYPE == *"json"* ]]; then
-        HTTP_RESPONSE=$(curl --silent --write-out "HTTPSTATUS:%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
-    else
-        CURL_CMD=(curl --silent --write-out "HTTPSTATUS:%{http_code}" -X POST -F "$FORM_DATA1" -F "$FORM_DATA2" -F "$FORM_DATA3" -F "$FORM_DATA4" -F "$FORM_DATA5" -H 'Content-Type: multipart/form-data' "$URL")
-        if [[ -n "$FORM_DATA6" ]]; then
-            CURL_CMD+=(-F "$FORM_DATA6")
+    local MAX_RETRIES=${13:-3}
+    local RETRY_DELAY=${14:-2}
+
+    local retry_count=0
+    local success=false
+
+    while [ $retry_count -lt $MAX_RETRIES ] && [ "$success" = false ]; do
+        retry_count=$((retry_count + 1))
+
+        echo "[ $SERVICE_NAME ] 尝试第 $retry_count/$MAX_RETRIES 次..."
+        if [[ $VALIDATE_TYPE == *"json"* ]]; then
+            HTTP_RESPONSE=$(curl --silent --write-out "HTTPSTATUS:%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
+        else
+            CURL_CMD=(curl --silent --write-out "HTTPSTATUS:%{http_code}" -X POST -F "$FORM_DATA1" -F "$FORM_DATA2" -F "$FORM_DATA3" -F "$FORM_DATA4" -F "$FORM_DATA5" -H 'Content-Type: multipart/form-data' "$URL")
+            if [[ -n "$FORM_DATA6" ]]; then
+                CURL_CMD+=(-F "$FORM_DATA6")
+            fi
+            HTTP_RESPONSE=$("${CURL_CMD[@]}")
+        fi
+        HTTP_STATUS=$(echo $HTTP_RESPONSE | tr -d '\n' | sed -e 's/.*HTTPSTATUS://')
+        RESPONSE_BODY=$(echo $HTTP_RESPONSE | sed -e 's/HTTPSTATUS\:.*//g')
+
+        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+
+        # check response status
+        if [ "$HTTP_STATUS" -ne "200" ]; then
+            echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
+            exit 1
+        else
+            echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+        fi
+        # check response body
+        if [[ "$RESPONSE_BODY" != *"$EXPECTED_RESULT"* ]]; then
+            echo "EXPECTED_RESULT==> $EXPECTED_RESULT"
+            echo "RESPONSE_BODY==> $RESPONSE_BODY"
+            echo "[ $SERVICE_NAME ] Content does not match the expected result: $RESPONSE_BODY"
+            if [ $retry_count -lt $max_retries ]; then
+                echo "[ $SERVICE_NAME ] will retry after $retry_delay seconds ..."
+                sleep ${retry_delay}s
+            fi
+        else
+            success=true
+            echo "[ $SERVICE_NAME ] Content is as expected."
         fi
-        HTTP_RESPONSE=$("${CURL_CMD[@]}")
-    fi
-    HTTP_STATUS=$(echo $HTTP_RESPONSE | tr -d '\n' | sed -e 's/.*HTTPSTATUS://')
-    RESPONSE_BODY=$(echo $HTTP_RESPONSE | sed -e 's/HTTPSTATUS\:.*//g')
-
-    docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-
-    # check response status
-    if [ "$HTTP_STATUS" -ne "200" ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
-        exit 1
-    else
-        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
-    fi
-    # check response body
-    if [[ "$RESPONSE_BODY" != *"$EXPECTED_RESULT"* ]]; then
-        echo "EXPECTED_RESULT==> $EXPECTED_RESULT"
-        echo "RESPONSE_BODY==> $RESPONSE_BODY"
-        echo "[ $SERVICE_NAME ] Content does not match the expected result: $RESPONSE_BODY"
-        exit 1
-    else
-        echo "[ $SERVICE_NAME ] Content is as expected."
-    fi
+    done
 
     sleep 1s
 }
@@ -354,7 +369,7 @@ function validate_megaservice_long_text() {
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f compose_tgi.yaml stop && docker compose rm -f
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml stop && docker compose -f compose_tgi.yaml -f compose.monitoring.yaml rm -f
 }
 
 function main() {
diff --git a/DocSum/tests/test_compose_tgi_on_xeon.sh b/DocSum/tests/test_compose_tgi_on_xeon.sh
index e107bfca63..1fbaa4d357 100644
--- a/DocSum/tests/test_compose_tgi_on_xeon.sh
+++ b/DocSum/tests/test_compose_tgi_on_xeon.sh
@@ -16,7 +16,7 @@ echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
 export REGISTRY=${IMAGE_REPO}
 export TAG=${IMAGE_TAG}
 
-source $WORKPATH/docker_compose/intel/set_env.sh
+source $WORKPATH/docker_compose/intel/cpu/xeon/set_env.sh
 export MODEL_CACHE=${model_cache:-"./data"}
 
 export MAX_INPUT_TOKENS=2048
@@ -45,7 +45,8 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 1m
 }
 
@@ -354,7 +355,7 @@ function validate_megaservice_long_text() {
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f compose_tgi.yaml stop && docker compose rm -f
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml stop && docker compose -f compose_tgi.yaml -f compose.monitoring.yaml rm -f
 }
 
 function main() {
diff --git a/DocSum/ui/docker/Dockerfile b/DocSum/ui/docker/Dockerfile
index 1d5115f4b5..3a6ca7f7c9 100644
--- a/DocSum/ui/docker/Dockerfile
+++ b/DocSum/ui/docker/Dockerfile
@@ -1,8 +1,8 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-# Use node 20.11.1 as the base image
-FROM node:20.11.1
+# Use node 20.19.0 as the base image (required for chokidar@5.0.0 compatibility)
+FROM node:20.19.0
 
 # Update package manager and install Git
 RUN apt-get update -y && apt-get install -y git
diff --git a/DocSum/ui/gradio/requirements.txt b/DocSum/ui/gradio/requirements.txt
index 5824f07218..27687edf4e 100644
--- a/DocSum/ui/gradio/requirements.txt
+++ b/DocSum/ui/gradio/requirements.txt
@@ -1,5 +1,5 @@
 docx2txt
-gradio==5.11.0
+gradio>5.22.0,<=5.34.0 
 langchain_community
 moviepy==1.0.3
 numpy==1.26.4
diff --git a/DocSum/ui/svelte/package.json b/DocSum/ui/svelte/package.json
index d5efc343c0..f6054bc229 100644
--- a/DocSum/ui/svelte/package.json
+++ b/DocSum/ui/svelte/package.json
@@ -27,7 +27,7 @@
   "devDependencies": {
     "@playwright/test": "^1.44.1",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/package": "^2.0.0",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "autoprefixer": "^10.4.16",
diff --git a/EdgeCraftRAG/Dockerfile.server b/EdgeCraftRAG/Dockerfile.server
old mode 100755
new mode 100644
index 4ac52700a8..f910252616
--- a/EdgeCraftRAG/Dockerfile.server
+++ b/EdgeCraftRAG/Dockerfile.server
@@ -1,30 +1,17 @@
 FROM python:3.11-slim
 
 SHELL ["/bin/bash", "-o", "pipefail", "-c"]
-
-RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missing \
-    libjemalloc-dev \
-    libmagic1 \
-    libglib2.0-0 \
-    poppler-utils \
-    tesseract-ocr
-
-RUN apt-get update && apt-get install -y gnupg wget git
-RUN wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | \
-    gpg --yes --dearmor --output /usr/share/keyrings/intel-graphics.gpg
-RUN echo "deb [arch=amd64,i386 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy client" | \
-    tee /etc/apt/sources.list.d/intel-gpu-jammy.list
-RUN apt-get update && apt-get install -y \
-    intel-opencl-icd intel-level-zero-gpu \
-    intel-level-zero-gpu-raytracing \
-    intel-media-va-driver-non-free libmfx1 libmfxgen1 libvpl2 \
-    libegl-mesa0 libegl1-mesa libegl1-mesa-dev libgbm1 libgl1-mesa-dev libgl1-mesa-dri \
-    libglapi-mesa libgles2-mesa-dev libglx-mesa0 libigdgmm12 libxatracker2 mesa-va-drivers \
-    mesa-vdpau-drivers mesa-vulkan-drivers va-driver-all vainfo hwinfo clinfo 
+RUN apt-get update && apt-get install -y gnupg2 wget git
+RUN apt-get remove -y libze-intel-gpu1 libigc1 libigdfcl1 libze-dev || true; \
+    apt-get update; \
+    apt-get install -y curl
+RUN curl -sL 'https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=get&search=0x0C0E6AF955CE463C03FC51574D098D70AFBE5E1F' | tee /etc/apt/trusted.gpg.d/driver.asc
+RUN echo -e "Types: deb\nURIs: https://ppa.launchpadcontent.net/kobuk-team/intel-graphics/ubuntu/\nSuites: plucky\nComponents: main\nSigned-By: /etc/apt/trusted.gpg.d/driver.asc" > /etc/apt/sources.list.d/driver.sources
+RUN apt-get update && apt-get install -y libze-intel-gpu1 libze1 intel-metrics-discovery intel-opencl-icd clinfo intel-gsc && apt-get install -y libze-intel-gpu1 libze1 intel-metrics-discovery intel-opencl-icd clinfo intel-gsc && apt-get install -y libze-dev intel-ocloc libze-intel-gpu-raytracing
 
 RUN useradd -m -s /bin/bash user && \
     mkdir -p /home/user && \
-    chown -R user /home/user/ 
+    chown -R user /home/user/
 
 RUN mkdir /templates && \
     chown -R user /templates
@@ -33,17 +20,21 @@ RUN chown -R user /templates/default_prompt.txt
 
 COPY ./edgecraftrag /home/user/edgecraftrag
 
-RUN mkdir -p /home/user/ui_cache 
+RUN mkdir -p /home/user/ui_cache
 ENV UI_UPLOAD_PATH=/home/user/ui_cache
 
 USER user
 
 WORKDIR /home/user/edgecraftrag
-RUN pip install --no-cache-dir --upgrade pip setuptools==70.0.0 && \
-    pip install --no-cache-dir --extra-index-url https://download.pytorch.org/whl/cpu -r requirements.txt
+RUN pip3 install --no-cache-dir --upgrade setuptools==70.0.0 --break-system-packages && \
+    pip3 install --no-cache-dir --extra-index-url https://download.pytorch.org/whl/cpu -r requirements.txt --break-system-packages
+
+RUN pip3 install --no-cache-dir docarray==0.40.0 --break-system-packages
 
 WORKDIR /home/user/
 RUN git clone https://github.com/openvinotoolkit/openvino.genai.git genai
 ENV PYTHONPATH="$PYTHONPATH:/home/user/genai/tools/llm_bench"
 
-ENTRYPOINT ["python", "-m", "edgecraftrag.server"]
\ No newline at end of file
+RUN python3 -m nltk.downloader -d /home/user/nltk_data punkt_tab averaged_perceptron_tagger_eng
+
+ENTRYPOINT ["python3", "-m", "edgecraftrag.server"]
diff --git a/EdgeCraftRAG/README.md b/EdgeCraftRAG/README.md
old mode 100755
new mode 100644
index 314feb3480..0f225c9b91
--- a/EdgeCraftRAG/README.md
+++ b/EdgeCraftRAG/README.md
@@ -5,6 +5,13 @@ Retrieval-Augmented Generation system for edge solutions. It is designed to
 curate the RAG pipeline to meet hardware requirements at edge with guaranteed
 quality and performance.
 
+## What's New
+
+1. Support Agent component and enable deep_search agent
+2. Optimize pipeline execution performance with asynchronous api
+3. Support session list display in UI
+4. Support vllm-based embedding service
+
 ## Table of contents
 
 1. [Architecture](#architecture)
diff --git a/EdgeCraftRAG/assets/img/kbadmin_index.png b/EdgeCraftRAG/assets/img/kbadmin_index.png
new file mode 100644
index 0000000000..7383a01c79
Binary files /dev/null and b/EdgeCraftRAG/assets/img/kbadmin_index.png differ
diff --git a/EdgeCraftRAG/assets/img/kbadmin_kb.png b/EdgeCraftRAG/assets/img/kbadmin_kb.png
new file mode 100644
index 0000000000..40f6909a9b
Binary files /dev/null and b/EdgeCraftRAG/assets/img/kbadmin_kb.png differ
diff --git a/EdgeCraftRAG/assets/img/kbadmin_type.png b/EdgeCraftRAG/assets/img/kbadmin_type.png
new file mode 100644
index 0000000000..012ebb0bd8
Binary files /dev/null and b/EdgeCraftRAG/assets/img/kbadmin_type.png differ
diff --git a/EdgeCraftRAG/chatqna.py b/EdgeCraftRAG/chatqna.py
old mode 100755
new mode 100644
index 1073a66eb4..48b7359cb4
--- a/EdgeCraftRAG/chatqna.py
+++ b/EdgeCraftRAG/chatqna.py
@@ -44,7 +44,7 @@ async def handle_request(self, request: Request):
         input = await request.json()
         stream_opt = input.get("stream", False)
         input["user"] = request.headers.get("sessionid", None)
-        chat_request = ChatCompletionRequest.parse_obj(input)
+        chat_request = ChatCompletionRequest.construct(**input)
         parameters = LLMParams(
             max_tokens=chat_request.max_tokens if chat_request.max_tokens else 1024,
             top_k=chat_request.top_k if chat_request.top_k else 10,
diff --git a/EdgeCraftRAG/docker_compose/intel/gpu/arc/README.md b/EdgeCraftRAG/docker_compose/intel/gpu/arc/README.md
index d4d283d8f1..9a5663ddb2 100755
--- a/EdgeCraftRAG/docker_compose/intel/gpu/arc/README.md
+++ b/EdgeCraftRAG/docker_compose/intel/gpu/arc/README.md
@@ -10,25 +10,27 @@ This document outlines the deployment process for Edge Craft Retrieval-Augmented
 
 This section describes how to quickly deploy and test the EdgeCraftRAG service manually on Intel® Arc® platform. The basic steps are:
 
-1. [Prerequisites](#prerequisites)
-2. [Access the Code](#access-the-code)
-3. [Prepare models](#prepare-models)
-4. [Prepare env variables and configurations](#prepare-env-variables-and-configurations)
-5. [Configure the Deployment Environment](#configure-the-deployment-environment)
-6. [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
-7. [Access UI](#access-ui)
-8. [Cleanup the Deployment](#cleanup-the-deployment)
+1. [Prerequisites](#1-prerequisites)
+2. [Access the Code](#2-access-the-code)
+3. [Prepare models](#3-prepare-models)
+4. [Prepare env variables and configurations](#4-prepare-env-variables-and-configurations)
+5. [Deploy the Service on Arc GPU Using Docker Compose](#5-deploy-the-service-on-intel-gpu-using-docker-compose)
+6. [Access UI](#6-access-ui)
+7. [Cleanup the Deployment](#7-cleanup-the-deployment)
 
-### Prerequisites
+### 1. Prerequisites
 
 EC-RAG supports vLLM deployment(default method) and local OpenVINO deployment for Intel Arc GPU. Prerequisites are shown as below:  
 Hardware: Intel Arc A770  
 OS: Ubuntu Server 22.04.1 or newer (at least 6.2 LTS kernel)  
 Driver & libraries: please to [Installing GPUs Drivers](https://dgpu-docs.intel.com/driver/installation-rolling.html#installing-gpu-drivers) for detailed driver & libraries setup
 
+Hardware: Intel Arc B60  
+please to [Install Native Environment](https://github.com/intel/llm-scaler/tree/main/vllm#11-install-native-environment) for detailed setup
+
 Below steps are based on **vLLM** as inference engine, if you want to choose **OpenVINO**, please refer to [OpenVINO Local Inference](../../../../docs/Advanced_Setup.md#openvino-local-inference)
 
-### Access the Code
+### 2. Access the Code
 
 Clone the GenAIExample repository and access the EdgeCraftRAG Intel® Arc® platform Docker Compose files and supporting scripts:
 
@@ -43,7 +45,7 @@ Checkout a released version, such as v1.3:
 git checkout v1.3
 ```
 
-### Prepare models
+### 3. Prepare models
 
 ```bash
 # Prepare models for embedding, reranking:
@@ -62,9 +64,7 @@ modelscope download --model $LLM_MODEL --local_dir "${MODEL_PATH}/${LLM_MODEL}"
 # huggingface-cli download $LLM_MODEL --local-dir "${MODEL_PATH}/${LLM_MODEL}"
 ```
 
-### Prepare env variables and configurations
-
-Below steps are for single Intel Arc GPU inference, if you want to setup multi Intel Arc GPUs inference, please refer to [Multi-ARC Setup](../../../../docs/Advanced_Setup.md#multi-arc-setup)
+### 4. Prepare env variables and configurations
 
 #### Prepare env variables for vLLM deployment
 
@@ -77,32 +77,25 @@ export HOST_IP=$ip_address # Your host ip
 export VIDEOGROUPID=$(getent group video | cut -d: -f3)
 export RENDERGROUPID=$(getent group render | cut -d: -f3)
 
-# If you have a proxy configured, uncomment below line
-# export no_proxy=${no_proxy},${HOST_IP},edgecraftrag,edgecraftrag-server
-# export NO_PROXY=${NO_PROXY},${HOST_IP},edgecraftrag,edgecraftrag-server
+# If you have a proxy configured, execute below line
+export no_proxy=${no_proxy},${HOST_IP},edgecraftrag,edgecraftrag-server
+export NO_PROXY=${NO_PROXY},${HOST_IP},edgecraftrag,edgecraftrag-server
 # If you have a HF mirror configured, it will be imported to the container
 # export HF_ENDPOINT=https://hf-mirror.com # your HF mirror endpoint"
 
 # Make sure all 3 folders have 1000:1000 permission, otherwise
-# chown 1000:1000 ${MODEL_PATH} ${PWD} # the default value of DOC_PATH and TMPFILE_PATH is PWD ,so here we give permission to ${PWD}
+export DOC_PATH=${PWD}/tests
+export TMPFILE_PATH=${PWD}/tests
+chown 1000:1000 ${MODEL_PATH} ${DOC_PATH} ${TMPFILE_PATH}
 # In addition, also make sure the .cache folder has 1000:1000 permission, otherwise
-# chown 1000:1000 -R $HOME/.cache
+chown 1000:1000 -R $HOME/.cache
 ```
 
 For more advanced env variables and configurations, please refer to [Prepare env variables for vLLM deployment](../../../../docs/Advanced_Setup.md#prepare-env-variables-for-vllm-deployment)
 
-#### Generate nginx config file
+### 5. Deploy the Service on Intel GPU Using Docker Compose
 
-```bash
-export VLLM_SERVICE_PORT_0=8100 # You can set your own port for vllm service
-# Generate your nginx config file
-# nginx-conf-generator.sh requires 2 parameters: DP_NUM and output filepath
-bash nginx/nginx-conf-generator.sh 1 nginx/nginx.conf
-# set NGINX_CONFIG_PATH
-export NGINX_CONFIG_PATH="${PWD}/nginx/nginx.conf"
-```
-
-### Deploy the Service Using Docker Compose
+set Milvus DB and chat history round for inference:
 
 ```bash
 # EC-RAG support Milvus as persistent database, by default milvus is disabled, you can choose to set MILVUS_ENABLED=1 to enable it
@@ -112,12 +105,40 @@ export MILVUS_ENABLED=0
 
 # EC-RAG support chat history round setting, by default chat history is disabled, you can set CHAT_HISTORY_ROUND to control it
 # export CHAT_HISTORY_ROUND= # change to your preference
+```
+
+#### option a. Deploy the Service on Arc A770 Using Docker Compose
+
+```bash
+export VLLM_SERVICE_PORT_A770=8086 # You can set your own port for vllm service
 
 # Launch EC-RAG service with compose
-docker compose -f docker_compose/intel/gpu/arc/compose_vllm.yaml up -d
+docker compose --profile a770 -f docker_compose/intel/gpu/arc/compose.yaml up -d
+```
+
+#### option b. Deploy the Service on Arc B60 Using Docker Compose
+
+```bash
+# Besides MILVUS_ENABLED and CHAT_HISTORY_ROUND, below environments are exposed for vLLM config, you can change them to your preference:
+# export VLLM_SERVICE_PORT_B60=8086
+# export DTYPE=float16
+# export TP=1 # for multi GPU, you can change TP value
+# export DP=1
+# export ZE_AFFINITY_MASK=0 # for multi GPU, you can export ZE_AFFINITY_MASK=0,1,2...
+# export ENFORCE_EAGER=1
+# export TRUST_REMOTE_CODE=1
+# export DISABLE_SLIDING_WINDOW=1
+# export GPU_MEMORY_UTIL=0.8
+# export NO_ENABLE_PREFIX_CACHING=1
+# export MAX_NUM_BATCHED_TOKENS=8192
+# export DISABLE_LOG_REQUESTS=1
+# export MAX_MODEL_LEN=49152
+# export BLOCK_SIZE=64
+# export QUANTIZATION=fp8
+docker compose --profile b60 -f docker_compose/intel/gpu/arc/compose.yaml up -d
 ```
 
-### Access UI
+### 6. Access UI
 
 Open your browser, access http://${HOST_IP}:8082
 
@@ -126,12 +147,12 @@ Open your browser, access http://${HOST_IP}:8082
 Below is the UI front page, for detailed operations on UI and EC-RAG settings, please refer to [Explore_Edge_Craft_RAG](../../../../docs/Explore_Edge_Craft_RAG.md)
 ![front_page](../../../../assets/img/front_page.png)
 
-### Cleanup the Deployment
+### 7. Cleanup the Deployment
 
 To stop the containers associated with the deployment, execute the following command:
 
 ```
-docker compose -f docker_compose/intel/gpu/arc/compose_vllm.yaml down
+docker compose -f docker_compose/intel/gpu/arc/compose.yaml down
 ```
 
 All the EdgeCraftRAG containers will be stopped and then removed on completion of the "down" command.
diff --git a/EdgeCraftRAG/docker_compose/intel/gpu/arc/compose.yaml b/EdgeCraftRAG/docker_compose/intel/gpu/arc/compose.yaml
old mode 100755
new mode 100644
index 488bccdf7a..707be2328c
--- a/EdgeCraftRAG/docker_compose/intel/gpu/arc/compose.yaml
+++ b/EdgeCraftRAG/docker_compose/intel/gpu/arc/compose.yaml
@@ -1,9 +1,11 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
+
 services:
   etcd:
     container_name: milvus-etcd
     image: quay.io/coreos/etcd:v3.5.5
+    restart: always
     environment:
       - ETCD_AUTO_COMPACTION_MODE=revision
       - ETCD_AUTO_COMPACTION_RETENTION=1000
@@ -22,6 +24,7 @@ services:
   minio:
     container_name: milvus-minio
     image: minio/minio:RELEASE.2023-03-20T20-16-18Z
+    restart: always
     environment:
       MINIO_ACCESS_KEY: minioadmin
       MINIO_SECRET_KEY: minioadmin
@@ -41,6 +44,7 @@ services:
   milvus-standalone:
     container_name: milvus-standalone
     image: milvusdb/milvus:v2.4.6
+    restart: always
     command: ["milvus", "run", "standalone"]
     security_opt:
       - seccomp:unconfined
@@ -48,7 +52,7 @@ services:
       ETCD_ENDPOINTS: etcd:2379
       MINIO_ADDRESS: minio:9000
     volumes:
-      - ./milvus.yaml:/milvus/configs/milvus.yaml
+      - ./milvus-config.yaml:/milvus/configs/milvus.yaml
       - ${DOCKER_VOLUME_DIRECTORY:-${PWD}}/volumes/milvus:/var/lib/milvus
     healthcheck:
       test: ["CMD", "curl", "-f", "http://localhost:9091/healthz"]
@@ -71,16 +75,16 @@ services:
       no_proxy: ${no_proxy}
       http_proxy: ${http_proxy}
       https_proxy: ${https_proxy}
-      HF_ENDPOINT: ${HF_ENDPOINT}
-      vLLM_ENDPOINT: ${vLLM_ENDPOINT:-http://${HOST_IP}:${NGINX_PORT:-8086}}
+      vLLM_ENDPOINT: ${vLLM_ENDPOINT:-http://${HOST_IP}:${VLLM_SERVICE_PORT_B60:-8086}}
+      LLM_MODEL: ${LLM_MODEL}
       ENABLE_BENCHMARK: ${ENABLE_BENCHMARK:-false}
-      MAX_MODEL_LEN: ${MAX_MODEL_LEN:-5000}
+      MAX_MODEL_LEN: ${MAX_MODEL_LEN:-49152}
       CHAT_HISTORY_ROUND: ${CHAT_HISTORY_ROUND:-0}
+      METADATA_DATABASE_URL: ${METADATA_DATABASE_URL:-""}
     volumes:
       - ${MODEL_PATH:-${PWD}}:/home/user/models
       - ${DOC_PATH:-${PWD}}:/home/user/docs
       - ${TMPFILE_PATH:-${PWD}}:/home/user/ui_cache
-      - ${HF_CACHE:-${HOME}/.cache}:/home/user/.cache
       - ${PROMPT_PATH:-${PWD}}:/templates/custom
     restart: always
     ports:
@@ -127,6 +131,96 @@ services:
     depends_on:
       - edgecraftrag-server
       - ecrag
+  llm-serving-xpu-b60:
+    container_name: ipex-serving-xpu-container
+    image: intel/llm-scaler-vllm:1.1-preview
+    privileged: true
+    restart: always
+    ports:
+      - ${VLLM_SERVICE_PORT_B60:-8086}:${VLLM_SERVICE_PORT_B60:-8086}
+    volumes:
+      - ${MODEL_PATH}:/workspace/vllm/models
+    devices:
+      - /dev/dri:/dev/dri
+    environment:
+      DTYPE: ${DTYPE:-float16}
+      VLLM_SERVICE_PORT_B60: ${VLLM_SERVICE_PORT_B60:-8086}
+      ZE_AFFINITY_MASK: ${ZE_AFFINITY_MASK:-0}
+      ENFORCE_EAGER: ${ENFORCE_EAGER:-1}
+      TRUST_REMOTE_CODE: ${TRUST_REMOTE_CODE:-1}
+      DISABLE_SLIDING_WINDOW: ${DISABLE_SLIDING_WINDOW:-1}
+      GPU_MEMORY_UTIL: ${GPU_MEMORY_UTIL:-0.8}
+      NO_ENABLE_PREFIX_CACHING: ${NO_ENABLE_PREFIX_CACHING:-1}
+      MAX_NUM_BATCHED_TOKENS: ${MAX_NUM_BATCHED_TOKENS:-8192}
+      DISABLE_LOG_REQUESTS: ${DISABLE_LOG_REQUESTS:-1}
+      MAX_MODEL_LEN: ${MAX_MODEL_LEN:-49152}
+      BLOCK_SIZE: ${BLOCK_SIZE:-64}
+      QUANTIZATION: ${QUANTIZATION:-fp8}
+      LLM_MODEL: ${LLM_MODEL}
+      TP: ${TP:-1}
+      DP: ${DP:-1}
+    entrypoint:
+      /bin/bash -c "
+      cd  /workspace/vllm/models && source /opt/intel/oneapi/setvars.sh --force &&
+      VLLM_OFFLOAD_WEIGHTS_BEFORE_QUANT=1 \
+      TORCH_LLM_ALLREDUCE=1 \
+      VLLM_USE_V1=1 \
+      CCL_ZE_IPC_EXCHANGE=pidfd \
+      VLLM_ALLOW_LONG_MAX_MODEL_LEN=1 \
+      VLLM_WORKER_MULTIPROC_METHOD=spawn \
+      python3 -m vllm.entrypoints.openai.api_server \
+      --model $${LLM_MODEL} \
+      --dtype $${DTYPE} \
+      --enforce-eager \
+      --port $${VLLM_SERVICE_PORT_B60} \
+      --trust-remote-code \
+      --disable-sliding-window \
+      --gpu-memory-util $${GPU_MEMORY_UTIL} \
+      --no-enable-prefix-caching \
+      --max-num-batched-tokens $${MAX_NUM_BATCHED_TOKENS} \
+      --disable-log-requests \
+      --max-model-len $${MAX_MODEL_LEN} \
+      --block-size $${BLOCK_SIZE} \
+      --quantization $${QUANTIZATION} \
+      -tp=$${TP} \
+      -dp=$${DP}"
+    profiles:
+      - b60
+  llm-serving-xpu-770:
+    container_name: ipex-llm-serving-xpu-770
+    image: intelanalytics/ipex-llm-serving-xpu:0.8.3-b20
+    privileged: true
+    restart: always
+    ports:
+      - ${VLLM_SERVICE_PORT_A770:-8086}:${VLLM_SERVICE_PORT_A770:-8086}
+    group_add:
+      - video
+      - ${VIDEOGROUPID:-44}
+      - ${RENDERGROUPID:-109}
+    volumes:
+      - ${LLM_MODEL_PATH:-${MODEL_PATH}/${LLM_MODEL}}:/llm/models
+    devices:
+      - /dev/dri
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      MODEL_PATH: "/llm/models"
+      SERVED_MODEL_NAME: ${LLM_MODEL}
+      TENSOR_PARALLEL_SIZE: ${TENSOR_PARALLEL_SIZE:-1}
+      MAX_NUM_SEQS: ${MAX_NUM_SEQS:-64}
+      MAX_NUM_BATCHED_TOKENS: ${MAX_NUM_BATCHED_TOKENS:-10240}
+      MAX_MODEL_LEN: ${MAX_MODEL_LEN:-10240}
+      LOAD_IN_LOW_BIT: ${LOAD_IN_LOW_BIT:-fp8}
+      CCL_DG2_USM: ${CCL_DG2_USM:-""}
+      PORT: ${VLLM_SERVICE_PORT_A770:-8086}
+      ZE_AFFINITY_MASK: ${SELECTED_XPU_0:-0}
+    shm_size: '32g'
+    entrypoint: /bin/bash -c "\
+      cd /llm && \
+      bash start-vllm-service.sh"
+    profiles:
+      - a770
 networks:
   default:
     driver: bridge
diff --git a/EdgeCraftRAG/docker_compose/intel/gpu/arc/compose_vllm.yaml b/EdgeCraftRAG/docker_compose/intel/gpu/arc/compose_vllm.yaml
deleted file mode 100644
index a1afa20eb9..0000000000
--- a/EdgeCraftRAG/docker_compose/intel/gpu/arc/compose_vllm.yaml
+++ /dev/null
@@ -1,177 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  etcd:
-    container_name: milvus-etcd
-    image: quay.io/coreos/etcd:v3.5.5
-    environment:
-      - ETCD_AUTO_COMPACTION_MODE=revision
-      - ETCD_AUTO_COMPACTION_RETENTION=1000
-      - ETCD_QUOTA_BACKEND_BYTES=4294967296
-      - ETCD_SNAPSHOT_COUNT=50000
-    volumes:
-      - ${DOCKER_VOLUME_DIRECTORY:-${PWD}}/volumes/etcd:/etcd
-    command: etcd -advertise-client-urls=http://127.0.0.1:2379 -listen-client-urls http://0.0.0.0:2379 --data-dir /etcd
-    healthcheck:
-      test: ["CMD", "etcdctl", "endpoint", "health"]
-      interval: 30s
-      timeout: 20s
-      retries: 3
-    deploy:
-      replicas: ${MILVUS_ENABLED:-0}
-  minio:
-    container_name: milvus-minio
-    image: minio/minio:RELEASE.2023-03-20T20-16-18Z
-    environment:
-      MINIO_ACCESS_KEY: minioadmin
-      MINIO_SECRET_KEY: minioadmin
-    ports:
-      - "${MINIO_PORT1:-5044}:9001"
-      - "${MINIO_PORT2:-5043}:9000"
-    volumes:
-      - ${DOCKER_VOLUME_DIRECTORY:-${PWD}}/volumes/minio:/minio_data
-    command: minio server /minio_data --console-address ":9001"
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:9000/minio/health/live"]
-      interval: 30s
-      timeout: 20s
-      retries: 3
-    deploy:
-      replicas: ${MILVUS_ENABLED:-0}
-  milvus-standalone:
-    container_name: milvus-standalone
-    image: milvusdb/milvus:v2.4.6
-    command: ["milvus", "run", "standalone"]
-    security_opt:
-      - seccomp:unconfined
-    environment:
-      ETCD_ENDPOINTS: etcd:2379
-      MINIO_ADDRESS: minio:9000
-    volumes:
-      - ./milvus.yaml:/milvus/configs/milvus.yaml
-      - ${DOCKER_VOLUME_DIRECTORY:-${PWD}}/volumes/milvus:/var/lib/milvus
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:9091/healthz"]
-      interval: 30s
-      start_period: 90s
-      timeout: 20s
-      retries: 3
-    ports:
-      - "19530:19530"
-      - "${MILVUS_STANDALONE_PORT:-9091}:9091"
-    depends_on:
-      - "etcd"
-      - "minio"
-    deploy:
-      replicas: ${MILVUS_ENABLED:-0}
-  edgecraftrag-server:
-    image: ${REGISTRY:-opea}/edgecraftrag-server:${TAG:-latest}
-    container_name: edgecraftrag-server
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      HF_ENDPOINT: ${HF_ENDPOINT}
-      vLLM_ENDPOINT: ${vLLM_ENDPOINT:-http://${HOST_IP}:${NGINX_PORT:-8086}}
-      LLM_MODEL: ${LLM_MODEL}
-      ENABLE_BENCHMARK: ${ENABLE_BENCHMARK:-false}
-      MAX_MODEL_LEN: ${MAX_MODEL_LEN:-5000}
-      CHAT_HISTORY_ROUND: ${CHAT_HISTORY_ROUND:-0}
-    volumes:
-      - ${MODEL_PATH:-${PWD}}:/home/user/models
-      - ${DOC_PATH:-${PWD}}:/home/user/docs
-      - ${TMPFILE_PATH:-${PWD}}:/home/user/ui_cache
-      - ${HF_CACHE:-${HOME}/.cache}:/home/user/.cache
-      - ${PROMPT_PATH:-${PWD}}:/templates/custom
-    restart: always
-    ports:
-      - ${PIPELINE_SERVICE_PORT:-16010}:${PIPELINE_SERVICE_PORT:-16010}
-    devices:
-      - /dev/dri:/dev/dri
-    group_add:
-      - ${VIDEOGROUPID:-44}
-      - ${RENDERGROUPID:-109}
-  ecrag:
-    image: ${REGISTRY:-opea}/edgecraftrag:${TAG:-latest}
-    container_name: edgecraftrag
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      MEGA_SERVICE_PORT: ${MEGA_SERVICE_PORT:-16011}
-      MEGA_SERVICE_HOST_IP: ${MEGA_SERVICE_HOST_IP:-${HOST_IP}}
-      PIPELINE_SERVICE_PORT: ${PIPELINE_SERVICE_PORT:-16010}
-      PIPELINE_SERVICE_HOST_IP: ${PIPELINE_SERVICE_HOST_IP:-${HOST_IP}}
-    restart: always
-    ports:
-      - ${MEGA_SERVICE_PORT:-16011}:${MEGA_SERVICE_PORT:-16011}
-    depends_on:
-      - edgecraftrag-server
-  nginx:
-    image: nginx:latest
-    restart: always
-    ports:
-      - ${NGINX_PORT:-8086}:8086
-    volumes:
-      - ${NGINX_CONFIG_PATH:-${PWD}}:/etc/nginx/nginx.conf
-    depends_on:
-      - edgecraftrag-server
-  edgecraftrag-ui:
-    image: ${REGISTRY:-opea}/edgecraftrag-ui:${TAG:-latest}
-    container_name: edgecraftrag-ui
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      MEGA_SERVICE_PORT: ${MEGA_SERVICE_PORT:-16011}
-      MEGA_SERVICE_HOST_IP: ${MEGA_SERVICE_HOST_IP:-${HOST_IP}}
-      PIPELINE_SERVICE_PORT: ${PIPELINE_SERVICE_PORT:-16010}
-      PIPELINE_SERVICE_HOST_IP: ${PIPELINE_SERVICE_HOST_IP:-${HOST_IP}}
-      UI_SERVICE_PORT: ${UI_SERVICE_PORT:-8082}
-      UI_SERVICE_HOST_IP: ${UI_SERVICE_HOST_IP:-0.0.0.0}
-    volumes:
-      - ${TMPFILE_PATH:-${PWD}}:/home/user/ui_cache
-    restart: always
-    ports:
-      - ${UI_SERVICE_PORT:-8082}:${UI_SERVICE_PORT:-8082}
-    depends_on:
-      - edgecraftrag-server
-      - ecrag
-  llm-serving-xpu-0:
-    container_name: ipex-llm-serving-xpu-container-0
-    image: intelanalytics/ipex-llm-serving-xpu:0.8.3-b20
-    privileged: true
-    restart: always
-    ports:
-      - ${VLLM_SERVICE_PORT_0:-8100}:${VLLM_SERVICE_PORT_0:-8100}
-    group_add:
-      - video
-      - ${VIDEOGROUPID:-44}
-      - ${RENDERGROUPID:-109}
-    volumes:
-      - ${LLM_MODEL_PATH:-${MODEL_PATH}/${LLM_MODEL}}:/llm/models
-    devices:
-      - /dev/dri
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      HF_ENDPOINT: ${HF_ENDPOINT}
-      MODEL_PATH: "/llm/models"
-      SERVED_MODEL_NAME: ${LLM_MODEL}
-      TENSOR_PARALLEL_SIZE: ${TENSOR_PARALLEL_SIZE:-1}
-      MAX_NUM_SEQS: ${MAX_NUM_SEQS:-64}
-      MAX_NUM_BATCHED_TOKENS: ${MAX_NUM_BATCHED_TOKENS:-10240}
-      MAX_MODEL_LEN: ${MAX_MODEL_LEN:-10240}
-      LOAD_IN_LOW_BIT: ${LOAD_IN_LOW_BIT:-fp8}
-      CCL_DG2_USM: ${CCL_DG2_USM:-""}
-      PORT: ${VLLM_SERVICE_PORT_0:-8100}
-      ZE_AFFINITY_MASK: ${SELECTED_XPU_0:-0}
-    shm_size: '32g'
-    entrypoint: /bin/bash -c "\
-      cd /llm && \
-      bash start-vllm-service.sh"
-networks:
-  default:
-    driver: bridge
diff --git a/EdgeCraftRAG/docker_compose/intel/gpu/arc/milvus.yaml b/EdgeCraftRAG/docker_compose/intel/gpu/arc/milvus-config.yaml
similarity index 100%
rename from EdgeCraftRAG/docker_compose/intel/gpu/arc/milvus.yaml
rename to EdgeCraftRAG/docker_compose/intel/gpu/arc/milvus-config.yaml
diff --git a/EdgeCraftRAG/docker_compose/intel/gpu/arc/multi-arc-yaml-generator.sh b/EdgeCraftRAG/docker_compose/intel/gpu/arc/multi-arc-yaml-generator.sh
deleted file mode 100644
index 2a819eb552..0000000000
--- a/EdgeCraftRAG/docker_compose/intel/gpu/arc/multi-arc-yaml-generator.sh
+++ /dev/null
@@ -1,202 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-# Check if the correct number of arguments is provided
-if [ "$#" -ne 2 ]; then
-    echo "Usage: $0 DP_NUM output-file-path"
-    exit 1
-fi
-
-# Get the port number from the command line argument
-PORT_NUM=$1
-
-# Start generating the Nginx configuration
-cat <<EOL > $2
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  etcd:
-    container_name: milvus-etcd
-    image: quay.io/coreos/etcd:v3.5.5
-    environment:
-      - ETCD_AUTO_COMPACTION_MODE=revision
-      - ETCD_AUTO_COMPACTION_RETENTION=1000
-      - ETCD_QUOTA_BACKEND_BYTES=4294967296
-      - ETCD_SNAPSHOT_COUNT=50000
-    volumes:
-      - \${DOCKER_VOLUME_DIRECTORY:-\${PWD}}/volumes/etcd:/etcd
-    command: etcd -advertise-client-urls=http://127.0.0.1:2379 -listen-client-urls http://0.0.0.0:2379 --data-dir /etcd
-    healthcheck:
-      test: ["CMD", "etcdctl", "endpoint", "health"]
-      interval: 30s
-      timeout: 20s
-      retries: 3
-    deploy:
-      replicas: \${MILVUS_ENABLED:-0}
-  minio:
-    container_name: milvus-minio
-    image: minio/minio:RELEASE.2023-03-20T20-16-18Z
-    environment:
-      MINIO_ACCESS_KEY: minioadmin
-      MINIO_SECRET_KEY: minioadmin
-    ports:
-      - "\${MINIO_PORT1:-5044}:9001"
-      - "\${MINIO_PORT2:-5043}:9000"
-    volumes:
-      - \${DOCKER_VOLUME_DIRECTORY:-\${PWD}}/volumes/minio:/minio_data
-    command: minio server /minio_data --console-address ":9001"
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:9000/minio/health/live"]
-      interval: 30s
-      timeout: 20s
-      retries: 3
-    deploy:
-      replicas: \${MILVUS_ENABLED:-0}
-  milvus-standalone:
-    container_name: milvus-standalone
-    image: milvusdb/milvus:v2.4.6
-    command: ["milvus", "run", "standalone"]
-    security_opt:
-      - seccomp:unconfined
-    environment:
-      ETCD_ENDPOINTS: etcd:2379
-      MINIO_ADDRESS: minio:9000
-    volumes:
-      - ./milvus.yaml:/milvus/configs/milvus.yaml
-      - \${DOCKER_VOLUME_DIRECTORY:-\${PWD}}/volumes/milvus:/var/lib/milvus
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:9091/healthz"]
-      interval: 30s
-      start_period: 90s
-      timeout: 20s
-      retries: 3
-    ports:
-      - "19530:19530"
-      - "\${MILVUS_STANDALONE_PORT:-9091}:9091"
-    depends_on:
-      - "etcd"
-      - "minio"
-    deploy:
-      replicas: \${MILVUS_ENABLED:-0}
-  edgecraftrag-server:
-    image: \${REGISTRY:-opea}/edgecraftrag-server:\${TAG:-latest}
-    container_name: edgecraftrag-server
-    environment:
-      no_proxy: \${no_proxy}
-      http_proxy: \${http_proxy}
-      https_proxy: \${https_proxy}
-      HF_ENDPOINT: \${HF_ENDPOINT}
-      vLLM_ENDPOINT: \${vLLM_ENDPOINT:-http://\${HOST_IP}:\${NGINX_PORT:-8086}}
-      LLM_MODEL: \${LLM_MODEL}
-      ENABLE_BENCHMARK: \${ENABLE_BENCHMARK:-false}
-      MAX_MODEL_LEN: \${MAX_MODEL_LEN:-5000}
-      CHAT_HISTORY_ROUND: \${CHAT_HISTORY_ROUND:-0}
-    volumes:
-      - \${MODEL_PATH:-\${PWD}}:/home/user/models
-      - \${DOC_PATH:-\${PWD}}:/home/user/docs
-      - \${TMPFILE_PATH:-\${PWD}}:/home/user/ui_cache
-      - \${HF_CACHE:-\${HOME}/.cache}:/home/user/.cache
-      - \${PROMPT_PATH:-\${PWD}}:/templates/custom
-    restart: always
-    ports:
-      - \${PIPELINE_SERVICE_PORT:-16010}:\${PIPELINE_SERVICE_PORT:-16010}
-    devices:
-      - /dev/dri:/dev/dri
-    group_add:
-      - \${VIDEOGROUPID:-44}
-      - \${RENDERGROUPID:-109}
-  ecrag:
-    image: \${REGISTRY:-opea}/edgecraftrag:\${TAG:-latest}
-    container_name: edgecraftrag
-    environment:
-      no_proxy: \${no_proxy}
-      http_proxy: \${http_proxy}
-      https_proxy: \${https_proxy}
-      MEGA_SERVICE_PORT: \${MEGA_SERVICE_PORT:-16011}
-      MEGA_SERVICE_HOST_IP: \${MEGA_SERVICE_HOST_IP:-\${HOST_IP}}
-      PIPELINE_SERVICE_PORT: \${PIPELINE_SERVICE_PORT:-16010}
-      PIPELINE_SERVICE_HOST_IP: \${PIPELINE_SERVICE_HOST_IP:-\${HOST_IP}}
-    restart: always
-    ports:
-      - \${MEGA_SERVICE_PORT:-16011}:\${MEGA_SERVICE_PORT:-16011}
-    depends_on:
-      - edgecraftrag-server
-  nginx:
-    image: nginx:latest
-    restart: always
-    ports:
-      - \${NGINX_PORT:-8086}:8086
-    volumes:
-      - \${NGINX_CONFIG_PATH:-\${PWD}}:/etc/nginx/nginx.conf
-    depends_on:
-      - edgecraftrag-server
-  edgecraftrag-ui:
-    image: \${REGISTRY:-opea}/edgecraftrag-ui:\${TAG:-latest}
-    container_name: edgecraftrag-ui
-    environment:
-      no_proxy: \${no_proxy}
-      http_proxy: \${http_proxy}
-      https_proxy: \${https_proxy}
-      MEGA_SERVICE_PORT: \${MEGA_SERVICE_PORT:-16011}
-      MEGA_SERVICE_HOST_IP: \${MEGA_SERVICE_HOST_IP:-\${HOST_IP}}
-      PIPELINE_SERVICE_PORT: \${PIPELINE_SERVICE_PORT:-16010}
-      PIPELINE_SERVICE_HOST_IP: \${PIPELINE_SERVICE_HOST_IP:-\${HOST_IP}}
-      UI_SERVICE_PORT: \${UI_SERVICE_PORT:-8082}
-      UI_SERVICE_HOST_IP: \${UI_SERVICE_HOST_IP:-0.0.0.0}
-    volumes:
-      - \${TMPFILE_PATH:-\${PWD}}:/home/user/ui_cache
-    restart: always
-    ports:
-      - \${UI_SERVICE_PORT:-8082}:\${UI_SERVICE_PORT:-8082}
-    depends_on:
-      - edgecraftrag-server
-      - ecrag
-EOL
-
-for ((i = 0; i < PORT_NUM; i++)); do
-    cat <<EOL >> $2
-  llm-serving-xpu-$i:
-    container_name: ipex-llm-serving-xpu-container-$i
-    image: intelanalytics/ipex-llm-serving-xpu:0.8.3-b20
-    privileged: true
-    restart: always
-    ports:
-      - \${VLLM_SERVICE_PORT_$i:-8$((i+1))00}:\${VLLM_SERVICE_PORT_$i:-8$((i+1))00}
-    group_add:
-      - video
-      - \${VIDEOGROUPID:-44}
-      - \${RENDERGROUPID:-109}
-    volumes:
-      - \${LLM_MODEL_PATH:-\${MODEL_PATH}/\${LLM_MODEL}}:/llm/models
-    devices:
-      - /dev/dri
-    environment:
-      no_proxy: \${no_proxy}
-      http_proxy: \${http_proxy}
-      https_proxy: \${https_proxy}
-      HF_ENDPOINT: \${HF_ENDPOINT}
-      MODEL_PATH: "/llm/models"
-      SERVED_MODEL_NAME: \${LLM_MODEL}
-      TENSOR_PARALLEL_SIZE: \${TENSOR_PARALLEL_SIZE:-1}
-      MAX_NUM_SEQS: \${MAX_NUM_SEQS:-64}
-      MAX_NUM_BATCHED_TOKENS: \${MAX_NUM_BATCHED_TOKENS:-10240}
-      MAX_MODEL_LEN: \${MAX_MODEL_LEN:-10240}
-      LOAD_IN_LOW_BIT: \${LOAD_IN_LOW_BIT:-fp8}
-      CCL_DG2_USM: \${CCL_DG2_USM:-""}
-      PORT: \${VLLM_SERVICE_PORT_$i:-8$((i+1))00}
-      ZE_AFFINITY_MASK: \${SELECTED_XPU_$i:-$i}
-    shm_size: '32g'
-    entrypoint: /bin/bash -c "\\
-      cd /llm && \\
-      bash start-vllm-service.sh"
-EOL
-done
-cat <<EOL >> $2
-networks:
-  default:
-    driver: bridge
-EOL
-
-echo "compose_vllm.yaml generated"
diff --git a/EdgeCraftRAG/docker_compose/intel/gpu/arc/set_env.sh b/EdgeCraftRAG/docker_compose/intel/gpu/arc/set_env.sh
index b587c32426..3247f3ce91 100755
--- a/EdgeCraftRAG/docker_compose/intel/gpu/arc/set_env.sh
+++ b/EdgeCraftRAG/docker_compose/intel/gpu/arc/set_env.sh
@@ -17,20 +17,15 @@ export HF_TOKEN=${HF_TOKEN}
 export no_proxy="localhost, 127.0.0.1, 192.168.1.1"
 export UI_UPLOAD_PATH=${UI_UPLOAD_PATH}
 export LLM_MODEL_PATH=${LLM_MODEL_PATH}
-export NGINX_PORT_0=${NGINX_PORT_0}
-export NGINX_PORT_1=${NGINX_PORT_1}
-export NGINX_PORT_2=${NGINX_PORT_2}
-export VLLM_SERVICE_PORT_0=${VLLM_SERVICE_PORT_0}
-export VLLM_SERVICE_PORT_1=${VLLM_SERVICE_PORT_1}
-export VLLM_SERVICE_PORT_2=${VLLM_SERVICE_PORT_2}
+
+export VLLM_SERVICE_PORT_B60=${VLLM_SERVICE_PORT_B60}
+export VLLM_SERVICE_PORT_A770=${VLLM_SERVICE_PORT_A770}
 export TENSOR_PARALLEL_SIZE=${TENSOR_PARALLEL_SIZE}
-export NGINX_CONFIG_PATH=${NGINX_CONFIG_PATH}
-export SELECTED_XPU_0=${SELECTED_XPU_0}
-export SELECTED_XPU_1=${SELECTED_XPU_1}
-export SELECTED_XPU_2=${SELECTED_XPU_2}
+
 export vLLM_ENDPOINT=${vLLM_ENDPOINT}
 export MAX_NUM_SEQS=${MAX_NUM_SEQS}
 export MAX_NUM_BATCHED_TOKENS=${MAX_NUM_BATCHED_TOKENS}
 export MAX_MODEL_LEN=${MAX_MODEL_LEN}
 export LOAD_IN_LOW_BIT=${LOAD_IN_LOW_BIT}
 export CCL_DG2_USM=${CCL_DG2_USM}
+export ZE_AFFINITY_MASK=${ZE_AFFINITY_MASK}
diff --git a/EdgeCraftRAG/docs/API_Guide.md b/EdgeCraftRAG/docs/API_Guide.md
index 804fa45397..c13753596c 100644
--- a/EdgeCraftRAG/docs/API_Guide.md
+++ b/EdgeCraftRAG/docs/API_Guide.md
@@ -205,3 +205,18 @@ curl -X POST http://${HOST_IP}:16010/v1/chatqna/prompt/reset -H "Content-Type: a
 ```bash
 curl -X POST http://${HOST_IP}:16010/v1/chatqna/prompt-file -H "Content-Type: multipart/form-data" -F "file=@your_prompt_file.txt"
 ```
+
+## ChatQnA
+
+### Retrieval API
+
+```bash
+curl -X POST http://${HOST_IP}:16010/v1/retrieval -H "Content-Type: application/json" -d '{"messages":"#Please enter the question you need to retrieve here#", "top_n":5, "max_tokens":512}' | jq '.'
+
+```
+
+### ChatQnA API
+
+```bash
+curl -X POST http://${HOST_IP}:16011/v1/chatqna -H "Content-Type: application/json" -d '{"messages":"#REPLACE WITH YOUR QUESTION HERE#", "top_n":5, "max_tokens":512}' | jq '.'
+```
diff --git a/EdgeCraftRAG/docs/Advanced_Setup.md b/EdgeCraftRAG/docs/Advanced_Setup.md
index ef864fc1f4..af1cce8522 100644
--- a/EdgeCraftRAG/docs/Advanced_Setup.md
+++ b/EdgeCraftRAG/docs/Advanced_Setup.md
@@ -1,49 +1,5 @@
 # Edge Craft Retrieval-Augmented Generation Advanced Setup
 
-## Query Search
-
-Query Search features allow EC-RAG to do query pre-process before retrieval and reranking. To enable query search, vllm inference is required. Chinese version is available in [Query Search Zh](Query_Search_Zh.md)
-
-### 1. Sub-question file(s) example
-
-Sub-question files need to end with `.json` and follow json file format: main question as json key, sub-questions as json value. See below example:
-
-```json
-{
-  "Issue1": "Sub-question1.1? Sub-question1.2?",
-  "Issue2": "Sub-question2.1? Sub-question2.2? Sub-question2.3?"
-}
-```
-
-> Note: 1. At lease one sub-question file is required. 2. Increasing main question amount would increase query time for EC-RAG.
-
-### 2. Sub-question file(s) location
-
-All sub-question files need to be placed under `${TMPFILE_PATH}/configs/search_dir`.
-
-### 3. Config file example
-
-Configure file includes variables such as prompts, temperature, etc.
-
-`instruction`, `input_template`, `output_template` would affect final prompt for query search.
-`json_key` and `json_levels` are related to each other. For example, if `json_key` is set to "similarity", `json_levels` need list options for "similarity", such as "Low, Medium, High".
-
-One example for DeesSeep-R1-Distill-Qwen-32B configs is listed below:
-
-```yaml
-query_matcher:
-  instructions: "Decide similarity of two queries. For exactly the same, mark as High, for totally different, mark as Low.\n"
-  input_template: "<query> {} </query>\n<query> {} </query>\n"
-  output_template: "output from {json_levels}.\n"
-  json_key: "similarity"
-  json_levels: ["Low", "Medium", "High"]
-  temperature: 3.7
-```
-
-### 4. Config file location
-
-Config file needs to be placed under `${TMPFILE_PATH}/configs` and named as `search_config.yaml`, which gives final path as `${TMPFILE_PATH}/configs/search_config.yaml`.
-
 ## OpenVINO Local Inference
 
 EC-RAG support using local OpenVINO models to do inference, please follow below steps to run local inference:
@@ -55,9 +11,9 @@ EC-RAG support using local OpenVINO models to do inference, please follow below
 ```bash
 git clone https://github.com/opea-project/GenAIExamples.git
 cd GenAIExamples/EdgeCraftRAG
-docker build --build-arg http_proxy=$http_proxy --build-arg https_proxy=$https_proxy --build-arg no_proxy="$no_proxy" -t opea/edgecraftrag:latest -f Dockerfile .
-docker build --build-arg http_proxy=$http_proxy --build-arg https_proxy=$https_proxy --build-arg no_proxy="$no_proxy" -t opea/edgecraftrag-server:latest -f Dockerfile.server .
-docker build --build-arg http_proxy=$http_proxy --build-arg https_proxy=$https_proxy --build-arg no_proxy="$no_proxy" -t opea/edgecraftrag-ui:latest -f ui/docker/Dockerfile.ui .
+docker build --no-cache --pull --build-arg http_proxy=$http_proxy --build-arg https_proxy=$https_proxy --build-arg no_proxy="$no_proxy" -t opea/edgecraftrag:latest -f Dockerfile .
+docker build --no-cache --pull --build-arg http_proxy=$http_proxy --build-arg https_proxy=$https_proxy --build-arg no_proxy="$no_proxy" -t opea/edgecraftrag-server:latest -f Dockerfile.server .
+docker build --no-cache --pull --build-arg http_proxy=$http_proxy --build-arg https_proxy=$https_proxy --build-arg no_proxy="$no_proxy" -t opea/edgecraftrag-ui:latest -f ui/docker/Dockerfile.ui .
 ```
 
 ### 2. Prepare models
@@ -79,28 +35,22 @@ ip_address=$(hostname -I | awk '{print $1}')
 # Use `ip a` to check your active ip
 export HOST_IP=$ip_address # Your host ip
 
-export DOC_PATH=${PWD} # Your doc path for uploading a dir of files
-export TMPFILE_PATH=${PWD} # Your UI cache path for transferring files
-
 # Check group id of video and render
 export VIDEOGROUPID=$(getent group video | cut -d: -f3)
 export RENDERGROUPID=$(getent group render | cut -d: -f3)
 
-# If you have a proxy configured, uncomment below line
-# export no_proxy=${no_proxy},${HOST_IP},edgecraftrag,edgecraftrag-server
-# export NO_PROXY=${NO_PROXY},${HOST_IP},edgecraftrag,edgecraftrag-server
+# If you have a proxy configured, execute below line
+export no_proxy=${no_proxy},${HOST_IP},edgecraftrag,edgecraftrag-server
+export NO_PROXY=${NO_PROXY},${HOST_IP},edgecraftrag,edgecraftrag-server
 # If you have a HF mirror configured, it will be imported to the container
 # export HF_ENDPOINT=https://hf-mirror.com # your HF mirror endpoint"
 
-# By default, the ports of the containers are set, uncomment if you want to change
-# export MEGA_SERVICE_PORT=16011
-# export PIPELINE_SERVICE_PORT=16010
-# export UI_SERVICE_PORT="8082"
-
 # Make sure all 3 folders have 1000:1000 permission, otherwise
-# chown 1000:1000 ${MODEL_PATH} ${DOC_PATH} ${TMPFILE_PATH}
+export DOC_PATH=${PWD}/tests
+export TMPFILE_PATH=${PWD}/tests
+chown 1000:1000 -R ${MODEL_PATH} ${DOC_PATH} ${TMPFILE_PATH}
 # In addition, also make sure the .cache folder has 1000:1000 permission, otherwise
-# chown 1000:1000 -R $HOME/.cache
+chown 1000:1000 -R $HOME/.cache
 ```
 
 ### 4. Start Edge Craft RAG Services with Docker Compose
@@ -117,82 +67,22 @@ export MILVUS_ENABLED=0
 # EC-RAG support pipeline performance benchmark, use ENABLE_BENCHMARK=true/false to turn on/off benchmark
 # export ENABLE_BENCHMARK= # change to your preference
 
+export MAX_MODEL_LEN=5000
 # Launch EC-RAG service with compose
 docker compose -f docker_compose/intel/gpu/arc/compose.yaml up -d
 ```
 
-## Multi-ARC Setup
+## EC-RAG with Kbadmin
 
-EC-RAG support run inference with multi-ARC in multiple isolated containers
-Docker Images preparation is the same as local inference section, please refer to [Build Docker Images](#1-optional-build-docker-images-for-mega-service-server-and-ui-by-your-own)
+EC-RAG support kbadmin as a knowledge base manager  
+Please make sure all the kbadmin services have been launched
+EC-RAG Docker Images preparation is the same as local inference section, please refer to [Build Docker Images](#1-optional-build-docker-images-for-mega-service-server-and-ui-by-your-own)
 Model preparation is the same as vLLM inference section, please refer to [Prepare models](../docker_compose/intel/gpu/arc/README.md#2-prepare-models)
-After docker images preparation and model preparation, please follow below steps to run multi-ARC Setup(Below steps show 2 vLLM container(2 DP) with multi Intel Arc GPUs):
 
-### 1. Prepare env variables and configurations
+### 1. Start Edge Craft RAG Services with Docker Compose
 
-#### Prepare env variables for vLLM deployment
-
-```bash
-ip_address=$(hostname -I | awk '{print $1}')
-# Use `ip a` to check your active ip
-export HOST_IP=$ip_address # Your host ip
-
-# The default LLM_MODEL_PATH is "${MODEL_PATH}/${LLM_MODEL}", you can change to your model path
-# export LLM_MODEL_PATH= # change to your model path
-export DOC_PATH=${PWD} # Your doc path for uploading a dir of files
-export TMPFILE_PATH=${PWD} # Your UI cache path for transferring files
-
-# Check group id of video and render
-export VIDEOGROUPID=$(getent group video | cut -d: -f3)
-export RENDERGROUPID=$(getent group render | cut -d: -f3)
-
-# If you have a proxy configured, uncomment below line
-# export no_proxy=${no_proxy},${HOST_IP},edgecraftrag,edgecraftrag-server
-# export NO_PROXY=${NO_PROXY},${HOST_IP},edgecraftrag,edgecraftrag-server
-# If you have a HF mirror configured, it will be imported to the container
-# export HF_ENDPOINT=https://hf-mirror.com # your HF mirror endpoint"
-
-# By default, the ports of the containers are set, uncomment if you want to change
-# export MEGA_SERVICE_PORT=16011
-# export PIPELINE_SERVICE_PORT=16010
-# export UI_SERVICE_PORT="8082"
-
-# Make sure all 3 folders have 1000:1000 permission, otherwise
-# chown 1000:1000 ${MODEL_PATH} ${DOC_PATH} ${TMPFILE_PATH}
-# In addition, also make sure the .cache folder has 1000:1000 permission, otherwise
-# chown 1000:1000 -R $HOME/.cache
-
-export NGINX_PORT=8086 # Set port for nginx
-export vLLM_ENDPOINT="http://${HOST_IP}:${NGINX_PORT}"
-export DP_NUM=2 # How many containers you want to start to run inference
-export VLLM_SERVICE_PORT_0=8100 # You can set your own vllm service port
-export VLLM_SERVICE_PORT_1=8200 # You can set your own vllm service port
-export TENSOR_PARALLEL_SIZE=1 # Your Intel Arc GPU number to do TP inference
-export SELECTED_XPU_0=0 # Which GPU to select to run for container 0
-export SELECTED_XPU_1=1 # Which GPU to select to run for container 1
-
-# Below are the extra env you can set for vllm
-export MAX_NUM_SEQS=64 # MAX_NUM_SEQS value
-export MAX_NUM_BATCHED_TOKENS=5000 # MAX_NUM_BATCHED_TOKENS value
-export MAX_MODEL_LEN=5000 # MAX_MODEL_LEN value
-export LOAD_IN_LOW_BIT=fp8 # the weight type value, expected: sym_int4, asym_int4, sym_int5, asym_int5 or sym_int8
-export CCL_DG2_USM="" # Need to set to 1 on Core to enable USM (Shared Memory GPUDirect). Xeon supports P2P and doesn't need this.
-```
-
-### 2. Generate nginx config file and compose yaml file
-
-```bash
-# Generate your nginx config file
-# nginx-conf-generator.sh requires 2 parameters: DP_NUM and output filepath
-bash nginx/nginx-conf-generator.sh $DP_NUM nginx/nginx.conf # You can change TEMP_FILE_PATH to your reference
-# set NGINX_CONFIG_PATH
-export NGINX_CONFIG_PATH="${PWD}/nginx/nginx.conf"
-
-# Generate compose_vllm.yaml file
-# multi-arc-yaml-generator.sh requires 2 parameters: DP_NUM and output filepath
-bash docker_compose/intel/gpu/arc/multi-arc-yaml-generator.sh $DP_NUM docker_compose/intel/gpu/arc/compose_vllm.yaml
-```
+This section is the same as default vLLM inference section, please refer to [Prepare env variables and configurations](../docker_compose/intel/gpu/arc/README.md#prepare-env-variables-and-configurations) and [Start Edge Craft RAG Services with Docker Compose](../docker_compose/intel/gpu/arc/README.md#deploy-the-service-on-arc-a770-using-docker-compose)
 
-### 3. Start Edge Craft RAG Services with Docker Compose
+### 2. Access Kbadmin UI
 
-This section is the same as default vLLM inference section, please refer to [Start Edge Craft RAG Services with Docker Compose](../docker_compose/intel/gpu/arc/README.md#deploy-the-service-using-docker-compose)
+please refer to [ChatQnA with Kbadmin in UI](./Explore_Edge_Craft_RAG.md#chatqna-with-kbadmin-in-ui)
diff --git a/EdgeCraftRAG/docs/Explore_Edge_Craft_RAG.md b/EdgeCraftRAG/docs/Explore_Edge_Craft_RAG.md
index a63b3a9f0e..0a5a91ba5e 100644
--- a/EdgeCraftRAG/docs/Explore_Edge_Craft_RAG.md
+++ b/EdgeCraftRAG/docs/Explore_Edge_Craft_RAG.md
@@ -33,3 +33,23 @@ After knowledge base creation, you can upload the documents for retrieval.
 
 Then, you can submit messages in the chat box in `Chat` page.
 ![chat_with_rag](../assets/img/chatqna.png)
+
+## ChatQnA with Kbadmin in UI
+
+### Kbadmin Pipeline
+
+In the `Node Parser` page, select 'kbadmin' as node parser.
+![kbadmin_node_parser](../assets/img/kbadmin_type.png)
+
+In the `Indexer` page, input embedding and vector DB information, please note the embedding service port is 13020; the vector DB port is 29530.
+![kbadmin_indexer](../assets/img/kbadmin_index.png)
+
+### Upload files & ChatQnA
+
+After the pipeline creation, you can go to `Knowledge Base` page and click `Create Knowledge Base` button to create your knowledge base.  
+Please select 'kbadmin' in `Type`and select kb name from the kbs you created in kbadmin UI page.
+
+![upload_data](../assets/img/kbadmin_kb.png)
+
+Then, you can submit messages in the chat box in `Chat` page.
+![chat_with_rag](../assets/img/chatqna.png)
diff --git a/EdgeCraftRAG/edgecraftrag/VERSION b/EdgeCraftRAG/edgecraftrag/VERSION
old mode 100755
new mode 100644
index 40766d6bb4..0198c14133
--- a/EdgeCraftRAG/edgecraftrag/VERSION
+++ b/EdgeCraftRAG/edgecraftrag/VERSION
@@ -1 +1 @@
-25.05-Release
+25.11-Dev
diff --git a/EdgeCraftRAG/edgecraftrag/api/v1/agent.py b/EdgeCraftRAG/edgecraftrag/api/v1/agent.py
new file mode 100644
index 0000000000..00a1b5db09
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/api/v1/agent.py
@@ -0,0 +1,148 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import json
+import os
+import time
+
+from edgecraftrag.api_schema import AgentCreateIn
+from edgecraftrag.base import AgentType
+from edgecraftrag.config_repository import MilvusConfigRepository, save_agent_configurations
+from edgecraftrag.context import ctx
+from edgecraftrag.env import AGENT_FILE
+from fastapi import FastAPI, HTTPException, status
+
+agent_app = FastAPI()
+
+
+# GET Agents
+@agent_app.get(path="/v1/settings/agents")
+async def get_all_agents():
+    out = []
+    agents = ctx.get_agent_mgr().get_agents()
+    active_id = ctx.get_agent_mgr().get_active_agent_id()
+    for k, agent in agents.items():
+        out.append(
+            AgentCreateIn(
+                idx=agent.idx,
+                name=agent.name,
+                type=agent.comp_subtype,
+                pipeline_idx=agent.pipeline_idx,
+                configs=agent.configs,
+                active=True if agent.idx == active_id else False,
+            )
+        )
+    return out
+
+
+# GET Agent
+@agent_app.get(path="/v1/settings/agents/{name}")
+async def get_agent(name):
+    agent = ctx.get_agent_mgr().get_agent_by_name(name)
+    if agent:
+        isactive = True if agent.idx == ctx.get_agent_mgr().get_active_agent_id() else False
+        return AgentCreateIn(
+            idx=agent.idx,
+            name=agent.name,
+            type=agent.comp_subtype,
+            pipeline_idx=agent.pipeline_idx,
+            configs=agent.configs,
+            active=isactive,
+        )
+    else:
+        raise HTTPException(status_code=status.HTTP_404_NOT_FOUND)
+
+
+# POST Agent
+@agent_app.post(path="/v1/settings/agents")
+async def create_agent(request: AgentCreateIn, status_code=status.HTTP_201_CREATED):
+    try:
+        agent = ctx.get_agent_mgr().create_agent(request)
+        if agent:
+            await save_agent_configurations("add", ctx.get_agent_mgr().get_agents())
+        return agent
+    except (ValueError, Exception) as e:
+        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
+
+
+# PATCH Agent
+@agent_app.patch(path="/v1/settings/agents/{name}")
+async def update_agent(name, request: AgentCreateIn):
+    try:
+        agentmgr = ctx.get_agent_mgr()
+        if agentmgr.get_agent_by_name(name):
+            ret = agentmgr.update_agent(name, request)
+            if ret:
+                await save_agent_configurations("update", ctx.get_agent_mgr().get_agents())
+            return ret
+        else:
+            raise HTTPException(status_code=status.HTTP_404_NOT_FOUND)
+    except (ValueError, Exception) as e:
+        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
+
+
+# DELETE Agent
+@agent_app.delete(path="/v1/settings/agents/{name}", status_code=status.HTTP_204_NO_CONTENT)
+async def delete_agent(name):
+    try:
+        agentmgr = ctx.get_agent_mgr()
+        if agentmgr.get_agent_by_name(name):
+            if agentmgr.remove_agent(name):
+                await save_agent_configurations("delete", ctx.get_agent_mgr().get_agents())
+                return
+            else:
+                raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR)
+        else:
+            raise HTTPException(status_code=status.HTTP_404_NOT_FOUND)
+    except (ValueError, Exception) as e:
+        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
+
+
+# GET Agent Type default configs
+@agent_app.get(path="/v1/settings/agents/configs/{agent_type}")
+async def get_agent_default_configs(agent_type):
+    try:
+        if agent_type in [e.value for e in AgentType]:
+            return ctx.get_agent_mgr().get_agent_default_configs(agent_type)
+        else:
+            raise HTTPException(status_code=status.HTTP_404_NOT_FOUND)
+    except (ValueError, Exception) as e:
+        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
+
+
+# Restore agent configurations
+async def restore_agent_configurations():
+    milvus_repo = MilvusConfigRepository.create_connection("agent_config", 1)
+    all_agents = []
+    if milvus_repo:
+        time.sleep(10)
+        all_agents_repo = milvus_repo.get_configs()
+        for agent in all_agents_repo:
+            all_agents.append(agent.get("config_json"))
+    else:
+        if os.path.exists(AGENT_FILE):
+            with open(AGENT_FILE, "r", encoding="utf-8") as f:
+                all_agents = f.read()
+        if all_agents:
+            all_agents = json.loads(all_agents)
+    try:
+        for agent_data in all_agents:
+            agent_req = AgentCreateIn(**agent_data)
+            await load_agent(agent_req)
+    except Exception as e:
+        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
+
+
+async def load_agent(request: AgentCreateIn):
+    agentmgr = ctx.get_agent_mgr()
+    agent = agentmgr.get_agent_by_name(request.name)
+    if agent is None:
+        # TODO: Restore idx back
+        # TODO: Update agent by import a json
+        agent = agentmgr.create_agent(request)
+    try:
+        await save_agent_configurations("add", ctx.get_agent_mgr().get_agents())
+    except (ValueError, Exception) as e:
+        agentmgr.remove_agent_by_name(request.name)
+        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
+    return agent
diff --git a/EdgeCraftRAG/edgecraftrag/api/v1/chatqna.py b/EdgeCraftRAG/edgecraftrag/api/v1/chatqna.py
old mode 100755
new mode 100644
index c3facef41b..cb3fcdb409
--- a/EdgeCraftRAG/edgecraftrag/api/v1/chatqna.py
+++ b/EdgeCraftRAG/edgecraftrag/api/v1/chatqna.py
@@ -1,23 +1,36 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+import asyncio
+import json
+from concurrent.futures import ThreadPoolExecutor
+from typing import List
+
 import requests
-from comps import GeneratedDoc
 from comps.cores.proto.api_protocol import ChatCompletionRequest
 from edgecraftrag.api_schema import RagOut
 from edgecraftrag.context import ctx
-from edgecraftrag.utils import serialize_contexts, set_current_session
-from fastapi import Body, FastAPI, File, HTTPException, UploadFile, status
+from edgecraftrag.utils import chain_async_generators, serialize_contexts, stream_generator
+from fastapi import Body, FastAPI, HTTPException, status
 from fastapi.responses import StreamingResponse
 
 chatqna_app = FastAPI()
+thread_pool = ThreadPoolExecutor(max_workers=16)
 
 
 # Retrieval
 @chatqna_app.post(path="/v1/retrieval")
 async def retrieval(request: ChatCompletionRequest):
     try:
-        contexts = ctx.get_pipeline_mgr().run_retrieve(chat_request=request)
+        active_kb = ctx.knowledgemgr.get_active_knowledge_base()
+        if active_kb:
+            request.user = active_kb
+        else:
+            raise HTTPException(
+                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+                detail="Retrieval needs to have an active knowledgebase",
+            )
+        contexts = await ctx.get_pipeline_mgr().run_retrieve_postprocess(chat_request=request)
         serialized_contexts = serialize_contexts(contexts)
 
         ragout = RagOut(query=request.messages, contexts=serialized_contexts, response="")
@@ -30,38 +43,81 @@ async def retrieval(request: ChatCompletionRequest):
 @chatqna_app.post(path="/v1/chatqna")
 async def chatqna(request: ChatCompletionRequest):
     try:
+        active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
         sessionid = request.user
-        set_current_session(sessionid)
-        generator = ctx.get_pipeline_mgr().get_active_pipeline().generator
-        if generator:
-            request.model = generator.model_id
+        ctx.get_session_mgr().set_current_session(sessionid)
+        experience_kb = ctx.knowledgemgr.get_active_experience()
+        active_kb = ctx.knowledgemgr.get_active_knowledge_base()
+        request.user = active_kb if active_kb else None
+        if experience_kb:
+            request.tool_choice = "auto" if experience_kb.experience_active else "none"
+
+        request.input = ctx.get_session_mgr().concat_history(
+            sessionid, active_pl.generator.inference_type, request.messages
+        )
+
+        # Run agent if activated, otherwise, run pipeline
+        if ctx.get_agent_mgr().get_active_agent():
+            run_agent_gen = await ctx.get_agent_mgr().run_agent(chat_request=request)
+            return StreamingResponse(save_session(sessionid, run_agent_gen), media_type="text/plain")
+
+        else:
+            generator = active_pl.generator
+            if generator:
+                request.model = generator.model_id
+
         if request.stream:
-            ret, contexts = ctx.get_pipeline_mgr().run_pipeline(chat_request=request)
-            return ret
+            run_pipeline_gen, contexts = await ctx.get_pipeline_mgr().run_pipeline(chat_request=request)
+            return StreamingResponse(save_session(sessionid, run_pipeline_gen), media_type="text/plain")
         else:
-            ret, contexts = ctx.get_pipeline_mgr().run_pipeline(chat_request=request)
+            ret, contexts = await ctx.get_pipeline_mgr().run_pipeline(chat_request=request)
+            ctx.get_session_mgr().save_current_message(sessionid, "assistant", str(ret))
             return str(ret)
+
     except Exception as e:
-        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"ChatQnA Error: {e}",
+        )
 
 
 # RAGQnA
 @chatqna_app.post(path="/v1/ragqna")
 async def ragqna(request: ChatCompletionRequest):
     try:
-        res, contexts = ctx.get_pipeline_mgr().run_pipeline(chat_request=request)
-        if isinstance(res, GeneratedDoc):
-            res = res.text
-        elif isinstance(res, StreamingResponse):
-            collected_data = []
-            async for chunk in res.body_iterator:
-                collected_data.append(chunk)
-            res = "".join(collected_data)
+        sessionid = request.user
+        experience_kb = ctx.knowledgemgr.get_active_experience()
+        active_kb = ctx.knowledgemgr.get_active_knowledge_base()
+        request.user = active_kb if active_kb else None
+        if experience_kb:
+            request.tool_choice = "auto" if experience_kb.experience_active else "none"
+        generator = ctx.get_pipeline_mgr().get_active_pipeline().generator
+        if generator:
+            request.model = generator.model_id
+        if request.stream:
+            res_gen, contexts = await ctx.get_pipeline_mgr().run_pipeline(chat_request=request)
 
-        serialized_contexts = serialize_contexts(contexts)
+            # Escape newlines for json format as value
+            async def res_gen_json():
+                async for token in res_gen:
+                    yield token.replace("\n", "\\n")
+
+            # Reconstruct RagOut in stream response
+            query_gen = stream_generator('{"query":"' + request.messages + '",')
+
+            s_contexts = json.dumps(serialize_contexts(contexts))
+            context_gen = stream_generator('"contexts":' + s_contexts + ',"response":"')
+            final_gen = stream_generator('"}')
+            output_gen = chain_async_generators([query_gen, context_gen, res_gen_json(), final_gen])
+
+            return StreamingResponse(output_gen, media_type="text/plain")
+        else:
+            ret, contexts = await ctx.get_pipeline_mgr().run_pipeline(chat_request=request)
+            serialized_contexts = serialize_contexts(contexts)
+
+            ragout = RagOut(query=request.messages, contexts=serialized_contexts, response=str(ret))
+            return ragout
 
-        ragout = RagOut(query=request.messages, contexts=serialized_contexts, response=str(res))
-        return ragout
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
 
@@ -82,3 +138,16 @@ def check_vllm(request_data: dict = Body(...)):
             raise HTTPException(status_code=500)
     except Exception as e:
         return {"status": "500", "message": f"connection failed: {str(e)}"}
+
+
+async def save_session(sessionid, run_agent_gen):
+    collected_data = []
+    session_mgr = ctx.get_session_mgr()
+    async for chunk in run_agent_gen:
+        if chunk:
+            collected_data.append(chunk)
+            current_content = "".join(collected_data)
+            session_mgr.update_current_message(sessionid, "assistant", current_content)
+        yield chunk or ""
+        await asyncio.sleep(0)
+    session_mgr.save_current_message(sessionid, "assistant", current_content)
diff --git a/EdgeCraftRAG/edgecraftrag/api/v1/data.py b/EdgeCraftRAG/edgecraftrag/api/v1/data.py
old mode 100755
new mode 100644
index 35ef7e25b7..9d5472f105
--- a/EdgeCraftRAG/edgecraftrag/api/v1/data.py
+++ b/EdgeCraftRAG/edgecraftrag/api/v1/data.py
@@ -1,12 +1,15 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+import json
 import os
+from typing import List
 
 from edgecraftrag.api_schema import DataIn, FilesIn
+from edgecraftrag.config_repository import MilvusConfigRepository
 from edgecraftrag.context import ctx
+from edgecraftrag.env import UI_DIRECTORY
 from fastapi import FastAPI, File, HTTPException, UploadFile, status
-from werkzeug.utils import secure_filename
 
 data_app = FastAPI()
 
@@ -14,16 +17,17 @@
 # Upload a text or files
 @data_app.post(path="/v1/data")
 async def add_data(request: DataIn):
+    pl = ctx.get_pipeline_mgr().get_active_pipeline()
     docs = []
     if request.text is not None:
         docs.extend(ctx.get_file_mgr().add_text(text=request.text))
     if request.local_path is not None:
         docs.extend(ctx.get_file_mgr().add_files(docs=request.local_path))
 
-    nodelist = ctx.get_pipeline_mgr().run_data_prepare(docs=docs)
-    if nodelist is None or len(nodelist) == 0:
-        raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="File not found")
-    pl = ctx.get_pipeline_mgr().get_active_pipeline()
+    nodelist = await ctx.get_pipeline_mgr().run_data_prepare(docs=docs)
+    if pl.indexer.comp_subtype != "kbadmin_indexer":
+        if nodelist is None or len(nodelist) == 0:
+            raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="File not found")
     ctx.get_node_mgr().add_nodes(pl.node_parser.idx, nodelist)
     return "Done"
 
@@ -32,8 +36,8 @@ async def add_data(request: DataIn):
 @data_app.post(path="/v1/data/reindex")
 async def redindex_data():
     pl = ctx.get_pipeline_mgr().get_active_pipeline()
-
     ctx.get_node_mgr().del_nodes_by_np_idx(pl.node_parser.idx)
+
     pl.indexer.reinitialize_indexer()
     pl.update_indexer_to_retriever()
 
@@ -45,6 +49,71 @@ async def redindex_data():
     return "Done"
 
 
+# Gets the current nodelist
+@data_app.get(path="/v1/data/nodes")
+async def get_nodes_with_kb(kb_name=None):
+    node_lists = {}
+    active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
+    if kb_name:
+        kb = ctx.get_knowledge_mgr().get_knowledge_base_by_name_or_id(kb_name)
+    else:
+        kb = ctx.get_knowledge_mgr().get_active_knowledge_base()
+    if active_pl.indexer.comp_subtype == "faiss_vector":
+        return active_pl.indexer.docstore.docs
+    elif active_pl.indexer.comp_subtype == "milvus_vector":
+        collection_name = kb.name + active_pl.name
+        Milvus_node_list = MilvusConfigRepository.create_connection(collection_name, 1, active_pl.indexer.vector_url)
+        results = Milvus_node_list.get_configs(output_fields=["text", "_node_content", "doc_id"])
+        for node_list in results:
+            text = node_list.get("text")
+            node_content = json.loads(node_list.get("_node_content"))
+            node_content["doc_id"] = node_list.get("doc_id")
+            node_content["text"] = text
+            node_lists[node_content.get("id_")] = node_content
+        return node_lists
+    node_list = ctx.get_node_mgr().get_nodes(active_pl.node_parser.idx)
+    return node_list
+
+
+# GET chunks by document name
+@data_app.get(path="/v1/data/{document_name}/nodes")
+async def get_nodes_by_document_name(document_name: str):
+    all_nodes = await get_nodes_with_kb()
+    matching_nodes = []
+    for node in all_nodes.values() if isinstance(all_nodes, dict) else all_nodes:
+        metadata = node.get("metadata", {}) if isinstance(node, dict) else getattr(node, "metadata", {})
+        node_file_name = metadata.get("file_name", "")
+        node_file_path = metadata.get("file_path", "")
+        if node_file_name == document_name or document_name in node_file_name or document_name in node_file_path:
+            matching_nodes.append(node)
+    return matching_nodes
+
+
+# GET available document names
+@data_app.get(path="/v1/data/documents")
+async def get_document_names():
+    all_nodes = await get_nodes_with_kb()
+    if not all_nodes:
+        return {"documents": []}
+
+    documents = {}
+    for node in all_nodes.values() if isinstance(all_nodes, dict) else all_nodes:
+        metadata = node.get("metadata", {}) if isinstance(node, dict) else getattr(node, "metadata", {})
+        file_name = metadata.get("file_name")
+        file_path = metadata.get("file_path")
+        if file_name and file_name not in documents:
+            documents[file_name] = {
+                "file_name": file_name,
+                "file_path": file_path,
+                "file_type": metadata.get("file_type", "unknown"),
+                "chunk_count": 0,
+            }
+        if file_name:
+            documents[file_name]["chunk_count"] += 1
+
+    return {"total_documents": len(documents), "documents": list(documents.values())}
+
+
 # Upload files by a list of file_path
 @data_app.post(path="/v1/data/files")
 async def add_files(request: FilesIn):
@@ -103,16 +172,13 @@ async def upload_file(file_name: str, file: UploadFile = File(...)):
         )
     try:
         # DIR for server to save files uploaded by UI
-        UI_DIRECTORY = os.getenv("TMPFILE_PATH", "/home/user/ui_cache")
         UPLOAD_DIRECTORY = os.path.normpath(os.path.join(UI_DIRECTORY, file_name))
         if not UPLOAD_DIRECTORY.startswith(os.path.abspath(UI_DIRECTORY) + os.sep):
             raise HTTPException(
                 status_code=status.HTTP_400_BAD_REQUEST, detail="Invalid file_name: directory traversal detected"
             )
         os.makedirs(UPLOAD_DIRECTORY, exist_ok=True)
-        safe_filename = secure_filename(file.filename)
-        # Sanitize the uploaded file's name
-        safe_filename = secure_filename(file.filename)
+        safe_filename = file.filename
         file_path = os.path.normpath(os.path.join(UPLOAD_DIRECTORY, safe_filename))
         # Ensure file_path is within UPLOAD_DIRECTORY
         if not file_path.startswith(os.path.abspath(UPLOAD_DIRECTORY)):
diff --git a/EdgeCraftRAG/edgecraftrag/api/v1/knowledge_base.py b/EdgeCraftRAG/edgecraftrag/api/v1/knowledge_base.py
old mode 100755
new mode 100644
index 21e0c0621e..6379b9c5ac
--- a/EdgeCraftRAG/edgecraftrag/api/v1/knowledge_base.py
+++ b/EdgeCraftRAG/edgecraftrag/api/v1/knowledge_base.py
@@ -1,24 +1,32 @@
 # Copyright (C) 2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-import copy
 import json
 import os
 import re
-
-from edgecraftrag.api.v1.data import add_data
-from edgecraftrag.api_schema import DataIn, KnowledgeBaseCreateIn
-from edgecraftrag.base import IndexerType
+from typing import Dict, List, Union
+
+from edgecraftrag.api.v1.data import get_nodes_with_kb
+from edgecraftrag.api_schema import DataIn, ExperienceIn, KnowledgeBaseCreateIn
+from edgecraftrag.components.query_preprocess import query_search
+from edgecraftrag.components.retriever import get_kbs_info
+from edgecraftrag.config_repository import (
+    MilvusConfigRepository,
+    save_knowledge_configurations,
+    save_pipeline_configurations,
+)
 from edgecraftrag.context import ctx
-from edgecraftrag.utils import compare_mappings
+from edgecraftrag.env import (
+    KNOWLEDGEBASE_FILE,
+    SEARCH_CONFIG_PATH,
+    SEARCH_DIR,
+    UI_DIRECTORY,
+)
 from fastapi import FastAPI, HTTPException, status
-from pymilvus.exceptions import MilvusException
+from llama_index.core.schema import Document
 
 kb_app = FastAPI()
 
-# Define the root directory for knowledge base files
-KNOWLEDGE_BASE_ROOT = "/home/user/ui_cache"
-
 
 # Get all knowledge bases
 @kb_app.get(path="/v1/knowledge")
@@ -41,16 +49,24 @@ async def get_knowledge_base(knowledge_name: str):
 async def create_knowledge_base(knowledge: KnowledgeBaseCreateIn):
     try:
         active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
+        if not active_pl:
+            raise HTTPException(
+                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+                detail="Please activate pipeline",
+            )
         if not re.match(r"^[a-zA-Z_][a-zA-Z0-9_]*$", knowledge.name):
             raise HTTPException(
                 status_code=status.HTTP_404_NOT_FOUND,
                 detail="Knowledge base names must begin with a letter or underscore",
             )
-        kb = ctx.knowledgemgr.create_knowledge_base(knowledge)
-        if kb.active:
-            active_pl.indexer.reinitialize_indexer(kb.name)
+
+        if knowledge.active and knowledge.comp_type == "knowledge" and knowledge.comp_subtype == "origin_kb":
+            active_pl.indexer.reinitialize_indexer(knowledge.name)
             active_pl.update_indexer_to_retriever()
-        await save_knowledge_to_file()
+        elif knowledge.active and knowledge.comp_subtype == "kbadmin_kb":
+            active_pl.retriever.config_kbadmin_milvus(knowledge.name)
+        kb = ctx.knowledgemgr.create_knowledge_base(knowledge)
+        await save_knowledge_configurations("add", kb)
         return "Create knowledge base successfully"
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail=str(e))
@@ -63,19 +79,33 @@ async def delete_knowledge_base(knowledge_name: str):
         rm_kb = ctx.knowledgemgr.get_knowledge_base_by_name_or_id(knowledge_name)
         active_kb = ctx.knowledgemgr.get_active_knowledge_base()
         active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
-        if active_kb.name == knowledge_name or active_kb.idx == knowledge_name:
-            raise HTTPException(
-                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail="Cannot delete a running knowledge base."
-            )
-        kb_file_path = rm_kb.get_file_paths()
-        if kb_file_path:
-            if active_pl.indexer.comp_subtype == "milvus_vector":
-                await remove_file_handler([], knowledge_name)
+        if rm_kb.comp_type == "knowledge" and rm_kb.comp_subtype == "origin_kb":
             if active_kb:
-                active_pl.indexer.reinitialize_indexer(active_kb.name)
-                active_pl.update_indexer_to_retriever()
+                if active_kb.name == knowledge_name or active_kb.idx == knowledge_name:
+                    raise HTTPException(
+                        status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+                        detail="Cannot delete a running knowledge base.",
+                    )
+            kb_file_path = rm_kb.get_file_paths()
+            if kb_file_path:
+                if active_pl.indexer.comp_subtype == "milvus_vector":
+                    active_pl.indexer.clear_milvus_collection(knowledge_name)
+                    active_pl.clear_document_cache(knowledge_name)
+                    if active_kb:
+                        active_pl.indexer.reinitialize_indexer(active_kb.name)
+                        active_pl.update_indexer_to_retriever()
+                rm_kb.clear_documents(active_pl.name)
+        if rm_kb.comp_type == "experience":
+            if rm_kb.experience_active:
+                raise HTTPException(
+                    status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+                    detail="Cannot delete a running experience knowledge base.",
+                )
+            else:
+                rm_kb.clear_experiences()
         result = ctx.knowledgemgr.delete_knowledge_base(knowledge_name)
-        await save_knowledge_to_file()
+        await save_knowledge_configurations("delete", rm_kb)
+        await save_pipeline_configurations("update", active_pl)
         return result
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail=str(e))
@@ -87,28 +117,51 @@ async def update_knowledge_base(knowledge: KnowledgeBaseCreateIn):
     try:
         kb = ctx.knowledgemgr.get_knowledge_base_by_name_or_id(knowledge.name)
         active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
-        if active_pl.indexer.comp_subtype != "milvus_vector":
-            if knowledge.active and knowledge.active != kb.active:
-                file_paths = kb.get_file_paths()
-                await update_knowledge_base_handler(file_paths, knowledge.name)
-            elif not knowledge.active and kb.description != knowledge.description:
-                pass
-            elif not knowledge.active:
-                raise HTTPException(
-                    status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail="Must have an active knowledge base"
-                )
-        else:
+        if active_pl.indexer.comp_subtype == "kbadmin_indexer" and kb.comp_subtype != "kbadmin_kb":
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail="The kbadmin pipeline must correspond to the kbadmin type kb.",
+            )
+        if active_pl.indexer.comp_subtype != "kbadmin_indexer" and kb.comp_subtype == "kbadmin_kb":
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail="Not kbadmin pipeline cannot active kbadmin type kb.",
+            )
+        if kb.comp_type == "knowledge" and kb.comp_subtype == "origin_kb":
+            if active_pl.indexer.comp_subtype != "milvus_vector":
+                if knowledge.active and knowledge.active != kb.active:
+                    await handle_reload_data(kb, active_pl)
+                elif not knowledge.active and kb.description != knowledge.description:
+                    pass
+            else:
+                if knowledge.active and knowledge.active != kb.active:
+                    current_paths = kb.file_paths
+                    file_paths = active_pl.compare_file_lists(kb.name, current_paths)
+                    if "del_docs" not in file_paths:
+                        await handle_pipeline_change(kb, active_pl, file_paths)
+                    else:
+                        need_delete_document_path = file_paths["del_docs"]
+                        need_add_document_path = file_paths["add_docs"]
+                        active_pl.indexer.reinitialize_indexer(kb.name)
+                        if need_delete_document_path:
+                            for file_path in need_delete_document_path:
+                                await remove_file_from_knowledge_base(kb.name, DataIn(local_path=file_path))
+                        if need_add_document_path:
+                            for file_path in need_add_document_path:
+                                add_document = await add_file_to_knowledge_base(
+                                    kb.name, DataIn(local_path=file_path), False
+                                )
+                                await add_document_handler(add_document)
+                    active_pl.indexer.reinitialize_indexer(kb.name)
+                    active_pl.update_indexer_to_retriever()
+                elif not knowledge.active and kb.description != knowledge.description:
+                    pass
+        elif kb.comp_subtype == "kbadmin_kb":
             if knowledge.active and knowledge.active != kb.active:
-                active_pl.indexer.reinitialize_indexer(knowledge.name)
-                active_pl.update_indexer_to_retriever()
-            elif not knowledge.active and kb.description != knowledge.description:
-                pass
-            elif not knowledge.active:
-                raise HTTPException(
-                    status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail="Must have an active knowledge base"
-                )
+                active_pl.retriever.config_kbadmin_milvus(kb.name)
         result = ctx.knowledgemgr.update_knowledge_base(knowledge)
-        await save_knowledge_to_file()
+        await save_knowledge_configurations("update", kb)
+        await save_pipeline_configurations("update", active_pl)
         return result
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail=str(e))
@@ -116,49 +169,68 @@ async def update_knowledge_base(knowledge: KnowledgeBaseCreateIn):
 
 # Add a files to the knowledge base
 @kb_app.post(path="/v1/knowledge/{knowledge_name}/files")
-async def add_file_to_knowledge_base(knowledge_name, file_path: DataIn):
+async def add_file_to_knowledge_base(knowledge_name, file_path: DataIn, only_add_file: bool = True):
     try:
         active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
         kb = ctx.knowledgemgr.get_knowledge_base_by_name_or_id(knowledge_name)
+        if kb.comp_type == "experience":
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail="The experience type cannot perform file operations.",
+            )
+        if kb.comp_subtype == "kbadmin_kb" or active_pl.indexer.comp_subtype == "kbadmin_indexer":
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail="Please proceed to the kbadmin interface to perform the operation.",
+            )
+        # Validate and normalize the user-provided path
         user_path = file_path.local_path
-        normalized_path = os.path.normpath(os.path.join(KNOWLEDGE_BASE_ROOT, user_path))
-        if not normalized_path.startswith(KNOWLEDGE_BASE_ROOT):
+        add_document = ctx.get_file_mgr().add_files(docs=user_path)
+        normalized_path = os.path.normpath(os.path.join(UI_DIRECTORY, user_path))
+        if not normalized_path.startswith(UI_DIRECTORY):
             raise HTTPException(status_code=status.HTTP_400_BAD_REQUEST, detail="Invalid file path")
         if os.path.isdir(normalized_path):
             for root, _, files in os.walk(normalized_path):
                 for file in files:
                     file_full_path = os.path.join(root, file)
                     if file_full_path not in kb.get_file_paths():
-                        kb.add_file_path(file_full_path)
+                        kb.add_file_path(file_full_path, add_document, active_pl.name, only_add_file)
+                        active_pl.add_docs_to_list(knowledge_name, file_full_path)
                     else:
-                        raise HTTPException(status_code=status.HTTP_409_CONFLICT, detail="File upload failed")
-        elif os.path.isfile(normalized_path) and normalized_path not in kb.get_file_paths():
-            kb.add_file_path(normalized_path)
+                        raise HTTPException(
+                            status_code=status.HTTP_409_CONFLICT,
+                            detail=f"File already exists {file_full_path}",
+                        )
+        elif os.path.isfile(normalized_path) and normalized_path in kb.get_file_paths() and only_add_file:
+            raise HTTPException(
+                status_code=status.HTTP_409_CONFLICT,
+                detail=f"File already exists {normalized_path}",
+            )
+        elif os.path.isfile(normalized_path) and only_add_file:
+            kb.add_file_path(normalized_path, add_document, active_pl.name, only_add_file)
+            active_pl.add_docs_to_list(knowledge_name, user_path)
+        elif os.path.isfile(normalized_path):
+            kb.add_file_path(normalized_path, add_document, active_pl.name, only_add_file)
+            active_pl.add_docs_to_list(knowledge_name, user_path)
+            return add_document
         else:
-            raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="File upload failed")
+            raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="Error uploading file.")
 
         active_kb = ctx.knowledgemgr.get_active_knowledge_base()
-        kb_file_path = kb.get_file_paths()
         if active_pl.indexer.comp_subtype == "milvus_vector":
-            if active_kb:
-                if active_kb.name == knowledge_name or active_kb.idx == knowledge_name:
-                    active_pl.indexer.reinitialize_indexer(active_kb.name)
-                    active_pl.update_indexer_to_retriever()
-                    await update_knowledge_base_handler(file_path, knowledge_name, add_file=True)
-                else:
-                    await update_knowledge_base_handler(kb_file_path, knowledge_name)
-                    active_pl.indexer.reinitialize_indexer(active_kb.name)
-                    active_pl.update_indexer_to_retriever()
+            if knowledge_name == active_kb.name:
+                await add_document_handler(add_document)
             else:
-                await update_knowledge_base_handler(kb_file_path, knowledge_name)
+                active_pl.indexer.reinitialize_indexer(knowledge_name)
+                await add_document_handler(add_document)
                 active_pl.indexer.reinitialize_indexer(active_kb.name)
                 active_pl.update_indexer_to_retriever()
         else:
             if active_kb:
                 if active_kb.name == knowledge_name or active_kb.idx == knowledge_name:
-                    await update_knowledge_base_handler(file_path, knowledge_name, add_file=True)
-
-        await save_knowledge_to_file()
+                    await add_document_handler(add_document)
+        await save_knowledge_configurations("update", kb)
+        await save_pipeline_configurations("update", active_pl)
         return "File upload successfully"
     except ValueError as e:
         raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail=str(e))
@@ -170,193 +242,325 @@ async def remove_file_from_knowledge_base(knowledge_name, file_path: DataIn):
     try:
         active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
         kb = ctx.knowledgemgr.get_knowledge_base_by_name_or_id(knowledge_name)
-        active_kb = ctx.knowledgemgr.get_active_knowledge_base()
-        if file_path.local_path in kb.get_file_paths():
-            kb.remove_file_path(file_path.local_path)
-        else:
-            raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="File remove failure")
-
-        kb_file_path = kb.get_file_paths()
-        if active_pl.indexer.comp_subtype == "milvus_vector":
-            if active_kb:
-                if active_kb.name == knowledge_name or active_kb.idx == knowledge_name:
-                    await remove_file_handler(kb_file_path, knowledge_name)
-                else:
-                    await remove_file_handler(kb_file_path, knowledge_name)
-                    active_pl.indexer.reinitialize_indexer(active_kb.name)
-                    active_pl.update_indexer_to_retriever()
-            else:
-                await remove_file_handler(kb_file_path, knowledge_name)
-                active_pl.indexer.reinitialize_indexer(active_kb.name)
-                active_pl.update_indexer_to_retriever()
-        elif active_kb:
-            if active_kb.name == knowledge_name or active_kb.idx == knowledge_name:
-                await update_knowledge_base_handler(kb_file_path, knowledge_name)
-        await save_knowledge_to_file()
+        if kb.comp_type == "experience":
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail="The experience type cannot perform file operations.",
+            )
+        if kb.comp_subtype == "kbadmin_kb" or active_pl.indexer.comp_subtype == "kbadmin_indexer":
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail="Please proceed to the kbadmin interface to perform the operation.",
+            )
+        document_list = kb.remove_file_path(file_path.local_path, active_pl.name)
+        active_pl.del_docs_to_list(knowledge_name, file_path.local_path)
+        if not document_list:
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail="Deleted file documents  not found",
+            )
+        await remove_document_handler(document_list, knowledge_name)
+        await save_knowledge_configurations("update", kb)
+        await save_pipeline_configurations("update", active_pl)
         return "File deleted successfully"
     except ValueError as e:
         raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail=str(e))
 
 
+@kb_app.post("/v1/experience")
+def get_experience_by_id_or_question(req: ExperienceIn):
+    kb = ctx.knowledgemgr.get_experience_kb()
+    result = kb.get_experience_by_id_or_question(req)
+    if not result:
+        raise HTTPException(404, detail="Experience not found")
+    return result
+
+
+@kb_app.get("/v1/experiences")
+def get_all_experience():
+    kb = ctx.knowledgemgr.get_experience_kb()
+    if kb:
+        return kb.get_all_experience()
+    else:
+        return kb
+
+
+@kb_app.patch("/v1/experiences")
+def update_experience(experience: ExperienceIn):
+    kb = ctx.knowledgemgr.get_experience_kb()
+    result = kb.update_experience(experience.idx, experience.question, experience.content)
+    if not result:
+        raise HTTPException(404, detail="Question_idx or question not found")
+    return result
+
+
+@kb_app.delete("/v1/experiences")
+def delete_experience(req: ExperienceIn):
+    kb = ctx.knowledgemgr.get_experience_kb()
+    success = kb.delete_experience(req.idx)
+    if not success:
+        raise HTTPException(404, detail=f"Question {req.question} not found")
+    return {"message": "Question deleted"}
+
+
+@kb_app.post("/v1/multiple_experiences/check")
+def check_duplicate_multiple_experiences(
+    experiences: List[Dict[str, Union[str, List[str]]]],
+):
+    kb = ctx.knowledgemgr.get_experience_kb()
+    if not kb:
+        raise HTTPException(404, detail="No active experience type knowledge base")
+    all_existing = kb.get_all_experience()
+    existing_questions = {item["question"] for item in all_existing if "question" in item}
+    new_questions = [exp["question"] for exp in experiences if "question" in exp and exp["question"]]
+    duplicate_questions = [q for q in new_questions if q in existing_questions]
+    if duplicate_questions:
+        return {
+            "code": 2001,
+            "detail": "Duplicate experiences are appended OR overwritten!",
+        }
+    else:
+        kb.add_multiple_experiences(experiences, True)
+        return {
+            "status": "success",
+            "detail": "No duplicate experiences, added successfully",
+        }
+
+
+@kb_app.post("/v1/multiple_experiences/confirm")
+def confirm_multiple_experiences(experiences: List[Dict[str, Union[str, List[str]]]], flag: bool):
+    kb = ctx.knowledgemgr.get_experience_kb()
+    try:
+        if not kb:
+            raise HTTPException(404, detail="No active experience type knowledge base")
+        kb.add_multiple_experiences(experiences, flag)
+        return {"status": "success", "detail": "Experiences added successfully"}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"Add Failure：{str(e)}")
+
+
+@kb_app.post("/v1/experiences/files")
+def add_experiences_from_file(req: DataIn):
+    kb = ctx.knowledgemgr.get_experience_kb()
+    try:
+        kb.add_experiences_from_file(req.local_path)
+        return {"status": "success"}
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=str(e))
+
+
+@kb_app.post(path="/v1/view_sub_questions")
+async def view_sub_questions(que: ExperienceIn):
+    active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
+    top1_issue, sub_questions_result = await query_search(
+        user_input=que.question,
+        SEARCH_CONFIG_PATH=SEARCH_CONFIG_PATH,
+        SEARCH_DIR=SEARCH_DIR,
+        pl=active_pl,
+    )
+    return sub_questions_result
+
+
+@kb_app.get("/v1/kbadmin/kbs_list")
+def get_kbs_list():
+    active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
+    try:
+        if not active_pl or active_pl.indexer.comp_subtype != "kbadmin_indexer":
+            return []
+        CONNECTION_ARGS = {"uri": active_pl.indexer.vector_url}
+        kbs_list = get_kbs_info(CONNECTION_ARGS)
+        kb_names = [name for name in kbs_list.keys()]
+        return kb_names
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=str(e))
+
+
 # Update knowledge base data
-async def update_knowledge_base_handler(file_path=None, knowledge_name: str = "default_kb", add_file: bool = False):
+async def add_document_handler(all_document=None):
     if ctx.get_pipeline_mgr().get_active_pipeline() is None:
-        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail="Please activate pipeline")
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail="Please activate pipeline",
+        )
 
-    pl = ctx.get_pipeline_mgr().get_active_pipeline()
-    if add_file and file_path:
-        return await add_data(file_path)
-    else:
-        try:
-            ctx.get_node_mgr().del_nodes_by_np_idx(pl.node_parser.idx)
-            pl.indexer.reinitialize_indexer(knowledge_name)
-            pl.update_indexer_to_retriever()
-            if file_path:
-                for file in file_path:
-                    request = DataIn(local_path=file)
-                    await add_data(request)
-        except MilvusException as e:
-            raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
-        return "Done"
+    active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
+    if all_document:
+        nodelist = await ctx.get_pipeline_mgr().run_data_prepare(docs=all_document)
+        if active_pl.indexer.comp_subtype != "kbadmin_indexer":
+            if nodelist is None or len(nodelist) == 0:
+                raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="File not found")
+        ctx.get_node_mgr().add_nodes(active_pl.node_parser.idx, nodelist)
+        return "success update file"
 
 
 # Update knowledge base data
-async def remove_file_handler(file_path=None, knowledge_name: str = "default_kb"):
+async def remove_document_handler(document_list=None, knowledge_name: str = "default_kb"):
     if ctx.get_pipeline_mgr().get_active_pipeline() is None:
-        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail="Please activate pipeline")
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail="Please activate pipeline",
+        )
 
-    pl = ctx.get_pipeline_mgr().get_active_pipeline()
-    ctx.get_node_mgr().del_nodes_by_np_idx(pl.node_parser.idx)
-    try:
-        pl.indexer.clear_milvus_collection(knowledge_name)
-        pl.indexer.reinitialize_indexer(knowledge_name)
-    except MilvusException as e:
-        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
-    pl.update_indexer_to_retriever()
-    if file_path:
-        for file in file_path:
-            request = DataIn(local_path=file)
-            await add_data(request)
-    return "Done"
+    active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
+    active_kb = ctx.get_knowledge_mgr().get_active_knowledge_base()
+    ctx.get_node_mgr().del_nodes_by_np_idx(active_pl.node_parser.idx)
+    if active_pl.indexer.comp_subtype == "milvus_vector":
+        active_pl.indexer.reinitialize_indexer(knowledge_name)
+        active_pl.indexer.delete(document_list)
+        if active_kb:
+            active_pl.indexer.reinitialize_indexer(active_kb.name)
+            active_pl.update_indexer_to_retriever()
+    elif active_kb.name == knowledge_name:
+        await handle_reload_data(active_kb, active_pl)
 
 
 # Restore knowledge base configuration
-async def load_knowledge_from_file():
-    CONFIG_DIR = "/home/user/ui_cache/configs"
-    KNOWLEDGEBASE_FILE = os.path.join(CONFIG_DIR, "knowledgebase.json")
+async def restore_knowledge_configurations():
+    knowledgebase_config_repo = MilvusConfigRepository.create_connection("knowledgebase_config", 1)
+    all_datas = []
     active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
-    if os.path.exists(KNOWLEDGEBASE_FILE):
-        with open(KNOWLEDGEBASE_FILE, "r", encoding="utf-8") as f:
-            all_Knowledgebases = f.read()
-        try:
+    if knowledgebase_config_repo:
+        all_Knowledgebases_repo = knowledgebase_config_repo.get_configs()
+        for Knowledgebase_data in all_Knowledgebases_repo:
+            config_json = Knowledgebase_data.get("config_json")
+            all_datas.append(config_json)
+    else:
+        if os.path.exists(KNOWLEDGEBASE_FILE):
+            with open(KNOWLEDGEBASE_FILE, "r", encoding="utf-8") as f:
+                all_Knowledgebases = f.read()
             all_data = json.loads(all_Knowledgebases)
             for Knowledgebase_data in all_data:
-                pipeline_req = KnowledgeBaseCreateIn(**Knowledgebase_data)
-                kb = ctx.knowledgemgr.create_knowledge_base(pipeline_req)
-                if Knowledgebase_data["file_map"]:
+                all_datas.append(Knowledgebase_data)
+    try:
+        for Knowledgebase_data in all_datas:
+            Knoweldge_req = KnowledgeBaseCreateIn(**Knowledgebase_data)
+            kb = ctx.knowledgemgr.create_knowledge_base(Knoweldge_req)
+            if kb.comp_type == "knowledge" and kb.comp_subtype == "origin_kb":
+                if Knowledgebase_data["file_paths"]:
                     if active_pl.indexer.comp_subtype != "milvus_vector" and Knowledgebase_data["active"]:
-                        for file_path in Knowledgebase_data["file_map"].values():
-                            await update_knowledge_base_handler(
-                                DataIn(local_path=file_path), Knowledgebase_data["name"], add_file=True
-                            )
-                            kb.add_file_path(file_path)
+                        await handle_reload_data(kb, active_pl)
                     elif Knowledgebase_data["active"]:
                         active_pl.indexer.reinitialize_indexer(Knowledgebase_data["name"])
                         active_pl.update_indexer_to_retriever()
-                        for file_path in Knowledgebase_data["file_map"].values():
-                            kb.add_file_path(file_path)
                     else:
-                        for file_path in Knowledgebase_data["file_map"].values():
-                            kb.add_file_path(file_path)
-        except Exception as e:
-            print(f"Error load Knowledge base: {e}")
-
-
-# Configuration of knowledge base for persistence
-async def save_knowledge_to_file():
-    CONFIG_DIR = "/home/user/ui_cache/configs"
-    KNOWLEDGEBASE_FILE = os.path.join(CONFIG_DIR, "knowledgebase.json")
-    if not os.path.exists(CONFIG_DIR):
-        os.makedirs(CONFIG_DIR, exist_ok=True)
-    try:
-        kb_base = ctx.knowledgemgr.get_all_knowledge_bases()
-        knowledgebases_data = []
-        for kb in kb_base:
-            kb_json = {"name": kb.name, "description": kb.description, "active": kb.active, "file_map": kb.file_map}
-            knowledgebases_data.append(kb_json)
-        json_str = json.dumps(knowledgebases_data, indent=2, ensure_ascii=False)
-        with open(KNOWLEDGEBASE_FILE, "w", encoding="utf-8") as f:
-            f.write(json_str)
+                        pass
+            elif kb.comp_subtype == "kbadmin_kb":
+                if Knowledgebase_data["active"]:
+                    active_pl.retriever.config_kbadmin_milvus(kb.name)
     except Exception as e:
-        print(f"Error saving Knowledge base: {e}")
-
-
-all_pipeline_milvus_maps = {}
-current_pipeline_kb_map = {}
-
-
-async def refresh_milvus_map(milvus_name):
-    current_pipeline_kb_map.clear()
-    knowledge_bases_list = await get_all_knowledge_bases()
-    for kb in knowledge_bases_list:
-        current_pipeline_kb_map[kb.name] = kb.file_map
-    all_pipeline_milvus_maps[milvus_name] = copy.deepcopy(current_pipeline_kb_map)
+        print(f"Error load Knowledge base: {e}")
 
 
 async def Synchronizing_vector_data(old_active_pl, new_active_pl):
     try:
         active_kb = ctx.knowledgemgr.get_active_knowledge_base()
         active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
-        milvus_name = (
-            old_active_pl.name + str(old_active_pl.indexer.model_extra["d"]) if old_active_pl else "default_kb"
-        )
+        # Determine whether it is kbadmin type
+        if old_active_pl:
+            if (
+                old_active_pl.retriever.comp_subtype == "kbadmin_retriever"
+                and new_active_pl.retriever.comp_subtype == "kbadmin_retriever"
+            ):
+                if active_kb:
+                    if active_kb.comp_subtype == "kbadmin_kb":
+                        new_active_pl.retriever.config_kbadmin_milvus(active_kb.name)
+                return True
+            elif old_active_pl.retriever.comp_subtype == "kbadmin_retriever":
+                return True
         if not active_kb:
             return True
-        if not active_pl:
-            if old_active_pl:
-                if old_active_pl.indexer.comp_subtype == "milvus_vector":
-                    await refresh_milvus_map(milvus_name)
+        if new_active_pl.retriever.comp_subtype == "kbadmin_retriever":
+            if active_kb:
+                if active_kb.comp_subtype == "kbadmin_kb":
+                    new_active_pl.retriever.config_kbadmin_milvus(active_kb.name)
             return True
-
+        # Perform milvus data synchronization
         if new_active_pl.indexer.comp_subtype == "milvus_vector":
-            new_milvus_map = {}
-            kb_list = await get_all_knowledge_bases()
-            for kb in kb_list:
-                new_milvus_map[kb.name] = kb.file_map
-            added_files, deleted_files = compare_mappings(
-                new_milvus_map,
-                all_pipeline_milvus_maps.get(new_active_pl.name + str(new_active_pl.indexer.model_extra["d"]), {}),
-            )
-            # Synchronization of deleted files
-            for kb_name, file_paths in deleted_files.items():
-                if file_paths:
-                    new_active_pl.indexer.clear_milvus_collection(kb_name)
-                    if kb_name not in new_milvus_map.keys():
-                        continue
-                    kb = await get_knowledge_base(kb_name)
-                    new_active_pl.indexer.reinitialize_indexer(kb_name)
-                    file_paths = kb.get_file_paths()
-                    if file_paths:
-                        for file in file_paths:
-                            await add_data(DataIn(local_path=file))
-            # Synchronization of added files
-            for kb_name, file_paths in added_files.items():
-                if file_paths:
-                    for file_path in file_paths.values():
-                        new_active_pl.indexer.reinitialize_indexer(kb_name)
-                        await add_data(DataIn(local_path=file_path))
-
-            new_active_pl.indexer.reinitialize_indexer(active_kb.name)
-            new_active_pl.update_indexer_to_retriever()
-            await refresh_milvus_map(milvus_name)
+            # Pipeline component state not changed
+            current_paths = active_kb.file_paths
+            file_paths = active_pl.compare_file_lists(active_kb.name, current_paths)
+            if "del_docs" not in file_paths:
+                await handle_pipeline_change(active_kb, active_pl, file_paths)
+            else:
+                need_delete_document_path = file_paths["del_docs"]
+                need_add_document_path = file_paths["add_docs"]
+                active_pl.indexer.reinitialize_indexer(active_kb.name)
+                if need_delete_document_path:
+                    for file_path in need_delete_document_path:
+                        await remove_file_from_knowledge_base(active_kb.name, DataIn(local_path=file_path))
+                if need_add_document_path:
+                    for file_path in need_add_document_path:
+                        add_document = await add_file_to_knowledge_base(
+                            active_kb.name, DataIn(local_path=file_path), False
+                        )
+                        await add_document_handler(add_document)
+            active_pl.indexer.reinitialize_indexer(active_kb.name)
+            active_pl.update_indexer_to_retriever()
         else:
-            new_active_pl.indexer.reinitialize_indexer()
-            new_active_pl.update_indexer_to_retriever()
-            add_list = active_kb.get_file_paths()
-            for file in add_list:
-                await add_data(DataIn(local_path=file))
-            if old_active_pl:
-                if old_active_pl.indexer.comp_subtype == "milvus_vector":
-                    await refresh_milvus_map(milvus_name)
+            await handle_reload_data(active_kb, active_pl)
+        await save_knowledge_configurations("update", active_kb)
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=e)
+
+
+# When the pipeline is changed, the current kb and the data of the pipeline are reconstructed
+async def handle_pipeline_change(kb, pl, file_paths):
+    exist_file = False
+    need_add_document_path = file_paths["add_docs"]
+    node_lists = await get_nodes_with_kb(kb.name)
+    pl.indexer.clear_milvus_collection(kb.name)
+    if need_add_document_path:
+        if os.path.isfile(need_add_document_path[0]):
+            kb.clear_documents(pl.name)
+            exist_file = True
+        pl.indexer.reinitialize_indexer(kb.name)
+        for file_path in need_add_document_path:
+            if exist_file:
+                add_document = await add_file_to_knowledge_base(kb.name, DataIn(local_path=file_path), False)
+                await add_document_handler(add_document)
+            else:
+                add_document = []
+                document = {}
+                documents_list = kb.get_all_document(file_path, pl.name)
+                for document in documents_list:
+                    need_add_node_list = {}
+                    for node in node_lists.values():
+                        if document.get("doc_id") == node.get("doc_id"):
+                            need_add_node_list[node["id_"]] = node
+                    docuement_text = pl.nodes_to_document(need_add_node_list)
+                    document["id_"] = document.get("doc_id")
+                    document["text"] = docuement_text
+                    document["excluded_embed_metadata_keys"] = [
+                        "file_name",
+                        "file_type",
+                        "file_size",
+                        "creation_date",
+                        "last_modified_date",
+                        "last_accessed_date",
+                    ]
+                    document["excluded_llm_metadata_keys"] = [
+                        "file_name",
+                        "file_type",
+                        "file_size",
+                        "creation_date",
+                        "last_modified_date",
+                        "last_accessed_date",
+                    ]
+                    document["metadata"] = document.get("metadata")
+                    result_document = Document.from_dict(data=document)
+                    add_document.append(result_document)
+                pl.add_docs_to_list(kb.name, file_path)
+                await add_document_handler(add_document)
+
+
+# reloading data that is not a milvus indexer
+async def handle_reload_data(kb, pl):
+    pl.indexer.reinitialize_indexer()
+    pl.update_indexer_to_retriever()
+    need_add_document_path = kb.get_file_paths()
+    ctx.get_node_mgr().del_nodes_by_np_idx(pl.node_parser.idx)
+    kb.clear_documents(pl.name)
+    if need_add_document_path:
+        for file_path in need_add_document_path:
+            add_document = await add_file_to_knowledge_base(kb.name, DataIn(local_path=file_path), False)
+            await add_document_handler(add_document)
diff --git a/EdgeCraftRAG/edgecraftrag/api/v1/model.py b/EdgeCraftRAG/edgecraftrag/api/v1/model.py
index bbc0d9806b..8707384cdf 100644
--- a/EdgeCraftRAG/edgecraftrag/api/v1/model.py
+++ b/EdgeCraftRAG/edgecraftrag/api/v1/model.py
@@ -3,10 +3,12 @@
 
 import gc
 import os
+from typing import Optional
 
+import requests
 from edgecraftrag.api_schema import ModelIn
 from edgecraftrag.context import ctx
-from fastapi import FastAPI, HTTPException, status
+from fastapi import FastAPI, HTTPException, Query, status
 
 model_app = FastAPI()
 
@@ -30,11 +32,22 @@ async def get_model_weight(model_id):
 
 # Search available model id
 @model_app.get(path="/v1/settings/avail-models/{model_type}")
-async def get_model_id(model_type):
+async def get_model_id(
+    model_type: str,
+    server_address: Optional[str] = Query(default=None, description="vLLM server address (optional)"),
+):
     try:
-        return get_available_models(model_type)
+        if model_type == "vLLM":
+            if not server_address:
+                server_address = "http://localhost:8086"
+            return get_available_vllm_models(server_address)
+        else:
+            return get_available_models(model_type)
     except Exception as e:
-        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=" GET model failed")
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=" GET model failed",
+        )
 
 
 # GET Models
@@ -123,7 +136,10 @@ def get_available_weights(model_path):
 
 def get_available_models(model_type):
     avail_models = []
-    if model_type == "LLM":
+    if model_type == "vLLM":
+        LLM_MODEL = os.getenv("LLM_MODEL", "Qwen/Qwen3-8B")
+        avail_models.append(LLM_MODEL)
+    elif model_type == "LLM":
         items = os.listdir(CONTAINER_MODEL_PATH)
         for item in items:
             if item == "BAAI":
@@ -134,9 +150,29 @@ def get_available_models(model_type):
                     avail_models.append(item + "/" + sub_path)
             else:
                 avail_models.append(item)
+    elif model_type == "kbadmin_embedding_model":
+        return ["BAAI/bge-large-zh-v1.5"]
     else:
         for item in os.listdir(CONTAINER_MODEL_PATH + "BAAI"):
             if (model_type == "reranker" and "rerank" in item) or (model_type == "embedding" and "rerank" not in item):
                 avail_models.append("BAAI/" + item)
 
     return avail_models
+
+
+@model_app.get(path="/v1/available_models")
+def get_available_vllm_models(server_address: str):
+    try:
+        url = f"{server_address}/v1/models"
+        response = requests.get(url, timeout=60)
+        response.raise_for_status()
+        response_data = response.json()
+        model_entries = response_data.get("data", [])
+        models = [entry.get("id") for entry in model_entries if entry.get("id")]
+
+        return models
+
+    except requests.exceptions.RequestException as e:
+        raise HTTPException(status_code=500, detail=f"Failed to connect to vLLM server: {str(e)}")
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"Error processing request: {str(e)}")
diff --git a/EdgeCraftRAG/edgecraftrag/api/v1/pipeline.py b/EdgeCraftRAG/edgecraftrag/api/v1/pipeline.py
old mode 100755
new mode 100644
index e1cd5b8345..216145fb9f
--- a/EdgeCraftRAG/edgecraftrag/api/v1/pipeline.py
+++ b/EdgeCraftRAG/edgecraftrag/api/v1/pipeline.py
@@ -4,24 +4,42 @@
 import asyncio
 import json
 import os
+import re
+import time
 import weakref
 from concurrent.futures import ThreadPoolExecutor
 
 from edgecraftrag.api.v1.knowledge_base import Synchronizing_vector_data
 from edgecraftrag.api_schema import MilvusConnectRequest, PipelineCreateIn
-from edgecraftrag.base import IndexerType, InferenceType, ModelType, NodeParserType, PostProcessorType, RetrieverType
+from edgecraftrag.base import (
+    GeneratorType,
+    IndexerType,
+    InferenceType,
+    ModelType,
+    NodeParserType,
+    PostProcessorType,
+    RetrieverType,
+)
 from edgecraftrag.components.benchmark import Benchmark
-from edgecraftrag.components.generator import QnAGenerator
-from edgecraftrag.components.indexer import VectorIndexer
+from edgecraftrag.components.generator import FreeChatGenerator, QnAGenerator
+from edgecraftrag.components.indexer import KBADMINIndexer, VectorIndexer
 from edgecraftrag.components.node_parser import (
     HierarchyNodeParser,
+    KBADMINParser,
     SimpleNodeParser,
     SWindowNodeParser,
     UnstructedNodeParser,
 )
 from edgecraftrag.components.postprocessor import MetadataReplaceProcessor, RerankProcessor
-from edgecraftrag.components.retriever import AutoMergeRetriever, SimpleBM25Retriever, VectorSimRetriever
+from edgecraftrag.components.retriever import (
+    AutoMergeRetriever,
+    KBadminRetriever,
+    SimpleBM25Retriever,
+    VectorSimRetriever,
+)
+from edgecraftrag.config_repository import MilvusConfigRepository, save_pipeline_configurations
 from edgecraftrag.context import ctx
+from edgecraftrag.env import PIPELINE_FILE
 from fastapi import FastAPI, File, HTTPException, UploadFile, status
 from pymilvus import connections
 
@@ -51,17 +69,33 @@ async def get_pipeline_json(name):
 
 
 # GET Pipeline benchmark
-@pipeline_app.get(path="/v1/settings/pipelines/{name}/benchmark")
-async def get_pipeline_benchmark(name):
-    pl = ctx.get_pipeline_mgr().get_pipeline_by_name_or_id(name)
+@pipeline_app.get(path="/v1/settings/pipeline/benchmark")
+async def get_pipeline_benchmark():
+    pl = ctx.get_pipeline_mgr().get_active_pipeline()
     if pl and pl.benchmark:
         return pl.benchmark
 
 
+# GET Pipeline benchmark
+@pipeline_app.get(path="/v1/settings/pipelines/{name}/benchmarks")
+async def get_pipeline_benchmarks(name):
+    pl = ctx.get_pipeline_mgr().get_pipeline_by_name_or_id(name)
+    if pl and pl.benchmark:
+        return pl.benchmark.benchmark_data_list
+
+
 # POST Pipeline
 @pipeline_app.post(path="/v1/settings/pipelines")
 async def add_pipeline(request: PipelineCreateIn):
-    return load_pipeline(request)
+    pattern = re.compile(r"^[a-zA-Z0-9_]+$")
+    if not pattern.fullmatch(request.name):
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail="Pipeline name must consist of letters, numbers, and underscores.",
+        )
+    pl = await load_pipeline(request)
+    await save_pipeline_configurations("add", pl)
+    return pl
 
 
 # PATCH Pipeline
@@ -73,15 +107,18 @@ async def update_pipeline(name, request: PipelineCreateIn):
     active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
     if pl == active_pl:
         if request.active:
-            raise HTTPException(status_code=status.HTTP_423_LOCKED, detail="Unable to patch an active pipeline...")
+            raise HTTPException(
+                status_code=status.HTTP_423_LOCKED,
+                detail="Unable to patch an active pipeline...",
+            )
     async with ctx.get_pipeline_mgr()._lock:
         try:
-            update_pipeline_handler(pl, request)
+            await update_pipeline_handler(pl, request)
             pipeline_dict = request.dict()
             pl.update_pipeline_json(pipeline_dict)
         except (ValueError, Exception) as e:
             raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
-    save_pipeline_to_file()
+    await save_pipeline_configurations("update", pl)
     return pl
 
 
@@ -89,8 +126,12 @@ async def update_pipeline(name, request: PipelineCreateIn):
 @pipeline_app.delete(path="/v1/settings/pipelines/{name}")
 async def remove_pipeline(name):
     try:
+        pl = ctx.get_pipeline_mgr().get_pipeline_by_name_or_id(name)
+        for _, agent in ctx.agentmgr.get_agents().items():
+            if pl.idx == agent.pipeline_idx:
+                raise Exception(f"Please cancel the {agent.name}'s agent associated with the current pipeline first")
         res = ctx.get_pipeline_mgr().remove_pipeline_by_name_or_id(name)
-        save_pipeline_to_file()
+        await save_pipeline_configurations("delete", pl)
         return res
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
@@ -102,30 +143,37 @@ async def upload_file(file: UploadFile = File(...)):
     content = await file.read()
     request = json.loads(content)
     pipeline_req = PipelineCreateIn(**request)
-    return load_pipeline(pipeline_req)
+    pl = await load_pipeline(pipeline_req)
+    await save_pipeline_configurations("add", pl)
+    return pl
 
 
-def load_pipeline(request):
+async def load_pipeline(request):
     pl = ctx.get_pipeline_mgr().get_pipeline_by_name_or_id(request.name)
     if pl is None:
         pipeline_json = request.model_dump_json()
-        pl = ctx.get_pipeline_mgr().create_pipeline(request.name, pipeline_json)
+        if request.idx is not None:
+            pl = ctx.get_pipeline_mgr().create_pipeline(request, pipeline_json)
+        else:
+            pl = ctx.get_pipeline_mgr().create_pipeline(request.name, pipeline_json)
     active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
     if pl == active_pl and request.active:
-        raise HTTPException(status_code=status.HTTP_423_LOCKED, detail="Unable to patch an active pipeline...")
+        raise HTTPException(
+            status_code=status.HTTP_423_LOCKED,
+            detail="Unable to patch an active pipeline...",
+        )
     try:
-        update_pipeline_handler(pl, request)
-        save_pipeline_to_file()
+        await update_pipeline_handler(pl, request)
     except (ValueError, Exception) as e:
         ctx.get_pipeline_mgr().remove_pipeline_by_name_or_id(request.name)
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
     return pl
 
 
-def update_pipeline_handler(pl, req):
+async def update_pipeline_handler(pl, req):
     active_kb = ctx.knowledgemgr.get_active_knowledge_base()
     active_pipeline = ctx.get_pipeline_mgr().get_active_pipeline()
-    kb_name = active_kb.name if active_kb else "default_kb"
+    kb_name = active_kb.name if active_kb else "default"
 
     if req.node_parser is not None:
         np = req.node_parser
@@ -153,12 +201,10 @@ def update_pipeline_handler(pl, req):
                     pl.node_parser = SWindowNodeParser.from_defaults(window_size=np.window_size)
                 case NodeParserType.UNSTRUCTURED:
                     pl.node_parser = UnstructedNodeParser(chunk_size=np.chunk_size, chunk_overlap=np.chunk_overlap)
+                case NodeParserType.KBADMINPARSER:
+                    pl.node_parser = KBADMINParser()
             ctx.get_node_parser_mgr().add(pl.node_parser)
 
-            all_docs = ctx.get_file_mgr().get_all_docs()
-            nodelist = pl.node_parser.run(docs=all_docs)
-            if nodelist is not None and len(nodelist) > 0:
-                ctx.get_node_mgr().add_nodes(pl.node_parser.idx, nodelist)
             pl._node_changed = True
 
     if req.indexer is not None:
@@ -168,17 +214,24 @@ def update_pipeline_handler(pl, req):
             pl.indexer = found_indexer
         else:
             embed_model = None
-            if ind.embedding_model:
-                embed_model = ctx.get_model_mgr().search_model(ind.embedding_model)
-                if embed_model is None:
-                    ind.embedding_model.model_type = ModelType.EMBEDDING
-                    embed_model = ctx.get_model_mgr().load_model(ind.embedding_model)
-                    ctx.get_model_mgr().add(embed_model)
             match ind.indexer_type:
                 case IndexerType.DEFAULT_VECTOR | IndexerType.FAISS_VECTOR | IndexerType.MILVUS_VECTOR:
+                    if ind.embedding_model:
+                        embed_model = ctx.get_model_mgr().search_model(ind.embedding_model)
+                        if embed_model is None:
+                            ind.embedding_model.model_type = ModelType.EMBEDDING
+                            embed_model = ctx.get_model_mgr().load_model(ind.embedding_model)
+                            ctx.get_model_mgr().add(embed_model)
                     # TODO: **RISK** if considering 2 pipelines with different
                     # nodes, but same indexer, what will happen?
-                    pl.indexer = VectorIndexer(embed_model, ind.indexer_type, ind.vector_uri, kb_name)
+                    pl.indexer = VectorIndexer(embed_model, ind.indexer_type, ind.vector_url, kb_name)
+                case IndexerType.KBADMIN_INDEXER:
+                    kbadmin_embedding_url = ind.embedding_url
+                    KBADMIN_VECTOR_URL = ind.vector_url
+                    embed_model = ind.embedding_model.model_id
+                    pl.indexer = KBADMINIndexer(
+                        embed_model, ind.indexer_type, kbadmin_embedding_url, KBADMIN_VECTOR_URL
+                    )
                 case _:
                     pass
             ctx.get_indexer_mgr().add(pl.indexer)
@@ -208,6 +261,8 @@ def update_pipeline_handler(pl, req):
                     pl.retriever = SimpleBM25Retriever(pl.indexer, similarity_top_k=retr.retrieve_topk)
                 else:
                     return Exception("No indexer")
+            case RetrieverType.KBADMIN_RETRIEVER:
+                pl.retriever = KBadminRetriever(pl.indexer, similarity_top_k=retr.retrieve_topk)
             case _:
                 pass
         # Index is updated to retriever
@@ -252,9 +307,12 @@ def update_pipeline_handler(pl, req):
                 ctx.get_model_mgr().add(model)
             # Use weakref to achieve model deletion and memory release
             model_ref = weakref.ref(model)
-            pl.generator = QnAGenerator(
-                model_ref, gen.prompt_path, gen.inference_type, gen.vllm_endpoint, gen.prompt_content
-            )
+            if gen.generator_type == GeneratorType.CHATQNA:
+                pl.generator = QnAGenerator(
+                    model_ref, gen.prompt_path, gen.inference_type, gen.vllm_endpoint, gen.prompt_content
+                )
+            elif gen.generator_type == GeneratorType.FREECHAT:
+                pl.generator = FreeChatGenerator(model_ref, gen.inference_type, gen.vllm_endpoint)
             if pl.enable_benchmark:
                 if "tokenizer" not in locals() or tokenizer is None:
                     _, tokenizer, bench_hook = ctx.get_model_mgr().load_model_ben(gen.model)
@@ -268,73 +326,49 @@ def update_pipeline_handler(pl, req):
         ctx.get_pipeline_mgr().activate_pipeline(pl.name, req.active, ctx.get_node_mgr(), kb_name)
 
     # Create and set up a separate event loop to run asynchronous tasks in threads
-    def run_async_task():
-        loop = asyncio.new_event_loop()
-        asyncio.set_event_loop(loop)
-        try:
-            loop.run_until_complete(Synchronizing_vector_data(active_pipeline, pl))
-        except Exception as e:
-            raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=f"Synchronization error: {e}")
-        finally:
-            loop.close()
-
-    with ThreadPoolExecutor(max_workers=1) as executor:
-        future = executor.submit(run_async_task)
-        future.result()
+    if req.active:
+        await Synchronizing_vector_data(active_pipeline, pl)
     return pl
 
 
 # Restore pipeline configuration
-def load_pipeline_from_file():
-    CONFIG_DIR = "/home/user/ui_cache/configs"
-    PIPELINE_FILE = os.path.join(CONFIG_DIR, "pipeline.json")
-    if os.path.exists(PIPELINE_FILE):
-        with open(PIPELINE_FILE, "r", encoding="utf-8") as f:
-            all_pipelines = f.read()
-        try:
-            all_da = json.loads(all_pipelines)
-            for pipeline_data in all_da:
-                one_pipelinejson = json.loads(pipeline_data)
-                pipeline_req = PipelineCreateIn(**one_pipelinejson)
-                load_pipeline(pipeline_req)
-        except Exception as e:
-            raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
-
-
-# Configuration of the persistence pipeline
-def save_pipeline_to_file():
-    CONFIG_DIR = "/home/user/ui_cache/configs"
-    PIPELINE_FILE = os.path.join(CONFIG_DIR, "pipeline.json")
-
-    if not os.path.exists(CONFIG_DIR):
-        os.makedirs(CONFIG_DIR, exist_ok=True)
+async def restore_pipeline_configurations():
+    milvus_repo = MilvusConfigRepository.create_connection("pipeline_config", 20)
+    all_pipelines = []
+    if milvus_repo:
+        time.sleep(10)
+        all_pipelines_repo = milvus_repo.get_configs()
+        for pipeline in all_pipelines_repo:
+            all_pipelines.append(pipeline.get("config_json"))
+    else:
+        if os.path.exists(PIPELINE_FILE):
+            with open(PIPELINE_FILE, "r", encoding="utf-8") as f:
+                all_pipelines = f.read()
+        if all_pipelines:
+            all_pipelines = json.loads(all_pipelines)
     try:
-        pipelines_data = ctx.get_pipeline_mgr().get_pipelines()
-        all_pipeline_json = []
-        for pipeline in pipelines_data:
-            all_pipeline_json.append(pipeline.get_pipeline_json)
-        json_str = json.dumps(all_pipeline_json, indent=2, ensure_ascii=False)
-        with open(PIPELINE_FILE, "w", encoding="utf-8") as f:
-            f.write(json_str)
+        for pipeline_data in all_pipelines:
+            pipeline_req = PipelineCreateIn(**pipeline_data)
+            await load_pipeline(pipeline_req)
     except Exception as e:
-        print(f"Error saving pipelines: {e}")
+        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
 
 
 # Detecting if milvus is connected
 @pipeline_app.post(path="/v1/check/milvus")
 async def check_milvus(request: MilvusConnectRequest):
-    vector_uri = request.vector_uri
+    vector_url = request.vector_url
     try:
-        if vector_uri.startswith("http://"):
-            host_port = vector_uri.replace("http://", "")
-        elif vector_uri.startswith("https://"):
-            host_port = vector_uri.replace("https://", "")
+        if vector_url.startswith("http://"):
+            host_port = vector_url.replace("http://", "")
+        elif vector_url.startswith("https://"):
+            host_port = vector_url.replace("https://", "")
         else:
-            host_port = vector_uri
+            host_port = vector_url
         host, port = host_port.split(":", 1)
-        connections.connect(alias="default", host=host, port=port)
+        connections.connect(alias="knowledge_default", host=host, port=port)
 
-        if connections.has_connection("default"):
+        if connections.has_connection("knowledge_default"):
             return {"status": "200", "message": "Milvus connection successful."}
         else:
             return {"status": "404", "message": "Milvus connection failed."}
diff --git a/EdgeCraftRAG/edgecraftrag/api/v1/prompt.py b/EdgeCraftRAG/edgecraftrag/api/v1/prompt.py
index 86639a40a7..51ed5be6d4 100644
--- a/EdgeCraftRAG/edgecraftrag/api/v1/prompt.py
+++ b/EdgeCraftRAG/edgecraftrag/api/v1/prompt.py
@@ -1,8 +1,10 @@
 # Copyright (C) 2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+from edgecraftrag.api.v1.pipeline import save_pipeline_configurations
 from edgecraftrag.api_schema import PromptIn
 from edgecraftrag.context import ctx
+from edgecraftrag.utils import DEFAULT_TEMPLATE
 from fastapi import FastAPI, File, HTTPException, UploadFile, status
 
 prompt_app = FastAPI()
@@ -12,11 +14,13 @@
 @prompt_app.post(path="/v1/chatqna/prompt-file")
 async def load_prompt_file(file: UploadFile = File(...)):
     try:
-        generator = ctx.get_pipeline_mgr().get_active_pipeline().generator
+        pl = ctx.get_pipeline_mgr().get_active_pipeline()
+        generator = pl.generator
         if generator:
             content = await file.read()
             prompt_str = content.decode("utf-8")
             generator.set_prompt(prompt_str)
+            await save_pipeline_configurations("update", pl)
             return "Set LLM Prompt Successfully"
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
@@ -26,10 +30,12 @@ async def load_prompt_file(file: UploadFile = File(...)):
 @prompt_app.post(path="/v1/chatqna/prompt")
 async def load_prompt(request: PromptIn):
     try:
-        generator = ctx.get_pipeline_mgr().get_active_pipeline().generator
+        pl = ctx.get_pipeline_mgr().get_active_pipeline()
+        generator = pl.generator
         if generator:
             prompt_str = request.prompt
             generator.set_prompt(prompt_str)
+            await save_pipeline_configurations("update", pl)
             return "Set LLM Prompt Successfully"
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
@@ -38,14 +44,30 @@ async def load_prompt(request: PromptIn):
 # Get prompt of LLM ChatQnA
 @prompt_app.get(path="/v1/chatqna/prompt")
 async def get_prompt():
+    try:
+        generator = ctx.get_pipeline_mgr().get_active_pipeline().generator
+        if generator:
+            return generator.original_template
+    except Exception as e:
+        raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
+
+
+@prompt_app.get(path="/v1/chatqna/prompt/tagged")
+async def get_tagged_prompt():
     try:
         generator = ctx.get_pipeline_mgr().get_active_pipeline().generator
         if generator:
             return generator.prompt
+        raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="Tagged prompt not found")
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
 
 
+@prompt_app.get(path="/v1/chatqna/prompt/default")
+async def get_default_prompt():
+    return DEFAULT_TEMPLATE
+
+
 # Reset prompt for LLM ChatQnA
 @prompt_app.post(path="/v1/chatqna/prompt/reset")
 async def reset_prompt():
diff --git a/EdgeCraftRAG/edgecraftrag/api/v1/session.py b/EdgeCraftRAG/edgecraftrag/api/v1/session.py
new file mode 100644
index 0000000000..d2427f7334
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/api/v1/session.py
@@ -0,0 +1,19 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from edgecraftrag.api_schema import SessionIn
+from edgecraftrag.context import ctx
+from fastapi import FastAPI
+
+session_app = FastAPI()
+
+
+@session_app.get("/v1/sessions")
+def get_all_sessions():
+    return ctx.get_session_mgr().get_all_sessions()
+
+
+@session_app.get("/v1/session/{idx}")
+def get_session_by_id(idx: str):
+    content = ctx.get_session_mgr().get_session_by_id(idx)
+    return {"session_id": idx, "session_content": content}
diff --git a/EdgeCraftRAG/edgecraftrag/api_schema.py b/EdgeCraftRAG/edgecraftrag/api_schema.py
index d7ae1c8478..b57b2da604 100644
--- a/EdgeCraftRAG/edgecraftrag/api_schema.py
+++ b/EdgeCraftRAG/edgecraftrag/api_schema.py
@@ -1,8 +1,9 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-from typing import Any, Optional
+from typing import Any, Dict, Optional
 
+from edgecraftrag import base
 from pydantic import BaseModel
 
 
@@ -12,6 +13,7 @@ class ModelIn(BaseModel):
     model_path: Optional[str] = "./"
     weight: Optional[str] = "INT4"
     device: Optional[str] = "cpu"
+    api_base: Optional[str] = None
 
 
 class NodeParserIn(BaseModel):
@@ -25,7 +27,8 @@ class NodeParserIn(BaseModel):
 class IndexerIn(BaseModel):
     indexer_type: str
     embedding_model: Optional[ModelIn] = None
-    vector_uri: Optional[str] = None
+    embedding_url: Optional[str] = None
+    vector_url: Optional[str] = None
 
 
 class RetrieverIn(BaseModel):
@@ -40,6 +43,7 @@ class PostProcessorIn(BaseModel):
 
 
 class GeneratorIn(BaseModel):
+    generator_type: str
     prompt_path: Optional[str] = None
     prompt_content: Optional[str] = None
     model: Optional[ModelIn] = None
@@ -48,6 +52,7 @@ class GeneratorIn(BaseModel):
 
 
 class PipelineCreateIn(BaseModel):
+    idx: Optional[str] = None
     name: Optional[str] = None
     node_parser: Optional[NodeParserIn] = None
     indexer: Optional[IndexerIn] = None
@@ -55,6 +60,7 @@ class PipelineCreateIn(BaseModel):
     postprocessor: Optional[list[PostProcessorIn]] = None
     generator: Optional[GeneratorIn] = None
     active: Optional[bool] = False
+    documents_cache: Optional[Dict] = None
 
 
 class DataIn(BaseModel):
@@ -77,10 +83,35 @@ class PromptIn(BaseModel):
 
 
 class KnowledgeBaseCreateIn(BaseModel):
+    idx: Optional[str] = None
     name: str
     description: Optional[str] = None
     active: Optional[bool] = None
+    comp_type: Optional[str] = "knowledge"
+    comp_subtype: Optional[str] = "origin_kb"
+    experience_active: Optional[bool] = None
+    all_document_maps: Optional[Dict] = None
+    file_paths: Optional[list] = None
+
+
+class ExperienceIn(BaseModel):
+    idx: Optional[str] = None
+    question: Optional[str] = None
+    content: list[str] = None
 
 
 class MilvusConnectRequest(BaseModel):
-    vector_uri: str
+    vector_url: str
+
+
+class AgentCreateIn(BaseModel):
+    idx: Optional[str] = None
+    name: Optional[str] = ""
+    type: Optional[base.AgentType] = None
+    pipeline_idx: Optional[str] = None
+    configs: Optional[dict] = None
+    active: Optional[bool] = False
+
+
+class SessionIn(BaseModel):
+    idx: Optional[str] = None
diff --git a/EdgeCraftRAG/edgecraftrag/base.py b/EdgeCraftRAG/edgecraftrag/base.py
index db1dc414b8..195302451c 100644
--- a/EdgeCraftRAG/edgecraftrag/base.py
+++ b/EdgeCraftRAG/edgecraftrag/base.py
@@ -4,7 +4,7 @@
 import abc
 import uuid
 from enum import Enum
-from typing import Any, Callable, List, Optional
+from typing import Any, Optional
 
 from pydantic import BaseModel, ConfigDict, Field, model_serializer
 
@@ -19,7 +19,12 @@ class CompType(str, Enum):
     RETRIEVER = "retriever"
     POSTPROCESSOR = "postprocessor"
     GENERATOR = "generator"
+    QUERYSEARCH = "querysearch"
     FILE = "file"
+    CHUNK_NUM = "chunk_num"
+    KNOWLEDGE = "knowledge"
+    AGENT = "agent"
+    SESSION = "session"
 
 
 class ModelType(str, Enum):
@@ -28,6 +33,7 @@ class ModelType(str, Enum):
     RERANKER = "reranker"
     LLM = "llm"
     VLLM = "vllm"
+    VLLM_EMBEDDING = "vllm_embedding"
 
 
 class FileType(str, Enum):
@@ -44,6 +50,7 @@ class NodeParserType(str, Enum):
     HIERARCHY = "hierarchical"
     SENTENCEWINDOW = "sentencewindow"
     UNSTRUCTURED = "unstructured"
+    KBADMINPARSER = "kbadmin_parser"
 
 
 class IndexerType(str, Enum):
@@ -51,6 +58,7 @@ class IndexerType(str, Enum):
     FAISS_VECTOR = "faiss_vector"
     DEFAULT_VECTOR = "vector"
     MILVUS_VECTOR = "milvus_vector"
+    KBADMIN_INDEXER = "kbadmin_indexer"
 
 
 class RetrieverType(str, Enum):
@@ -58,6 +66,7 @@ class RetrieverType(str, Enum):
     VECTORSIMILARITY = "vectorsimilarity"
     AUTOMERGE = "auto_merge"
     BM25 = "bm25"
+    KBADMIN_RETRIEVER = "kbadmin_retriever"
 
 
 class PostProcessorType(str, Enum):
@@ -69,6 +78,7 @@ class PostProcessorType(str, Enum):
 class GeneratorType(str, Enum):
 
     CHATQNA = "chatqna"
+    FREECHAT = "freechat"
 
 
 class InferenceType(str, Enum):
@@ -81,7 +91,18 @@ class CallbackType(str, Enum):
 
     DATAPREP = "dataprep"
     RETRIEVE = "retrieve"
+    RETRIEVE_POSTPROCESS = "retrieve_postprocess"
+    POSTPROCESS = "postprocess"
+    GENERATE = "generate"
     PIPELINE = "pipeline"
+    RUNAGENT = "run_agent"
+    QUERYSEARCH = "query_search"
+
+
+class AgentType(str, Enum):
+
+    SIMPLE = "simple"
+    DEEPSEARCH = "deep_search"
 
 
 class BaseComponent(BaseModel):
@@ -113,9 +134,19 @@ class BaseMgr:
     def __init__(self):
         self.components = {}
 
-    def add(self, comp: BaseComponent):
+    def add(self, comp: BaseComponent, name: str = None):
+        if name:
+            self.components[name] = comp
+            return True
         self.components[comp.idx] = comp
 
+    def append(self, comp: BaseComponent, name: str = None):
+        key = name if name else comp.idx
+        if key not in self.components:
+            self.components[key] = []
+        self.components[key].append(comp)
+        return True
+
     def get(self, idx: str) -> BaseComponent:
         if idx in self.components:
             return self.components[idx]
diff --git a/EdgeCraftRAG/edgecraftrag/components/agent.py b/EdgeCraftRAG/edgecraftrag/components/agent.py
new file mode 100644
index 0000000000..fd6c4ff7a2
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agent.py
@@ -0,0 +1,114 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import os
+from abc import abstractmethod
+
+from comps.cores.proto.api_protocol import ChatCompletionRequest
+from edgecraftrag.base import BaseComponent, CallbackType, CompType
+from edgecraftrag.components.agents.utils import remove_think_tags
+from edgecraftrag.utils import stream_generator
+from langgraph.config import get_stream_writer
+from pydantic import model_serializer
+
+
+class Agent(BaseComponent):
+
+    def __init__(self, name, agent_type, pipeline_idx, configs):
+        super().__init__(name=name, comp_type=CompType.AGENT, comp_subtype=agent_type)
+        if self.name == "" or self.name is None:
+            self.name = self.idx
+        self.enable_benchmark = os.getenv("ENABLE_BENCHMARK", "False").lower() == "true"
+        self.pipeline_idx = pipeline_idx
+        self.manager = None
+        self.configs = configs
+
+    @classmethod
+    @abstractmethod
+    def get_default_configs(cls):
+        pass
+
+    def get_bound_pipeline(self):
+        if self.manager is not None:
+            pl = self.manager.get_pipeline_by_name_or_id(self.pipeline_idx)
+            return pl
+        raise ValueError("No pipeline bound or bound pipeline not found")
+
+    def get_active_knowledge_base(self):
+        if self.manager is not None:
+            kb = self.manager.get_active_knowledge_base()
+            return kb
+        return None
+
+    async def llm_generate(self, request: ChatCompletionRequest, streaming):
+        request.stream = streaming
+        request.messages = self._messages
+        response = await self._run_pipeline_generate(request)
+        return response
+
+    async def llm_generate_astream_writer(self, request, prefix=None, suffix=None) -> str:
+        response = ""
+        writer = get_stream_writer()
+        first = True
+        generator = await self.llm_generate(request, True)
+        async for chunk in generator:
+            if first and prefix:
+                writer(prefix + chunk)
+                first = False
+            else:
+                writer(chunk)
+            response += chunk
+        if suffix:
+            writer(suffix)
+        response = remove_think_tags(response)
+        return response
+
+    # wrappers for calling pipeline
+    async def run_pipeline_chatqna(self, request):
+        pl = self.get_bound_pipeline()
+        if pl is not None:
+            return await pl.run(cbtype=CallbackType.PIPELINE, chat_request=request)
+
+    async def _run_pipeline_generate(self, request):
+        pl = self.get_bound_pipeline()
+        if pl is not None:
+            return await pl.run(cbtype=CallbackType.GENERATE, chat_request=request)
+
+    async def run_pipeline_retrieve_and_rerank(self, request):
+        pl = self.get_bound_pipeline()
+        if pl is not None:
+            return await pl.run(cbtype=CallbackType.RETRIEVE_POSTPROCESS, chat_request=request)
+
+    async def run_pipeline_retrieve(self, request):
+        pl = self.get_bound_pipeline()
+        if pl is not None:
+            return await pl.run(cbtype=CallbackType.RETRIEVE, chat_request=request)
+
+    async def run_pipeline_rerank(self, request, contexts):
+        pl = self.get_bound_pipeline()
+        if pl is not None:
+            return await pl.run(cbtype=CallbackType.POSTPROCESS, chat_request=request, contexts=contexts)
+
+    async def run_pipeline_query_search(self, request):
+        pl = self.get_bound_pipeline()
+        if pl is not None:
+            return await pl.run(cbtype=CallbackType.QUERYSEARCH, chat_request=request)
+
+    @model_serializer
+    def ser_model(self):
+        isactive = True if self.idx == self.manager.get_active_agent_id() else False
+        set = {
+            "idx": self.idx,
+            "name": self.name,
+            "type": self.comp_subtype,
+            "pipeline_idx": self.pipeline_idx,
+            "configs": self.configs,
+            "active": isactive,
+        }
+        return set
+
+
+async def stream_writer(input):
+    writer = get_stream_writer()
+    async for chunk in stream_generator(input):
+        writer(chunk)
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/__init__.py b/EdgeCraftRAG/edgecraftrag/components/agents/__init__.py
new file mode 100644
index 0000000000..4057dc0163
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/__init__.py
@@ -0,0 +1,2 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/__init__.py b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/__init__.py
new file mode 100644
index 0000000000..4057dc0163
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/__init__.py
@@ -0,0 +1,2 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/default.json b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/default.json
new file mode 100644
index 0000000000..98afc83cb3
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/default.json
@@ -0,0 +1,24 @@
+{
+  "system_instruction": "As an expert AI assistant for TCB Bonder systems, your goal is to provide accurate solutions. Analyze the user's question, create a retrieval plan, gather information, and synthesize a step-by-step answer. Follow all instructions.",
+  "plan_instruction": "To maximize retrieval recall, create a multi-step query plan. First, deconstruct the user's question into its core components and symptoms. Then, generate hypotheses about the potential root causes. Finally, create a numbered list of 2-5 queries to investigate these hypotheses.\n\n*   **Step 1 (Rephrase and Broaden):** Start with a comprehensive query that rephrases the user's question, including synonyms and alternative phrasings to ensure broad initial coverage.\n*   **Subsequent Steps (Hypothesis Testing):** Each following query should be a targeted, self-contained question designed to confirm or deny a specific hypothesis. These queries must include precise technical terms, component names, and potential error codes to retrieve the most relevant documents.\n\nYour final output must be only the numbered list of queries.",
+  "query_instruction": "After each retrieval, evaluate if you have enough information to solve the problem. If not, and if your plan has more steps, formulate the next query. This query must be a concise, targeted sub-question with precise keywords to fill a specific knowledge gap. Do not use prefixes like 'Query:'./no_think",
+  "answer_instruction": "As a TCB Bonder expert, synthesize the retrieved information into a final, actionable answer for the user.\n\n**User's Question:**\n{question}\n\n**Retrieved Information:**\n{plan_with_information}\n\n**Your Task:**\n1.  **Synthesize and Filter:** Review all retrieved context, using only the most relevant information to address the user's problem.\n2.  **Structure and Format:** Organize the solution into a clear, step-by-step guide. Present it as a numbered or bulleted list, highlighting any warnings at the beginning./no_think",
+  "domain_knowledge": "",
+  "prompt_templates": {
+    "system": "{system_instruction}\n\n{query_instruction}\n\n{domain_knowledge}\n\n{experiences}\n",
+    "generate_query": "Now generate a query for the next retrieval./no_think",
+    "make_plan": "Now generate a plan based on the user's question above. \n\n{plan_instruction}\n\nFormat the plan as a (Python) list containing the ordered steps, each step is a string./no_think",
+    "plan": "The following is the plan to step by step retrieve knowledge needed and work out an answer to user's question:\n{plan_steps}\n",
+    "plan_step": "Step {num}: {step}.",
+    "context": "<context>\n{context}\n</context>\n",
+    "contexts": "The following are the retrieved contexts for current query.\n{contexts}\n",
+    "continue_decision": "Is more information needed? Answer Yes or No. Then explain why or why not.",
+    "experiences": "The following are question-plan examples by human experts. Refer to them to better make your plan. If you find that there is a question that is highly similar or exactly match the input question, then strictly follow the subquestions to make the plan.\n\n{experiences}\n"
+  },
+
+  "retrieve_top_k": 60,
+  "rerank_top_k": 3,
+  "mece_retrieval": true,
+  "max_retrievals": 3,
+  "max_plan_steps": 3
+}
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/tcb_demo_v8_rs_v3.json b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/tcb_demo_v8_rs_v3.json
new file mode 100644
index 0000000000..914924a59c
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/tcb_demo_v8_rs_v3.json
@@ -0,0 +1,25 @@
+{
+  "system_instruction": "As an expert AI assistant for TCB Bonder systems, your goal is to provide accurate solutions. Analyze the user's question, create a retrieval plan, gather information, and synthesize a step-by-step answer. Follow all instructions.",
+  "plan_instruction": "To maximize retrieval recall, create a multi-step query plan. First, deconstruct the user's question into its core components and symptoms. Then, generate hypotheses about the potential root causes. Finally, create a numbered list of 2-5 queries to investigate these hypotheses.\n\n*   **Step 1 (Rephrase and Broaden):** Start with a comprehensive query that rephrases the user's question, including synonyms and alternative phrasings to ensure broad initial coverage.\n*   **Subsequent Steps (Hypothesis Testing):** Each following query should be a targeted, self-contained question designed to confirm or deny a specific hypothesis. These queries must include precise technical terms, component names, and potential error codes to retrieve the most relevant documents.\n\nYour final output must be only the numbered list of queries.",
+  "query_instruction": "After each retrieval, evaluate if you have enough information to solve the problem. If not, and if your plan has more steps, formulate the next query. This query must be a concise, targeted sub-question with precise keywords to fill a specific knowledge gap. Do not use prefixes like 'Query:'.",
+  "answer_instruction": "As a TCB Bonder expert, your task is to synthesize the raw, unfiltered retrieved documents into a final, actionable answer for the user.\n\n**User's Question:**\n{question}\n\n**Retrieved Information:**\n{plan_with_information}\n\n**Your Task:**\n1.  **Synthesize and Filter:** The retrieved information consists of raw, and potentially noisy, document chunks. Critically evaluate the relevance and accuracy of all retrieved context. You must filter out irrelevant, redundant, or contradictory information to distill only the most pertinent facts for solving the user's problem.\n2.  **Structure and Format:** Organize the solution into a clear, step-by-step guide. Present it as a numbered or bulleted list, highlighting any warnings at the beginning. Your answer must be based *only* on the provided retrieved information.",
+  "recur_summarize_instruction": "Now, identify the useful context (and ignore the irrelevant text) from the previous search steps and summarize the search process in a concise manner.",
+  "domain_knowledge": "",
+  "prompt_templates": {
+    "system": "{system_instruction}\n\n{query_instruction}\n\n{domain_knowledge}\n\n{experiences}\n",
+    "generate_query": "Now generate a query for the next retrieval.",
+    "make_plan": "Now generate a plan based on the user's question above. \n\n{plan_instruction}\n\nFormat the plan as a (Python) list containing the ordered steps, each step is a string.",
+    "plan": "The following is the plan to step by step retrieve knolwedge needed and work out a answer to user's question:\n{plan_steps}\n",
+    "plan_step": "Step {num}: {step}.",
+    "context": "<context>\n{context}\n</context>\n",
+    "contexts": "The following are the retrieved contexts for current query.\n{contexts}\n",
+    "continue_decision": "Is more information needed? Answer Yes or No. Then explain why or why not.",
+    "experiences": "The following are question-plan examples by human experts. Refer to them to better make your plan. If you find that there is a question that is highly similar or exactly match the input question, then strictly follow the subquestions to make the plan.\n\n{experiences}\n"
+  },
+
+  "retrieve_top_k": 60,
+  "rerank_top_k": 3,
+  "mece_retrieval": true,
+  "max_retrievals": 3,
+  "max_plan_steps": 6
+}
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/tcb_demo_v8_rss_v3.json b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/tcb_demo_v8_rss_v3.json
new file mode 100644
index 0000000000..b236df0a27
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/cfgs/tcb_demo_v8_rss_v3.json
@@ -0,0 +1,26 @@
+{
+  "system_instruction": "As an expert AI assistant for TCB Bonder systems, your goal is to provide accurate solutions. Analyze the user's question, create a retrieval plan, gather information, and synthesize a step-by-step answer. Follow all instructions.",
+  "plan_instruction": "To maximize retrieval recall, create a multi-step query plan. First, deconstruct the user's question into its core components and symptoms. Then, generate hypotheses about the potential root causes. Finally, create a numbered list of 2-5 queries to investigate these hypotheses.\n\n*   **Step 1 (Rephrase and Broaden):** Start with a comprehensive query that rephrases the user's question, including synonyms and alternative phrasings to ensure broad initial coverage.\n*   **Subsequent Steps (Hypothesis Testing):** Each following query should be a targeted, self-contained question designed to confirm or deny a specific hypothesis. These queries must include precise technical terms, component names, and potential error codes to retrieve the most relevant documents.\n\nYour final output must be only the numbered list of queries.",
+  "query_instruction": "After each retrieval, evaluate if you have enough information to solve the problem. If not, and if your plan has more steps, formulate the next query. This query must be a concise, targeted sub-question with precise keywords to fill a specific knowledge gap. Do not use prefixes like 'Query:'.",
+  "answer_instruction": "As a TCB Bonder expert, your task is to synthesize the pre-processed, summarized information into a final, actionable answer for the user.\n\n**User's Question:**\n{question}\n\n**Retrieved Information:**\n{plan_with_information}\n\n**Your Task:**\n1.  **Synthesize and Filter:** The retrieved information consists of concise summaries from multiple retrieval steps. Your primary goal is to integrate these summaries into a single, coherent response. While the information is pre-filtered, you must still identify and use only the most relevant details to address the user's specific problem.\n2.  **Structure and Format:** Organize the solution into a clear, step-by-step guide. Present it as a numbered or bulleted list, highlighting any warnings at the beginning. Your answer must be based *only* on the provided summarized information.",
+  "recur_summarize_instruction": "Now, identify the useful context (and ignore the irrelevant text) from the previous search steps and summarize the search process in a concise manner.",
+  "domain_knowledge": "",
+  "prompt_templates": {
+    "system": "{system_instruction}\n\n{query_instruction}\n\n{domain_knowledge}\n\n{experiences}\n",
+    "generate_query": "Now generate a query for the next retrieval.",
+    "make_plan": "Now generate a plan based on the user's question above. \n\n{plan_instruction}\n\nFormat the plan as a (Python) list containing the ordered steps, each step is a string.",
+    "plan": "The following is the plan to step by step retrieve knolwedge needed and work out a answer to user's question:\n{plan_steps}\n",
+    "plan_step": "Step {num}: {step}.",
+    "context": "<context>\n{context}\n</context>\n",
+    "contexts": "The following are the retrieved contexts for current query.\n{contexts}\n",
+    "continue_decision": "Is more information needed? Answer Yes or No. Then explain why or why not.",
+    "experiences": "The following are question-plan examples by human experts. Refer to them to better make your plan. If you find that there is a question that is highly similar or exactly match the input question, then strictly follow the subquestions to make the plan.\n\n{experiences}\n"
+  },
+
+  "retrieve_top_k": 60,
+  "rerank_top_k": 3,
+  "mece_retrieval": true,
+  "max_retrievals": 3,
+  "max_plan_steps": 6,
+  "use_summarized_context": true
+}
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/config.py b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/config.py
new file mode 100644
index 0000000000..1c40ed023c
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/config.py
@@ -0,0 +1,86 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+"""Configuration models and helpers for Mini Deep Search."""
+
+from __future__ import annotations
+
+import json
+from pathlib import Path
+from typing import Any, Dict
+
+from pydantic import BaseModel, Field
+
+
+class PromptTemplates(BaseModel):
+    """Collection of prompt templates used by the DeepSearch workflow."""
+
+    system: str = Field(..., description="Template for the system prompt.")
+    generate_query: str = Field(..., description="Instruction for generating the next retrieval query.")
+    make_plan: str = Field(..., description="Instruction for constructing the retrieval plan.")
+    plan: str = Field(..., description="Format string for presenting the plan back to the model.")
+    plan_step: str = Field(..., description="Template used for each individual plan step.")
+    context: str = Field(..., description="Template for wrapping a single context chunk.")
+    contexts: str = Field(..., description="Template for presenting all contexts for evaluation.")
+    continue_decision: str = Field(..., description="Instruction asking the model whether more retrieval is needed.")
+    experiences: str = Field(..., description="Template used when experience search results are available.")
+
+
+class Config(BaseModel):
+    """Runtime configuration for the Mini Deep Search pipeline."""
+
+    system_instruction: str
+    plan_instruction: str = ""
+    query_instruction: str
+    answer_instruction: str
+    domain_knowledge: str
+    retrieve_top_k: int
+    rerank_top_k: int
+    mece_retrieval: bool = False
+    max_retrievals: int
+    max_plan_steps: int = 7
+    recur_summarize_instruction: str = ""
+    postproc: str = "defaults.py"
+    use_summarized_context: bool = False
+    prompt_templates: PromptTemplates
+
+
+def _resolve_path(value: str, base_path: Path) -> str:
+    """Resolve value relative to ``base_path`` if it is an existing file."""
+    if not value:
+        return value
+    value_path = Path(value)
+    if value_path.is_absolute():
+        return str(value_path)
+    candidate = base_path / value
+    return str(candidate) if candidate.exists() else value
+
+
+def load_config(config_path: str) -> Config:
+    """Load and normalise a configuration file.
+
+    Args:
+        config_path: Path to the configuration JSON.
+
+    Returns:
+        A fully-populated :class:`Config` instance.
+    """
+
+    config_file = Path(config_path).expanduser().resolve()
+    with config_file.open("r", encoding="utf-8") as handle:
+        config_dict: Dict[str, Any] = json.load(handle)
+
+    base_dir = config_file.parent
+
+    # Resolve relative paths where applicable.
+    for key in ("domain_knowledge", "postproc"):
+        if key in config_dict and isinstance(config_dict[key], str):
+            config_dict[key] = _resolve_path(config_dict[key], base_dir)
+
+    cfg = Config(**config_dict)
+
+    # Expand domain knowledge file lazily if it points to a file.
+    domain_path = Path(cfg.domain_knowledge)
+    if domain_path.exists() and domain_path.is_file():
+        cfg.domain_knowledge = domain_path.read_text(encoding="utf-8")
+
+    return cfg
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/deep_search.py b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/deep_search.py
new file mode 100644
index 0000000000..ada6713be1
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/deep_search.py
@@ -0,0 +1,628 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+"""Core DeepSearch implementation."""
+
+from __future__ import annotations
+
+import asyncio
+import os
+from typing import Any, List, Tuple
+
+from comps.cores.proto.api_protocol import ChatCompletionRequest
+from edgecraftrag.base import AgentType, CallbackType, CompType
+from edgecraftrag.components.agent import Agent, stream_writer
+from langgraph.graph import END, START, StateGraph
+from pydantic import BaseModel, Field
+
+from .config import load_config
+from .logging_utils import format_terminal_str, log_status
+from .postprocessing import postproc_answer as default_postproc_answer
+from .postprocessing import postproc_plan as default_postproc_plan
+from .postprocessing import postproc_query as default_postproc_query
+from .utils import Role, import_module_from_path
+
+DEFAULT_CONFIG = "./edgecraftrag/components/agents/deep_search/cfgs/default.json"
+
+
+class Retrieval(BaseModel):
+    step: str
+    query: str
+    retrieved: List[Any] = Field(...)
+    reranked: List[Any] = Field(...)
+
+
+class DeepSearchState(BaseModel):
+    question: str
+    query: str
+    step: int
+    num_retrievals: int
+    answer: str
+
+    plan: List[str] = Field(default_factory=list)
+    retrievals: List[Retrieval] = Field(default_factory=list)
+    context_chunk_ids: List[str] = Field(default_factory=list)
+    search_summaries: List[str] = Field(default_factory=list)
+
+    request: ChatCompletionRequest
+
+
+class DeepSearchAgent(Agent):
+    """Driver class orchestrating the deep search workflow."""
+
+    def __init__(self, idx, name, pipeline_idx, cfg):
+        super().__init__(name=name, agent_type=AgentType.DEEPSEARCH, pipeline_idx=pipeline_idx, configs=cfg)
+
+        # Load the configuration
+        # TODO: remove deep path
+        self.cfg = load_config(DEFAULT_CONFIG)
+        if idx is not None:
+            self.idx = idx
+        if "retrieve_top_k" in cfg:
+            self.cfg.retrieve_top_k = cfg["retrieve_top_k"]
+        if "rerank_top_k" in cfg:
+            self.cfg.rerank_top_k = cfg["rerank_top_k"]
+        if "mece_retrieval" in cfg:
+            self.cfg.mece_retrieval = cfg["mece_retrieval"]
+        if "max_retrievals" in cfg:
+            self.cfg.max_retrievals = cfg["max_retrievals"]
+        if "max_plan_steps" in cfg:
+            self.cfg.max_plan_steps = cfg["max_plan_steps"]
+
+        self.graph = self._build_graph()
+        self._messages: List[dict] = []
+        self.conversation_history: List[dict] = []
+
+        postproc_module = None
+        if self.cfg.postproc:
+            try:
+                postproc_module = import_module_from_path(self.cfg.postproc)
+            except ImportError as exc:
+                log_status(
+                    "⚠️",
+                    format_terminal_str(
+                        f"Failed to import postproc module '{self.cfg.postproc}': {exc}", color="yellow"
+                    ),
+                )
+        postproc_module = postproc_module or None
+        self.postproc_query = getattr(postproc_module, "postproc_query", default_postproc_query)
+        self.postproc_answer = getattr(postproc_module, "postproc_answer", default_postproc_answer)
+        self.postproc_plan = getattr(postproc_module, "postproc_plan", default_postproc_plan)
+
+    @classmethod
+    def get_default_configs(cls):
+        cfg = load_config(DEFAULT_CONFIG)
+        return {
+            "retrieve_top_k": cfg.retrieve_top_k,
+            "rerank_top_k": cfg.rerank_top_k,
+            "mece_retrieval": cfg.mece_retrieval,
+            "max_retrievals": cfg.max_retrievals,
+            "max_plan_steps": cfg.max_plan_steps,
+        }
+
+    def update(self, cfg):
+        retrieve = cfg.get("retrieve_top_k", None)
+        if retrieve and isinstance(retrieve, int):
+            self.cfg.retrieve_top_k = retrieve
+            self.configs["retrieve_top_k"] = retrieve
+
+        rerank = cfg.get("rerank_top_k", None)
+        if rerank and isinstance(rerank, int):
+            self.cfg.rerank_top_k = rerank
+            self.configs["rerank_top_k"] = rerank
+
+        mr = cfg.get("mece_retrieval", None)
+        if mr and isinstance(mr, int):
+            self.cfg.mece_retrieval = mr
+            self.configs["mece_retrieval"] = mr
+
+        maxr = cfg.get("max_retrievals", None)
+        if maxr and isinstance(maxr, int):
+            self.cfg.max_retrievals = maxr
+            self.configs["max_retrievals"] = maxr
+
+        mps = cfg.get("max_plan_steps", None)
+        if mps and isinstance(mps, int):
+            self.cfg.max_plan_steps = mps
+            self.configs["max_plan_steps"] = mps
+
+    async def _build_init_messages(self, request: ChatCompletionRequest) -> List[dict]:
+        if os.path.isfile(self.cfg.domain_knowledge):
+            with open(self.cfg.domain_knowledge, "r", encoding="utf-8") as file:
+                self.cfg.domain_knowledge = file.read()
+
+        experiences_block = ""
+        experience_status = True if request.tool_choice == "auto" else False
+        if experience_status:
+            log_status(
+                "🔍",
+                format_terminal_str(
+                    "Retrieving experiences from experience knowledge base ...\n",
+                    color="cyan",
+                    bold=True,
+                ),
+            )
+            _, query_search_result = await self.run_pipeline_query_search(request)
+            raw_examples = query_search_result
+            if isinstance(query_search_result, dict):
+                raw_examples = query_search_result.get("results") or ""
+            if isinstance(raw_examples, str):
+                examples = [chunk for chunk in raw_examples.split("\n\n") if chunk.strip()]
+            elif isinstance(raw_examples, list):
+                examples = [chunk for chunk in raw_examples if isinstance(chunk, str) and chunk.strip()]
+            else:
+                examples = []
+            if examples:
+                num_retrieved = len(examples)
+                num_max_examples = 3
+                if num_retrieved > num_max_examples:
+                    examples = examples[:num_max_examples]
+                    log_status(
+                        "📚",
+                        f"Retrieved {format_terminal_str(str(num_retrieved), color='cyan', bold=True)} similar questions from experience database.",
+                    )
+                    log_status(
+                        "⚠️",
+                        f"Truncated to top {format_terminal_str(str(num_max_examples), color='cyan', bold=True)} examples for prompt.\n",
+                    )
+                else:
+                    log_status(
+                        "📚",
+                        f"Retrieved {format_terminal_str(str(num_retrieved), color='cyan', bold=True)} similar questions from experience database.\n",
+                    )
+                experiences_block = self.cfg.prompt_templates.experiences.format(experiences="\n\n".join(examples))
+        return [
+            {
+                "role": Role.SYSTEM.value,
+                "content": self.cfg.prompt_templates.system.format(
+                    system_instruction=self.cfg.system_instruction,
+                    query_instruction=self.cfg.query_instruction,
+                    domain_knowledge=self.cfg.domain_knowledge,
+                    experiences=experiences_block,
+                ),
+            }
+        ]
+
+    async def _retrieve_and_rerank(
+        self, state: DeepSearchState, mece_retrieve: bool = False
+    ) -> Tuple[List[Any], List[Any], List[str]]:
+        retrieval_query, rerank_query = self.postproc_query(state.query, state)
+        mece_retrieve = mece_retrieve or self.cfg.mece_retrieval
+        request = state.request
+        request.messages = retrieval_query
+        contexts = await self.run_pipeline_retrieve(request)
+        # Llamaindex NodeWithScore Structure
+        retrieved = contexts[CompType.RETRIEVER]
+
+        if mece_retrieve:
+            new_retrieved = [node for node in retrieved if node.node_id not in state.context_chunk_ids]
+            # TODO: Using top_k from request, need to change?
+            new_retrieved = new_retrieved[: request.k]
+        else:
+            new_retrieved = retrieved
+
+        contexts[CompType.RETRIEVER] = new_retrieved
+
+        request = state.request
+        request.messages = rerank_query
+        contexts = await self.run_pipeline_rerank(request, contexts)
+        reranked = contexts[CompType.POSTPROCESSOR]
+        reranked_chunk_ids = [node.node_id for node in reranked]
+        return new_retrieved, reranked, state.context_chunk_ids + reranked_chunk_ids
+
+    async def retrieve(self, state: DeepSearchState) -> dict:
+        retrieved, reranked, updated_chunk_ids = await self._retrieve_and_rerank(state)
+        log_status(
+            "🔍",
+            f"Retrieved {format_terminal_str(str(len(retrieved)), color='magenta', bold=True)} documents, "
+            f"Reranked to top {format_terminal_str(str(len(reranked)), color='magenta', bold=True)}.",
+        )
+        await stream_writer(f"\n\n🔍 **Retrieved {str(len(retrieved))}, Reranked to top {str(len(reranked))}**\n\n")
+        new_retrieval = Retrieval(
+            step=state.plan[state.step],
+            query=state.query,
+            retrieved=retrieved,
+            reranked=reranked,
+        )
+        return {
+            "num_retrievals": state.num_retrievals + 1,
+            "retrievals": [*state.retrievals, new_retrieval],
+            "context_chunk_ids": updated_chunk_ids,
+        }
+
+    async def check_retrieved(self, state: DeepSearchState) -> str:
+        log_status("🤔", format_terminal_str("Evaluating if more information is needed", color="green"))
+        await stream_writer("\n\n🤔 **Evaluating if more information is needed**\n\n")
+        contexts = self.cfg.prompt_templates.contexts.format(
+            contexts="\n".join(
+                [self.cfg.prompt_templates.context.format(context=doc.text) for doc in state.retrievals[-1].reranked]
+            )
+        )
+        messages = [
+            {
+                "role": Role.SYSTEM.value,
+                "content": contexts,
+            },
+            {
+                "role": Role.SYSTEM.value,
+                "content": self.cfg.prompt_templates.continue_decision,
+            },
+        ]
+        self._messages.extend(messages)
+        self.conversation_history.extend(messages)
+        if state.num_retrievals >= self.cfg.max_retrievals:
+            log_status(
+                "⚠️",
+                format_terminal_str(
+                    f"Reached maximum retrievals: {self.cfg.max_retrievals}, stopping search\n",
+                    color="yellow",
+                    bold=True,
+                ),
+            )
+            await stream_writer(f"\n\n⚠️ **Reached maximum retrievals: {self.cfg.max_retrievals}, stopping search**\n\n")
+            return "stop"
+
+        response = await self.llm_generate_astream_writer(state.request)
+
+        message = {
+            "role": Role.ASSISTANT.value,
+            "content": response,
+        }
+        self._messages.append(message)
+        self.conversation_history.append(message)
+        if response.upper().startswith("NO"):
+            log_status(
+                "✅",
+                format_terminal_str("Information is sufficient, moving to next step\n", color="green"),
+            )
+            await stream_writer("\n\n✅ **Information is sufficient, moving to next step**\n\n")
+            return "stop"
+        log_status(
+            "🔄",
+            format_terminal_str("Need more information, generating new query ...", color="green"),
+        )
+        await stream_writer("\n\n🔄 **Need more information, generating new query**\n\n")
+        return "continue"
+
+    async def generate_query(self, state: DeepSearchState) -> dict:
+        await stream_writer("\n\n💡 **Generating a query to help to understand the question**\n\n")
+        message = {
+            "role": Role.SYSTEM.value,
+            "content": self.cfg.prompt_templates.generate_query,
+        }
+        self._messages.append(message)
+        self.conversation_history.append(message)
+
+        response = await self.llm_generate_astream_writer(state.request)
+
+        message = {
+            "role": Role.ASSISTANT.value,
+            "content": response,
+        }
+        self._messages.append(message)
+        self.conversation_history.append(message)
+        return {"query": response}
+
+    async def execute_next_step(self, state: DeepSearchState) -> None:
+        step = state.plan[state.step]
+        title_str = format_terminal_str(
+            f"Executing Step {state.step + 1}/{len(state.plan)}:",
+            color="green",
+            bold=True,
+        )
+        log_status("🚀", f"{title_str} {format_terminal_str(step, italic=True)}")
+        log_status("💡", format_terminal_str("Generating the initial query ...", color="green"))
+        await stream_writer(f'<agent title="Executing Step {state.step + 1}/{len(state.plan)}: {step}">')
+        message = {
+            "role": Role.SYSTEM.value,
+            "content": f"Start to execute the step: {step}\n",
+        }
+        self._messages.append(message)
+        self.conversation_history.append(message)
+
+    async def finish_search(self, state: DeepSearchState) -> dict:
+        await stream_writer("</agent>")
+        return {"step": state.step + 1, "num_retrievals": 0}
+
+    async def check_execution(self, state: DeepSearchState) -> str:
+        if state.step >= len(state.plan):
+            log_status("🏁", format_terminal_str("All planned steps completed", color="cyan", bold=True))
+            await stream_writer('<agent title="All planned steps completed" tag="nofold"></agent>')
+            return "stop"
+        return "continue"
+
+    async def make_plan(self, state: DeepSearchState) -> dict:
+        log_status("📋", format_terminal_str("Making a plan ...", color="cyan", bold=True))
+        await stream_writer('<agent title="Making a plan">')
+        messages = [
+            {
+                "role": Role.USER.value,
+                "content": state.question,
+            },
+            {
+                "role": Role.SYSTEM.value,
+                "content": self.cfg.prompt_templates.make_plan.format(plan_instruction=self.cfg.plan_instruction),
+            },
+        ]
+        self._messages.extend(messages)
+        self.conversation_history.extend(messages)
+
+        response = await self.llm_generate(state.request, False)
+
+        plan = self.postproc_plan(response, state, self.cfg)
+        num_plan_step = len(plan)
+        for i, step in enumerate(plan):
+            step_num_str = format_terminal_str(f"Step{i+1: >2d}:", color="green", bold=True)
+            step_str = format_terminal_str(step, bold=False, italic=True)
+            suffix = "\n" if i == num_plan_step - 1 else ""
+            log_status("📌", f"{step_num_str} {step_str}{suffix}")
+            await stream_writer(f"📌 Step{i+1: >2d}: {step}\n\n")
+        await stream_writer("</agent>")
+        plan_prompt = self.cfg.prompt_templates.plan.format(
+            plan_steps="\n".join(
+                [self.cfg.prompt_templates.plan_step.format(num=i + 1, step=step) for i, step in enumerate(plan)]
+            )
+        )
+        message = {
+            "role": Role.ASSISTANT.value,
+            "content": plan_prompt,
+        }
+        self._messages.append(message)
+        self.conversation_history.append(message)
+        return {"plan": plan, "step": 0, "num_retrievals": 0}
+
+    async def summarize_search(self, state: DeepSearchState) -> dict:
+        log_status("📝", format_terminal_str("Summarizing the search process ...", color="cyan", bold=True))
+        await stream_writer("📝 **Summarizing the search process**")
+        messages = [
+            {
+                "role": Role.SYSTEM.value,
+                "content": self.cfg.recur_summarize_instruction,
+            }
+        ]
+        self._messages.extend(messages)
+        self.conversation_history.extend(messages)
+
+        response = await self.llm_generate_astream_writer(state.request)
+
+        message = {
+            "role": Role.ASSISTANT.value,
+            "content": response,
+        }
+        self.conversation_history.append(message)
+        self._messages = [
+            self._messages[0],
+            self._messages[1],
+            self._messages[3],
+        ]
+        self._messages.append(
+            {
+                "role": Role.ASSISTANT.value,
+                "content": "The following is the summarized information from previous search steps:\n" + response,
+            }
+        )
+        log_status("✅", format_terminal_str("Search process summarized\n", color="cyan", bold=True))
+        await stream_writer("✅ **Search process summarized**")
+        return {"search_summaries": [*state.search_summaries, response]}
+
+    async def generate_answer(self, state: DeepSearchState) -> dict:
+        log_status("📝", format_terminal_str("Generating the final answer ...", color="cyan", bold=True))
+        await stream_writer('<agent title="Generating the final answer ..." tag="nofold"></agent>')
+
+        if self.cfg.use_summarized_context and state.search_summaries:
+            plan_with_information = "Plan with Summarized Information:\n"
+            for i, step in enumerate(state.plan):
+                plan_with_information += f"Step {i+1}: {step}\n"
+                if i < len(state.search_summaries):
+                    plan_with_information += f"- Summary: {state.search_summaries[i]}\n\n"
+                else:
+                    plan_with_information += "- Summary: N/A\n\n"
+        else:
+            if not self.cfg.mece_retrieval:
+                plan_with_information = (
+                    "Plan:\n" + "\n".join([f"{i+1}. {step}" for i, step in enumerate(state.plan)]) + "\n\n"
+                )
+                plan_with_information += "Retrieved Information:\n"
+                presented_ids = []
+                for retrieval in state.retrievals:
+                    for doc in retrieval.reranked:
+                        node_id = doc.node_id
+                        if node_id not in presented_ids:
+                            plan_with_information += f"{doc.text}\n\n"
+                            presented_ids.append(node_id)
+            else:
+                plan_with_information = "Plan with Retrieved Information:\n"
+                for i, step in enumerate(state.plan):
+                    plan_with_information += f"Step {i+1}: {step}\n"
+                    related_docs = []
+                    for retrieval in state.retrievals:
+                        if retrieval.step == step:
+                            related_docs = retrieval.reranked
+                            break
+                    for doc in related_docs:
+                        plan_with_information += f"- {doc.text}\n"
+                    plan_with_information += "\n"
+
+        self._messages = [
+            {
+                "role": Role.SYSTEM.value,
+                "content": self.cfg.answer_instruction.format(
+                    question=state.question,
+                    plan_with_information=plan_with_information,
+                ),
+            }
+        ]
+        self.conversation_history.extend(self._messages)
+
+        response = await self.llm_generate_astream_writer(state.request)
+
+        self.conversation_history.append(
+            {
+                "role": Role.ASSISTANT.value,
+                "content": response,
+            }
+        )
+        answer = self.postproc_answer(response, state)
+        title_str = format_terminal_str("Final Answer:", color="blue", bold=True)
+        log_status(
+            "✅",
+            format_terminal_str(
+                f"{title_str}\n{format_terminal_str(answer, italic=True, bold=True)}",
+                color="blue",
+                bold=True,
+            ),
+        )
+        return {"answer": answer}
+
+    def _build_graph(self):
+        search = StateGraph(DeepSearchState)
+        search.add_node("generate_query", self.generate_query)
+        search.add_node("retrieve", self.retrieve)
+        search.add_node("finish_search", self.finish_search)
+
+        search.add_edge(START, "generate_query")
+        search.add_edge("generate_query", "retrieve")
+        search.add_conditional_edges(
+            "retrieve",
+            self.check_retrieved,
+            {
+                "stop": "finish_search",
+                "continue": "generate_query",
+            },
+        )
+        if self.cfg.recur_summarize_instruction:
+            search.add_edge("finish_search", "summarize")
+            search.add_node("summarize", self.summarize_search)
+            search.add_edge("summarize", END)
+        else:
+            search.add_edge("finish_search", END)
+
+        deep_search = StateGraph(DeepSearchState)
+        deep_search.add_node("make_plan", self.make_plan)
+        deep_search.add_node("execute_search_step", self.execute_next_step)
+        deep_search.add_node("search", search.compile())
+        deep_search.add_node("final_answer", self.generate_answer)
+
+        deep_search.add_edge(START, "make_plan")
+        deep_search.add_edge("make_plan", "execute_search_step")
+        deep_search.add_edge("execute_search_step", "search")
+        deep_search.add_conditional_edges(
+            "search",
+            self.check_execution,
+            {
+                "stop": "final_answer",
+                "continue": "execute_search_step",
+            },
+        )
+        deep_search.add_edge("final_answer", END)
+
+        return deep_search.compile()
+
+    def generate_report(self, result: dict, report_path: str) -> str:
+        import datetime
+
+        log_status(
+            "📝",
+            format_terminal_str(
+                f"Generating markdown report at {report_path}",
+                color="cyan",
+                bold=True,
+            ),
+        )
+        question = result.get("question", "No question provided")
+        plan = result.get("plan", [])
+        answer = result.get("answer", "No answer provided")
+        retrievals = result.get("retrievals", [])
+        search_summaries = result.get("search_summaries", [])
+        graph_mermaid = result.get("graph_mermaid", "")
+        timestamp = datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+
+        report = [
+            "# Deep Search Report",
+            f"*Generated on: {timestamp}*",
+            "",
+            "## Original Question",
+            f"> {question}",
+            "",
+            "## Research Plan",
+        ]
+        for i, step in enumerate(plan):
+            report.append(f"{i+1}. {step}")
+        report.append("")
+        report.append("---")
+        report.append("## Search Statistics")
+        report.append(f"- **Total Retrieval Operations:** {len(retrievals)}")
+        if retrievals:
+            total_docs = sum(len(r.retrieved) for r in retrievals)
+            report.append(f"- **Total Documents Retrieved:** {total_docs}")
+            total_reranked = sum(len(r.reranked) for r in retrievals)
+            report.append(f"- **Total Documents After Reranking:** {total_reranked}")
+        report.append("")
+        report.append("---")
+        report.append("## Final Answer")
+        report.append(answer)
+        if search_summaries:
+            report.append("## Search Summaries")
+            for i, summary in enumerate(search_summaries):
+                report.append(f"### Summary for Step {i+1}")
+                report.append(summary)
+            report.append("")
+            report.append("---")
+        report.append("## Search Process Details")
+        for i, retrieval in enumerate(retrievals):
+            step_index = i + 1
+            step_desc = retrieval.step
+            report.append(f"### Retrieval {step_index}: {step_desc}")
+            report.append(f'**Query:** "{retrieval.query}"')
+            report.append("#### Retrieved Documents Summary")
+            for j, doc in enumerate(retrieval.reranked[:3]):
+                doc_content = doc.text
+                if len(doc_content) > 500:
+                    doc_content = doc_content[:500] + "..."
+                doc_content = doc_content.replace("\n", "\n> ")
+                report.append(f"**Document {j+1}:**")
+                report.append(f"> {doc_content}")
+                report.append("")
+            if i < len(retrievals) - 1:
+                report.append("---")
+        if graph_mermaid:
+            report.append("## Search Graph")
+            report.append("```mermaid")
+            report.append(graph_mermaid)
+            report.append("```")
+            report.append("")
+        with open(report_path, "w", encoding="utf-8") as handle:
+            handle.write("\n\n".join(report))
+        return report_path
+
+    # Implement abstract run function
+    # callback dispatcher
+    async def run(self, **kwargs) -> Any:
+        if "cbtype" in kwargs:
+            if kwargs["cbtype"] == CallbackType.RUNAGENT:
+                request = kwargs["chat_request"]
+
+                log_status(
+                    "🤿",
+                    f"{format_terminal_str('Starting DeepSearch:', color='cyan', bold=True)} {format_terminal_str(request.messages, italic=True)}\n",
+                )
+                state = DeepSearchState(
+                    question=request.messages,
+                    query="",
+                    step=0,
+                    num_retrievals=0,
+                    answer="",
+                    plan=[],
+                    retrievals=[],
+                    request=request,
+                )
+                self._messages = await self._build_init_messages(request)
+
+                async def async_gen():
+                    async for event, chunk in self.graph.astream(state, subgraphs=True, stream_mode="custom"):
+                        yield chunk
+                        await asyncio.sleep(0)
+
+                # log_status("✅", format_terminal_str("DeepSearch process completed", color="cyan", bold=True))
+                # result["conversation"] = [*self.conversation_history]
+                # result["graph_mermaid"] = self.graph.get_graph(xray=True).draw_mermaid()
+                return async_gen()
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/logging_utils.py b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/logging_utils.py
new file mode 100644
index 0000000000..bfa596dedb
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/logging_utils.py
@@ -0,0 +1,74 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+"""Logging helpers for Mini Deep Search."""
+
+import logging
+import os
+from typing import List
+
+_LOGGER_NAME = "deep_search"
+
+
+def _configure_logger() -> logging.Logger:
+    logger = logging.getLogger(_LOGGER_NAME)
+    if logger.handlers:
+        return logger
+
+    logger.setLevel(logging.INFO)
+    console_handler = logging.StreamHandler()
+    console_handler.setLevel(logging.INFO)
+    formatter = logging.Formatter("[%(asctime)s] %(message)s", datefmt="%H:%M:%S")
+    console_handler.setFormatter(formatter)
+    logger.addHandler(console_handler)
+    return logger
+
+
+LOGGER = _configure_logger()
+
+
+def log_status(emoji: str, message: str, indent: int = 0) -> None:
+    """Emit a formatted status message with optional indent."""
+    indent_str = "  " * indent
+    LOGGER.info("%s%s %s", indent_str, emoji, message)
+
+
+def format_terminal_str(text: str, color: str = "", bold: bool = False, italic: bool = False) -> str:
+    """Format ``text`` with ANSI colours, bold or italics."""
+    if text is None:
+        text = ""
+
+    if os.environ.get("NO_COLOR"):
+        return text
+
+    color_map = {
+        "black": 30,
+        "red": 31,
+        "green": 32,
+        "yellow": 33,
+        "blue": 34,
+        "magenta": 35,
+        "cyan": 36,
+        "white": 37,
+        "bright_black": 90,
+        "bright_red": 91,
+        "bright_green": 92,
+        "bright_yellow": 93,
+        "bright_blue": 94,
+        "bright_magenta": 95,
+        "bright_cyan": 96,
+        "bright_white": 97,
+    }
+
+    style_seq: List[str] = []
+    if color and color.lower() in color_map:
+        style_seq.append(str(color_map[color.lower()]))
+    if bold:
+        style_seq.append("1")
+    if italic:
+        style_seq.append("3")
+
+    if not style_seq:
+        return text
+
+    prefix = f"\033[{';'.join(style_seq)}m"
+    return f"{prefix}{text}\033[0m"
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/postproc_jqa.py b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/postproc_jqa.py
new file mode 100644
index 0000000000..4a0939a2ee
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/postproc_jqa.py
@@ -0,0 +1,36 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import json_repair
+from mini_deep_search.logging_utils import format_terminal_str, log_status
+
+
+def postproc_query(response_text, state):
+    """
+    load query for retrieval and rerank from a predefined JSON:
+    {
+        "keywords": "keywords for retrieval",
+        "query": "query for rerank"
+    }
+    """
+    # Default use the raw response text as the query for both retrieval and rerank
+    try:
+        # Attempt to parse the response text as JSON
+        parsed_json = json_repair.loads(response_text)
+        keywords_str = parsed_json.get("keywords", "")
+        query_str = parsed_json.get("query", "")
+        log_status(
+            "🧲",
+            f"{format_terminal_str('Keywords for retrieval:', color='magenta')} {format_terminal_str(keywords_str, italic=True)}",
+        )
+        log_status(
+            "🔮",
+            f"{format_terminal_str('Query for reranking:', color='magenta')} {format_terminal_str(query_str, italic=True)}",
+        )
+    except Exception as e:
+        # If parsing fails, return the original response text
+        print("Failed to parse JSON, returning original response text.")
+        print(e)
+        return response_text, response_text
+    # return keywords_str, query_str
+    return f"{state.question}\n{state.step}\n{keywords_str}", f"{query_str}"
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/postprocessing.py b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/postprocessing.py
new file mode 100644
index 0000000000..e48e3a61c6
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/postprocessing.py
@@ -0,0 +1,135 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+"""Default post-processing logic for Mini Deep Search."""
+
+from __future__ import annotations
+
+import re
+from typing import List, Optional, Tuple
+
+import json_repair
+
+from .logging_utils import format_terminal_str, log_status
+
+
+def _merge_plan_steps(plan: List[str], max_steps: int) -> List[str]:
+    """Merge plan steps if the generated plan exceeds ``max_steps``."""
+    if len(plan) <= max_steps:
+        return plan
+
+    merged_plan: List[str] = []
+    steps_per_group = len(plan) // max_steps
+    extra_steps = len(plan) % max_steps
+    index = 0
+    for i in range(max_steps):
+        group_size = steps_per_group + 1 if i < extra_steps else steps_per_group
+        if index < len(plan):
+            merged_plan.append(" ".join(plan[index : index + group_size]))
+            index += group_size
+    log_status(
+        "✨",
+        format_terminal_str(
+            f"Merged plan from {len(plan)} steps to {len(merged_plan)} steps.",
+            color="yellow",
+            bold=True,
+        ),
+    )
+    return merged_plan
+
+
+def _extract_pattern_and_text(line: str) -> Optional[Tuple[str, int, str]]:
+    match = re.match(r"^(.*?)(\d+)(.*)", line)
+    if match:
+        prefix, digit_str, text = match.groups()
+        if text.strip():
+            return prefix, int(digit_str), text.strip()
+    return None
+
+
+def parse_plan_from_text(text_content: str) -> List[str]:
+    """Parse a block of text to extract a numbered plan."""
+    lines = text_content.splitlines()
+    longest_plan: List[str] = []
+    for i, start_line in enumerate(lines):
+        processed_line = start_line.strip()
+        if processed_line.lower().startswith("step"):
+            processed_line = re.sub(r"^step\s*[:\-\s#]*", "", processed_line, flags=re.IGNORECASE)
+        pattern_info = _extract_pattern_and_text(processed_line)
+        if not pattern_info:
+            continue
+        prefix, digit, text = pattern_info
+        if digit not in (0, 1):
+            continue
+        current_plan = [text]
+        expected_digit = digit + 1
+        for next_line in lines[i + 1 :]:
+            processed_next_line = next_line.strip()
+            if processed_next_line.lower().startswith("step"):
+                processed_next_line = re.sub(r"^step\s*[:\-\s#]*", "", processed_next_line, flags=re.IGNORECASE)
+            expected_pattern = re.match(f"^{re.escape(prefix)}{expected_digit}(.*)", processed_next_line)
+            if not expected_pattern:
+                break
+            next_text = expected_pattern.group(1).strip()
+            if not next_text:
+                break
+            current_plan.append(next_text)
+            expected_digit += 1
+        if len(current_plan) > len(longest_plan):
+            longest_plan = current_plan
+    return [step.lstrip(" .:-") for step in longest_plan]
+
+
+def postproc_plan(text: str, state, cfg) -> List[str]:  # type: ignore[valid-type]
+    try:
+        plan = json_repair.loads(text)
+        if not plan:
+            try:
+                plan = parse_plan_from_text(text)
+            except Exception as exc:  # pragma: no cover - defensive logging only
+                log_status(
+                    "⚠️",
+                    format_terminal_str(
+                        f"Error parsing plan from text: {exc}. Using question as single step plan",
+                        color="red",
+                        bold=True,
+                    ),
+                )
+                plan = None
+        elif any(not isinstance(step, str) for step in plan):
+            new_plan = []
+            for step in plan:
+                if isinstance(step, str):
+                    new_plan.append(step)
+                elif isinstance(step, dict) and "step" in step:
+                    new_plan.append(step["step"])
+                elif isinstance(step, list) and all(isinstance(s, str) for s in step):
+                    new_plan.extend(step)
+                else:
+                    log_status("⚠️", f"Invalid step format: {step}. Using as-is.")
+                    new_plan.append(str(step))
+            plan = new_plan
+        log_status(
+            "✨",
+            format_terminal_str(f"Plan created with {len(plan)} steps.", color="cyan", bold=True),
+        )
+    except Exception as exc:  # pragma: no cover - defensive logging only
+        log_status(
+            "⚠️",
+            format_terminal_str(
+                f"Error evaluating plan: {exc}. Using question as single step plan",
+                color="red",
+                bold=True,
+            ),
+        )
+        plan = None
+    plan = plan or [state.question]
+    return _merge_plan_steps(plan, cfg.max_plan_steps)
+
+
+def postproc_query(text: str, state):  # type: ignore[valid-type]
+    log_status("💡", f"{format_terminal_str('Query generated:', color='cyan', bold=True)} '{text}'")
+    return text, text
+
+
+def postproc_answer(text: str, state):  # type: ignore[valid-type]
+    return text
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/utils.py b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/utils.py
new file mode 100644
index 0000000000..964be4cf13
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/deep_search/utils.py
@@ -0,0 +1,45 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+"""Internal helper utilities for Mini Deep Search."""
+
+from __future__ import annotations
+
+import importlib.util
+import os
+import re
+import sys
+from enum import Enum
+from typing import Optional
+
+
+class Role(str, Enum):
+    SYSTEM = "system"
+    ASSISTANT = "assistant"
+    USER = "user"
+
+
+def import_module_from_path(file_path: str):
+    """Import and return a Python module from the given path."""
+    if not os.path.isfile(file_path):
+        raise ImportError(f"File not found: {file_path}")
+
+    module_name = os.path.splitext(os.path.basename(file_path))[0]
+    spec = importlib.util.spec_from_file_location(module_name, file_path)
+    if spec is None:
+        raise ImportError(f"Failed to create spec for: {file_path}")
+
+    module = importlib.util.module_from_spec(spec)
+    sys.modules[module_name] = module
+    try:
+        if spec.loader is None:
+            raise ImportError(f"Module loader missing for: {file_path}")
+        spec.loader.exec_module(module)
+    except Exception as exc:  # pragma: no cover - propagates import errors
+        raise ImportError(f"Error executing module {module_name}: {exc}") from exc
+    return module
+
+
+def remove_tagged(text: str, tag: str = "think") -> str:
+    """Remove sections wrapped in a custom tag from ``text``."""
+    pattern = f"<{tag}>.*?</{tag}>"
+    return re.sub(pattern, "", text, flags=re.DOTALL).strip()
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/simple.py b/EdgeCraftRAG/edgecraftrag/components/agents/simple.py
new file mode 100644
index 0000000000..722bd3acda
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/simple.py
@@ -0,0 +1,274 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import asyncio
+from typing import Any, List
+
+from comps.cores.proto.api_protocol import ChatCompletionRequest
+from edgecraftrag.base import AgentType, CallbackType, CompType
+from edgecraftrag.components.agent import Agent, stream_writer
+from edgecraftrag.components.agents.utils import ROLE, format_terminal_str
+from langgraph.graph import END, START, StateGraph
+from pydantic import BaseModel, Field
+
+
+class Retrieval(BaseModel):
+    step: int
+    query: str
+    retrieved: List[Any] = Field(...)
+    reranked: List[Any] = Field(...)
+
+
+class QnaState(BaseModel):
+    question: str
+    query: str
+    num_retrievals: int
+    answer: str
+
+    retrievals: List[Retrieval] = Field(default_factory=list)
+    context_chunk_ids: List[str] = Field(default_factory=list)
+    request: ChatCompletionRequest
+
+
+class SimpleRAGAgent(Agent):
+
+    def __init__(self, idx, name, pipeline_idx, cfg):
+        super().__init__(name=name, agent_type=AgentType.SIMPLE, pipeline_idx=pipeline_idx, configs=cfg)
+        self.graph = self._build_graph()
+        self._messages = []
+        self.conversation_history = []
+        if idx is not None:
+            self.idx = idx
+        if "max_retrievals" in cfg:
+            self.max_retrievals = int(cfg["max_retrievals"])
+        else:
+            self.max_retrievals = 3
+        self.postproc_query = postproc_query
+        self.postproc_answer = postproc_answer
+
+    @classmethod
+    def get_default_configs(cls):
+        return {"max_retrievals": 3}
+
+    def update(self, cfg):
+        max_r = cfg.get("max_retrievals", None)
+        if max_r and isinstance(max_r, int):
+            self.max_retrievals = int(max_r)
+            self.configs["max_retrievals"] = self.max_retrievals
+            return True
+        else:
+            return False
+
+    def _build_graph(self):
+
+        qnagraph = StateGraph(QnaState)
+        qnagraph.add_node("generate_query", self.generate_query)
+        qnagraph.add_node("retrieve", self.retrieve)
+        qnagraph.add_node("final_answer", self.generate_answer)
+
+        qnagraph.add_edge(START, "generate_query")
+        qnagraph.add_edge("generate_query", "retrieve")
+        qnagraph.add_conditional_edges(
+            "retrieve", self.check_retrieved, {"stop": "final_answer", "continue": "generate_query"}
+        )
+        qnagraph.add_edge("final_answer", END)
+
+        return qnagraph.compile()
+
+    async def retrieve(self, state: QnaState) -> dict:
+        # print(f"State Retrieve {state}")
+        request = state.request
+        request.messages = state.query
+        contexts = await self.run_pipeline_retrieve_and_rerank(request)
+
+        retrieved = contexts[CompType.RETRIEVER]
+        reranked = contexts[CompType.POSTPROCESSOR]
+        print(
+            "🔍",
+            f"Retrieved {format_terminal_str(str(len(retrieved)), color='magenta', bold=True)} documents, Reranked to top {format_terminal_str(str(len(reranked)), color='magenta', bold=True)}.",
+        )
+        await stream_writer(
+            f"\n\n🔍 **Retrieved {str(len(retrieved))} documents, Reranked to top {str(len(reranked))}**\n\n"
+        )
+
+        new_retrieval = Retrieval(step=state.num_retrievals, query=state.query, retrieved=retrieved, reranked=reranked)
+        return {
+            "num_retrievals": state.num_retrievals + 1,
+            "retrievals": [*state.retrievals, new_retrieval],
+        }
+
+    async def generate_query(self, state: QnaState) -> dict:
+        # print(f"State generate_query {state}")
+        await stream_writer('<agent title="Understanding the user\'s question">')
+
+        messages = [
+            {"role": ROLE.USER, "content": state.question},
+            {"role": ROLE.SYSTEM, "content": PROMPT_TEMPLATE.GENERATE_QUERY},
+        ]
+        self._messages.extend(messages)
+        self.conversation_history.extend(messages)
+
+        response = await self.llm_generate_astream_writer(state.request)
+
+        message = {"role": ROLE.ASSISTANT, "content": response}
+        self._messages.append(message)
+        self.conversation_history.append(message)
+        return {
+            "query": response,
+        }
+
+    async def check_retrieved(self, state: QnaState) -> str:
+        # print(f"State check_retrieved {state}")
+        print("🤔", format_terminal_str("Evaluating if more information is needed", color="green"))
+        await stream_writer("🤔 **Evaluating if more information is needed...**\n\n")
+
+        # Format context for the next decision
+        contexts = PROMPT_TEMPLATE.CONTEXTS.format(
+            contexts="\n".join(
+                [PROMPT_TEMPLATE.CONTEXT.format(context=doc.text) for doc in state.retrievals[-1].reranked]
+            )
+        )
+        messages = [
+            {"role": ROLE.SYSTEM, "content": contexts},
+            {"role": ROLE.SYSTEM, "content": PROMPT_TEMPLATE.CONTINUE},
+        ]
+        self._messages.extend(messages)
+        self.conversation_history.extend(messages)
+        if state.num_retrievals >= self.max_retrievals:
+            print(
+                "⚠️",
+                format_terminal_str(
+                    f"Reached maximum retrievals: {self.max_retrievals}, stopping search\n", color="yellow", bold=True
+                ),
+            )
+            await stream_writer(
+                f"\n\n⚠️ **Reached maximum retrievals: {self.max_retrievals}, stopping searching...**\n\n</agent>"
+            )
+            return "stop"
+        else:
+            response = await self.llm_generate_astream_writer(state.request)
+            message = {"role": ROLE.ASSISTANT, "content": response}
+            self._messages.append(message)
+            self.conversation_history.append(message)
+            if response.upper().startswith("NO"):
+                print("✅", format_terminal_str("Information is sufficient, moving to next step\n", color="green"))
+                await stream_writer("\n\n✅ **Information is sufficient, moving to next step...**\n\n</agent>")
+                return "stop"
+            else:
+                print("🔄", format_terminal_str("Need more information, generating new query ...", color="green"))
+                await stream_writer("\n\n🔄 **Need more information, generating new query...**\n\n</agent>")
+                return "continue"
+
+    async def generate_answer(self, state: QnaState) -> dict:
+        # print(f"State generate_answer {state}")
+        print("📝", format_terminal_str("Generating the final answer ...", color="cyan", bold=True))
+        await stream_writer('<agent title="Generating the final answer ..." tag="nofold"></agent>')
+        plan_with_information = ""
+        prev_step = ""
+        for i, r in enumerate(state.retrievals):
+            if r.step != prev_step:
+                plan_with_information += f"Step {i+1}\n\nRetrieved:\n"
+            for doc in r.reranked:
+                plan_with_information += doc.text + "\n"
+            plan_with_information += "\n"
+            prev_step = r.step
+
+        self._messages = [
+            {
+                "role": ROLE.SYSTEM,
+                "content": answer_instruction.format(
+                    question=state.question, plan_with_information=plan_with_information
+                ),
+            }
+        ]
+        self.conversation_history.extend(self._messages)
+
+        response = await self.llm_generate_astream_writer(state.request)
+
+        self.conversation_history.append({"role": ROLE.ASSISTANT, "content": response})
+        answer = self.postproc_answer(response, state)
+        title_str = format_terminal_str("Final Answer:", color="blue", bold=True)
+        print(
+            "✅",
+            format_terminal_str(
+                f"{title_str}\n{format_terminal_str(answer, italic=True, bold=True)}", color="blue", bold=True
+            ),
+        )
+        return {"answer": answer}
+
+    # Implement abstract run function
+    # callback dispatcher
+    async def run(self, **kwargs) -> Any:
+        if "cbtype" in kwargs:
+            if kwargs["cbtype"] == CallbackType.RUNAGENT:
+                request = kwargs["chat_request"]
+
+                print(
+                    "🤿",
+                    f"{format_terminal_str('Starting DeepSearch:', color='cyan', bold=True)} {format_terminal_str(request.messages, bold=False, italic=True)}\n",
+                )
+                # Initialize state
+                state = QnaState(
+                    question=request.messages, query="", num_retrievals=0, answer="", retrievals=[], request=request
+                )
+                self._messages = self._build_init_messages(request.messages)
+
+                async def async_gen():
+                    async for chunk in self.graph.astream(state, stream_mode="custom"):
+                        yield chunk
+                        await asyncio.sleep(0)
+
+                print("✅", format_terminal_str("RAG process completed", color="cyan", bold=True))
+                return async_gen()
+
+    def _build_init_messages(self, question) -> List[dict]:
+        return [
+            {
+                "role": ROLE.SYSTEM,
+                "content": PROMPT_TEMPLATE.SYSTEM.format(
+                    system_instruction=system_instruction,
+                    query_instruction=query_instruction,
+                    domain_knowledge="",
+                ),
+            }
+        ]
+
+
+def postproc_query(text, state):
+    """Default post-process the response text generated for new query.
+
+    This function is a placeholder for any specific post-processing logic needed.
+    The returned values are a tuple of (retrieval_query, rerank_query).
+    """
+    print("💡", f"{format_terminal_str('Query generated:', color='cyan', bold=True)} '{text}'")
+    # Default use the raw response text as the query for both retrieval and rerank
+    return text, text
+
+
+def postproc_answer(text, state):
+    return text
+
+
+system_instruction = "You will be provided with a question from a user, and you need to create queries and execute them based on the question for the final answer.\nYou should only use the information provided in the search results to answer the user's question. \nMake your response in the same language as the user's question./no_think"
+query_instruction = 'Every time when asked if more information is needed, check the retrieved contexts and try to identify new content that is related. Then based on what you get and all above, decide if a new query is needed to gather more potential useful information. The query should be a very concise and clear sub-question that is specific to the user\'s question. A good query should include all the related actions or keywords that can help to retrieve the most related context. Response with the query directly.\nDO NOT use any prefix, such as "Query:"/no_think'
+answer_instruction = "You have been provided with a question from user:\n{question}\n\nThe following are the plan steps you generated and the corresponding retrieved information:{plan_with_information}\n\nBased on the above, come up with a final answer for the user's question. Format the answer as a list of steps that can guide the user to solve the problem./no_think"
+
+
+class PROMPT_TEMPLATE:
+    # only contain formatting related instructions here
+
+    SYSTEM = """{system_instruction}
+
+{query_instruction}
+
+{domain_knowledge}
+
+"""
+    GENERATE_QUERY = "Now generate a query for the next retrieval."
+
+    CONTEXT = """<context>\n{context}\n</context>\n"""
+    CONTEXTS = """The following are the retrieved contexts for current query.\n{contexts}\n"""
+
+    CONTINUE = "Is more information needed? Answer Yes or No. Then explain why or why not."
+
+    EXPERIENCES = """The following are question-plan examples by human experts. Refer to them to better make your plan. If you find that there is a question that is highly similar or exactly match the input question, then strictly follow the subquestions to make the plan.\n\n{experiences}\n"""
diff --git a/EdgeCraftRAG/edgecraftrag/components/agents/utils.py b/EdgeCraftRAG/edgecraftrag/components/agents/utils.py
new file mode 100644
index 0000000000..e96c2af9da
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/agents/utils.py
@@ -0,0 +1,401 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+import asyncio
+import importlib.util
+import json
+import logging
+import os
+import re
+import sys
+from typing import Any, Dict, List, Optional, Tuple, Union
+
+import numpy
+from pydantic import BaseModel
+
+# from wrapped_atomic_apis import call_logits_next_token
+
+# Configure logging
+logger = logging.getLogger("deep_search")
+logger.setLevel(logging.INFO)
+
+# Create console handler with a formatter that includes timestamps and emojis
+if not logger.handlers:
+    console_handler = logging.StreamHandler()
+    console_handler.setLevel(logging.INFO)
+    # Format: [YYYY-MM-DD HH:MM:SS] Message with emoji
+    formatter = logging.Formatter("[%(asctime)s] %(message)s", datefmt="%Y-%m-%d %H:%M:%S")
+    formatter = logging.Formatter("[%(asctime)s] %(message)s", datefmt="%H:%M:%S")
+    console_handler.setFormatter(formatter)
+    logger.addHandler(console_handler)
+
+
+def log_status(emoji: str, message: str, indent: int = 0) -> None:
+    """Log a formatted status message with emoji indicator using Python's logging module.
+
+    Args:
+        emoji: Emoji character to prepend to the message
+        message: The message text to log
+        indent: Number of indentation levels (2 spaces each)
+    """
+    indent_str = "  " * indent
+    logger.info(f"{indent_str}{emoji} {message}")
+
+
+class Config(BaseModel):
+    system_instruction: str
+    plan_instruction: str = ""
+    query_instruction: str
+    answer_instruction: str
+    domain_knowledge: str
+    retrieve_top_k: int
+    rerank_top_k: int
+    max_retrievals: int
+    max_plan_steps: int = 7
+    embedding_endpoint: str
+    reranker_endpoint: str
+    llm_endpoint: str
+    query_search_endpoint: str = ""
+    generation_config: Dict[str, Any] = {}
+    postproc: str = "defaults.py"
+
+
+def import_module_from_path(file_path: str):
+    """Import a module from a full file path.
+
+    Args:
+        file_path: Full path to the Python file to import
+
+    Returns:
+        The imported module
+
+    Raises:
+        ImportError: If the module cannot be imported
+    """
+    if not os.path.isfile(file_path):
+        raise ImportError(f"File not found: {file_path}")
+
+    # Get the module name (filename without extension)
+    module_name = os.path.splitext(os.path.basename(file_path))[0]
+
+    # Create the spec
+    spec = importlib.util.spec_from_file_location(module_name, file_path)
+    if spec is None:
+        raise ImportError(f"Failed to create spec for: {file_path}")
+
+    # Create the module
+    module = importlib.util.module_from_spec(spec)
+
+    # Add the module to sys.modules
+    sys.modules[module_name] = module
+
+    # Execute the module
+    try:
+        spec.loader.exec_module(module)
+    except Exception as e:
+        raise ImportError(f"Error executing module {module_name}: {e}")
+
+    return module
+
+
+def load_config(config_path: str) -> Config:
+    """Load configuration from a JSON file.
+
+    Args:
+        config_path: Path to the configuration JSON file
+
+    Returns:
+        Config object with loaded configuration
+    """
+    with open(config_path, "r") as f:
+        config_dict = json.load(f)
+    cfg = Config(**config_dict)
+    if os.path.isfile(cfg.domain_knowledge):
+        with open(cfg.domain_knowledge, "r") as f:
+            cfg.domain_knowledge = f.read()
+    return cfg
+
+
+class ROLE:
+    SYSTEM = "system"
+    ASSISTANT = "assistant"
+    USER = "user"
+
+
+def remove_tagged(text, tag="think"):
+    pattern = f"<{tag}>.*?</{tag}>"
+    return re.sub(pattern, "", text, flags=re.DOTALL).strip()
+
+
+def _extract_pattern_and_text(line: str) -> Optional[Tuple[str, int, str, str]]:
+    """Checks if a line matches the pattern [prefix][digit][suffix][text].
+
+    Args:
+        line: The line to check.
+
+    Returns:
+        A tuple of (prefix, digit, suffix, step_text) if a match is found,
+        otherwise None.
+        - prefix: Characters before the digit (e.g., " "). Can be empty.
+        - digit: The integer value of the digit.
+        - suffix: The separator characters after the digit (e.g., ". ").
+        - step_text: The actual description of the step.
+    """
+    # Pattern: Start, any prefix (non-greedy), a digit, a suffix of non-digits,
+    # and the rest of the line as text.
+    # The suffix (\D+) is followed by (.*) which will grab the text.
+    # This structure correctly separates the separator from the text.
+    match = re.match(r"^(.*?)(\d+)(.*)", line)
+    if match:
+        prefix, digit_str, text = match.groups()
+        # We require actual text for it to be a valid step
+        if text.strip():
+            return prefix, int(digit_str), text.strip()
+    return None
+
+
+def parse_plan_from_text(text_content: str) -> List[str]:
+    """Parses a block of text to extract a list of plan steps by finding a
+    consecutive sequence of numbered lines.
+
+    Args:
+        text_content: A string containing the plan.
+
+    Returns:
+        A list of strings, where each string is a single plan step.
+    """
+    lines = text_content.splitlines()
+    longest_plan = []
+
+    # Iterate through each line, treating it as a potential start of a plan
+    for i, start_line in enumerate(lines):
+
+        # 1. Pre-process the line
+        processed_line = start_line.strip()
+        if processed_line.lower().startswith("step"):
+            # Remove "step" and any space/punctuation immediately after
+            processed_line = re.sub(r"^step\s*[:\-\s#]*", "", processed_line, flags=re.IGNORECASE)
+
+        # 2. Check if it matches the generic pattern and starts with 0 or 1
+        pattern_info = _extract_pattern_and_text(processed_line)
+        if pattern_info:
+            prefix, digit, text = pattern_info
+
+            # Allow multi-digit numbers but only start a plan on 0 or 1
+            if digit in [0, 1]:
+                current_plan = [text]
+                expected_digit = digit + 1
+
+                # 3. If it's a valid start, check subsequent lines for the same pattern
+                for next_line in lines[i + 1 :]:
+
+                    # Pre-process the next line similarly
+                    processed_next_line = next_line.strip()
+                    if processed_next_line.lower().startswith("step"):
+                        processed_next_line = re.sub(r"^step\s*[:\-\s#]*", "", processed_next_line, flags=re.IGNORECASE)
+
+                    # Check if the next line matches the *exact* pattern with the next number
+                    # We escape prefix/suffix in case they contain special regex characters
+                    expected_pattern = re.match(f"^{re.escape(prefix)}{expected_digit}(.*)", processed_next_line)
+
+                    if expected_pattern:
+                        next_text = expected_pattern.group(1).strip()
+                        if next_text:  # Ensure the step is not empty
+                            current_plan.append(next_text)
+                            expected_digit += 1
+                        else:
+                            break  # Empty step text breaks sequence
+                    else:
+                        # The consecutive sequence is broken
+                        break
+
+                # If the plan we just found is the longest so far, save it
+                if len(current_plan) > len(longest_plan):
+                    longest_plan = current_plan
+    longest_plan = [_.lstrip(" .:-") for _ in longest_plan]
+    return longest_plan
+
+
+def format_terminal_str(text: str, color: str = "", bold: bool = False, italic: bool = False) -> str:
+    """Format a string with ANSI escape codes for color, bold, and italic.
+
+    Args:
+        text: The text to format.
+        color: The color name (e.g., 'red', 'green', 'blue').
+        bold: Whether to apply bold formatting.
+        italic: Whether to apply italic formatting.
+
+    Returns:
+        The formatted string with ANSI codes.
+
+    Notes:
+        - If the environment variable NO_COLOR is set (per https://no-color.org/),
+          the function returns the original text without styling.
+        - Unsupported color names are ignored (text returned with other
+          requested styles, if any).
+        - Color names are case-insensitive. Both standard and bright variants
+          are supported (e.g., 'red', 'bright_red').
+    """
+    if text is None:
+        text = ""
+
+    # Honor NO_COLOR convention
+    if os.environ.get("NO_COLOR"):
+        return text
+
+    color_lower = color.lower()
+
+    # Standard and bright ANSI color codes
+    color_map = {
+        "black": 30,
+        "red": 31,
+        "green": 32,
+        "yellow": 33,
+        "blue": 34,
+        "magenta": 35,
+        "cyan": 36,
+        "white": 37,
+        "bright_black": 90,
+        "bright_red": 91,
+        "bright_green": 92,
+        "bright_yellow": 93,
+        "bright_blue": 94,
+        "bright_magenta": 95,
+        "bright_cyan": 96,
+        "bright_white": 97,
+    }
+
+    style_seq: List[str] = []
+
+    # Add color if valid
+    if color_lower in color_map:
+        style_seq.append(str(color_map[color_lower]))
+
+    # Bold and italic attributes
+    if bold:
+        style_seq.append("1")
+    if italic:
+        style_seq.append("3")
+
+    # If no styling requested or recognized, return original text
+    if not style_seq:
+        return text
+
+    prefix = f"\033[{';'.join(style_seq)}m"
+    suffix = "\033[0m"
+    return f"{prefix}{text}{suffix}"
+
+
+_DEFAULT_TEMPLATE_MESSAGES = [
+    {
+        "role": "system",
+        "content": """You are an impartial quality rater for TCB Bonder troubleshooting answers. Your task is to rate if the answer by user well covers the steps in the reference answer.
+
+Task instructions:
+- Parse the reference answer into its essential checkpoints (split on punctuation such as "?", ";", or line breaks) and understand what each step expects the technician to do or verify. The order of the checkpoints has low importance.
+- Examine the user's answer and decide if each checkpoint is substantively addressed with accurate, actionable guidance.
+- Treat synonymous language or additional helpful context as a match when it fulfills the intent of the checkpoint.
+- Mark a checkpoint as uncovered if the user's answer omits it, contradicts it, or gives incorrect or unsafe guidance.
+- Ignore extra steps that do not conflict with the reference; they should not reduce the score.
+- The mismatch of the step number between user's answer and reference answer does not matter, as long as all the content is well covered.
+- Keep all reasoning internal; do not expose the intermediate analysis in the final reply.
+- Focus solely on the provided texts. Do not rely on your knowledge.
+
+The following are domain terms you may refer to:
+BFS: Bulk feed system
+BH: Bondhead
+BS: Bond stage/Bond pedestal
+CAH: Carrier handler
+COG: Chrome on glass
+COS: Cover opening station
+COT: Change over trolley
+DCP: Data collection plan
+DFH: Die feed handler
+DL: Down-look
+DPA: Die pick arm
+DTA: Die transfer arm
+FOV: Field of view
+HW: Highway
+MBH: Media buffer handler
+MHS: Material Handling System
+NCF: No clean flux
+OT: Optics table
+PFLU: Power feeder loading unit
+PHS: Pre/Post heat station
+PR: Pattern recognition
+SC: Station controller
+BLPCS: Bond line process control system
+""",
+    },
+    {
+        "role": "user",
+        "content": """User's answer:
+{llm_answer}
+
+Reference answer:
+{ref_answer}
+""",
+        "template_message": True,
+    },
+    {
+        "role": "system",
+        "content": """Does the user's answer well cover the steps in the reference answer? Yes or No.
+
+Scoring rubric:
+- Answer "Yes" only when every checkpoint from the reference is fully covered and nothing in the user's answer conflicts with the reference guidance.
+- Answer "No" if any checkpoint is missing, incorrectly addressed, or contradicted by the user's answer.
+""",
+    },
+    {"role": "assistant", "content": '{"label": "'},
+]
+DEFAULT_TARGET_TOKENS = ["No", "Yes"]
+DEFAULT_TRANSFORM_PARAMS = (5, -1, 10)  # a, b, T
+
+
+def batch_cal_score(x, a=1.0, b=0.0, T=1.0, s=10):
+    _, d = x.shape
+    levels = numpy.arange(d)[None,] / (d - 1)
+    transformed = numpy.exp(x / T)
+    probs = transformed / transformed.sum(axis=1, keepdims=True)
+    expected_levels = (probs * levels).sum(axis=1)
+    scores = a * expected_levels + b
+    return s * numpy.tanh(scores)
+
+
+def llm_evaluate(
+    ref_answer,
+    llm_answer,
+    eval_endpoint,
+    template_messages=_DEFAULT_TEMPLATE_MESSAGES,
+    target_tokens=DEFAULT_TARGET_TOKENS,
+    transform_params=DEFAULT_TRANSFORM_PARAMS,
+    return_logits=False,
+) -> Union[float, List[float]]:
+    messages = [
+        (
+            message
+            if not message.get("template_message")
+            else {
+                "role": message["role"],
+                "content": message["content"].format(ref_answer=ref_answer, llm_answer=llm_answer),
+            }
+        )
+        for message in template_messages
+    ]
+    # result_json = call_logits_next_token(
+    #     endpoint=eval_endpoint,
+    #     messages=messages,
+    #     target_tokens=target_tokens
+    # )
+    result_json = ""
+    raw_logits = {_["token"]: _["logit"] for _ in result_json["target_token_logits"]}
+    raw_logits = [raw_logits[k] for k in target_tokens]
+    if return_logits:
+        return raw_logits
+    else:
+        score = batch_cal_score(numpy.array(raw_logits)[None,], *transform_params)[0]
+        return score
+
+
+def remove_think_tags(text: str) -> str:
+    """Remove <think>...</think> sections from Qwen3 output."""
+    return re.sub(r"<think>.*?</think>", "", text, flags=re.DOTALL).strip()
diff --git a/EdgeCraftRAG/edgecraftrag/components/benchmark.py b/EdgeCraftRAG/edgecraftrag/components/benchmark.py
index fc3801b5d3..3bf2a7e602 100644
--- a/EdgeCraftRAG/edgecraftrag/components/benchmark.py
+++ b/EdgeCraftRAG/edgecraftrag/components/benchmark.py
@@ -49,7 +49,14 @@ def cal_input_token_size(self, input_text_list):
         return input_token_size
 
     def init_benchmark_data(self):
-        pipeline_comp = [CompType.RETRIEVER, CompType.POSTPROCESSOR, CompType.GENERATOR]
+        pipeline_comp = [
+            CompType.NODEPARSER,
+            CompType.CHUNK_NUM,
+            CompType.RETRIEVER,
+            CompType.POSTPROCESSOR,
+            CompType.QUERYSEARCH,
+            CompType.GENERATOR,
+        ]
         if self.is_enabled():
             with self._idx_lock:
                 self.last_idx += 1
@@ -58,6 +65,8 @@ def init_benchmark_data(self):
             data["idx"] = idx
             for comp in pipeline_comp:
                 data[comp] = ""
+            data[CompType.NODEPARSER] = 0
+            data[CompType.CHUNK_NUM] = 0
             return idx, data
 
     def update_benchmark_data(self, idx, comp_type, start, end):
diff --git a/EdgeCraftRAG/edgecraftrag/components/data.py b/EdgeCraftRAG/edgecraftrag/components/data.py
old mode 100755
new mode 100644
diff --git a/EdgeCraftRAG/edgecraftrag/components/generator.py b/EdgeCraftRAG/edgecraftrag/components/generator.py
old mode 100755
new mode 100644
index cb170fcd10..fe5974e71f
--- a/EdgeCraftRAG/edgecraftrag/components/generator.py
+++ b/EdgeCraftRAG/edgecraftrag/components/generator.py
@@ -2,16 +2,16 @@
 # SPDX-License-Identifier: Apache-2.0
 
 import asyncio
-import dataclasses
 import json
 import os
 import urllib.request
+from concurrent.futures import ThreadPoolExecutor
 from urllib.parse import urlparse
 
+from comps.cores.proto.api_protocol import ChatCompletionRequest
 from edgecraftrag.base import BaseComponent, CompType, GeneratorType, InferenceType, NodeParserType
-from edgecraftrag.utils import concat_history, get_prompt_template, save_history
+from edgecraftrag.utils import get_prompt_template
 from fastapi.responses import StreamingResponse
-from langchain_core.prompts import PromptTemplate
 from llama_index.llms.openai_like import OpenAILike
 from pydantic import model_serializer
 from unstructured.staging.base import elements_from_base64_gzipped_json
@@ -44,11 +44,11 @@ def extract_unstructured_eles(retrieved_nodes=[], text_gen_context=""):
             continue
         metadata = node.node.metadata
         # extract referenced docs
-        if "filename" in metadata:
+        if "file_name" in metadata:
             reference_doc = (
-                metadata["filename"]
+                metadata["file_name"]
                 if "page_number" not in metadata
-                else metadata["filename"] + " --page" + str(metadata["page_number"])
+                else metadata["file_name"] + " --page" + str(metadata["page_number"])
             )
             reference_docs.add(reference_doc)
         # extract hyperlinks in chunk
@@ -69,48 +69,52 @@ def extract_unstructured_eles(retrieved_nodes=[], text_gen_context=""):
         # extract hyperlinks in chunk
         link_urls.extend(extract_urls(text_gen_context))
     unstructured_str = ""
-    if image_paths:
-        unstructured_str += "\n\n参考图片:\n\n"
-        for image_path in image_paths:
-            unstructured_str += f"![]({image_path})"
-    if link_urls:
-        unstructured_str += "\n\n相关链接:\n\n"
-        for link in link_urls:
-            unstructured_str += f"[{link}]({link})\n\n"
     if reference_docs:
-        unstructured_str += "\n\n内容来源:\n\n"
+        unstructured_str += "\n\n --- \n\n### Document Source:\n"
         for reference_doc in reference_docs:
-            unstructured_str += f"{reference_doc}\n\n"
+            unstructured_str += f"- {reference_doc}\n\n"
     return unstructured_str
 
 
+def build_stream_response(status=None, content=None, error=None):
+    response = {"status": status, "contentType": "text"}
+    if content is not None:
+        response["content"] = content
+    if error is not None:
+        response["error"] = error
+    return response
+
+
 async def local_stream_generator(lock, llm, prompt_str, unstructured_str):
     async with lock:
-        response = llm.stream_complete(prompt_str)
-        collected_data = []
-        for r in response:
-            collected_data.append(r.delta)
-            yield r.delta
-            await asyncio.sleep(0)
-        if unstructured_str:
-            collected_data.append(unstructured_str)
-            yield unstructured_str
-        res = "".join(collected_data)
-        save_history(res)
+        response = await llm.astream_complete(prompt_str)
+        try:
+            async for r in response:
+                yield r.delta or ""
+                await asyncio.sleep(0)
+            if unstructured_str:
+                yield unstructured_str
+        except Exception as e:
+            start_idx = str(e).find("message") + len("message")
+            result_error = str(e)[start_idx:]
+            yield f"code:0000{result_error}"
 
 
 async def stream_generator(llm, prompt_str, unstructured_str):
-    response = llm.stream_complete(prompt_str)
-    collected_data = []
-    for r in response:
-        collected_data.append(r.delta)
-        yield r.delta
-        await asyncio.sleep(0)
-    if unstructured_str:
-        collected_data.append(unstructured_str)
-        yield unstructured_str
-    res = "".join(collected_data)
-    save_history(res)
+    response = await llm.astream_complete(prompt_str)
+    try:
+        async for r in response:
+            yield r.delta or ""
+            await asyncio.sleep(0)
+        if unstructured_str:
+            yield unstructured_str
+            await asyncio.sleep(0)
+    except asyncio.CancelledError as e:
+        response.aclose()
+    except Exception as e:
+        start_idx = str(e).find("message") + len("message")
+        result_error = str(e)[start_idx:]
+        yield f"code:0000{result_error}"
 
 
 class QnAGenerator(BaseComponent):
@@ -127,22 +131,25 @@ def __init__(self, llm_model, prompt_template_file, inference_type, vllm_endpoin
             ("\t\n", "\n"),
         )
         self.enable_think = False
-        self.llm = llm_model
-        if isinstance(llm_model, str):
-            self.model_id = llm_model
-        else:
-            self.model_id = llm_model().model_id
-        if self.inference_type == InferenceType.LOCAL:
-            self.lock = asyncio.Lock()
+        self.enable_rag_retrieval = True
         self.prompt_content = prompt_content
         self.prompt_template_file = prompt_template_file
-        self.prompt = self.init_prompt(self.model_id, self.prompt_content, self.prompt_template_file)
-
-        self.llm = llm_model
         if isinstance(llm_model, str):
             self.model_id = llm_model
+            self.model_path = llm_model
         else:
-            self.model_id = llm_model().model_id
+            llm_instance = llm_model()
+            if llm_instance.model_path is None or llm_instance.model_path == "":
+                self.model_id = llm_instance.model_id
+                self.model_path = os.path.join("/home/user/models", os.getenv("LLM_MODEL", "Qwen/Qwen3-8B"))
+            else:
+                self.model_id = llm_instance.model_id
+                self.model_path = llm_instance.model_path
+        self.original_template, self.prompt = self.prompt_handler(
+            self.model_path, self.prompt_content, self.prompt_template_file
+        )
+
+        self.llm = llm_model
         if self.inference_type == InferenceType.LOCAL:
             self.lock = asyncio.Lock()
         if self.inference_type == InferenceType.VLLM:
@@ -151,45 +158,43 @@ def __init__(self, llm_model, prompt_template_file, inference_type, vllm_endpoin
                 vllm_endpoint = os.getenv("vLLM_ENDPOINT", "http://localhost:8086")
         self.vllm_endpoint = vllm_endpoint
 
-    def init_prompt(self, model_id, prompt_content=None, prompt_template_file=None, enable_think=False):
-        # using the prompt template enhancement strategy(only tested on Qwen2-7B-Instruction) if template_enhance_on is true
-        template_enhance_on = True if "Qwen2" in self.model_id else False
+    def prompt_handler(
+        self, model_path, prompt_content=None, prompt_template_file=None, enable_think=False, enable_rag_retrieval=True
+    ):
         if prompt_content:
-            self.set_prompt(prompt_content)
-            return get_prompt_template(model_id, prompt_content, prompt_template_file, enable_think)
+            return get_prompt_template(model_path, prompt_content, prompt_template_file, enable_think)
         elif prompt_template_file is None:
             print("There is no template file, using the default template.")
-            prompt_template = get_prompt_template(model_id, prompt_content, prompt_template_file, enable_think)
-            return (
-                DocumentedContextRagPromptTemplate.from_template(prompt_template)
-                if template_enhance_on
-                else prompt_template
-            )
+            prompt_template = get_prompt_template(model_path, prompt_content, prompt_template_file, enable_think)
+            return prompt_template
         else:
-            safe_root = "/templates"
+            if enable_rag_retrieval:
+                safe_root = "/templates"
+            else:
+                prompt_content = "### User Guide ###You are a helpful assistant. Please respond to user inquiries with concise and professional answers.### Historical Content ###{chat_history}"
+                return get_prompt_template(model_path, prompt_content, prompt_template_file, enable_think)
+
             prompt_template_file = os.path.normpath(os.path.join(safe_root, prompt_template_file))
             if not prompt_template_file.startswith(safe_root):
                 raise ValueError("Invalid template path")
             if not os.path.exists(prompt_template_file):
                 raise ValueError("Template file not exists")
-            if template_enhance_on:
-                return DocumentedContextRagPromptTemplate.from_file(prompt_template_file)
-            else:
-                return get_prompt_template(model_id, prompt_content, prompt_template_file, enable_think)
+            return get_prompt_template(model_path, prompt_content, prompt_template_file, enable_think)
 
     def set_prompt(self, prompt):
         if "{context}" not in prompt:
             prompt += "\n<|im_start|>{context}<|im_end|>"
         if "{chat_history}" not in prompt:
             prompt += "\n<|im_start|>{chat_history}"
-        self.prompt = prompt
+        self.prompt_content = prompt
+        self.original_template, self.prompt = self.prompt_handler(
+            self.model_path, self.prompt_content, self.prompt_template_file
+        )
 
     def reset_prompt(self):
-        prompt_template = get_prompt_template(self.model_id)
-        self.prompt = (
-            DocumentedContextRagPromptTemplate.from_template(prompt_template)
-            if self.template_enhance_on
-            else prompt_template
+        self.prompt_content = None
+        self.original_template, self.prompt = self.prompt_handler(
+            self.model_path, self.prompt_content, self.prompt_template_file
         )
 
     def clean_string(self, string):
@@ -206,20 +211,30 @@ def query_transform(self, chat_request, retrieved_nodes, sub_questions=None):
         :return: Generated text_gen_context and prompt_str."""
         text_gen_context = ""
         for n in retrieved_nodes:
-            origin_text = n.node.get_text()
+            origin_text = n.node.text
             text_gen_context += self.clean_string(origin_text.strip())
         query = chat_request.messages
-        chat_history = concat_history(chat_request.messages)
+        chat_history = chat_request.input
         # Modify model think status
         if chat_request.chat_template_kwargs:
-            if self.enable_think != chat_request.chat_template_kwargs["enable_thinking"]:
-                self.prompt = self.init_prompt(
-                    self.model_id,
+            change_flag = False
+            if "enable_rag_retrieval" in chat_request.chat_template_kwargs:
+                if self.enable_rag_retrieval != chat_request.chat_template_kwargs["enable_rag_retrieval"]:
+                    self.enable_rag_retrieval = chat_request.chat_template_kwargs["enable_rag_retrieval"]
+                    change_flag = True
+            if "enable_thinking" in chat_request.chat_template_kwargs:
+                if self.enable_think != chat_request.chat_template_kwargs["enable_thinking"]:
+                    self.enable_think = chat_request.chat_template_kwargs["enable_thinking"]
+                    change_flag = True
+            if change_flag:
+                self.original_template, self.prompt = self.prompt_handler(
+                    self.model_path,
                     self.prompt_content,
                     self.prompt_template_file,
-                    chat_request.chat_template_kwargs["enable_thinking"],
+                    self.enable_think,
+                    self.enable_rag_retrieval,
                 )
-                self.enable_think = chat_request.chat_template_kwargs["enable_thinking"]
+
         if sub_questions:
             final_query = f"{query}\n\n### Sub-questions ###\nThe following list is how you should consider the answer, you MUST follow these steps when responding:\n\n{sub_questions}"
         else:
@@ -227,7 +242,7 @@ def query_transform(self, chat_request, retrieved_nodes, sub_questions=None):
         prompt_str = self.prompt.format(input=final_query, chat_history=chat_history, context=text_gen_context)
         return text_gen_context, prompt_str
 
-    def run(self, chat_request, retrieved_nodes, node_parser_type, **kwargs):
+    async def run(self, chat_request, retrieved_nodes, node_parser_type, **kwargs):
         if self.llm() is None:
             # This could happen when User delete all LLMs through RESTful API
             raise ValueError("No LLM available, please load LLM")
@@ -245,19 +260,21 @@ def run(self, chat_request, retrieved_nodes, node_parser_type, **kwargs):
         self.llm().generate_kwargs = generate_kwargs
         self.llm().max_new_tokens = chat_request.max_tokens
         unstructured_str = ""
-        if node_parser_type == NodeParserType.UNSTRUCTURED:
+        if node_parser_type == NodeParserType.UNSTRUCTURED or node_parser_type == NodeParserType.SIMPLE:
             unstructured_str = extract_unstructured_eles(retrieved_nodes, text_gen_context)
         if chat_request.stream:
-            return StreamingResponse(
-                local_stream_generator(self.lock, self.llm(), prompt_str, unstructured_str),
-                media_type="text/event-stream",
-            )
+            # Asynchronous generator
+            async def generator():
+                async for chunk in local_stream_generator(self.lock, self.llm(), prompt_str, unstructured_str):
+                    yield chunk or ""
+                    await asyncio.sleep(0)
+
+            return generator()
         else:
             result = self.llm().complete(prompt_str)
-            save_history(str(result.text))
             return result
 
-    def run_vllm(self, chat_request, retrieved_nodes, node_parser_type, **kwargs):
+    async def run_vllm(self, chat_request, retrieved_nodes, node_parser_type, **kwargs):
         # query transformation
         sub_questions = kwargs.get("sub_questions", None)
         text_gen_context, prompt_str = self.query_transform(chat_request, retrieved_nodes, sub_questions=sub_questions)
@@ -273,15 +290,19 @@ def run_vllm(self, chat_request, retrieved_nodes, node_parser_type, **kwargs):
             repetition_penalty=chat_request.repetition_penalty,
         )
         unstructured_str = ""
-        if node_parser_type == NodeParserType.UNSTRUCTURED:
+        if node_parser_type == NodeParserType.UNSTRUCTURED or node_parser_type == NodeParserType.SIMPLE:
             unstructured_str = extract_unstructured_eles(retrieved_nodes, text_gen_context)
         if chat_request.stream:
-            return StreamingResponse(
-                stream_generator(llm, prompt_str, unstructured_str), media_type="text/event-stream"
-            )
+
+            # Asynchronous generator
+            async def generator():
+                async for chunk in stream_generator(llm, prompt_str, unstructured_str):
+                    yield chunk or ""
+                    await asyncio.sleep(0)
+
+            return generator()
         else:
-            result = llm.complete(prompt_str)
-            save_history(str(result))
+            result = await llm.acomplete(prompt_str)
             return result
 
     @model_serializer
@@ -296,69 +317,89 @@ def ser_model(self):
         return set
 
 
-@dataclasses.dataclass
-class INSTRUCTIONS:
-    IM_START = "You are an AI assistant that helps users answer questions given a specific context."
-    SUCCINCT = "Ensure your response is succinct"
-    ACCURATE = "Ensure your response is accurate."
-    SUCCINCT_AND_ACCURATE = "Ensure your response is succinct. Try to be accurate if possible."
-    ACCURATE_AND_SUCCINCT = "Ensure your response is accurate. Try to be succinct if possible."
-    NO_RAMBLING = "Avoid posing new questions or self-questioning and answering, and refrain from repeating words in your response."
-    SAY_SOMETHING = "Avoid meaningless answer such a random symbol or blanks."
-    ENCOURAGE = "If you cannot well understand the question, try to translate it into English, and translate the answer back to the language of the question."
-    NO_IDEA = (
-        'If the answer is not discernible, please respond with "Sorry. I have no idea" in the language of the question.'
-    )
-    CLOZE_TEST = """The task is a fill-in-the-blank/cloze test."""
-    NO_MEANINGLESS_SYMBOLS = "Meaningless symbols and ``` should not be included in your response."
-    ADAPT_NATIVE_LANGUAGE = "Please try to think like a person that speak the same language that the question used."
-
-
-def _is_cloze(question):
-    return ("()" in question or "（）" in question) and ("填" in question or "fill" in question or "cloze" in question)
-
-
-# depreciated
-def get_instructions(question):
-    # naive pre-retrieval rewrite
-    # cloze
-    if _is_cloze(question):
-        instructions = [
-            INSTRUCTIONS.CLOZE_TEST,
-        ]
-    else:
-        instructions = [
-            INSTRUCTIONS.ACCURATE_AND_SUCCINCT,
-            INSTRUCTIONS.NO_RAMBLING,
-            INSTRUCTIONS.NO_MEANINGLESS_SYMBOLS,
-        ]
-    return ["System: {}".format(_) for _ in instructions]
-
-
-def preprocess_question(question):
-    if _is_cloze(question):
-        question = question.replace(" ", "").replace("（", "(").replace("）", ")")
-        # .replace("()", " <|blank|> ")
-        ret = "User: Please finish the following fill-in-the-blank question marked by $$$ at the beginning and end. Make sure all the () are filled.\n$$$\n{}\n$$$\nAssistant: ".format(
-            question
+class FreeChatGenerator(BaseComponent):
+
+    def __init__(self, llm_model, inference_type, vllm_endpoint, **kwargs):
+        BaseComponent.__init__(
+            self,
+            comp_type=CompType.GENERATOR,
+            comp_subtype=GeneratorType.FREECHAT,
         )
-    else:
-        ret = "User: {}\nAssistant: 从上下文提供的信息中可以知道，".format(question)
-    return ret
-
-
-class DocumentedContextRagPromptTemplate(PromptTemplate):
-
-    def format(self, **kwargs) -> str:
-        # context = '\n'.join([clean_string(f"{_.page_content}".strip()) for i, _ in enumerate(kwargs["context"])])
-        context = kwargs["context"]
-        question = kwargs["input"]
-        preprocessed_question = preprocess_question(question)
-        if "instructions" in self.template:
-            instructions = get_instructions(question)
-            prompt_str = self.template.format(
-                context=context, instructions="\n".join(instructions), input=preprocessed_question
-            )
+        self.inference_type = inference_type
+        self.prompt_content = ""
+        self.prompt_template_file = ""
+        self._REPLACE_PAIRS = (
+            ("\n\n", "\n"),
+            ("\t\n", "\n"),
+        )
+        self.enable_think = False
+        if isinstance(llm_model, str):
+            self.model_id = llm_model
+            self.model_path = llm_model
         else:
-            prompt_str = self.template.format(context=context, input=preprocessed_question)
-        return prompt_str
+            llm_instance = llm_model()
+            if llm_instance.model_path is None or llm_instance.model_path == "":
+                self.model_id = llm_instance.model_id
+                self.model_path = os.path.join("/home/user/models", os.getenv("LLM_MODEL", "Qwen/Qwen3-8B"))
+            else:
+                self.model_id = llm_instance.model_id
+                self.model_path = llm_instance.model_path
+
+        self.llm = llm_model
+        if self.inference_type == InferenceType.VLLM:
+            self.vllm_name = llm_model().model_id
+            if vllm_endpoint == "":
+                vllm_endpoint = os.getenv("vLLM_ENDPOINT", "http://localhost:8086")
+        self.vllm_endpoint = vllm_endpoint
+
+    async def run(self, chat_request, retrieved_nodes, node_parser_type, **kwargs):
+        response = await self.run_vllm(chat_request, retrieved_nodes, node_parser_type, **kwargs)
+        return response
+
+    async def run_vllm(self, chat_request, retrieved_nodes, node_parser_type, **kwargs):
+        llm = OpenAILike(
+            api_key="fake",
+            api_base=self.vllm_endpoint + "/v1",
+            max_tokens=chat_request.max_tokens,
+            model=self.vllm_name,
+            top_p=chat_request.top_p,
+            top_k=chat_request.top_k,
+            temperature=chat_request.temperature,
+            streaming=chat_request.stream,
+            repetition_penalty=chat_request.repetition_penalty,
+        )
+        prompt_str = chatcompletion_to_chatml(chat_request)
+        if chat_request.stream:
+
+            # Asynchronous generator
+            async def generator():
+                gen = await llm.astream_complete(prompt_str)
+                async for chunk in gen:
+                    yield chunk.delta or ""
+                    await asyncio.sleep(0)
+
+            return generator()
+        else:
+            result = await llm.acomplete(prompt_str)
+            return str(result)
+
+    @model_serializer
+    def ser_model(self):
+        set = {
+            "idx": self.idx,
+            "generator_type": self.comp_subtype,
+            "inference_type": self.inference_type,
+            "model": self.llm(),
+            "vllm_endpoint": self.vllm_endpoint,
+        }
+        return set
+
+
+def chatcompletion_to_chatml(request: ChatCompletionRequest) -> str:
+    """Convert a ChatCompletionRequest dict to a ChatML-formatted string."""
+    chatml = ""
+    for msg in request.messages:
+        chatml += f"<|im_start|>{msg.get('role', '')}\n{msg.get('content', '')}<|im_end|>\n"
+    # start generation from assistant role
+    chatml += "<|im_start|>assistant\n"
+    return chatml
diff --git a/EdgeCraftRAG/edgecraftrag/components/indexer.py b/EdgeCraftRAG/edgecraftrag/components/indexer.py
index 842122964f..e2a517101d 100644
--- a/EdgeCraftRAG/edgecraftrag/components/indexer.py
+++ b/EdgeCraftRAG/edgecraftrag/components/indexer.py
@@ -10,11 +10,11 @@
 from llama_index.vector_stores.faiss import FaissVectorStore
 from llama_index.vector_stores.milvus import MilvusVectorStore
 from pydantic import model_serializer
+from pymilvus import Collection, connections
 
 
 class VectorIndexer(BaseComponent, VectorStoreIndex):
-
-    def __init__(self, embed_model, vector_type, milvus_uri="http://localhost:19530", kb_name="default_kb"):
+    def __init__(self, embed_model, vector_type, vector_url="http://localhost:19530", kb_name="default_kb"):
         BaseComponent.__init__(
             self,
             comp_type=CompType.INDEXER,
@@ -26,15 +26,19 @@ def __init__(self, embed_model, vector_type, milvus_uri="http://localhost:19530"
             from llama_index.core import Settings
 
             Settings.embed_model = None
-        self.milvus_uri = milvus_uri
-        self._initialize_indexer(embed_model, vector_type, milvus_uri, kb_name)
+        self.vector_url = vector_url
+        self._initialize_indexer(embed_model, vector_type, vector_url, kb_name)
 
-    def _initialize_indexer(self, embed_model, vector_type, milvus_uri, kb_name):
+    def _initialize_indexer(self, embed_model, vector_type, vector_url, kb_name):
         # get active name
         pl = ctx.get_pipeline_mgr().get_active_pipeline()
-        plname = pl.name if pl else ""
+        collection_name = kb_name + pl.name if pl else "default"
         if embed_model:
-            self.d = embed_model._model.request.outputs[0].get_partial_shape()[2].get_length()
+            try:
+                self.d = len(embed_model.get_text_embedding("test"))
+            except Exception:
+                # Fallback for OpenVINO models if the above fails
+                self.d = embed_model._model.request.outputs[0].get_partial_shape()[2].get_length()
         else:
             self.d = 128
         match vector_type:
@@ -46,24 +50,24 @@ def _initialize_indexer(self, embed_model, vector_type, milvus_uri, kb_name):
                 VectorStoreIndex.__init__(self, embed_model=embed_model, nodes=[], storage_context=faiss_store)
             case IndexerType.MILVUS_VECTOR:
                 milvus_vector_store = MilvusVectorStore(
-                    uri=milvus_uri,
+                    uri=vector_url,
                     dim=self.d,
-                    collection_name=kb_name + plname + str(self.d),
+                    collection_name=collection_name,
                     overwrite=False,
                 )
                 milvus_store = StorageContext.from_defaults(vector_store=milvus_vector_store)
                 VectorStoreIndex.__init__(self, embed_model=embed_model, nodes=[], storage_context=milvus_store)
 
     def reinitialize_indexer(self, kb_name="default_kb"):
-        self._initialize_indexer(self.model, self.comp_subtype, self.milvus_uri, kb_name)
+        self._initialize_indexer(self.model, self.comp_subtype, self.vector_url, kb_name)
 
     def clear_milvus_collection(self, kb_name="default_kb"):
         # get active name
         pl = ctx.get_pipeline_mgr().get_active_pipeline()
         plname = pl.name if pl else ""
         milvus_vector_store = MilvusVectorStore(
-            uri=self.milvus_uri,
-            collection_name=kb_name + plname + str(self.d),
+            uri=self.vector_url,
+            collection_name=kb_name + plname,
             overwrite=False,
         )
         milvus_vector_store.clear()
@@ -75,3 +79,42 @@ def run(self, **kwargs) -> Any:
     def ser_model(self):
         set = {"idx": self.idx, "indexer_type": self.comp_subtype, "model": self.model}
         return set
+
+
+class KBADMINIndexer(BaseComponent):
+    # Handled in the kbadmin project
+    def __init__(self, embed_model, vector_type, kbadmin_embedding_url, vector_url="http://localhost:29530"):
+        BaseComponent.__init__(
+            self,
+            comp_type=CompType.INDEXER,
+            comp_subtype=IndexerType.KBADMIN_INDEXER,
+        )
+        self.embed_model = embed_model
+        self.kbadmin_embedding_url = kbadmin_embedding_url
+        self.vector_url = vector_url
+
+    def insert_nodes(self, nodes):
+        return None
+
+    def _index_struct(self, nodes):
+        return None
+
+    def run(self, **kwargs) -> Any:
+        return None
+
+    def reinitialize_indexer(self, kb_name="default_kb"):
+        return None
+
+    def clear_milvus_collection(self, **kwargs):
+        return None
+
+    @model_serializer
+    def ser_model(self):
+        set = {
+            "idx": self.idx,
+            "indexer_type": self.comp_subtype,
+            "model": {"model_id": self.embed_model},
+            "kbadmin_embedding_url": self.kbadmin_embedding_url,
+            "vector_url": self.vector_url,
+        }
+        return set
diff --git a/EdgeCraftRAG/edgecraftrag/components/knowledge_base.py b/EdgeCraftRAG/edgecraftrag/components/knowledge_base.py
index 259c4a463f..93f578080c 100644
--- a/EdgeCraftRAG/edgecraftrag/components/knowledge_base.py
+++ b/EdgeCraftRAG/edgecraftrag/components/knowledge_base.py
@@ -1,40 +1,363 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+import json
 import os
-from typing import Any, List, Optional
+import uuid
+from typing import Any, Dict, List, Optional, Union
 
-from edgecraftrag.base import BaseComponent
+from edgecraftrag.base import BaseComponent, CompType
+from edgecraftrag.config_repository import (
+    MilvusConfigRepository,
+    MilvusDocumentRecordRepository,
+)
+from edgecraftrag.env import DOCUMENT_DATA_FILE, EXPERIENCE_FILE
+from llama_index.core.schema import Document
 from pydantic import model_serializer
 
 
 class Knowledge(BaseComponent):
-    file_paths: Optional[List[str]] = []
-    file_map: Optional[List[str]] = {}
-    description: Optional[str] = "None"
-    comp_type: str = "knowledge"
-    active: bool
+    def __init__(
+        self,
+        name: str,
+        description: Optional[str] = None,
+        active: bool = True,
+        comp_type: Optional[str] = None,
+        comp_subtype: Optional[str] = None,
+        experience_active: bool = False,
+        idx: Optional[str] = None,
+        all_document_maps: Optional[Dict] = None,
+        file_paths: Optional[list] = None,
+        **kwargs,
+    ):
+        super().__init__(name=name, comp_type=CompType.KNOWLEDGE, **kwargs)
+
+        self.description = description
+        self.experience_active = experience_active
+        self.active = active
+        self.comp_type = comp_type
+        self.comp_subtype = comp_subtype
+        if idx is not None:
+            self.idx = str(idx)
+        if all_document_maps is not None:
+            self.all_document_maps = all_document_maps
+        else:
+            self.all_document_maps: Dict[str, Dict[str, str]] = {}
+
+        self.document_records: List[Dict[str, str]] = []
+
+        if file_paths is not None:
+            self.file_paths = file_paths
+            self._update_file_names()
+        else:
+            self.file_paths: List[str] = []
+            self.file_map: Dict[str, str] = {}
+
+        self.experience_repo = MilvusConfigRepository.create_connection("experience_data", 1)
+        self.document_record_repo = MilvusDocumentRecordRepository.create_connection("document_records", 1)
 
     def _update_file_names(self) -> None:
         self.file_map = {os.path.basename(path): path for path in self.file_paths if path is not None}
 
-    def add_file_path(self, file_path: str) -> bool:
-        if file_path not in self.file_paths:
+    def add_file_path(
+        self,
+        file_path: str,
+        documents: List[Document],
+        pl_name: str,
+        only_add_file: bool = True,
+    ) -> bool:
+        if pl_name not in self.all_document_maps:
+            self.all_document_maps[pl_name] = {}
+        if file_path not in self.all_document_maps[pl_name]:
+            file_id = str(uuid.uuid4())
+            self.all_document_maps[pl_name][file_path] = file_id
+        else:
+            file_id = self.all_document_maps[pl_name][file_path]
+
+        records = [
+            {
+                "file_id": file_id,
+                "file_path": file_path,
+                "doc_id": doc.id_,
+                "metadata": doc.metadata,
+            }
+            for doc in documents
+        ]
+        self._add_document_records(records)
+
+        if only_add_file and file_path not in self.file_paths:
             self.file_paths.append(file_path)
             self._update_file_names()
-            return True
-        return False
 
-    def remove_file_path(self, file_path: str) -> bool:
-        if file_path in self.file_paths:
-            self.file_paths.remove(file_path)
-            self._update_file_names()
-            return True
-        return False
+    def remove_file_path(self, file_path: str, pl_name: str) -> List[str]:
+        removed_doc_ids = []
+        if pl_name in self.all_document_maps and file_path in self.all_document_maps[pl_name]:
+            file_id = self.all_document_maps[pl_name][file_path]
+            removed_doc_ids = self._remove_document_records_by_file_id(file_id)
+
+            del self.all_document_maps[pl_name][file_path]
+            if file_path in self.file_paths:
+                self.file_paths.remove(file_path)
+                self._update_file_names()
+
+        return removed_doc_ids
 
     def get_file_paths(self) -> List[str]:
         return self.file_paths
 
+    # Content related to experience
+    def _read_experience_file(self) -> List[Dict]:
+        if self.experience_repo:
+            return [item["config_json"] for item in self.experience_repo.get_configs()]
+        else:
+            if EXPERIENCE_FILE not in self.file_paths:
+                self.file_paths.append(EXPERIENCE_FILE)
+            if not os.path.isfile(self.file_paths[0]):
+                self.ensure_file_exists(self.file_paths[0])
+            with open(self.file_paths[0], "r", encoding="utf-8") as f:
+                return json.load(f)
+
+    def _write_experience_file(self, data: List[Dict]) -> None:
+        if self.experience_repo:
+            return True
+        else:
+            with open(self.file_paths[0], "w", encoding="utf-8") as f:
+                json.dump(data, f, ensure_ascii=False, indent=4)
+            return True
+
+    def get_all_experience(self) -> List[Dict]:
+        return self._read_experience_file()
+
+    def get_experience_by_id_or_question(self, req: str) -> Optional[Dict]:
+        for item in self.get_all_experience():
+            if item.get("idx") == req.idx or item.get("question") == req.question:
+                return item
+        return None
+
+    def add_multiple_experiences(
+        self, experiences: List[Dict[str, Union[str, List[str]]]], flag: bool = True
+    ) -> List[Dict]:
+        result = []
+        if self.experience_repo:
+            for exp in experiences:
+                question = exp.get("question")
+                if not question:
+                    raise ValueError("Each experience must have a 'question'")
+                content = exp.get("content", [])
+                exp_idx = exp.get("idx") or str(uuid.uuid4())
+
+                existing = self.experience_repo.get_configs(idx=exp_idx)
+                if not existing:
+                    all_exps = self.get_all_experience()
+                    existing = [item for item in all_exps if item.get("question") == question]
+                else:
+                    existing = [item["config_json"] for item in existing]
+
+                if existing:
+                    existing_item = existing[0]
+                    exp_idx = existing_item.get("idx")
+                    if flag:
+                        existing_item["content"].extend([c for c in content if c not in existing_item["content"]])
+                    else:
+                        existing_item["content"] = content
+                    existing_item["question"] = question
+                    success = self.experience_repo.update_config_by_idx(exp_idx, existing_item)
+                    if success:
+                        result.append(existing_item)
+                else:
+                    new_item = {
+                        "idx": exp_idx,
+                        "question": question,
+                        "content": content,
+                    }
+                    success = self.experience_repo.add_config_by_idx(exp_idx, new_item)
+                    if success:
+                        result.append(new_item)
+            return result
+        else:
+            all_exp = self._read_experience_file()
+            for exp in experiences:
+                question = exp.get("question")
+                if not question:
+                    raise ValueError("Each experience must have a 'question'")
+                content = exp.get("content", [])
+                exp_idx = exp.get("idx") or str(uuid.uuid4())
+                existing_idx = None
+                existing_item = None
+                for i, item in enumerate(all_exp):
+                    if item.get("idx") == exp_idx:
+                        existing_idx = i
+                        existing_item = item
+                        break
+                if existing_idx is None:
+                    for i, item in enumerate(all_exp):
+                        if item.get("question") == question:
+                            existing_idx = i
+                            existing_item = item
+                            break
+                if existing_idx is not None:
+                    if flag:
+                        existing_item["content"].extend([c for c in content if c not in existing_item["content"]])
+                        existing_item["question"] = question
+                    else:
+                        existing_item["content"] = content
+                        existing_item["question"] = question
+                    all_exp[existing_idx] = existing_item
+                    result.append(existing_item)
+                else:
+                    new_item = {
+                        "idx": exp_idx,
+                        "question": question,
+                        "content": content,
+                    }
+                    all_exp.append(new_item)
+                    result.append(new_item)
+            self._write_experience_file(all_exp)
+            return result
+
+    def delete_experience(self, exp_idx: str) -> bool:
+        if self.experience_repo:
+            return self.experience_repo.delete_config_by_idx(exp_idx)
+        else:
+            all_exp = self._read_experience_file()
+            remaining = [item for item in all_exp if item.get("idx") != exp_idx]
+            if len(remaining) != len(all_exp):
+                self._write_experience_file(remaining)
+                return True
+            return False
+
+    def clear_experiences(self) -> bool:
+        if self.experience_repo:
+            try:
+                self.experience_repo.clear_all_config()
+                return True
+            except Exception as e:
+                print(f"Clear Milvus experiences failed: {e}")
+                return False
+        else:
+            self._write_experience_file([])
+            return True
+
+    def update_experience(self, exp_idx: str, new_question: str, new_content: List[str]) -> Optional[Dict]:
+        updated_item = {
+            "idx": exp_idx,
+            "question": new_question,
+            "content": new_content,
+        }
+        if self.experience_repo:
+            success = self.experience_repo.update_config_by_idx(exp_idx, updated_item)
+            return updated_item if success else None
+        else:
+            all_exp = self._read_experience_file()
+            for i, item in enumerate(all_exp):
+                if item.get("idx") == exp_idx:
+                    all_exp[i] = updated_item
+                    self._write_experience_file(all_exp)
+                    return updated_item
+            return None
+
+    def add_experiences_from_file(self, file_path: str, flag: bool = False) -> List[Dict]:
+        if not file_path.endswith(".json"):
+            raise ValueError("File must be a JSON file")
+        try:
+            with open(file_path, "r", encoding="utf-8") as f:
+                data = json.load(f)
+            if not isinstance(data, list):
+                raise ValueError("File content must be a list of experiences")
+            experiences = []
+            for item in data:
+                exp = {
+                    "idx": item.get("idx") or str(uuid.uuid4()),
+                    "question": item.get("question", ""),
+                    "content": item.get("content", []),
+                }
+                experiences.append(exp)
+
+            return self.add_multiple_experiences(experiences=experiences, flag=flag)
+        except json.JSONDecodeError as e:
+            raise ValueError(f"Invalid JSON: {str(e)}")
+        except Exception as e:
+            raise ValueError(f"File error: {str(e)}")
+
+    # Related content of document
+    def _add_document_records(self, records: List[Dict[str, str]]) -> None:
+        if records and self.document_record_repo:
+            self.document_record_repo.save_records(records)
+        elif records:
+            if not os.path.isfile(DOCUMENT_DATA_FILE):
+                self.ensure_file_exists(DOCUMENT_DATA_FILE)
+            if os.path.exists(DOCUMENT_DATA_FILE):
+                with open(DOCUMENT_DATA_FILE, "r", encoding="utf-8") as f:
+                    existing_data = json.load(f)
+            else:
+                existing_data = []
+            existing_data.extend(records)
+            with open(DOCUMENT_DATA_FILE, "w", encoding="utf-8") as f:
+                json.dump(existing_data, f, ensure_ascii=False, indent=4)
+
+    def _remove_document_records_by_file_id(self, file_id: str) -> List[Dict[str, str]]:
+        deleted_records = []
+        if self.document_record_repo:
+            deleted_records = self.document_record_repo.delete_records_by_file_id(file_id)
+        else:
+            if os.path.exists(DOCUMENT_DATA_FILE):
+                with open(DOCUMENT_DATA_FILE, "r", encoding="utf-8") as f:
+                    all_document_data = json.load(f)
+                deleted_records = [item.get("doc_id") for item in all_document_data if item.get("file_id") == file_id]
+                result_documents = [item for item in all_document_data if item.get("file_id") != file_id]
+                if len(deleted_records) > 0:
+                    with open(DOCUMENT_DATA_FILE, "w", encoding="utf-8") as f:
+                        json.dump(result_documents, f, ensure_ascii=False, indent=4)
+        return deleted_records
+
+    def get_all_document(self, file_path, pl_name) -> List[Dict[str, Any]]:
+        doc_info_list = []
+        if pl_name not in self.all_document_maps:
+            return doc_info_list
+        file_id = self.all_document_maps[pl_name].get(file_path)
+        if not file_id:
+            return doc_info_list
+
+        if self.document_record_repo:
+            records = self.document_record_repo.get_records_by_file_id(file_id)
+            doc_info_list = [{"doc_id": rec["doc_id"], "metadata": rec.get("metadata", {})} for rec in records]
+        else:
+            if os.path.exists(DOCUMENT_DATA_FILE):
+                with open(DOCUMENT_DATA_FILE, "r", encoding="utf-8") as f:
+                    all_data = json.load(f)
+            doc_info_list = [
+                {"doc_id": item["doc_id"], "metadata": item.get("metadata", {})}
+                for item in all_data
+                if item.get("file_id") == file_id
+            ]
+        return doc_info_list
+
+    def clear_documents(self, pl_name):
+        if pl_name not in self.all_document_maps:
+            return
+        for file_id in self.all_document_maps[pl_name].values():
+            self._remove_document_records_by_file_id(file_id)
+        self.all_document_maps[pl_name] = {}
+        return True
+
+    # Make sure the folder and its files exist
+    def ensure_file_exists(self, file_paths):
+        dir_path = os.path.dirname(file_paths)
+        os.makedirs(dir_path, exist_ok=True)
+        if not os.path.exists(file_paths):
+            with open(file_paths, "w", encoding="utf-8") as f:
+                json.dump([], f, ensure_ascii=False, indent=4)
+
+    # Calculate the number of files or experience
+    def calculate_totals(self):
+        if self.comp_type == "knowledge":
+            total = len(self.file_paths)
+        elif self.comp_type == "experience":
+            total = len(self.get_all_experience())
+        else:
+            total = None
+        return total
+
     def run(self, **kwargs) -> Any:
         pass
 
@@ -44,8 +367,11 @@ def ser_model(self):
             "idx": self.idx,
             "name": self.name,
             "comp_type": self.comp_type,
+            "comp_subtype": self.comp_subtype,
             "file_map": self.file_map,
             "description": self.description,
             "active": self.active,
+            "experience_active": self.experience_active,
+            "total": self.calculate_totals(),
         }
         return set
diff --git a/EdgeCraftRAG/edgecraftrag/components/model.py b/EdgeCraftRAG/edgecraftrag/components/model.py
index a41b4a7f01..6cb27e623b 100644
--- a/EdgeCraftRAG/edgecraftrag/components/model.py
+++ b/EdgeCraftRAG/edgecraftrag/components/model.py
@@ -6,6 +6,7 @@
 
 from edgecraftrag.base import BaseComponent, CompType, ModelType
 from llama_index.embeddings.huggingface_openvino import OpenVINOEmbedding
+from llama_index.embeddings.openai import OpenAIEmbedding
 from llama_index.llms.openvino import OpenVINOLLM
 from llama_index.postprocessor.openvino_rerank import OpenVINORerank
 from pydantic import Field, model_serializer
@@ -26,6 +27,7 @@ class BaseModelComponent(BaseComponent):
     model_path: Optional[str] = Field(default="")
     weight: Optional[str] = Field(default="")
     device: Optional[str] = Field(default="cpu")
+    api_base: Optional[str] = Field(default=None)
 
     def run(self, **kwargs) -> Any:
         pass
@@ -39,10 +41,24 @@ def ser_model(self):
             "model_path": self.model_path,
             "weight": self.weight,
             "device": self.device,
+            "api_base": self.api_base,
         }
         return set
 
 
+class OpenAIEmbeddingModel(BaseModelComponent, OpenAIEmbedding):
+    def __init__(self, model_id, api_base, **kwargs):
+        super().__init__(
+            model_id=model_id,
+            api_base=api_base,
+            api_key="unused",
+            **kwargs,
+        )
+        OpenAIEmbedding.__init__(self, model=model_id, api_base=api_base, api_key="unused")
+        self.comp_type = CompType.MODEL
+        self.comp_subtype = ModelType.VLLM_EMBEDDING
+
+
 class OpenVINOEmbeddingModel(BaseModelComponent, OpenVINOEmbedding):
 
     def __init__(self, model_id, model_path, device, weight):
diff --git a/EdgeCraftRAG/edgecraftrag/components/node_parser.py b/EdgeCraftRAG/edgecraftrag/components/node_parser.py
index 0f386bc61f..0bd49b91b4 100644
--- a/EdgeCraftRAG/edgecraftrag/components/node_parser.py
+++ b/EdgeCraftRAG/edgecraftrag/components/node_parser.py
@@ -168,3 +168,25 @@ def ser_model(self):
             "chunk_overlap": self.chunk_overlap,
         }
         return set
+
+
+class KBADMINParser(BaseComponent):
+    # Handled in the kbadmin project
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+        self.comp_type = CompType.NODEPARSER
+        self.comp_subtype = NodeParserType.KBADMINPARSER
+
+    def run(self, **kwargs) -> Any:
+        return None
+
+    def insert_nodes(self):
+        return None
+
+    @model_serializer
+    def ser_model(self):
+        set = {
+            "idx": self.idx,
+            "parser_type": self.comp_subtype,
+        }
+        return set
diff --git a/EdgeCraftRAG/edgecraftrag/components/pipeline.py b/EdgeCraftRAG/edgecraftrag/components/pipeline.py
index 41780ef88f..8bc0a3c15f 100644
--- a/EdgeCraftRAG/edgecraftrag/components/pipeline.py
+++ b/EdgeCraftRAG/edgecraftrag/components/pipeline.py
@@ -9,10 +9,11 @@
 from typing import Any, Callable, List, Optional
 
 from comps.cores.proto.api_protocol import ChatCompletionRequest
-from edgecraftrag.base import BaseComponent, CallbackType, CompType, InferenceType, RetrieverType
+from edgecraftrag.base import BaseComponent, CallbackType, CompType, InferenceType, NodeParserType, RetrieverType
 from edgecraftrag.components.postprocessor import RerankProcessor
 from edgecraftrag.components.query_preprocess import query_search
 from edgecraftrag.components.retriever import AutoMergeRetriever, SimpleBM25Retriever, VectorSimRetriever
+from edgecraftrag.env import SEARCH_CONFIG_PATH, SEARCH_DIR
 from fastapi.responses import StreamingResponse
 from llama_index.core.schema import Document, QueryBundle
 from pydantic import BaseModel, Field, model_serializer
@@ -32,22 +33,37 @@ class Pipeline(BaseComponent):
     benchmark: Optional[BaseComponent] = Field(default=None)
     status: PipelineStatus = Field(default=PipelineStatus())
     run_pipeline_cb: Optional[Callable[..., Any]] = Field(default=None)
+    run_retriever_postprocessor_cb: Optional[Callable[..., Any]] = Field(default=None)
     run_retriever_cb: Optional[Callable[..., Any]] = Field(default=None)
+    run_postprocessor_cb: Optional[Callable[..., Any]] = Field(default=None)
     run_data_prepare_cb: Optional[Callable[..., Any]] = Field(default=None)
+    run_query_search_cb: Optional[Callable[..., Any]] = Field(default=None)
 
     def __init__(
         self,
         name,
         origin_json=None,
+        idx=None,
+        documents_cache=None,
     ):
         super().__init__(name=name, comp_type=CompType.PIPELINE)
         if self.name == "" or self.name is None:
             self.name = self.idx
+        if idx is not None:
+            self.idx = str(idx)
+        if documents_cache is not None:
+            self.documents_cache = documents_cache
+        else:
+            self.documents_cache = {}
+
         self.enable_benchmark = os.getenv("ENABLE_BENCHMARK", "False").lower() == "true"
-        self.run_pipeline_cb = run_generator_ben if self.enable_benchmark else run_generator
+        self.run_pipeline_cb = run_pipeline
+        self.run_retriever_postprocessor_cb = run_retrieve_postprocess
         self.run_retriever_cb = run_retrieve
+        self.run_postprocessor_cb = run_postprocess
+        self.run_generator_cb = run_generator
         self.run_data_prepare_cb = run_simple_doc
-
+        self.run_query_search_cb = run_query_search
         self._node_changed = False
         self._index_changed = False
         self._index_to_retriever_updated = True
@@ -97,12 +113,10 @@ def check_active(self, nodelist, kb_name):
     # TODO: update doc changes
     # TODO: more operations needed, add, del, modify
     def update_nodes(self, nodes):
-        print(f"Updating {len(nodes)} nodes ...")
         if self.indexer is not None:
             self.indexer.insert_nodes(nodes)
 
     def update_indexer_to_retriever(self):
-        print("Updating indexer to retriever ...")
         if self.indexer is not None and self.retriever is not None:
             old_retriever = self.retriever
             retriever_type = old_retriever.comp_subtype
@@ -121,18 +135,31 @@ def update_indexer_to_retriever(self):
 
     # Implement abstract run function
     # callback dispatcher
-    def run(self, **kwargs) -> Any:
-        print(kwargs)
+    async def run(self, **kwargs) -> Any:
         if "cbtype" in kwargs:
             if kwargs["cbtype"] == CallbackType.DATAPREP:
                 if "docs" in kwargs:
-                    return self.run_data_prepare_cb(self, docs=kwargs["docs"])
+                    return await self.run_data_prepare_cb(self, docs=kwargs["docs"])
+            if kwargs["cbtype"] == CallbackType.RETRIEVE_POSTPROCESS:
+                if "chat_request" in kwargs:
+                    return await self.run_retriever_postprocessor_cb(self, chat_request=kwargs["chat_request"])
             if kwargs["cbtype"] == CallbackType.RETRIEVE:
                 if "chat_request" in kwargs:
-                    return self.run_retriever_cb(self, chat_request=kwargs["chat_request"])
+                    return await self.run_retriever_cb(self, chat_request=kwargs["chat_request"])
+            if kwargs["cbtype"] == CallbackType.POSTPROCESS:
+                if "chat_request" in kwargs and "contexts" in kwargs:
+                    return await self.run_postprocessor_cb(
+                        self, chat_request=kwargs["chat_request"], contexts=kwargs["contexts"]
+                    )
+            if kwargs["cbtype"] == CallbackType.GENERATE:
+                if "chat_request" in kwargs:
+                    return await self.run_generator_cb(self, chat_request=kwargs["chat_request"])
             if kwargs["cbtype"] == CallbackType.PIPELINE:
                 if "chat_request" in kwargs:
-                    return self.run_pipeline_cb(self, chat_request=kwargs["chat_request"])
+                    return await self.run_pipeline_cb(self, chat_request=kwargs["chat_request"])
+            if kwargs["cbtype"] == CallbackType.QUERYSEARCH:
+                if "chat_request" in kwargs:
+                    return await self.run_query_search_cb(self, chat_request=kwargs["chat_request"])
 
     def update(self, node_parser=None, indexer=None, retriever=None, postprocessor=None, generator=None):
         if node_parser is not None:
@@ -146,6 +173,86 @@ def update(self, node_parser=None, indexer=None, retriever=None, postprocessor=N
         if generator is not None:
             self.generator = generator
 
+    def add_docs_to_list(self, kb_name, file_paths):
+        if self.indexer.comp_subtype != "milvus_vector":
+            return None
+        target_config = self.connect_target_config()
+        if kb_name not in self.documents_cache:
+            self.documents_cache[kb_name] = {"files": [], "config": target_config}
+        if isinstance(file_paths, str):
+            file_paths = [file_paths]
+        self.documents_cache[kb_name]["files"].extend(file_paths)
+
+    def del_docs_to_list(self, kb_name, file_paths):
+        if kb_name not in self.documents_cache:
+            return None
+        if isinstance(file_paths, str):
+            file_paths = [file_paths]
+        for file_path in file_paths:
+            if file_path in self.documents_cache[kb_name]["files"]:
+                self.documents_cache[kb_name]["files"].remove(file_path)
+
+    def clear_document_cache(self, kb_name):
+        if kb_name in self.documents_cache:
+            del self.documents_cache[kb_name]
+
+    def compare_file_lists(self, kb_name, current_files):
+        self.add_docs_to_list(kb_name, [])
+        target_config = self.connect_target_config()
+        if self.documents_cache[kb_name]["config"] == target_config:
+            diff = self.compare_mappings(self.documents_cache[kb_name]["files"], current_files)
+        else:
+            self.documents_cache[kb_name] = {"files": [], "config": self.connect_target_config()}
+            diff = {"add_docs": current_files}
+        return diff
+
+    def compare_mappings(self, stored_files, new_files):
+        stored = set(stored_files)
+        new = set(new_files)
+        return {"add_docs": list(new - stored), "del_docs": list(stored - new)}
+
+    def connect_target_config(self):
+        target_config = ""
+        if self.node_parser.comp_subtype == NodeParserType.SIMPLE:
+            target_config = (
+                "simple"
+                + str(self.node_parser.chunk_size)
+                + str(self.node_parser.chunk_overlap)
+                + self.indexer.model.model_id
+            )
+        elif self.node_parser.comp_subtype == NodeParserType.SENTENCEWINDOW:
+            target_config = "sentencewindow" + str(self.node_parser.window_size) + self.indexer.model.model_id
+        elif self.node_parser.comp_subtype == NodeParserType.HIERARCHY:
+            target_config = "hierarchical" + self.indexer.model.model_id
+        elif self.node_parser.comp_subtype == NodeParserType.UNSTRUCTURED:
+            target_config = (
+                "target_config"
+                + str(self.node_parser.chunk_size)
+                + str(self.node_parser.chunk_overlap)
+                + self.indexer.model.model_id
+            )
+        return target_config
+
+    def nodes_to_document(self, node_dict: dict):
+        nodes = []
+        for node_info in node_dict.values():
+            nodes.append({"start": int(node_info["start_char_idx"]), "text": node_info["text"]})
+        nodes_sorted = sorted(nodes, key=lambda x: x["start"])
+        if not nodes_sorted:
+            return ""
+        merged_text = nodes_sorted[0]["text"]
+        for i in range(1, len(nodes_sorted)):
+            prev_text = merged_text
+            curr_text = nodes_sorted[i]["text"]
+            max_possible_overlap = min(len(prev_text), len(curr_text))
+            overlap_len = 0
+            for j in range(max_possible_overlap, 0, -1):
+                if prev_text.endswith(curr_text[:j]):
+                    overlap_len = j
+                    break
+            merged_text += curr_text[overlap_len:]
+        return merged_text
+
     @model_serializer
     def ser_model(self):
         set = {
@@ -181,11 +288,55 @@ def model_existed(self, model_id: str) -> bool:
         return False
 
 
-# Test callback to retrieve nodes from query
-def run_retrieve(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
+async def run_retrieve(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
+    benchmark_data = {}
+    query = chat_request.messages
+    top_k = None if chat_request.k == ChatCompletionRequest.model_fields["k"].default else chat_request.k
+    contexts = {}
+    start = 0
+    if pl.enable_benchmark:
+        _, benchmark_data = pl.benchmark.init_benchmark_data()
+        start = time.perf_counter()
+    retri_res = pl.retriever.run(query=query, top_k=top_k)
+    if pl.enable_benchmark:
+        benchmark_data[CompType.RETRIEVER] = time.perf_counter() - start
+        pl.benchmark.insert_benchmark_data(benchmark_data)
+    contexts[CompType.RETRIEVER] = retri_res
+    return contexts
+
+
+async def run_postprocess(pl: Pipeline, chat_request: ChatCompletionRequest, contexts) -> Any:
+    if CompType.RETRIEVER not in contexts:
+        raise ValueError("No retrieved contexts identified.")
+    query = chat_request.messages
+    query_bundle = QueryBundle(query)
+    if pl.postprocessor:
+        # TODO: Consider multiple postprocessors
+        for processor in pl.postprocessor:
+            if (
+                isinstance(processor, RerankProcessor)
+                and chat_request.top_n != ChatCompletionRequest.model_fields["top_n"].default
+            ):
+                processor.top_n = chat_request.top_n
+            retri_res = processor.run(retri_res=contexts.get(CompType.RETRIEVER), query_bundle=query_bundle)
+            contexts[CompType.POSTPROCESSOR] = retri_res
+    return contexts
+
+
+# Test callback to retrieve and rerank nodes from query
+async def run_retrieve_postprocess(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
+    benchmark_data = {}
     query = chat_request.messages
+    top_k = None if chat_request.k == ChatCompletionRequest.model_fields["k"].default else chat_request.k
     contexts = {}
-    retri_res = pl.retriever.run(query=query)
+    start = 0
+    if pl.enable_benchmark:
+        _, benchmark_data = pl.benchmark.init_benchmark_data()
+        start = time.perf_counter()
+    retri_res = pl.retriever.run(query=query, top_k=top_k)
+    if pl.enable_benchmark:
+        benchmark_data[CompType.RETRIEVER] = time.perf_counter() - start
+        pl.benchmark.insert_benchmark_data(benchmark_data)
     contexts[CompType.RETRIEVER] = retri_res
     query_bundle = QueryBundle(query)
     if pl.postprocessor:
@@ -200,14 +351,41 @@ def run_retrieve(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
     return contexts
 
 
-def run_simple_doc(pl: Pipeline, docs: List[Document]) -> Any:
+async def run_simple_doc(pl: Pipeline, docs: List[Document]) -> Any:
+    start = 0
+    benchmark_data = {}
+    if pl.enable_benchmark:
+        _, benchmark_data = pl.benchmark.init_benchmark_data()
+        start = time.perf_counter()
     n = pl.node_parser.run(docs=docs)
     if pl.indexer is not None:
         pl.indexer.insert_nodes(n)
-    print(pl.indexer._index_struct)
+    if pl.enable_benchmark:
+        benchmark_data[CompType.NODEPARSER] += time.perf_counter() - start
+        benchmark_data[CompType.CHUNK_NUM] += len(n)
+        pl.benchmark.insert_benchmark_data(benchmark_data)
     return n
 
 
+async def run_query_search(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
+    query = chat_request.messages
+
+    def run_async_query_search():
+        loop = asyncio.new_event_loop()
+        asyncio.set_event_loop(loop)
+        try:
+            return loop.run_until_complete(query_search(query, SEARCH_CONFIG_PATH, SEARCH_DIR, pl))
+        finally:
+            loop.close()
+
+    with ThreadPoolExecutor(max_workers=1) as executor:
+        future = executor.submit(run_async_query_search)
+        top1_issue, sub_questionss_result = future.result()
+    if sub_questionss_result:
+        query = query + sub_questionss_result
+    return query, sub_questionss_result
+
+
 def benchmark_response(ret, benchmark, benchmark_index, benchmark_data, input_token_size, start):
     if isinstance(ret, StreamingResponse):
         original_body_iterator = ret.body_iterator
@@ -225,114 +403,94 @@ async def timing_wrapper():
         return ret
 
 
-def run_generator_ben(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
-    benchmark_index, benchmark_data = pl.benchmark.init_benchmark_data()
+async def run_pipeline(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
+    if pl.enable_benchmark:
+        benchmark_index, benchmark_data = pl.benchmark.init_benchmark_data()
     contexts = {}
-    start = time.perf_counter()
+    retri_res = []
+    active_kb = chat_request.user if chat_request.user else None
+    enable_rag_retrieval = (
+        chat_request.chat_template_kwargs.get("enable_rag_retrieval", True)
+        if chat_request.chat_template_kwargs
+        else True
+    )
+    if not active_kb:
+        enable_rag_retrieval = False
+    elif pl.retriever.comp_subtype == "kbadmin_retriever" and active_kb.comp_subtype == "origin_kb":
+        enable_rag_retrieval = False
+    elif pl.retriever.comp_subtype != "kbadmin_retriever" and active_kb.comp_subtype == "kbadmin_kb":
+        enable_rag_retrieval = False
     query = chat_request.messages
-    if pl.generator.inference_type == InferenceType.VLLM:
-        UI_DIRECTORY = os.getenv("TMPFILE_PATH", "/home/user/ui_cache")
-        search_config_path = os.path.join(UI_DIRECTORY, "configs/search_config.yaml")
-        search_dir = os.path.join(UI_DIRECTORY, "configs/search_dir")
-
-        def run_async_query_search():
-            loop = asyncio.new_event_loop()
-            asyncio.set_event_loop(loop)
-            try:
-                return loop.run_until_complete(query_search(query, search_config_path, search_dir, pl))
-            finally:
-                loop.close()
-
-        with ThreadPoolExecutor(max_workers=1) as executor:
-            future = executor.submit(run_async_query_search)
-            top1_issue, sub_questionss_result = future.result()
-        if sub_questionss_result:
-            query = query + sub_questionss_result
-
-    retri_res = pl.retriever.run(query=query)
-    query_bundle = QueryBundle(query)
-    benchmark_data[CompType.RETRIEVER] = time.perf_counter() - start
-    contexts[CompType.RETRIEVER] = retri_res
-
-    start = time.perf_counter()
-    if pl.postprocessor:
-        for processor in pl.postprocessor:
-            if (
-                isinstance(processor, RerankProcessor)
-                and chat_request.top_n != ChatCompletionRequest.model_fields["top_n"].default
-            ):
-                processor.top_n = chat_request.top_n
-            retri_res = processor.run(retri_res=retri_res, query_bundle=query_bundle)
-            contexts[CompType.POSTPROCESSOR] = retri_res
-    benchmark_data[CompType.POSTPROCESSOR] = time.perf_counter() - start
+    sub_questionss_result = None
+    experience_status = True if chat_request.tool_choice == "auto" else False
+    if enable_rag_retrieval:
+        start = 0
+        if pl.enable_benchmark:
+            start = time.perf_counter()
+        if pl.generator.inference_type == InferenceType.VLLM and experience_status:
+            query, sub_questionss_result = await run_query_search(pl, chat_request)
+        if pl.enable_benchmark:
+            benchmark_data[CompType.QUERYSEARCH] = time.perf_counter() - start
+            start = time.perf_counter()
+        top_k = (
+            None
+            if chat_request.k == pl.retriever.topk or chat_request.k != 0 or chat_request.k is None
+            else chat_request.k
+        )
+        retri_res = pl.retriever.run(query=query, top_k=top_k)
+        if pl.enable_benchmark:
+            benchmark_data[CompType.RETRIEVER] = time.perf_counter() - start
+        contexts[CompType.RETRIEVER] = retri_res
+        query_bundle = QueryBundle(query)
+        if pl.enable_benchmark:
+            start = time.perf_counter()
+        if pl.postprocessor:
+            for processor in pl.postprocessor:
+                if (
+                    isinstance(processor, RerankProcessor)
+                    and chat_request.top_n != processor.top_n
+                    and chat_request.top_n != 0
+                    and chat_request.top_n is not None
+                ):
+                    processor.top_n = chat_request.top_n
+                retri_res = processor.run(retri_res=retri_res, query_bundle=query_bundle)
+                contexts[CompType.POSTPROCESSOR] = retri_res
+        if pl.enable_benchmark:
+            benchmark_data[CompType.POSTPROCESSOR] = time.perf_counter() - start
 
     if pl.generator is None:
         raise ValueError("No Generator Specified")
 
-    text_gen_context, prompt_str = pl.generator.query_transform(chat_request, retri_res)
-    input_token_size = pl.benchmark.cal_input_token_size(prompt_str)
+    if pl.enable_benchmark:
+        _, prompt_str = pl.generator.query_transform(chat_request, retri_res)
+        input_token_size = pl.benchmark.cal_input_token_size(prompt_str)
 
     np_type = pl.node_parser.comp_subtype
-    start = time.perf_counter()
+    if pl.enable_benchmark:
+        start = time.perf_counter()
     if pl.generator.inference_type == InferenceType.LOCAL:
-        ret = pl.generator.run(chat_request, retri_res, np_type)
+        ret = await pl.generator.run(chat_request, retri_res, np_type)
     elif pl.generator.inference_type == InferenceType.VLLM:
-        ret = pl.generator.run_vllm(chat_request, retri_res, np_type, sub_questions=sub_questionss_result)
+        ret = await pl.generator.run_vllm(chat_request, retri_res, np_type, sub_questions=sub_questionss_result)
     else:
         raise ValueError("LLM inference_type not supported")
-    end = time.perf_counter()
-
-    if isinstance(ret, StreamingResponse):
-        ret = benchmark_response(ret, pl.benchmark, benchmark_index, benchmark_data, input_token_size, start)
-    else:
-        benchmark_data[CompType.GENERATOR] = end - start
-        pl.benchmark.insert_llm_data(benchmark_index, input_token_size)
-        pl.benchmark.insert_benchmark_data(benchmark_data)
+    if pl.enable_benchmark:
+        end = time.perf_counter()
+        if isinstance(ret, StreamingResponse):
+            ret = benchmark_response(ret, pl.benchmark, benchmark_index, benchmark_data, input_token_size, start)
+        else:
+            benchmark_data[CompType.GENERATOR] = end - start
+            pl.benchmark.insert_llm_data(benchmark_index, input_token_size)
+            pl.benchmark.insert_benchmark_data(benchmark_data)
     return ret, contexts
 
 
-def run_generator(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
-    query = chat_request.messages
-    contexts = {}
-    if pl.generator.inference_type == InferenceType.VLLM:
-        UI_DIRECTORY = os.getenv("TMPFILE_PATH", "/home/user/ui_cache")
-        search_config_path = os.path.join(UI_DIRECTORY, "configs/search_config.yaml")
-        search_dir = os.path.join(UI_DIRECTORY, "configs/search_dir")
-
-        def run_async_query_search():
-            loop = asyncio.new_event_loop()
-            asyncio.set_event_loop(loop)
-            try:
-                return loop.run_until_complete(query_search(query, search_config_path, search_dir, pl))
-            finally:
-                loop.close()
-
-        with ThreadPoolExecutor(max_workers=1) as executor:
-            future = executor.submit(run_async_query_search)
-            top1_issue, sub_questionss_result = future.result()
-        if sub_questionss_result:
-            query = query + sub_questionss_result
-    retri_res = pl.retriever.run(query=query)
-    contexts[CompType.RETRIEVER] = retri_res
-    query_bundle = QueryBundle(query)
-
-    if pl.postprocessor:
-        for processor in pl.postprocessor:
-            if (
-                isinstance(processor, RerankProcessor)
-                and chat_request.top_n != ChatCompletionRequest.model_fields["top_n"].default
-            ):
-                processor.top_n = chat_request.top_n
-            retri_res = processor.run(retri_res=retri_res, query_bundle=query_bundle)
-            contexts[CompType.POSTPROCESSOR] = retri_res
-
-    if pl.generator is None:
-        raise ValueError("No Generator Specified")
+async def run_generator(pl: Pipeline, chat_request: ChatCompletionRequest) -> Any:
     np_type = pl.node_parser.comp_subtype
     if pl.generator.inference_type == InferenceType.LOCAL:
-        ret = pl.generator.run(chat_request, retri_res, np_type)
+        ret = await pl.generator.run(chat_request, [], np_type)
     elif pl.generator.inference_type == InferenceType.VLLM:
-        ret = pl.generator.run_vllm(chat_request, retri_res, np_type, sub_questions=sub_questionss_result)
+        ret = await pl.generator.run_vllm(chat_request, [], np_type)
     else:
         raise ValueError("LLM inference_type not supported")
-    return ret, contexts
+    return ret
diff --git a/EdgeCraftRAG/edgecraftrag/components/postprocessor.py b/EdgeCraftRAG/edgecraftrag/components/postprocessor.py
index bb59cc3d21..cbd387f59e 100644
--- a/EdgeCraftRAG/edgecraftrag/components/postprocessor.py
+++ b/EdgeCraftRAG/edgecraftrag/components/postprocessor.py
@@ -60,5 +60,5 @@ def run(self, **kwargs) -> Any:
 
     @model_serializer
     def ser_model(self):
-        set = {"idx": self.idx, "processor_type": self.comp_subtype, "model": None, "top_n": None}
+        set = {"idx": self.idx, "processor_type": self.comp_subtype, "top_n": None}
         return set
diff --git a/EdgeCraftRAG/edgecraftrag/components/query_preprocess.py b/EdgeCraftRAG/edgecraftrag/components/query_preprocess.py
index 124014a038..e17ab9d724 100644
--- a/EdgeCraftRAG/edgecraftrag/components/query_preprocess.py
+++ b/EdgeCraftRAG/edgecraftrag/components/query_preprocess.py
@@ -8,6 +8,7 @@
 
 import aiohttp
 import numpy
+from edgecraftrag.config_repository import MilvusConfigRepository
 from omegaconf import OmegaConf
 
 
@@ -85,6 +86,7 @@ def __init__(
         output_template="",
         json_key="relevance",
         json_levels=["Low", "High"],
+        scores_weight=None,
         temperature=1.0,
         API_BASE=None,
         **kwargs,
@@ -107,6 +109,19 @@ def __init__(
         self.json_levels = json_levels
         self.API_BASE = API_BASE
 
+        # dynamically set scores_weight, use default if not provided
+        if scores_weight is None:
+            # generate default weights based on json_levels count
+            if len(json_levels) == 2:
+                self.scores_weight = [0.0, 1.0]  # Low, High
+            elif len(json_levels) == 3:
+                self.scores_weight = [0.0, 0.5, 1.0]  # Low, Medium, High
+            else:
+                # for other counts, generate evenly spaced weights
+                self.scores_weight = [i / (len(json_levels) - 1) for i in range(len(json_levels))]
+        else:
+            self.scores_weight = scores_weight
+
     async def invoke_vllm(self, input_texts):
         headers = {"Content-Type": "application/json"}
         payload = {
@@ -152,18 +167,22 @@ async def _calculate_logits_score(self, user_input, issue):
 
     def _calculate_token_score_vllm(self, outputs, output_index=1, transform="exp"):
         generated_scores = outputs[output_index]
-        three_scores = [
-            generated_scores.get("Low", -9999.0),
-            generated_scores.get("Medium", -9999.0),
-            generated_scores.get("High", -9999.0),
-        ]
-        level_scores = [score / self.temperature for score in three_scores]
+
+        # dynamically get scores for all levels
+        level_scores = []
+        for level in self.json_levels:
+            level_scores.append(generated_scores.get(level, -9999.0))
+
+        # apply temperature scaling
+        level_scores = [score / self.temperature for score in level_scores]
 
         level_scores_np = numpy.array(level_scores)
         level_scores_np = numpy.where(level_scores_np < -1000, -1000, level_scores_np)
         level_scores_np_exp = numpy.exp(level_scores_np - numpy.max(level_scores_np))
         scores_probs = level_scores_np_exp / level_scores_np_exp.sum()
-        scores_weight = numpy.array([0.0, 0.5, 1.0])  # Low=0, Medium=0.5, High=1
+
+        # using dynamic scores_weight
+        scores_weight = numpy.array(self.scores_weight)
         final_score = numpy.dot(scores_probs, scores_weight)
 
         return final_score
@@ -172,40 +191,51 @@ async def compute_score(self, input_pair):
         return await self._calculate_logits_score(*input_pair)
 
 
-def read_json_files(directory: str) -> dict:
-    result = {}
-    for filename in os.listdir(directory):
-        if filename.endswith(".json"):
-            file_path = os.path.join(directory, filename)
-            if os.path.isfile(file_path):
-                try:
-                    with open(file_path, "r", encoding="utf-8") as file:
-                        data = json.load(file)
-                        result.update(data)
-                except Exception:
-                    continue
-    return result
+experience_repo = MilvusConfigRepository.create_connection("experience_data", 1)
+
 
+def read_json_files(file_path: str) -> dict:
+    experience_lists = []
+    if experience_repo:
+        experience_lists = []
+        for experience in experience_repo.get_configs():
+            experience_lists.append(experience["config_json"])
+    else:
+        if os.path.isfile(file_path):
+            with open(file_path, "r", encoding="utf-8") as f:
+                experience_lists = json.load(f)
+    return experience_lists
 
-async def query_search(user_input, search_config_path, search_dir, pl):
 
+async def query_search(user_input, SEARCH_CONFIG_PATH, SEARCH_DIR, pl):
     top1_issue = None
-    sub_questionss_result = None
-    if not os.path.exists(search_dir):
-        return top1_issue, sub_questionss_result
+    sub_questions_result = None
 
     model_id = pl.generator.model_id
     vllm_endpoint = pl.generator.vllm_endpoint
 
-    cfg = OmegaConf.load(search_config_path)
-    cfg.query_matcher.model_id = model_id
-    cfg.query_matcher.API_BASE = os.path.join(vllm_endpoint, "v1/completions")
-    query_matcher = LogitsEstimatorJSON(**cfg.query_matcher)
-    maintenance_data = read_json_files(search_dir)
-    issues = list(maintenance_data.keys())
+    maintenance_data = read_json_files(SEARCH_DIR)
+    issues = []
+    for i in range(len(maintenance_data)):
+        issues.append(maintenance_data[i]["question"])
     if not issues:
-        return top1_issue, sub_questionss_result
-
+        return top1_issue, sub_questions_result
+
+    cfg = {}
+    if not os.path.exists(SEARCH_CONFIG_PATH):
+        cfg["query_matcher"] = {
+            "instructions": "You're a knowledgeable assistant. Your task is to judge if two queries ask for the same information about the same primary subject. Output only 'Yes' or 'No'. Yes = same subject entity AND same information need, with only wording or stylistic differences. No = different subject entity, different spec or numeric constraint, different attribute/metric, or scope changed by adding/removing a restricting condition. Entity changes MUST lead to No.",
+            "input_template": "Query 1: {}\nQuery 2: {}\n",
+            "output_template": "\nAre these queries equivalent? Answer 'Yes' or 'No':",
+            "json_key": "similarity",
+            "json_levels": ["No", "Yes"],
+            "temperature": 0.1,
+        }
+    else:
+        cfg = OmegaConf.load(SEARCH_CONFIG_PATH)
+    cfg["query_matcher"]["model_id"] = model_id
+    cfg["query_matcher"]["API_BASE"] = os.path.join(vllm_endpoint, "v1/completions")
+    query_matcher = LogitsEstimatorJSON(**cfg["query_matcher"])
     semaphore = asyncio.Semaphore(200)
 
     async def limited_compute_score(query_matcher, user_input, issue):
@@ -219,9 +249,9 @@ async def limited_compute_score(query_matcher, user_input, issue):
 
     # Maximum less than 0.6, we don't use query search.
     if match_scores[0][1] < 0.6:
-        return top1_issue, sub_questionss_result
+        return top1_issue, sub_questions_result
     top1_issue = match_scores[0][0]
-    for key, value in maintenance_data.items():
-        if key == top1_issue:
-            sub_questionss_result = value
-    return top1_issue, sub_questionss_result
+    for i in range(len(maintenance_data)):
+        if maintenance_data[i]["question"] == top1_issue:
+            sub_questions_result = "\n".join(maintenance_data[i]["content"])
+    return top1_issue, sub_questions_result
diff --git a/EdgeCraftRAG/edgecraftrag/components/retriever.py b/EdgeCraftRAG/edgecraftrag/components/retriever.py
index fa8553346a..cdd3fe0bc2 100644
--- a/EdgeCraftRAG/edgecraftrag/components/retriever.py
+++ b/EdgeCraftRAG/edgecraftrag/components/retriever.py
@@ -1,14 +1,19 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-from typing import Any, List, cast
+import warnings
+from typing import Any, List, Optional, cast
 
+import requests
 from edgecraftrag.base import BaseComponent, CompType, RetrieverType
+from langchain_milvus import Milvus
+from langchain_openai import OpenAIEmbeddings
 from llama_index.core.indices.vector_store.retrievers import VectorIndexRetriever
 from llama_index.core.retrievers import AutoMergingRetriever
-from llama_index.core.schema import BaseNode
+from llama_index.core.schema import BaseNode, Document, NodeWithScore
 from llama_index.retrievers.bm25 import BM25Retriever
 from pydantic import model_serializer
+from pymilvus import Collection, MilvusException, connections, utility
 
 
 class VectorSimRetriever(BaseComponent, VectorIndexRetriever):
@@ -39,6 +44,8 @@ def __init__(self, indexer, **kwargs):
     def run(self, **kwargs) -> Any:
         for k, v in kwargs.items():
             if k == "query":
+                top_k = kwargs["top_k"] if kwargs["top_k"] else self.topk
+                self.similarity_top_k = top_k
                 return self.retrieve(v)
 
         return None
@@ -75,8 +82,9 @@ def __init__(self, indexer, **kwargs):
     def run(self, **kwargs) -> Any:
         for k, v in kwargs.items():
             if k == "query":
+                top_k = kwargs["top_k"] if kwargs["top_k"] else self.topk
                 # vector_retriever needs to be updated
-                self._vector_retriever = self._index.as_retriever(similarity_top_k=self.topk)
+                self._vector_retriever = self._index.as_retriever(similarity_top_k=top_k)
                 return self.retrieve(v)
 
         return None
@@ -108,8 +116,9 @@ def __init__(self, indexer, **kwargs):
     def run(self, **kwargs) -> Any:
         for k, v in kwargs.items():
             if k == "query":
+                top_k = kwargs["top_k"] if kwargs["top_k"] else self.topk
                 nodes = cast(List[BaseNode], list(self._docstore.docs.values()))
-                similarity_top_k = min(len(nodes), self.topk)
+                similarity_top_k = min(len(nodes), top_k)
                 bm25_retr = BM25Retriever.from_defaults(nodes=nodes, similarity_top_k=similarity_top_k)
                 return bm25_retr.retrieve(v)
 
@@ -123,3 +132,139 @@ def ser_model(self):
             "retrieve_topk": self.topk,
         }
         return set
+
+
+class KBadminRetriever(BaseComponent):
+    def __init__(self, indexer, **kwargs):
+        BaseComponent.__init__(
+            self,
+            comp_type=CompType.RETRIEVER,
+            comp_subtype=RetrieverType.KBADMIN_RETRIEVER,
+        )
+        self.vector_db = None
+        self.collection_name = None
+        self.topk = kwargs.get("similarity_top_k", 30)
+        self.KBADMIN_MILVUS_URL = indexer.vector_url
+        self.CONNECTION_ARGS = {"uri": indexer.vector_url}
+        self.vector_field = "q_1024_vec"
+        self.text_field = "content_with_weight"
+        self.embedding_model_name = indexer.embed_model
+        self.embedding_url = indexer.kbadmin_embedding_url + "/v3"
+        self.embedding = OpenAIEmbeddings(
+            model=self.embedding_model_name,
+            api_key="unused",
+            base_url=self.embedding_url,
+            tiktoken_enabled=False,
+            embedding_ctx_length=510,
+        )
+
+    def config_kbadmin_milvus(self, knowledge_name):
+        collection_name = knowledge_name
+        if not kbs_rev_maps:
+            get_kbs_info(self.CONNECTION_ARGS)
+        collection_name = kbs_rev_maps[collection_name]
+        self.vector_db = Milvus(
+            self.embedding,
+            connection_args=self.CONNECTION_ARGS,
+            collection_name=collection_name,
+            vector_field=self.vector_field,
+            text_field=self.text_field,
+            enable_dynamic_field=True,
+            index_params={"index_type": "FLAT", "metric_type": "IP", "params": {}},
+        )
+
+    def similarity_search_with_embedding(self, query: str, k) -> list[tuple[Document, float]]:
+        url = self.embedding_url + "/embeddings"
+        embedding_info = {"model": self.embedding_model_name, "input": query}
+        # Get embedding result from embedding service
+        response = requests.post(url, headers={"Content-Type": "application/json"}, json=embedding_info)
+        embedding_json = response.json()
+        embedding = embedding_json["data"][0]["embedding"]
+        docs_and_scores = self.vector_db.similarity_search_with_score_by_vector(embedding=embedding, k=k)
+        relevance_score_fn = self.vector_db._select_relevance_score_fn()
+        return [(doc, relevance_score_fn(score)) for doc, score in docs_and_scores]
+
+    def run(self, **kwargs) -> Any:
+        query = kwargs["query"]
+        top_k = kwargs["top_k"] if kwargs["top_k"] else self.topk
+        # langchain retrieval
+        docs_and_similarities = self.similarity_search_with_embedding(query=query, k=top_k)
+        node_with_scores: List[NodeWithScore] = []
+        for doc, similarity in docs_and_similarities:
+            score: Optional[float] = None
+            if similarity is not None:
+                score = similarity
+            # convert langchain store format into llamaindex
+            node = Document.from_langchain_format(doc)
+            node_with_scores.append(NodeWithScore(node=node, score=score))
+        return node_with_scores
+
+    @model_serializer
+    def ser_model(self):
+        set = {"idx": self.idx, "retriever_type": self.comp_subtype, "CONNECTION_ARGS": self.CONNECTION_ARGS}
+        return set
+
+
+# global kbs maps.
+global kbs_rev_maps
+kbs_rev_maps = {}
+
+
+def get_kbs_info(CONNECTION_ARGS):
+    alias = "default"
+    try:
+        connections.connect("default", **CONNECTION_ARGS)
+        collections = utility.list_collections()
+        all_kb_infos = {}
+        new_infos = {}
+        for kb in collections:
+            collection = Collection(kb)
+            collection.load()
+            try:
+                if any(field.name == "kb_id" for field in collection.schema.fields):
+                    docs = collection.query(
+                        expr="pk != 0",
+                        output_fields=["kb_name", "kb_id", "docnm_kwd"],
+                        timeout=10,
+                    )
+                else:
+                    docs = collection.query(
+                        expr="pk != 0",
+                        output_fields=["filename"],
+                        timeout=10,
+                    )
+                collection.release()
+            except MilvusException as e:
+                continue
+            this_kbinfo = {}
+            for doc in docs:
+                try:
+                    if "kb_name" in doc:
+                        if not this_kbinfo:
+                            this_kbinfo["name"] = doc["kb_name"]
+                            this_kbinfo["uuid"] = doc["kb_id"]
+                            this_kbinfo["files"] = set([doc["docnm_kwd"]])
+                        else:
+                            this_kbinfo["files"].add(doc["docnm_kwd"])
+                    else:
+                        if not this_kbinfo:
+                            this_kbinfo["name"] = kb
+                            this_kbinfo["uuid"] = ""
+                            this_kbinfo["files"] = set([doc["filename"]])
+                        else:
+                            this_kbinfo["files"].add(doc["filename"])
+                except KeyError:
+                    this_kbinfo = None
+                    break
+            if this_kbinfo:
+                unique_files = list(this_kbinfo["files"])
+                this_kbinfo["files"] = unique_files
+                new_infos[kb] = this_kbinfo
+        all_kb_infos.update(new_infos)
+        kbs_rev_maps.clear()
+        for kb_id in all_kb_infos:
+            kbs_rev_maps[all_kb_infos[kb_id]["name"]] = kb_id
+        return kbs_rev_maps
+    finally:
+        if connections.has_connection(alias):
+            connections.disconnect(alias)
diff --git a/EdgeCraftRAG/edgecraftrag/components/session.py b/EdgeCraftRAG/edgecraftrag/components/session.py
new file mode 100644
index 0000000000..65b1aeb4fd
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/components/session.py
@@ -0,0 +1,75 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from datetime import datetime
+from typing import Any, Dict, List, Optional
+
+from edgecraftrag.base import BaseComponent, CompType
+from pydantic import model_serializer
+
+
+class Session(BaseComponent):
+    def __init__(self, session_id: str):
+        super().__init__(comp_type=CompType.SESSION)
+        self.session_id = session_id
+        self.messages: List[Dict[str, str]] = []
+        self.created_at: datetime = datetime.now()
+        self.current_messages: Optional[Dict[str, str]] = None
+
+    def add_message(self, role: str, content: str) -> None:
+        if role not in ("user", "assistant"):
+            raise ValueError("Role should be 'user' or 'assistant'")
+        self.messages.append({"role": role, "content": content})
+        self.current_messages = None
+
+    def get_messages(self) -> List[Dict[str, str]]:
+        return self.messages.copy()
+
+    def clear_messages(self) -> None:
+        self.messages = []
+
+    def get_user_message_titel(self) -> Optional[str]:
+        for msg in self.messages:
+            if msg["role"] == "user":
+                return msg["content"]
+        return None
+
+    def to_dict(self) -> Dict[str, Any]:
+        concat_messages = self.messages.copy()
+        if self.current_messages:
+            concat_messages.append(self.current_messages)
+        return {
+            "session_id": self.session_id,
+            "created_at": self.created_at.isoformat(),
+            "messages": concat_messages,
+            "idx": self.idx,
+        }
+
+    def update_current_message(self, role: str, content: str) -> None:
+        self.current_messages = {"role": role, "content": content}
+
+    @classmethod
+    def from_dict(cls, data: Dict[str, Any]) -> "Session":
+        session_id = data.get("session_id", f"session_{data.get('idx', 'unknown')}")
+        session = cls(session_id)
+        session.idx = data.get("idx", session.idx)
+        created_at_str = data.get("created_at")
+        session.created_at = datetime.fromisoformat(created_at_str) if created_at_str else datetime.now()
+        for item in data.get("messages", []):
+            if isinstance(item, dict) and "role" in item and "content" in item:
+                role = item["role"]
+                content = item["content"]
+                if role in ("user", "assistant") and isinstance(content, str):
+                    session.add_message(role, content)
+        return session
+
+    def run(self, **kwargs) -> Any:
+        pass
+
+    @model_serializer
+    def ser_model(self):
+        return {
+            "session_id": self.session_id,
+            "created_at": self.created_at.isoformat(),
+            "messages": self.messages,
+        }
diff --git a/EdgeCraftRAG/edgecraftrag/config_repository.py b/EdgeCraftRAG/edgecraftrag/config_repository.py
new file mode 100644
index 0000000000..761297f4f7
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/config_repository.py
@@ -0,0 +1,420 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import json
+import os
+import time
+from typing import Dict, List, Optional
+
+from edgecraftrag.env import AGENT_FILE, KNOWLEDGEBASE_FILE, PIPELINE_FILE
+from pymilvus import (
+    Collection,
+    CollectionSchema,
+    DataType,
+    FieldSchema,
+    connections,
+    utility,
+)
+
+
+class MilvusConfigRepository:
+    def __init__(
+        self,
+        Repo_config_name: Optional[str] = "pipeline_config",
+        vector_url: Optional[str] = None,
+    ):
+        self.vector_url = vector_url or os.getenv("METADATA_DATABASE_URL")
+        self.host, self.port = None, None
+        if self.vector_url:
+            host_port = self.vector_url.replace("http://", "").replace("https://", "")
+            if ":" in host_port:
+                self.host, self.port = host_port.split(":", 1)
+        self.collection_name = Repo_config_name
+        self.alias = Repo_config_name
+        self.collection = None
+        self.connected = False
+
+    def _connect(self) -> None:
+        try:
+            connections.connect(host=self.host, port=self.port, alias=self.alias)
+        except Exception as e:
+            raise RuntimeError(f"Connect Milvus failed: {str(e)}")
+
+    def _init_collection(self) -> Collection:
+        if not utility.has_collection(self.collection_name, using=self.alias):
+            fields = [
+                FieldSchema(
+                    name="idx",
+                    dtype=DataType.VARCHAR,
+                    max_length=100,
+                    is_primary=True,
+                    auto_id=False,
+                ),
+                FieldSchema(name="config_json", dtype=DataType.JSON),
+                FieldSchema(name="dummy_vector", dtype=DataType.FLOAT_VECTOR, dim=2),
+            ]
+            schema = CollectionSchema(fields, description="Config storage (idx as primary key)")
+            collection = Collection(self.collection_name, schema, using=self.alias)
+            collection.create_index("dummy_vector", {"index_type": "FLAT", "metric_type": "L2"})
+            return collection
+        return Collection(self.collection_name, using=self.alias)
+
+    @classmethod
+    def create_connection(
+        cls,
+        Repo_config_name: Optional[str] = "pipeline_config",
+        max_retries: Optional[int] = 10,
+        vector_url: Optional[str] = None,
+    ):
+        instance = cls(Repo_config_name, vector_url)
+        retry_interval = 6
+        if instance.host:
+            for retry in range(max_retries):
+                try:
+                    instance._connect()
+                    instance.collection = instance._init_collection()
+                    instance.collection.load()
+                    instance.connected = True
+                    return instance
+                except Exception as e:
+                    print(f"Attempt {retry + 1} failed: {str(e)}")
+                    if retry < max_retries - 1:
+                        time.sleep(retry_interval)
+            raise ConnectionError(f"Max retries ({max_retries}) reached")
+        return None
+
+    def save_configs(self, configs: List[Dict]) -> None:
+        self.collection.delete("idx != ''")
+        insert_data = []
+        for config in configs:
+            insert_data.append(
+                {
+                    "idx": config["idx"],
+                    "config_json": config,
+                    "dummy_vector": [0.0, 0.0],
+                }
+            )
+        if insert_data:
+            idx_list = [i["idx"] for i in insert_data]
+            configs_list = [i["config_json"] for i in insert_data]
+            vectors = [i["dummy_vector"] for i in insert_data]
+            self.collection.insert([idx_list, configs_list, vectors])
+            self.collection.flush()
+        else:
+            print("No data to insert")
+
+    def get_configs(self, idx: Optional[str] = None, output_fields: Optional[list] = None) -> List[Dict]:
+        try:
+            self.collection.load()
+            output_fields = output_fields or ["idx", "config_json"]
+            if idx:
+                expr = f'idx == "{idx}"'
+            else:
+                expr = "idx != ''"
+            results = self.collection.query(expr=expr, output_fields=output_fields)
+            return results
+        except Exception as e:
+            print(f"Read error: {e}")
+            return []
+
+    def add_config_by_idx(self, idx: str, config_json: Dict) -> bool:
+        if not self.connected or not self.collection:
+            raise RuntimeError("Not connected to Milvus")
+        try:
+            self.collection.load()
+            self.collection.insert([[idx], [config_json], [[0.0, 0.0]]])
+            return True
+        except Exception as e:
+            print(f"Add failed: {e}")
+            return False
+
+    def delete_config_by_idx(self, idx: str) -> int:
+        if not self.connected or not self.collection:
+            raise RuntimeError("Not connected to Milvus")
+        try:
+            self.collection.load()
+            res = self.collection.delete(f'idx == "{idx}"')
+            self.collection.flush()
+            return True
+        except Exception as e:
+            print(f"Delete failed: {e}")
+            return 0
+
+    def update_config_by_idx(self, idx: str, new_config_json: Dict) -> bool:
+        if not self.connected or not self.collection:
+            raise RuntimeError("Not connected to Milvus")
+        try:
+            self.collection.load()
+            upsert_data = [[idx], [new_config_json], [[0.0, 0.0]]]
+            self.collection.upsert(upsert_data)
+            return True
+        except Exception as e:
+            print(f"Upsert failed: {str(e)}")
+            return False
+
+    def clear_all_config(self):
+        try:
+            self.collection.load()
+            res = self.collection.delete("idx != ''")
+            self.collection.flush()
+            return True
+        except Exception as e:
+            print(f"Clear all configs failed: {e}")
+            return False
+
+
+class MilvusDocumentRecordRepository:
+    def __init__(
+        self,
+        repo_name: Optional[str] = "document_records",
+        vector_url: Optional[str] = None,
+    ):
+        if vector_url:
+            self.vector_url = vector_url
+        else:
+            self.vector_url = os.getenv("METADATA_DATABASE_URL")
+        self.host, self.port = None, None
+        if self.vector_url:
+            if self.vector_url.startswith(("http://", "https://")):
+                host_port = self.vector_url.replace("http://", "").replace("https://", "")
+            else:
+                host_port = self.vector_url
+            if ":" in host_port:
+                self.host, self.port = host_port.split(":", 1)
+
+        self.collection_name = repo_name
+        self.alias = repo_name
+        self.collection = None
+        self.connected = False
+
+    def _connect(self) -> None:
+        try:
+            connections.connect(host=self.host, port=self.port, alias=self.alias)
+        except Exception as e:
+            raise RuntimeError(f"Unable to connect to Milvus server: {str(e)}")
+
+    def _init_collection(self) -> Collection:
+        if not utility.has_collection(self.collection_name, using=self.alias):
+            fields = [
+                FieldSchema(name="id", dtype=DataType.INT64, is_primary=True, auto_id=True),
+                FieldSchema(name="file_id", dtype=DataType.VARCHAR, max_length=100),
+                FieldSchema(name="file_path", dtype=DataType.VARCHAR, max_length=512),
+                FieldSchema(name="doc_id", dtype=DataType.VARCHAR, max_length=100),
+                FieldSchema(name="metadata", dtype=DataType.JSON),
+                FieldSchema(name="dummy_vector", dtype=DataType.FLOAT_VECTOR, dim=2),
+            ]
+            schema = CollectionSchema(fields, description="File-Document association records (with metadata)")
+            collection = Collection(name=self.collection_name, schema=schema, using=self.alias)
+            index_params = {"index_type": "FLAT", "metric_type": "L2"}
+            collection.create_index(field_name="dummy_vector", index_params=index_params)
+            return collection
+        else:
+            return Collection(self.collection_name, using=self.alias)
+
+    @classmethod
+    def create_connection(
+        cls,
+        repo_name: Optional[str] = "document_records",
+        max_retries: Optional[int] = 10,
+        vector_url: Optional[str] = None,
+    ):
+        instance = cls(repo_name, vector_url)
+        retry_interval = 6
+        if instance.host:
+            for retry in range(max_retries):
+                try:
+                    instance._connect()
+                    instance.collection = instance._init_collection()
+                    instance.collection.load()
+                    instance.connected = True
+                    return instance
+                except Exception as e:
+                    print(f"Attempt {retry + 1} failed: {str(e)}")
+                    if retry < max_retries - 1:
+                        print(f"Retrying in {retry_interval}s...")
+                        time.sleep(retry_interval)
+            raise ConnectionError(f"Max retries ({max_retries}) reached. Failed to connect to Milvus")
+        else:
+            return None
+
+    def save_records(self, records: List[Dict[str, str]]) -> None:
+        if not records:
+            print("No records to save")
+            return
+        insert_data = [
+            [rec["file_id"] for rec in records],
+            [rec["file_path"] for rec in records],
+            [rec["doc_id"] for rec in records],
+            [rec.get("metadata", {}) for rec in records],
+            [[0.0, 0.0] for _ in records],
+        ]
+        self.collection.insert(insert_data)
+
+    def delete_records_by_file_id(self, file_id: str) -> List[str]:
+        expr = f'file_id == "{file_id}"'
+        results = self.collection.query(expr=expr, output_fields=["doc_id"])
+        deleted_doc_ids = [res["doc_id"] for res in results]
+
+        if deleted_doc_ids:
+            self.collection.delete(expr=expr)
+        return deleted_doc_ids
+
+    def get_records_by_file_id(self, file_id: str) -> List[Dict]:
+        expr = f'file_id == "{file_id}"'
+        results = self.collection.query(
+            expr=expr,
+            output_fields=["id", "file_id", "file_path", "doc_id", "metadata"],
+        )
+        return results
+
+
+# Configuration of the persistence pipeline
+pipeline_milvus_repo = MilvusConfigRepository.create_connection("pipeline_config", 20)
+
+
+async def save_pipeline_configurations(operation: str = None, pipeline=None):
+    try:
+        json_str = pipeline.get_pipeline_json
+        target_data = json.loads(json_str)
+        target_data["idx"] = pipeline.idx
+        target_idx = target_data.get("idx")
+        if "generator" in target_data and operation != "delete":
+            target_data["generator"]["prompt_content"] = pipeline.generator.prompt_content
+            target_data["documents_cache"] = pipeline.documents_cache
+            target_data["active"] = pipeline.status.active
+
+        if pipeline_milvus_repo:
+            if operation == "add":
+                success = pipeline_milvus_repo.add_config_by_idx(target_idx, target_data)
+            elif operation == "delete":
+                success = pipeline_milvus_repo.delete_config_by_idx(target_idx)
+            elif operation == "update":
+                success = pipeline_milvus_repo.update_config_by_idx(target_idx, target_data)
+            if not success:
+                return False
+            return True
+        else:
+            existing_pipelines = []
+            if os.path.exists(PIPELINE_FILE):
+                with open(PIPELINE_FILE, "r", encoding="utf-8") as f:
+                    existing_pipelines = json.load(f)
+                if not isinstance(existing_pipelines, list):
+                    existing_pipelines = []
+
+            if operation == "add":
+                if any(p.get("idx") == target_idx for p in existing_pipelines):
+                    return {"message": "Pipeline already exists"}
+                existing_pipelines.append(target_data)
+            elif operation == "delete":
+                existing_pipelines = [p for p in existing_pipelines if p.get("idx") != target_idx]
+            elif operation == "update":
+                for i in range(len(existing_pipelines)):
+                    if existing_pipelines[i].get("idx") == target_idx:
+                        existing_pipelines[i] = target_data
+            else:
+                return {"message": f"Invalid operation: {operation}"}
+            with open(PIPELINE_FILE, "w", encoding="utf-8") as f:
+                json.dump(existing_pipelines, f, indent=2, ensure_ascii=False)
+            return True
+    except Exception as e:
+        print(f"Error saving pipelines: {e}")
+
+
+# Configuration of knowledge base for persistence
+knowledgebase_config_repo = MilvusConfigRepository.create_connection("knowledgebase_config", 1)
+
+
+async def save_knowledge_configurations(operation: str = None, kb=None):
+    try:
+        if not kb:
+            return {"message": "Missing knowledgebase data"}
+        target_kb = {
+            "idx": kb.idx,
+            "name": kb.name,
+            "description": kb.description,
+            "active": kb.active,
+            "file_paths": kb.file_paths,
+            "comp_type": kb.comp_type,
+            "comp_subtype": kb.comp_subtype,
+            "experience_active": kb.experience_active,
+            "all_document_maps": kb.all_document_maps,
+        }
+        target_idx = target_kb.get("idx")
+        if not target_idx:
+            return {"message": "Missing 'idx' in knowledgebase data"}
+
+        if knowledgebase_config_repo:
+            if operation == "add":
+                success = knowledgebase_config_repo.add_config_by_idx(target_idx, target_kb)
+            elif operation == "delete":
+                success = knowledgebase_config_repo.delete_config_by_idx(target_idx)
+            elif operation == "update":
+                success = knowledgebase_config_repo.update_config_by_idx(target_idx, target_kb)
+            else:
+                return {"message": f"Invalid operation: {operation}"}
+            return success
+        else:
+            existing_kbs = []
+            if os.path.exists(KNOWLEDGEBASE_FILE):
+                with open(KNOWLEDGEBASE_FILE, "r", encoding="utf-8") as f:
+                    existing_kbs = json.load(f)
+                if not isinstance(existing_kbs, list):
+                    existing_kbs = []
+            if operation == "add":
+                existing_kbs.append(target_kb)
+            elif operation == "delete":
+                existing_kbs = [item for item in existing_kbs if item.get("idx") != target_idx]
+            elif operation == "update":
+                for i in range(len(existing_kbs)):
+                    if existing_kbs[i].get("idx") == target_idx:
+                        existing_kbs[i] = target_kb
+            else:
+                return {"message": f"Invalid operation: {operation}"}
+            with open(KNOWLEDGEBASE_FILE, "w", encoding="utf-8") as f:
+                json.dump(existing_kbs, f, indent=2, ensure_ascii=False)
+            return True
+    except Exception as e:
+        print(f"Error saving Knowledge base: {e}")
+
+
+# Configuration of the persistence agent
+agent_milvus_repo = MilvusConfigRepository.create_connection("agent_config", 1)
+
+
+async def save_agent_configurations(operation: str = None, agents=None):
+    try:
+        if agent_milvus_repo:
+            if not agents:
+                return False
+            for agent in agents.values():
+                target_data = agent.model_dump(mode="json")
+                if operation == "delete":
+                    success = agent_milvus_repo.delete_config_by_idx(agent.idx)
+                    if not success:
+                        return False
+                    continue
+
+                target_idx = target_data.get("idx")
+                if not target_idx:
+                    return {"message": "Missing 'idx' in data"}
+
+                if operation == "add":
+                    success = agent_milvus_repo.add_config_by_idx(target_idx, target_data)
+
+                elif operation == "update":
+                    success = agent_milvus_repo.update_config_by_idx(target_idx, target_data)
+
+                if not success:
+                    return False
+            return True
+        else:
+            if not agents:
+                return False
+            agent_list = []
+            for agent in agents.values():
+                agent_list.append(agent.model_dump(mode="json"))
+            json_str = json.dumps(agent_list, indent=2, ensure_ascii=False)
+            with open(AGENT_FILE, "w", encoding="utf-8") as f:
+                f.write(json_str)
+    except Exception as e:
+        print(f"Error saving agents: {e}")
diff --git a/EdgeCraftRAG/edgecraftrag/context.py b/EdgeCraftRAG/edgecraftrag/context.py
index 4d013b9bd2..94a5d91c40 100644
--- a/EdgeCraftRAG/edgecraftrag/context.py
+++ b/EdgeCraftRAG/edgecraftrag/context.py
@@ -1,12 +1,20 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-from edgecraftrag.controllers.compmgr import GeneratorMgr, IndexerMgr, NodeParserMgr, PostProcessorMgr, RetrieverMgr
+from edgecraftrag.controllers.agentmgr import AgentManager
+from edgecraftrag.controllers.compmgr import (
+    GeneratorMgr,
+    IndexerMgr,
+    NodeParserMgr,
+    PostProcessorMgr,
+    RetrieverMgr,
+)
 from edgecraftrag.controllers.filemgr import FilelMgr
 from edgecraftrag.controllers.knowledge_basemgr import KnowledgeManager
 from edgecraftrag.controllers.modelmgr import ModelMgr
 from edgecraftrag.controllers.nodemgr import NodeMgr
 from edgecraftrag.controllers.pipelinemgr import PipelineMgr
+from edgecraftrag.controllers.sessionmgr import SessionManager
 
 
 class Context:
@@ -22,6 +30,8 @@ def __init__(self):
         self.genmgr = GeneratorMgr()
         self.filemgr = FilelMgr()
         self.knowledgemgr = KnowledgeManager()
+        self.agentmgr = AgentManager(self.plmgr)
+        self.sessionmgr = SessionManager()
 
     def get_pipeline_mgr(self):
         return self.plmgr
@@ -53,5 +63,11 @@ def get_file_mgr(self):
     def get_knowledge_mgr(self):
         return self.knowledgemgr
 
+    def get_agent_mgr(self):
+        return self.agentmgr
+
+    def get_session_mgr(self):
+        return self.sessionmgr
+
 
 ctx = Context()
diff --git a/EdgeCraftRAG/edgecraftrag/controllers/agentmgr.py b/EdgeCraftRAG/edgecraftrag/controllers/agentmgr.py
new file mode 100644
index 0000000000..db03dab3fd
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/controllers/agentmgr.py
@@ -0,0 +1,117 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Any, Dict, Optional
+
+from comps.cores.proto.api_protocol import ChatCompletionRequest
+from edgecraftrag.api_schema import AgentCreateIn
+from edgecraftrag.base import AgentType, BaseMgr, CallbackType
+from edgecraftrag.components.agent import Agent
+from edgecraftrag.components.agents.deep_search.deep_search import DeepSearchAgent
+from edgecraftrag.components.agents.simple import SimpleRAGAgent
+
+
+class AgentManager(BaseMgr):
+
+    active_agent_idx: Optional[str] = None
+
+    def __init__(self, pipeline_mgr):
+        super().__init__()
+        self.active_agent_idx = None
+        self.agents = {}
+        self.pipeline_mgr = pipeline_mgr
+
+    def set_manager(self, agent: Agent):
+        agent.manager = self
+
+    def get_pipeline_by_name_or_id(self, name_or_id):
+        return self.pipeline_mgr.get_pipeline_by_name_or_id(name_or_id)
+
+    def get_agents(self) -> Dict[str, Any]:
+        return self.agents
+
+    def get_agent_by_id(self, idx):
+        return self.agents.get(idx, None)
+
+    def get_agent_by_name(self, name):
+        for k, a in self.agents.items():
+            if a.name == name:
+                return a
+        return None
+
+    def get_agent_id_by_name(self, name):
+        for k, a in self.agents.items():
+            if a.name == name:
+                return k
+        return None
+
+    def create_agent(self, cfgs: AgentCreateIn):
+        new_agent = None
+        if not self.get_pipeline_by_name_or_id(cfgs.pipeline_idx):
+            return "Create Agent failed. Pipeline id not found."
+        if cfgs.type == AgentType.SIMPLE:
+            new_agent = SimpleRAGAgent(cfgs.idx, cfgs.name, cfgs.pipeline_idx, cfgs.configs)
+        elif cfgs.type == AgentType.DEEPSEARCH:
+            new_agent = DeepSearchAgent(cfgs.idx, cfgs.name, cfgs.pipeline_idx, cfgs.configs)
+        if new_agent is not None:
+            self.set_manager(new_agent)
+            self.agents[new_agent.idx] = new_agent
+            if cfgs.active:
+                self.active_agent_idx = new_agent.idx
+            return new_agent
+        else:
+            return "Create Agent failed."
+
+    def update_agent(self, name, cfgs: AgentCreateIn):
+        idx = self.get_agent_id_by_name(name)
+        if idx:
+            agent = self.get_agent_by_id(idx)
+            if cfgs.configs:
+                agent.update(cfgs.configs)
+            if cfgs.active:
+                return self.activate_agent(idx)
+            else:
+                return self.deactivate_agent(idx)
+            return True
+        else:
+            return False
+
+    def remove_agent(self, name):
+        idx = self.get_agent_id_by_name(name)
+        if self.agents.pop(idx, None):
+            return True
+        return False
+
+    def activate_agent(self, idx):
+        if idx in self.agents:
+            self.active_agent_idx = idx
+            return True
+        else:
+            return False
+
+    def deactivate_agent(self, idx):
+        if idx in self.agents:
+            self.active_agent_idx = None
+            return True
+        else:
+            return False
+
+    def get_active_agent_id(self):
+        return self.active_agent_idx
+
+    def get_active_agent(self):
+        if self.active_agent_idx:
+            return self.agents[self.active_agent_idx]
+        else:
+            return None
+
+    def get_agent_default_configs(self, agent_type):
+        if agent_type == AgentType.SIMPLE:
+            return SimpleRAGAgent.get_default_configs()
+        if agent_type == AgentType.DEEPSEARCH:
+            return DeepSearchAgent.get_default_configs()
+
+    async def run_agent(self, chat_request: ChatCompletionRequest) -> Any:
+        active_agent = self.get_active_agent()
+        if active_agent is not None:
+            return await active_agent.run(cbtype=CallbackType.RUNAGENT, chat_request=chat_request)
diff --git a/EdgeCraftRAG/edgecraftrag/controllers/compmgr.py b/EdgeCraftRAG/edgecraftrag/controllers/compmgr.py
index b8dd82ab7b..4e5d93896a 100644
--- a/EdgeCraftRAG/edgecraftrag/controllers/compmgr.py
+++ b/EdgeCraftRAG/edgecraftrag/controllers/compmgr.py
@@ -43,6 +43,7 @@ def search_indexer(self, indin: IndexerIn) -> BaseComponent:
                         (v.model.model_id_or_path == indin.embedding_model.model_id)
                         or (v.model.model_id_or_path == indin.embedding_model.model_path)
                     )
+                    and v.model.device == indin.embedding_model.device
                 ):
                     return v
         return None
diff --git a/EdgeCraftRAG/edgecraftrag/controllers/knowledge_basemgr.py b/EdgeCraftRAG/edgecraftrag/controllers/knowledge_basemgr.py
index dc69943eb2..233a2bd5bd 100644
--- a/EdgeCraftRAG/edgecraftrag/controllers/knowledge_basemgr.py
+++ b/EdgeCraftRAG/edgecraftrag/controllers/knowledge_basemgr.py
@@ -13,6 +13,7 @@ class KnowledgeManager(BaseMgr):
     def __init__(self):
         super().__init__()
         self.active_knowledge_idx: Optional[str] = None
+        self.active_experience_idx: Optional[str] = None
 
     def get_knowledge_base_by_name_or_id(self, name: str):
         for _, kb in self.components.items():
@@ -26,8 +27,17 @@ def get_active_knowledge_base(self) -> Optional[Knowledge]:
         else:
             return None
 
+    def get_active_experience(self):
+        if self.active_experience_idx:
+            return self.get_knowledge_base_by_name_or_id(self.active_experience_idx)
+        else:
+            return None
+
     def active_knowledge(self, knowledge: KnowledgeBaseCreateIn):
         kb = self.get_knowledge_base_by_name_or_id(knowledge.name)
+        if kb.comp_type != "knowledge":
+            raise HTTPException(status_code=status.HTTP_409_CONFLICT, detail="Experience type  cannot be active")
+        kb = self.get_knowledge_base_by_name_or_id(knowledge.name)
         self.active_knowledge_idx = kb.idx if knowledge.active else None
 
         for idx, comp in self.components.items():
@@ -35,16 +45,47 @@ def active_knowledge(self, knowledge: KnowledgeBaseCreateIn):
                 comp.active = idx == self.active_knowledge_idx
         return kb
 
+    def active_experience(self, knowledge: KnowledgeBaseCreateIn):
+        kb = self.get_knowledge_base_by_name_or_id(knowledge.name)
+        if kb.comp_type != "experience":
+            raise HTTPException(status_code=status.HTTP_409_CONFLICT, detail="Knowledge type  cannot be active")
+        self.active_experience_idx = kb.idx if knowledge.experience_active else None
+        if kb.experience_active != knowledge.experience_active:
+            for idx, comp in self.components.items():
+                if isinstance(comp, Knowledge):
+                    comp.experience_active = idx == self.active_experience_idx
+        return kb
+
     def create_knowledge_base(self, knowledge: KnowledgeBaseCreateIn) -> Knowledge:
         for _, kb in self.components.items():
             if kb.name == knowledge.name:
                 raise HTTPException(status_code=status.HTTP_409_CONFLICT, detail="The knowledge base already exists.")
+            if knowledge.comp_type == "experience":
+                for idx, kb in self.components.items():
+                    if kb.comp_type == "experience":
+                        raise HTTPException(
+                            status_code=status.HTTP_409_CONFLICT, detail="Only one experience class can be created."
+                        )
+        if knowledge.comp_type == "experience":
+            knowledge.active = False
         if knowledge.active is None:
             knowledge.active = False
-        kb = Knowledge(name=knowledge.name, description=knowledge.description, active=knowledge.active)
+        kb = Knowledge(
+            idx=knowledge.idx,
+            name=knowledge.name,
+            description=knowledge.description,
+            active=knowledge.active,
+            comp_type=knowledge.comp_type,
+            comp_subtype=knowledge.comp_subtype,
+            experience_active=knowledge.experience_active,
+            all_document_maps=knowledge.all_document_maps,
+            file_paths=knowledge.file_paths,
+        )
         self.add(kb)
         if knowledge.active:
             self.active_knowledge(knowledge)
+        if knowledge.experience_active:
+            self.active_experience(knowledge)
         return kb
 
     def delete_knowledge_base(self, name: str):
@@ -54,12 +95,16 @@ def delete_knowledge_base(self, name: str):
 
     def update_knowledge_base(self, knowledge) -> Knowledge:
         kb = self.get_knowledge_base_by_name_or_id(knowledge.name)
-
-        if knowledge.description is not None:
-            kb.description = knowledge.description
-
-        if knowledge.active is not None and kb.active != knowledge.active:
-            kb = self.active_knowledge(knowledge)
+        if kb.comp_type == "knowledge":
+            if knowledge.description is not None:
+                kb.description = knowledge.description
+            if knowledge.active is not None and kb.active != knowledge.active:
+                kb = self.active_knowledge(knowledge)
+        if kb.comp_type == "experience":
+            if knowledge.description is not None:
+                kb.description = knowledge.description
+            if knowledge.experience_active is not None and kb.experience_active != knowledge.experience_active:
+                kb = self.active_experience(knowledge)
         return "Knowledge base update successfully"
 
     def get_all_knowledge_bases(self) -> List[Dict[str, Any]]:
@@ -67,3 +112,8 @@ def get_all_knowledge_bases(self) -> List[Dict[str, Any]]:
         for idx, kb in self.components.items():
             kb_list.append(kb)
         return kb_list
+
+    def get_experience_kb(self):
+        for idx, kb in self.components.items():
+            if kb.comp_type == "experience":
+                return kb
diff --git a/EdgeCraftRAG/edgecraftrag/controllers/modelmgr.py b/EdgeCraftRAG/edgecraftrag/controllers/modelmgr.py
index b2715c27fa..966632705e 100644
--- a/EdgeCraftRAG/edgecraftrag/controllers/modelmgr.py
+++ b/EdgeCraftRAG/edgecraftrag/controllers/modelmgr.py
@@ -7,6 +7,7 @@
 from edgecraftrag.base import BaseComponent, BaseMgr, CompType, ModelType
 from edgecraftrag.components.model import (
     BaseModelComponent,
+    OpenAIEmbeddingModel,
     OpenVINOEmbeddingModel,
     OpenVINOLLMModel,
     OpenVINORerankModel,
@@ -92,6 +93,8 @@ def load_model(model_para: ModelIn):
                     device=model_para.device,
                     weight=model_para.weight,
                 )
+            case ModelType.VLLM_EMBEDDING:
+                model = OpenAIEmbeddingModel(model_id=model_para.model_id, api_base=model_para.api_base)
             case ModelType.LLM:
                 model = OpenVINOLLMModel(
                     model_id=model_para.model_id,
diff --git a/EdgeCraftRAG/edgecraftrag/controllers/pipelinemgr.py b/EdgeCraftRAG/edgecraftrag/controllers/pipelinemgr.py
index 81524a3754..d44a227325 100644
--- a/EdgeCraftRAG/edgecraftrag/controllers/pipelinemgr.py
+++ b/EdgeCraftRAG/edgecraftrag/controllers/pipelinemgr.py
@@ -19,8 +19,15 @@ def __init__(self):
         self._lock = asyncio.Lock()
         super().__init__()
 
-    def create_pipeline(self, name: str, origin_json: str):
-        pl = Pipeline(name, origin_json)
+    def create_pipeline(self, request, origin_json: str):
+        if isinstance(request, str):
+            name = request
+            idx, documents_cache = None, None
+        else:
+            name = request.name
+            idx = request.idx
+            documents_cache = request.documents_cache
+        pl = Pipeline(name, origin_json, idx, documents_cache)
         self.add(pl)
         return pl
 
@@ -66,8 +73,8 @@ def activate_pipeline(self, name: str, active: bool, nm: NodeMgr, kb_name: None)
             return
 
         nodelist = None
-        if pl.node_changed:
-            nodelist = nm.get_nodes(pl.node_parser.idx)
+        # if pl.node_changed:
+        #     nodelist = nm.get_nodes(pl.node_parser.idx)
         pl.check_active(nodelist, kb_name)
         prevactive = self._active_pipeline
         if prevactive:
@@ -83,24 +90,38 @@ def notify_node_change(self):
         for _, pl in self.components.items():
             pl.set_node_change()
 
-    def run_pipeline(self, chat_request: ChatCompletionRequest) -> Any:
+    async def run_pipeline(self, chat_request: ChatCompletionRequest) -> Any:
+        ap = self.get_active_pipeline()
+        if ap is not None:
+            return await ap.run(cbtype=CallbackType.PIPELINE, chat_request=chat_request)
+        return -1
+
+    async def run_retrieve_postprocess(self, chat_request: ChatCompletionRequest) -> Any:
+        ap = self.get_active_pipeline()
+        out = None
+        if ap is not None:
+            out = await ap.run(cbtype=CallbackType.RETRIEVE_POSTPROCESS, chat_request=chat_request)
+            return out
+        return -1
+
+    async def run_retrieve(self, chat_request: ChatCompletionRequest) -> Any:
         ap = self.get_active_pipeline()
         out = None
         if ap is not None:
-            out = ap.run(cbtype=CallbackType.PIPELINE, chat_request=chat_request)
+            out = await ap.run(cbtype=CallbackType.RETRIEVE, chat_request=chat_request)
             return out
         return -1
 
-    def run_retrieve(self, chat_request: ChatCompletionRequest) -> Any:
+    async def run_postprocess(self, chat_request: ChatCompletionRequest, contexts) -> Any:
         ap = self.get_active_pipeline()
         out = None
         if ap is not None:
-            out = ap.run(cbtype=CallbackType.RETRIEVE, chat_request=chat_request)
+            out = await ap.run(cbtype=CallbackType.POSTPROCESS, chat_request=chat_request, contexts=contexts)
             return out
         return -1
 
-    def run_data_prepare(self, docs: List[Document]) -> Any:
+    async def run_data_prepare(self, docs: List[Document]) -> Any:
         ap = self.get_active_pipeline()
         if ap is not None:
-            return ap.run(cbtype=CallbackType.DATAPREP, docs=docs)
+            return await ap.run(cbtype=CallbackType.DATAPREP, docs=docs)
         return -1
diff --git a/EdgeCraftRAG/edgecraftrag/controllers/sessionmgr.py b/EdgeCraftRAG/edgecraftrag/controllers/sessionmgr.py
new file mode 100644
index 0000000000..53dac2bc04
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/controllers/sessionmgr.py
@@ -0,0 +1,178 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import json
+import os
+from typing import Any, Dict, List, Optional
+
+from edgecraftrag.api_schema import SessionIn
+from edgecraftrag.base import BaseMgr, InferenceType
+from edgecraftrag.components.session import Session
+from edgecraftrag.config_repository import MilvusConfigRepository
+from edgecraftrag.env import SESSION_FILE
+
+
+class SessionManager(BaseMgr):
+    def __init__(self):
+        super().__init__()
+        self._current_session_id: Optional[str] = None
+        self.session_file = SESSION_FILE
+
+        self.milvus_repo = MilvusConfigRepository.create_connection(Repo_config_name="session_storage", max_retries=1)
+        self.components: Dict[str, Session] = {}
+
+        if self.milvus_repo and self.milvus_repo.connected:
+            self._load_from_milvus()
+        else:
+            self.load_from_file()
+
+    def set_current_session(self, session_id: str) -> None:
+        self._current_session_id = session_id if session_id and session_id not in ("None", "") else "default_session"
+        if self._current_session_id not in self.components:
+            new_session = Session(self._current_session_id)
+            self.add(new_session, name=self._current_session_id)
+
+    def get_current_session(self) -> Optional[Session]:
+        if not self._current_session_id:
+            return None
+        return self.components.get(self._current_session_id)
+
+    def create_session(self, session: SessionIn) -> str:
+        session_id = session.idx if session and session.idx else None
+
+        if not session_id or session_id in ("", "None"):
+            session_id = f"session_{len(self.components) + 1}"
+            while session_id in self.components:
+                session_id = f"session_{len(self.components) + 1}"
+
+        if session_id in self.components:
+            raise ValueError(f"Session ID {session_id} already exists")
+
+        new_session = Session(session_id)
+        self.add(new_session, name=session_id)
+        return session_id
+
+    def add(self, session: Session, name: str) -> None:
+        self.components[name] = session
+        if self.milvus_repo and self.milvus_repo.connected:
+            self.milvus_repo.add_config_by_idx(name, session.to_dict())
+        else:
+            self.save_to_file()
+
+    def clear_current_history(self) -> None:
+        current_session = self.get_current_session()
+        if current_session:
+            current_session.clear_messages()
+            self._persist_session(current_session.idx)
+
+    def save_current_message(self, sessionid: str, role: str, content: str) -> str:
+        current_session = self.get(sessionid)
+        if not current_session:
+            return "No current session set"
+
+        try:
+            current_session.add_message(role, content)
+            self._persist_session(sessionid)
+            return "Message added successfully"
+        except ValueError as e:
+            return f"Failed to add message: {str(e)}"
+
+    def update_current_message(self, sessionid: str, role: str, content: str) -> str:
+        current_session = self.get(sessionid)
+        if not current_session:
+            return "No current session set"
+        try:
+            current_session.update_current_message(role, content)
+            return "Message updated successfully"
+        except ValueError as e:
+            return f"Failed to update message: {str(e)}"
+
+    def concat_history(self, sessionid: str, inference_type: str, user_message: str) -> str:
+        max_token = 6000
+        if inference_type == InferenceType.VLLM:
+            vllm_max_len = int(os.getenv("MAX_MODEL_LEN", "10240"))
+            if vllm_max_len > 5000:
+                max_token = vllm_max_len - 1024
+
+        current_session = self.get(sessionid)
+        if not current_session:
+            return ""
+        history_messages = current_session.get_messages()
+        recent_str = self.get_recent_chat_rounds(history_messages)
+
+        self.save_current_message(sessionid, "user", user_message)
+        return recent_str[-max_token:] if len(recent_str) > max_token else recent_str
+
+    def get_recent_chat_rounds(self, messages: List[Dict[str, str]]) -> str:
+        history_num = int(os.getenv("CHAT_HISTORY_ROUND", "0"))
+        if history_num <= 0:
+            return ""
+        total = len(messages)
+        start_idx = max(0, total - (history_num * 2))
+        return str(messages[start_idx:])
+
+    def get_all_sessions(self):
+        return {
+            sid: session.get_user_message_titel()
+            for sid, session in reversed(self.components.items())
+            if isinstance(session, Session)
+        }
+
+    def get_session_by_id(self, session_id: str) -> Dict[str, Any]:
+        session = self.get(session_id)
+        if not session or not isinstance(session, Session):
+            return {"session_id": session_id, "exists": False}
+        return session.to_dict()
+
+    def _persist_session(self, session_id: str):
+        session = self.components.get(session_id)
+        if not session:
+            return
+
+        if self.milvus_repo and self.milvus_repo.connected:
+            self.milvus_repo.update_config_by_idx(session_id, session.to_dict())
+        else:
+            self.save_to_file()
+
+    def save_to_file(self) -> Dict[str, str]:
+        try:
+            os.makedirs(os.path.dirname(self.session_file), exist_ok=True)
+            data = {sid: session.to_dict() for sid, session in self.components.items() if isinstance(session, Session)}
+            with open(self.session_file, "w", encoding="utf-8") as f:
+                json.dump(data, f, indent=2, ensure_ascii=False)
+            return {"status": "success", "message": f"Saved to {self.session_file}"}
+        except Exception as e:
+            return {"status": "error", "message": f"Save failed: {str(e)}"}
+
+    def load_from_file(self) -> Dict[str, str]:
+        try:
+            if not os.path.exists(self.session_file):
+                return {"status": "warning", "message": "Session file does not exist"}
+            with open(self.session_file, "r", encoding="utf-8") as f:
+                loaded_data = json.load(f)
+            if not isinstance(loaded_data, dict):
+                raise ValueError("Invalid session file format: expected dict")
+
+            self.components.clear()
+            for session_id, session_data in loaded_data.items():
+                session = Session.from_dict(session_data)
+                self.components[session_id] = session
+            return {
+                "status": "success",
+                "message": f"Loaded {len(self.components)} sessions from {self.session_file}",
+            }
+        except Exception as e:
+            return {"status": "error", "message": f"Load failed: {str(e)}"}
+
+    def _load_from_milvus(self):
+        try:
+            milvus_sessions = self.milvus_repo.get_configs()
+            for item in milvus_sessions:
+                session_id = item.get("idx")
+                config_json = item.get("config_json", {})
+                if session_id and isinstance(config_json, dict):
+                    session = Session.from_dict(config_json)
+                    self.components[session_id] = session
+            print(f"Loaded {len(self.components)} sessions from Milvus.")
+        except Exception as e:
+            print(f"Error loading sessions from Milvus: {str(e)}")
diff --git a/EdgeCraftRAG/edgecraftrag/env.py b/EdgeCraftRAG/edgecraftrag/env.py
new file mode 100644
index 0000000000..b5371278b1
--- /dev/null
+++ b/EdgeCraftRAG/edgecraftrag/env.py
@@ -0,0 +1,24 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+import os
+
+UI_DIRECTORY = os.getenv("TMPFILE_PATH", "/home/user/ui_cache")
+# Define the root directory for knowledge base files
+CONFIG_DIRECTORY = os.path.join(UI_DIRECTORY, "configs")
+if not os.path.exists(CONFIG_DIRECTORY):
+    os.makedirs(CONFIG_DIRECTORY, exist_ok=True)
+
+IMG_OUTPUT_DIR = os.path.join(UI_DIRECTORY, "pic")
+os.makedirs(IMG_OUTPUT_DIR, exist_ok=True)
+
+KNOWLEDGEBASE_FILE = os.path.join(CONFIG_DIRECTORY, "knowledgebase.json")
+PIPELINE_FILE = os.path.join(CONFIG_DIRECTORY, "pipeline.json")
+AGENT_FILE = os.path.join(CONFIG_DIRECTORY, "agent.json")
+
+EXPERIENCE_FILE = os.path.join(UI_DIRECTORY, "experience_dir/experience.json")
+DOCUMENT_DATA_FILE = os.path.join(UI_DIRECTORY, "document_data.json")
+SESSION_FILE = os.path.join(UI_DIRECTORY, "session.json")
+
+SEARCH_CONFIG_PATH = os.path.join(UI_DIRECTORY, "configs/search_config.yaml")
+SEARCH_DIR = os.path.join(UI_DIRECTORY, "configs/experience_dir/experience.json")
diff --git a/EdgeCraftRAG/edgecraftrag/requirements.txt b/EdgeCraftRAG/edgecraftrag/requirements.txt
index 94cbef7b6c..6c4b7e4451 100644
--- a/EdgeCraftRAG/edgecraftrag/requirements.txt
+++ b/EdgeCraftRAG/edgecraftrag/requirements.txt
@@ -2,8 +2,12 @@ docx2txt
 EbookLib>=0.18
 faiss-cpu>=1.8.0.post1
 html2text>=2025.4.15
-langchain-core==0.3.60
-llama-index==0.12.41
+json-repair==0.52.0
+langchain-core==0.3.80
+langchain-milvus
+langchain-openai
+langgraph==0.6.10
+llama-index==0.12.36
 llama-index-core==0.12.37
 llama-index-embeddings-openvino==0.5.2
 llama-index-llms-openai==0.3.44
@@ -20,6 +24,10 @@ pillow>=10.4.0
 py-cpuinfo>=9.0.0
 pymilvus==2.5.10
 python-docx==1.1.2
-unstructured==0.16.11
+torch==2.8.0+cpu
+torchvision==0.23.0+cpu
+transformers==4.53.3
+unstructured
+unstructured[all-docs]
 unstructured[pdf]
 werkzeug==3.1.3
diff --git a/EdgeCraftRAG/edgecraftrag/server.py b/EdgeCraftRAG/edgecraftrag/server.py
index a8117cf014..44b63c4d32 100644
--- a/EdgeCraftRAG/edgecraftrag/server.py
+++ b/EdgeCraftRAG/edgecraftrag/server.py
@@ -4,14 +4,16 @@
 import os
 
 import uvicorn
+from edgecraftrag.api.v1.agent import agent_app, restore_agent_configurations
 from edgecraftrag.api.v1.chatqna import chatqna_app
 from edgecraftrag.api.v1.data import data_app
-from edgecraftrag.api.v1.knowledge_base import kb_app, load_knowledge_from_file
+from edgecraftrag.api.v1.knowledge_base import kb_app, restore_knowledge_configurations
 from edgecraftrag.api.v1.model import model_app
-from edgecraftrag.api.v1.pipeline import load_pipeline_from_file, pipeline_app
+from edgecraftrag.api.v1.pipeline import pipeline_app, restore_pipeline_configurations
 from edgecraftrag.api.v1.prompt import prompt_app
+from edgecraftrag.api.v1.session import session_app
 from edgecraftrag.api.v1.system import system_app
-from edgecraftrag.utils import UI_DIRECTORY
+from edgecraftrag.env import UI_DIRECTORY
 from fastapi import FastAPI
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.staticfiles import StaticFiles
@@ -19,10 +21,14 @@
 
 
 async def lifespan(app: FastAPI):
-    print("Restore pipeline configuration and knowledge base configuration...")
-    load_pipeline_from_file()
-    await load_knowledge_from_file()
-    yield
+    try:
+        print("Restore pipeline configuration and knowledge base configuration...")
+        await restore_pipeline_configurations()
+        await restore_knowledge_configurations()
+        await restore_agent_configurations()
+        yield
+    except Exception as e:
+        raise
 
 
 app = FastAPI(lifespan=lifespan)
@@ -36,7 +42,17 @@ async def lifespan(app: FastAPI):
 )
 
 
-sub_apps = [data_app, model_app, pipeline_app, chatqna_app, system_app, prompt_app, kb_app]
+sub_apps = [
+    data_app,
+    model_app,
+    pipeline_app,
+    chatqna_app,
+    system_app,
+    prompt_app,
+    kb_app,
+    agent_app,
+    session_app,
+]
 for sub_app in sub_apps:
     for route in sub_app.routes:
         app.router.routes.append(route)
diff --git a/EdgeCraftRAG/edgecraftrag/utils.py b/EdgeCraftRAG/edgecraftrag/utils.py
old mode 100755
new mode 100644
index 18a43e5879..a4b06ebf97
--- a/EdgeCraftRAG/edgecraftrag/utils.py
+++ b/EdgeCraftRAG/edgecraftrag/utils.py
@@ -1,6 +1,7 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
+import asyncio
 import io
 import os
 from pathlib import Path
@@ -8,16 +9,12 @@
 
 from docx.text.paragraph import Paragraph
 from edgecraftrag.base import InferenceType
-from edgecraftrag.context import ctx
+from edgecraftrag.env import IMG_OUTPUT_DIR
 from PIL import Image as Img
 from transformers import AutoTokenizer
 from unstructured.documents.elements import ElementMetadata, Image
 from unstructured.partition.docx import DocxPartitionerOptions
 
-UI_DIRECTORY = os.getenv("TMPFILE_PATH", "/home/user/ui_cache")
-IMG_OUTPUT_DIR = os.path.join(UI_DIRECTORY, "pic")
-os.makedirs(IMG_OUTPUT_DIR, exist_ok=True)
-
 DEFAULT_TEMPLATE = """You are an AI assistant. Your task is to learn from the following context. Then answer the user's question based on what you learned from the context but not your own knowledge.
 
 {context}
@@ -44,15 +41,21 @@ def iter_elements(cls, paragraph: Paragraph, opts: DocxPartitionerOptions) -> It
             yield Image(text="IMAGE", metadata=element_metadata)
 
 
-def get_prompt_template(model_id, prompt_content=None, template_path=None, enable_think=False):
+def get_prompt_template(model_path, prompt_content=None, template_path=None, enable_think=False):
     if prompt_content is not None:
         template = prompt_content
     elif template_path is not None:
-        template = Path(template_path).read_text(encoding=None)
+        # Safely load the template only if it is inside /templates (or other safe root)
+        safe_root = "/templates"
+        normalized_path = os.path.normpath(os.path.join(safe_root, template_path))
+        if not normalized_path.startswith(safe_root):
+            raise ValueError("Template path is outside of the allowed directory.")
+        if not os.path.exists(normalized_path):
+            raise FileNotFoundError("Template file does not exist.")
+        template = Path(normalized_path).read_text(encoding=None)
     else:
         template = DEFAULT_TEMPLATE
-    tokenizer = AutoTokenizer.from_pretrained(model_id)
-    model_id = model_id.split("/")[-1]
+    tokenizer = AutoTokenizer.from_pretrained(model_path)
     messages = [{"role": "system", "content": template}, {"role": "user", "content": "\n{input}\n"}]
     prompt_template = tokenizer.apply_chat_template(
         messages,
@@ -60,10 +63,13 @@ def get_prompt_template(model_id, prompt_content=None, template_path=None, enabl
         add_generation_prompt=True,
         enable_thinking=enable_think,  # Switches between thinking and non-thinking modes. Default is True.
     )
-    return prompt_template
+    return template, prompt_template
 
 
 def serialize_node_with_score(node_with_score):
+    # relationships is not serializable
+    # No need for this information right now
+    node_with_score.node.relationships = {}
     return {
         "node": node_with_score.node.__dict__,
         "score": node_with_score.score.item() if hasattr(node_with_score.score, "item") else node_with_score.score,
@@ -74,74 +80,13 @@ def serialize_contexts(contexts):
     return {key: [serialize_node_with_score(node) for node in nodes] for key, nodes in contexts.items()}
 
 
-def compare_mappings(new_dict, old_dict):
-    added_files = {}
-    deleted_files = {}
-    for key in set(new_dict) - set(old_dict):
-        added_files[key] = new_dict[key]
-    for key in set(old_dict) - set(new_dict):
-        deleted_files[key] = old_dict[key]
-    for key in set(new_dict) & set(old_dict):
-        new_files = new_dict[key]
-        old_files = old_dict[key]
-        added = {name: new_files[name] for name in set(new_files) - set(old_files)}
-        if added:
-            added_files[key] = added
-        deleted = {name: old_files[name] for name in set(old_files) - set(new_files)}
-        if deleted:
-            deleted_files[key] = deleted
-
-    for key in list(added_files.keys()):
-        if key in deleted_files:
-            del added_files[key]
-    return added_files, deleted_files
-
-
-_history_map = {}
-_current_session_id: Optional[str] = None
-
-
-def set_current_session(session_id: str) -> None:
-    global _current_session_id
-    _current_session_id = session_id if session_id not in (None, "", "None") else "default_session"
-
-
-def get_current_session() -> Optional[str]:
-    return _current_session_id
-
-
-def clear_history() -> None:
-    session_id = get_current_session()
-    if session_id in _history_map:
-        _history_map[session_id] = []
-
-
-def save_history(message: str) -> str:
-    session_id = get_current_session()
-    _history_map.setdefault(session_id, []).append(f"content: {message}")
-    return "History appended successfully"
-
-
-def concat_history(message: str) -> str:
-    max_token = 6000
-    active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
-    if active_pl.generator.inference_type == InferenceType.VLLM:
-        vllm_max_len = int(os.getenv("MAX_MODEL_LEN", "5000"))
-        if vllm_max_len > 5000:
-            max_token = vllm_max_len - 1024
-
-    history_id = get_current_session()
-    history_id_list = _history_map.get(history_id, [])
-    str_message = get_recent_chat_rounds(history_id_list)
-    _history_map.setdefault(history_id, []).append(f"user: {message}")
-    return str_message[-max_token:] if len(str_message) > max_token else str_message
+async def stream_generator(string: str):
+    for token in iter(string):
+        yield token
+        await asyncio.sleep(0)
 
 
-def get_recent_chat_rounds(history_id_list: List[str]) -> str:
-    history_num = int(os.getenv("CHAT_HISTORY_ROUND", "0"))
-    actual_rounds = min(history_num, len(history_id_list) // 2)
-    if actual_rounds <= 0:
-        return ""
-    start_index = max(0, len(history_id_list) - (actual_rounds * 2 + 1))
-    recent_history = history_id_list[start_index:]
-    return "".join(recent_history)
+async def chain_async_generators(gen_list: List):
+    for stream in gen_list:
+        async for token in stream:
+            yield token
diff --git a/EdgeCraftRAG/nginx/nginx-conf-generator.sh b/EdgeCraftRAG/nginx/nginx-conf-generator.sh
deleted file mode 100644
index bd8e5b194c..0000000000
--- a/EdgeCraftRAG/nginx/nginx-conf-generator.sh
+++ /dev/null
@@ -1,68 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-# Check if the correct number of arguments is provided
-if [ "$#" -ne 2 ]; then
-    echo "Usage: $0 DP_NUM output-file-path"
-    exit 1
-fi
-
-# Get the port number from the command line argument
-PORT_NUM=$1
-
-# Start generating the Nginx configuration
-cat <<EOL > $2
-worker_processes  auto;
-events {
-    worker_connections  1024;
-}
-http {
-
-    upstream multi-arc-serving-container {
-EOL
-
-# Generate the server lines
-for ((i=0; i<PORT_NUM; i++)); do
-    PORT_VAR="VLLM_SERVICE_PORT_$i"
-    echo "        server ${HOST_IP}:${!PORT_VAR};" >> $2
-done
-
-# Close the upstream block and the http block
-cat <<EOL >> $2
-    }
-    include /etc/nginx/mime.types;
-    default_type  application/octet-stream;
-    client_max_body_size 50M;
-    sendfile on;
-
-    keepalive_timeout  65;
-    keepalive_requests 1000;
-    server {
-        listen 8086;
-        server_name _;
-        location / {
-            root /usr/share/nginx/html;
-            index index.html index.htm;
-            add_header Cache-Control "no-cache";
-            try_files $uri $uri/ /index.html;
-        }
-        location /v1/completions {
-            proxy_pass http://multi-arc-serving-container/v1/completions;
-            proxy_http_version 1.1;
-            proxy_set_header Connection "";
-        }
-        location /metrics {
-            proxy_pass http://multi-arc-serving-container/metrics;
-            proxy_http_version 1.1;
-            proxy_set_header Connection "";
-        }
-
-        location ~ /\. {
-            deny all;
-        }
-    }
-}
-EOL
-
-echo "Nginx configuration generated in nginx.conf"
diff --git a/EdgeCraftRAG/tests/configs/test_pipeline_ipex_vllm.json b/EdgeCraftRAG/tests/configs/test_pipeline_ipex_vllm.json
index 097309d7e2..cac241ec73 100644
--- a/EdgeCraftRAG/tests/configs/test_pipeline_ipex_vllm.json
+++ b/EdgeCraftRAG/tests/configs/test_pipeline_ipex_vllm.json
@@ -38,6 +38,7 @@
       "device": "",
       "weight": ""
     },
+    "generator_type": "chatqna",
     "prompt_path": "./default_prompt.txt",
     "vllm_endpoint": ""
   },
diff --git a/EdgeCraftRAG/tests/configs/test_pipeline_local_llm.json b/EdgeCraftRAG/tests/configs/test_pipeline_local_llm.json
index 39ee2ef0f1..811e119690 100644
--- a/EdgeCraftRAG/tests/configs/test_pipeline_local_llm.json
+++ b/EdgeCraftRAG/tests/configs/test_pipeline_local_llm.json
@@ -37,6 +37,7 @@
       "device": "auto",
       "weight": "INT4"
     },
+    "generator_type": "chatqna",
     "prompt_path": "./default_prompt.txt",
     "inference_type": "local"
   },
diff --git a/EdgeCraftRAG/tests/test_compose_on_arc.sh b/EdgeCraftRAG/tests/test_compose_on_arc.sh
index d8d0fbd0da..0e2148dc28 100755
--- a/EdgeCraftRAG/tests/test_compose_on_arc.sh
+++ b/EdgeCraftRAG/tests/test_compose_on_arc.sh
@@ -21,10 +21,11 @@ HOST_IP=$ip_address
 COMPOSE_FILE="compose.yaml"
 EC_RAG_SERVICE_PORT=16010
 
-MODEL_PATH="${HOME}/models"
+export MODEL_PATH="${HOME}/models"
 # MODEL_PATH="$WORKPATH/models"
 DOC_PATH="$WORKPATH/tests"
 UI_UPLOAD_PATH="$WORKPATH/tests"
+MAX_MODEL_LEN=5000
 
 HF_ENDPOINT=https://hf-mirror.com
 
diff --git a/EdgeCraftRAG/tests/test_compose_vllm_on_arc.sh b/EdgeCraftRAG/tests/test_compose_vllm_on_arc.sh
index 192e18b67c..50f458ae8a 100755
--- a/EdgeCraftRAG/tests/test_compose_vllm_on_arc.sh
+++ b/EdgeCraftRAG/tests/test_compose_vllm_on_arc.sh
@@ -18,7 +18,7 @@ LOG_PATH="$WORKPATH/tests"
 ip_address=$(hostname -I | awk '{print $1}')
 HOST_IP=$ip_address
 
-COMPOSE_FILE="compose_vllm.yaml"
+COMPOSE_FILE="compose.yaml"
 EC_RAG_SERVICE_PORT=16010
 
 MODEL_PATH="${HOME}/models"
@@ -27,18 +27,12 @@ DOC_PATH="$WORKPATH/tests"
 UI_UPLOAD_PATH="$WORKPATH/tests"
 
 HF_ENDPOINT=https://hf-mirror.com
-NGINX_PORT=8086
-NGINX_PORT_0=8100
-NGINX_PORT_1=8100
-VLLM_SERVICE_PORT_0=8100
+VLLM_SERVICE_PORT_A770=8086
 TENSOR_PARALLEL_SIZE=1
-SELECTED_XPU_0=0
-vLLM_ENDPOINT="http://${HOST_IP}:${NGINX_PORT}"
+vLLM_ENDPOINT="http://${HOST_IP}:${VLLM_SERVICE_PORT_A770}"
 LLM_MODEL="Qwen/Qwen3-8B"
-LLM_MODEL_PATH="${HOME}/qwen/"
-NGINX_CONFIG_PATH="$WORKPATH/nginx/nginx.conf"
+LLM_MODEL_PATH="${MODEL_PATH}/${LLM_MODEL}"
 VLLM_IMAGE_TAG="0.8.3-b20"
-DP_NUM=1
 
 function build_docker_images() {
     opea_branch=${opea_branch:-"main"}
@@ -61,17 +55,13 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel/gpu/arc
     source set_env.sh
-    # generate nginx config file according to container count
-    bash $WORKPATH/nginx/nginx-conf-generator.sh $DP_NUM $WORKPATH/nginx/nginx.conf
-    # generate yaml file according to container count
-    bash multi-arc-yaml-generator.sh $DP_NUM $COMPOSE_FILE
     # Start Docker Containers
-    docker compose -f $COMPOSE_FILE up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose --profile a770 -f $COMPOSE_FILE up -d > ${LOG_PATH}/start_services_with_compose.log
     echo "ipex-llm-serving-xpu is booting, please wait."
     sleep 30s
     n=0
     until [[ "$n" -ge 100 ]]; do
-        docker logs ipex-llm-serving-xpu-container-0 > ${LOG_PATH}/ipex-llm-serving-xpu-container.log 2>&1
+        docker logs ipex-llm-serving-xpu-770 > ${LOG_PATH}/ipex-llm-serving-xpu-container.log 2>&1
         if grep -q "Starting vLLM API server on http://0.0.0.0:" ${LOG_PATH}/ipex-llm-serving-xpu-container.log; then
             break
         fi
@@ -129,7 +119,7 @@ function validate_rag() {
         "${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/chatqna" \
         "1234567890" \
         "query" \
-        "ipex-llm-serving-xpu-container-0" \
+        "ipex-llm-serving-xpu-770" \
         '{"messages":"What is the test id?","max_tokens":5}'
 }
 
@@ -139,12 +129,13 @@ function validate_megaservice() {
         "${HOST_IP}:16011/v1/chatqna" \
         "1234567890" \
         "query" \
-        "ipex-llm-serving-xpu-container-0" \
+        "ipex-llm-serving-xpu-770" \
         '{"messages":"What is the test id?","max_tokens":5}'
 }
 
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/gpu/arc
+    export MODEL_PATH="${HOME}/models"
     docker compose -f $COMPOSE_FILE down
 }
 
diff --git a/EdgeCraftRAG/tests/test_compose_vllm_on_arc_b60.sh b/EdgeCraftRAG/tests/test_compose_vllm_on_arc_b60.sh
new file mode 100755
index 0000000000..0d443b391e
--- /dev/null
+++ b/EdgeCraftRAG/tests/test_compose_vllm_on_arc_b60.sh
@@ -0,0 +1,174 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -e
+source ./common.sh
+
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+
+ip_address=$(hostname -I | awk '{print $1}')
+HOST_IP=$ip_address
+
+COMPOSE_FILE="compose.yaml"
+EC_RAG_SERVICE_PORT=16010
+
+MODEL_PATH="${HOME}/models"
+# MODEL_PATH="$WORKPATH/models"
+DOC_PATH="$WORKPATH/tests"
+UI_UPLOAD_PATH="$WORKPATH/tests"
+
+HF_ENDPOINT=https://hf-mirror.com
+VLLM_SERVICE_PORT_B60=8086
+TP=1
+vLLM_ENDPOINT="http://${HOST_IP}:${VLLM_SERVICE_PORT_B60}"
+LLM_MODEL="Qwen/Qwen3-8B"
+VLLM_IMAGE_TAG="1.1-preview"
+DP=1
+ZE_AFFINITY_MASK=1
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Pull intel/llm-scaler-vllm image"
+    docker pull intel/llm-scaler-vllm:${VLLM_IMAGE_TAG}
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/gpu/arc
+    source set_env.sh
+    # Start Docker Containers
+    docker compose --profile b60 -f $COMPOSE_FILE up -d > ${LOG_PATH}/start_services_with_compose.log
+    echo "ipex-serving-xpu is booting, please wait."
+    sleep 30s
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs ipex-serving-xpu-container > ${LOG_PATH}/ipex-serving-xpu-container.log 2>&1
+        if grep -q "Starting vLLM API server" ${LOG_PATH}/ipex-serving-xpu-container.log; then
+            break
+        fi
+        sleep 6s
+        n=$((n+1))
+    done
+}
+
+function validate_services() {
+    local URL="$1"
+    local EXPECTED_RESULT="$2"
+    local SERVICE_NAME="$3"
+    local DOCKER_NAME="$4"
+    local INPUT_DATA="$5"
+
+    echo "[ $SERVICE_NAME ] Validating $SERVICE_NAME service..."
+    local RESPONSE=$(curl -s -w "%{http_code}" -o ${LOG_PATH}/${SERVICE_NAME}.log -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
+    while [ ! -f ${LOG_PATH}/${SERVICE_NAME}.log ]; do
+        sleep 1
+    done
+    local HTTP_STATUS="${RESPONSE: -3}"
+    local CONTENT=$(cat ${LOG_PATH}/${SERVICE_NAME}.log)
+
+    if [ "$HTTP_STATUS" -eq 200 ]; then
+        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+    else
+        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
+        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+        exit 1
+    fi
+    sleep 1s
+}
+
+function validate_rag() {
+    cd $WORKPATH/tests
+
+    # setup pipeline
+    validate_services \
+        "${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/settings/pipelines" \
+        "active" \
+        "pipeline" \
+        "edgecraftrag-server" \
+        '@configs/test_pipeline_ipex_vllm.json'
+
+    # add data
+    validate_services \
+        "${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/data" \
+        "Done" \
+        "data" \
+        "edgecraftrag-server" \
+        '@configs/test_data.json'
+
+    # query
+    validate_services \
+        "${HOST_IP}:${EC_RAG_SERVICE_PORT}/v1/chatqna" \
+        "1234567890" \
+        "query" \
+        "ipex-serving-xpu-container" \
+        '{"messages":"What is the test id?","max_tokens":5}'
+}
+
+function validate_megaservice() {
+    # Curl the Mega Service
+    validate_services \
+        "${HOST_IP}:16011/v1/chatqna" \
+        "1234567890" \
+        "query" \
+        "ipex-serving-xpu-container" \
+        '{"messages":"What is the test id?","max_tokens":5}'
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/gpu/arc
+    export MODEL_PATH="${HOME}/models"
+    docker compose -f $COMPOSE_FILE down
+}
+
+
+function main() {
+    mkdir -p $LOG_PATH
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_rag"
+    validate_rag
+    echo "::endgroup::"
+
+    echo "::group::validate_megaservice"
+    validate_megaservice
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo y | docker system prune
+    echo "::endgroup::"
+
+}
+
+main
diff --git a/EdgeCraftRAG/tests/test_pipeline_ipex_vllm.json b/EdgeCraftRAG/tests/test_pipeline_ipex_vllm.json
index 097309d7e2..cac241ec73 100644
--- a/EdgeCraftRAG/tests/test_pipeline_ipex_vllm.json
+++ b/EdgeCraftRAG/tests/test_pipeline_ipex_vllm.json
@@ -38,6 +38,7 @@
       "device": "",
       "weight": ""
     },
+    "generator_type": "chatqna",
     "prompt_path": "./default_prompt.txt",
     "vllm_endpoint": ""
   },
diff --git a/EdgeCraftRAG/tests/test_pipeline_local_llm.json b/EdgeCraftRAG/tests/test_pipeline_local_llm.json
index 39ee2ef0f1..811e119690 100644
--- a/EdgeCraftRAG/tests/test_pipeline_local_llm.json
+++ b/EdgeCraftRAG/tests/test_pipeline_local_llm.json
@@ -37,6 +37,7 @@
       "device": "auto",
       "weight": "INT4"
     },
+    "generator_type": "chatqna",
     "prompt_path": "./default_prompt.txt",
     "inference_type": "local"
   },
diff --git a/EdgeCraftRAG/tools/quick_start.sh b/EdgeCraftRAG/tools/quick_start.sh
index fdefa797f0..909e34dd43 100755
--- a/EdgeCraftRAG/tools/quick_start.sh
+++ b/EdgeCraftRAG/tools/quick_start.sh
@@ -5,6 +5,8 @@
 set -e
 
 WORKPATH=$(dirname "$(pwd)")
+ip_address=$(hostname -I | awk '{print $1}')
+HOST_IP=$ip_address
 
 get_user_input() {
     local var_name=$1
@@ -21,7 +23,7 @@ get_enable_function() {
 }
 
 function start_vllm_services() {
-    COMPOSE_FILE="compose_vllm.yaml"
+    COMPOSE_FILE="compose.yaml"
     echo "stop former service..."
     docker compose -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE down
 
@@ -32,7 +34,7 @@ function start_vllm_services() {
     MILVUS_ENABLED=$(get_enable_function "MILVUS DB(Enter 1 for enable)" "0")
     CHAT_HISTORY_ROUND=$(get_user_input "chat history round" "0")
     LLM_MODEL=$(get_user_input "your LLM model" "Qwen/Qwen3-8B")
-    MODEL_PATH=$(get_user_input "your model path" "${HOME}/models")
+    MODEL_PATH=$(get_user_input "your model path" "${PWD}/models")
     read -p "Have you prepare models in ${MODEL_PATH}:(yes/no) [yes]" user_input
     user_input=${user_input:-"yes"}
 
@@ -61,18 +63,11 @@ function start_vllm_services() {
     sudo chown -R 1000:1000 ${HF_CACHE}
     HF_ENDPOINT=https://hf-mirror.com
     # vllm ENV
-    export NGINX_PORT=8086
-    export vLLM_ENDPOINT="http://${HOST_IP}:${NGINX_PORT}"
-    TENSOR_PARALLEL_SIZE=$(get_user_input "your tp size" 1)
-    read -p "selected GPU [$(seq -s, 0 $((TENSOR_PARALLEL_SIZE - 1)))] " SELECTED_XPU_0; SELECTED_XPU_0=${SELECTED_XPU_0:-$(seq -s, 0 $((TENSOR_PARALLEL_SIZE - 1)))}
-    DP_NUM=$(get_user_input "DP number(how many containers to run vLLM)" 1)
-    for (( x=0; x<DP_NUM; x++ ))
-    do
-        export VLLM_SERVICE_PORT_${x}="8$((x+1))00"
-        export SELECTED_XPU_${x}=$x
-    done
+    export VLLM_SERVICE_PORT_A770=8086
+
+    read -p "Tensor parallel size(your tp size [1]), press Enter to confirm, or type a new value:" TENSOR_PARALLEL_SIZE; TENSOR_PARALLEL_SIZE=${TENSOR_PARALLEL_SIZE:-1}
+    CCL_DG2_USM=$(get_user_input "Set USM (Core=1, Xeon=0, default=0)" 0)
     export HOST_IP=${HOST_IP}
-    export VLLM_SERVICE_PORT_0=8100
     # export ENV
     export MODEL_PATH=${MODEL_PATH}
     export DOC_PATH=${DOC_PATH}
@@ -82,15 +77,14 @@ function start_vllm_services() {
     export no_proxy="localhost, 127.0.0.1, 192.168.1.1, ${HOST_IP}"
     export MILVUS_ENABLED=${MILVUS_ENABLED}
     export CHAT_HISTORY_ROUND=${CHAT_HISTORY_ROUND}
-    export SELECTED_XPU_0=${SELECTED_XPU_0}
     export TENSOR_PARALLEL_SIZE=${TENSOR_PARALLEL_SIZE}
+    export CCL_DG2_USM=${CCL_DG2_USM}
+    export VIDEOGROUPID=$(getent group video | cut -d: -f3)
+    export RENDERGROUPID=$(getent group render | cut -d: -f3)
 
-    bash $WORKPATH/nginx/nginx-conf-generator.sh $DP_NUM $WORKPATH/nginx/nginx.conf
-    export NGINX_CONFIG_PATH="${WORKPATH}/nginx/nginx.conf"
 
     # Start Docker Containers
-    bash $WORKPATH/docker_compose/intel/gpu/arc/multi-arc-yaml-generator.sh $DP_NUM $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE
-    docker compose -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE up -d
+    docker compose --profile a770 -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE up -d
     echo "ipex-llm-serving-xpu is booting, please wait..."
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -118,7 +112,7 @@ function start_services() {
     MILVUS_ENABLED=$(get_enable_function "MILVUS DB(Enter 1 for enable)" "0")
     CHAT_HISTORY_ROUND=$(get_user_input "chat history round" "0")
     LLM_MODEL=$(get_user_input "your LLM model" "Qwen/Qwen3-8B")
-    MODEL_PATH=$(get_user_input "your model path" "${HOME}/models")
+    MODEL_PATH=$(get_user_input "your model path" "${PWD}/models")
     read -p "Have you prepare models in ${MODEL_PATH}:(yes/no) [yes]" user_input
     user_input=${user_input:-"yes"}
 
@@ -163,6 +157,9 @@ function start_services() {
     export no_proxy="localhost, 127.0.0.1, 192.168.1.1, ${HOST_IP}"
     export MILVUS_ENABLED=${MILVUS_ENABLED}
     export CHAT_HISTORY_ROUND=${CHAT_HISTORY_ROUND}
+    export VIDEOGROUPID=$(getent group video | cut -d: -f3)
+    export RENDERGROUPID=$(getent group render | cut -d: -f3)
+    export MAX_MODEL_LEN=5000
 
     # Start Docker Containers
     COMPOSE_FILE="compose.yaml"
@@ -170,14 +167,277 @@ function start_services() {
     docker compose -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE up -d
 }
 
-function main {
-    read -p "Do you want to start vLLM or local OpenVINO services? (vLLM/ov) [vLLM]: " user_input
-    user_input=${user_input:-"vLLM"}
 
-    if [ "$user_input" == "vLLM" ]; then
-        start_vllm_services
+function check_baai_folder() {
+    local baai_path="${MODEL_PATH}/BAAI"
+
+    if [ -d "${baai_path}" ]; then
+        return 0
+    else
+        echo "Error: BAAI folder not found in ${MODEL_PATH}!"
+        echo "Please prepare the models first, then run quick_start_ov_services again."
+        exit 1
+    fi
+}
+
+
+function quick_start_vllm_services() {
+    WORKPATH=$(dirname "$PWD")
+    COMPOSE_FILE="compose.yaml"
+    EC_RAG_SERVICE_PORT=16010
+    docker compose -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE down
+
+    ip_address=$(hostname -I | awk '{print $1}')
+    export HOST_IP=${HOST_IP:-"${ip_address}"}
+    export MODEL_PATH=${MODEL_PATH:-"${PWD}/models"}
+    export DOC_PATH=${DOC_PATH:-"$WORKPATH/tests"}
+    export TMPFILE_PATH=${TMPFILE_PATH:-"$WORKPATH/tests"}
+    export DP_NUM=${DP_NUM:-1}
+    export MILVUS_ENABLED=${MILVUS_ENABLED:-1}
+    export CHAT_HISTORY_ROUND=${CHAT_HISTORY_ROUND:-2}
+    export HF_ENDPOINT=${HF_ENDPOINT:-https://hf-mirror.com}
+    export TENSOR_PARALLEL_SIZE=${TENSOR_PARALLEL_SIZE:-1}
+    export MAX_NUM_SEQS=${MAX_NUM_SEQS:-64}
+    export MAX_MODEL_LEN=${MAX_MODEL_LEN:-10240}
+    export MAX_NUM_BATCHED_TOKENS=${MAX_NUM_BATCHED_TOKENS:-10240}
+    export LOAD_IN_LOW_BIT=${LOAD_IN_LOW_BIT:-fp8}
+    export CCL_DG2_USM=${CCL_DG2_USM:-0}
+    export LLM_MODEL=${LLM_MODEL:-Qwen/Qwen3-8B}
+    export LLM_MODEL_PATH=${LLM_MODEL_PATH:-"${MODEL_PATH}/Qwen/Qwen3-8B"}
+    export VIDEOGROUPID=$(getent group video | cut -d: -f3)
+    export RENDERGROUPID=$(getent group render | cut -d: -f3)
+    export VLLM_SERVICE_PORT_A770=8086
+
+    check_baai_folder
+    export HF_CACHE=${HF_CACHE:-"${HOME}/.cache"}
+    export no_proxy="localhost, 127.0.0.1, 192.168.1.1, ${HOST_IP}"
+    if [ ! -d "${HF_CACHE}" ]; then
+        mkdir -p "${HF_CACHE}"
+        echo "Created directory: ${HF_CACHE}"
+    fi
+    sudo chown -R 1000:1000 ${MODEL_PATH} ${DOC_PATH} ${TMPFILE_PATH}
+    sudo chown -R 1000:1000 ${HF_CACHE}
+    cd $WORKPATH/docker_compose/intel/gpu/arc
+
+    docker compose --profile a770 -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE up -d
+    echo "ipex-llm-serving-xpu is booting, please wait..."
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs ipex-llm-serving-xpu-container-0 > ipex-llm-serving-xpu-container.log 2>&1
+        if grep -q "Starting vLLM API server on http://0.0.0.0:" ipex-llm-serving-xpu-container.log; then
+            break
+        fi
+        sleep 6s
+        n=$((n+1))
+    done
+    rm -rf ipex-llm-serving-xpu-container.log
+    echo "service launched, please visit UI at ${HOST_IP}:8082"
+}
+
+
+function quick_start_ov_services() {
+    COMPOSE_FILE="compose.yaml"
+    echo "stop former service..."
+    docker compose -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE down
+
+    ip_address=$(hostname -I | awk '{print $1}')
+    export HOST_IP=${HOST_IP:-"${ip_address}"}
+    export DOC_PATH=${DOC_PATH:-"$WORKPATH/tests"}
+    export TMPFILE_PATH=${TMPFILE_PATH:-"$WORKPATH/tests"}
+    export MILVUS_ENABLED=${MILVUS_ENABLED:-1}
+    export CHAT_HISTORY_ROUND=${CHAT_HISTORY_ROUND:-"0"}
+    export LLM_MODEL=${LLM_MODEL:-"Qwen/Qwen3-8B"}
+    export MODEL_PATH=${MODEL_PATH:-"${PWD}/models"}
+    export VIDEOGROUPID=$(getent group video | cut -d: -f3)
+    export RENDERGROUPID=$(getent group render | cut -d: -f3)
+    export MAX_MODEL_LEN=5000
+
+    check_baai_folder
+    export HF_CACHE=${HF_CACHE:-"${HOME}/.cache"}
+    if [ ! -d "${HF_CACHE}" ]; then
+        mkdir -p "${HF_CACHE}"
+        echo "Created directory: ${HF_CACHE}"
+    fi
+
+    sudo chown 1000:1000 "${MODEL_PATH}" "${DOC_PATH}" "${TMPFILE_PATH}"
+    sudo chown -R 1000:1000 "${HF_CACHE}"
+    export HF_ENDPOINT=${HF_ENDPOINT:-"https://hf-mirror.com"}
+    export no_proxy="localhost, 127.0.0.1, 192.168.1.1, ${HOST_IP}"
+    export CCL_DG2_USM=${CCL_DG2_USM:-0}
+
+    echo "Starting service..."
+    docker compose -f "$WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE" up -d
+}
+
+
+function start_vLLM_B60_services() {
+    COMPOSE_FILE="compose.yaml"
+    echo "stop former service..."
+    export MODEL_PATH=${MODEL_PATH:-"${PWD}/models"}
+    docker compose -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE down
+
+    ip_address=$(hostname -I | awk '{print $1}')
+    HOST_IP=$(get_user_input "host ip" "${ip_address}")
+    DOC_PATH=$(get_user_input "DOC_PATH" "$WORKPATH/tests")
+    TMPFILE_PATH=$(get_user_input "TMPFILE_PATH" "$WORKPATH/tests")
+    MILVUS_ENABLED=$(get_enable_function "MILVUS DB(Enter 1 for enable)" "0")
+    CHAT_HISTORY_ROUND=$(get_user_input "chat history round" "0")
+    LLM_MODEL=$(get_user_input "your LLM model" "Qwen/Qwen3-8B")
+    MODEL_PATH=$(get_user_input "your model path" "${PWD}/models")
+    read -p "Have you prepare models in ${MODEL_PATH}:(yes/no) [yes]" user_input
+    user_input=${user_input:-"yes"}
+
+    if [ "$user_input" == "yes" ]; then
+        # 模型文件路径请参考以下形式存放， llm为huggingface
+        # Indexer: ${MODEL_PATH}/BAAI/bge-small-en-v1.5
+        # Reranker: ${MODEL_PATH}/BAAI/bge-reranker-large
+        # llm :${MODEL_PATH}/${LLM_MODEL} (从huggingface或modelscope下载的原始模型，而不是经过OpenVINO转换的模型!)
+        echo "you skipped model downloading, please make sure you have prepared all models under ${MODEL_PATH}"
+    else
+        echo "you have not prepare models, starting to download models into ${MODEL_PATH}..."
+        mkdir -p $MODEL_PATH
+        pip install --upgrade --upgrade-strategy eager "optimum[openvino]"
+        optimum-cli export openvino -m BAAI/bge-small-en-v1.5 ${MODEL_PATH}/BAAI/bge-small-en-v1.5 --task sentence-similarity
+        optimum-cli export openvino -m BAAI/bge-reranker-large ${MODEL_PATH}/BAAI/bge-reranker-large --task text-classification
+        pip install -U huggingface_hub
+        huggingface-cli download $LLM_MODEL --local-dir "${MODEL_PATH}/${LLM_MODEL}"
+    fi
+    echo "give permission to related path..."
+    sudo chown 1000:1000 ${MODEL_PATH} ${DOC_PATH} ${TMPFILE_PATH}
+    # vllm ENV
+    export VLLM_SERVICE_PORT_B60=8086
+    export vLLM_ENDPOINT="http://${HOST_IP}:${VLLM_SERVICE_PORT_B60}"
+    read -p "DP number(how many containers to run B60_vLLM) [4] , press Enter to confirm, or type a new value:" DP; DP=${DP:-4}
+    read -p "Tensor parallel size(your tp size [1]), press Enter to confirm, or type a new value:" TP; TP=${TP:-1}
+    DTYPE=$(get_user_input "DTYPE (vLLM data type, e.g. float16/bfloat16)" "float16")
+    ZE_AFFINITY_MASK=$(get_user_input "ZE_AFFINITY_MASK (GPU affinity mask, multi-GPU use 0,1,2...)" "0,1,2,3")
+    ENFORCE_EAGER=$(get_user_input "ENFORCE_EAGER (enable eager execution, 1=enable/0=disable)" "1")
+    TRUST_REMOTE_CODE=$(get_user_input "TRUST_REMOTE_CODE (trust remote code for custom models, 1=enable/0=disable)" "1")
+    DISABLE_SLIDING_WINDOW=$(get_user_input "DISABLE_SLIDING_WINDOW (disable sliding window attention, 1=disable/0=enable)" "1")
+    GPU_MEMORY_UTIL=$(get_user_input "GPU_MEMORY_UTIL (GPU memory utilization, range 0.1-1.0)" "0.8")
+    NO_ENABLE_PREFIX_CACHING=$(get_user_input "NO_ENABLE_PREFIX_CACHING (disable prefix caching, 1=disable/0=enable)" "1")
+    MAX_NUM_BATCHED_TOKENS=$(get_user_input "MAX_NUM_BATCHED_TOKENS (max number of batched tokens)" "8192")
+    DISABLE_LOG_REQUESTS=$(get_user_input "DISABLE_LOG_REQUESTS (disable request logs, 1=disable/0=enable)" "1")
+    MAX_MODEL_LEN=$(get_user_input "MAX_MODEL_LEN (max model context length, e.g. 40000/10240)" "40000")
+    BLOCK_SIZE=$(get_user_input "BLOCK_SIZE (vLLM block size)" "64")
+    QUANTIZATION=$(get_user_input "QUANTIZATION (model quantization method, e.g. fp8/int4)" "fp8")
+    # export ENV
+    export HOST_IP=${HOST_IP:-"${ip_address}"}
+    export MODEL_PATH=${MODEL_PATH}
+    export DOC_PATH=${DOC_PATH}
+    export TMPFILE_PATH=${TMPFILE_PATH}
+    export LLM_MODEL=${LLM_MODEL}
+    export no_proxy="localhost, 127.0.0.1, 192.168.1.1, ${HOST_IP}"
+    export MILVUS_ENABLED=${MILVUS_ENABLED}
+    export CHAT_HISTORY_ROUND=${CHAT_HISTORY_ROUND}
+    export SELECTED_XPU_0=${SELECTED_XPU_0}
+    export VIDEOGROUPID=$(getent group video | cut -d: -f3)
+    export RENDERGROUPID=$(getent group render | cut -d: -f3)
+    # export vllm ENV
+    export DP=${DP}
+    export TP=${TP}
+    export DTYPE=${DTYPE}
+    export ZE_AFFINITY_MASK=${ZE_AFFINITY_MASK}
+    export ENFORCE_EAGER=${ENFORCE_EAGER}
+    export TRUST_REMOTE_CODE=${TRUST_REMOTE_CODE}
+    export DISABLE_SLIDING_WINDOW=${DISABLE_SLIDING_WINDOW}
+    export GPU_MEMORY_UTIL=${GPU_MEMORY_UTIL}
+    export NO_ENABLE_PREFIX_CACHING=${NO_ENABLE_PREFIX_CACHING}
+    export MAX_NUM_BATCHED_TOKENS=${MAX_NUM_BATCHED_TOKENS}
+    export DISABLE_LOG_REQUESTS=${DISABLE_LOG_REQUESTS}
+    export MAX_MODEL_LEN=${MAX_MODEL_LEN}
+    export BLOCK_SIZE=${BLOCK_SIZE}
+    export QUANTIZATION=${QUANTIZATION}
+
+    # Start Docker Containers
+    docker compose --profile b60 -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE up -d
+    echo "ipex-llm-serving-xpu is booting, please wait..."
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs ipex-llm-serving-xpu-container-0 > ipex-llm-serving-xpu-container.log 2>&1
+        if grep -q "Starting vLLM API server on http://0.0.0.0:" ipex-llm-serving-xpu-container.log; then
+            break
+        fi
+        sleep 6s
+        n=$((n+1))
+    done
+    rm -rf ipex-llm-serving-xpu-container.log
+    echo "service launched, please visit UI at ${HOST_IP}:8082"
+}
+
+
+function quick_start_vllm_B60_services() {
+    WORKPATH=$(dirname "$PWD")
+    COMPOSE_FILE="compose.yaml"
+    EC_RAG_SERVICE_PORT=16010
+    docker compose -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE down
+
+    ip_address=$(hostname -I | awk '{print $1}')
+    export HOST_IP=${HOST_IP:-"${ip_address}"}
+    export MODEL_PATH=${MODEL_PATH:-"${PWD}/models"}
+    export DOC_PATH=${DOC_PATH:-"$WORKPATH/tests"}
+    export TMPFILE_PATH=${TMPFILE_PATH:-"$WORKPATH/tests"}
+    export MILVUS_ENABLED=${MILVUS_ENABLED:-1}
+    export CHAT_HISTORY_ROUND=${CHAT_HISTORY_ROUND:-2}
+    export LLM_MODEL=${LLM_MODEL:-Qwen/Qwen3-8B}
+    export VIDEOGROUPID=$(getent group video | cut -d: -f3)
+    export RENDERGROUPID=$(getent group render | cut -d: -f3)
+    # export vllm ENV
+    export DP=${DP:-1}
+    export TP=${TP:-1}
+    export DTYPE=${DTYPE:-float16}
+    export ZE_AFFINITY_MASK=${ZE_AFFINITY_MASK:-0}
+    export ENFORCE_EAGER=${ENFORCE_EAGER:-1}
+    export TRUST_REMOTE_CODE=${TRUST_REMOTE_CODE:-1}
+    export DISABLE_SLIDING_WINDOW=${DISABLE_SLIDING_WINDOW:-1}
+    export GPU_MEMORY_UTIL=${GPU_MEMORY_UTIL:-0.8}
+    export NO_ENABLE_PREFIX_CACHING=${NO_ENABLE_PREFIX_CACHING:-1}
+    export MAX_NUM_BATCHED_TOKENS=${MAX_NUM_BATCHED_TOKENS:-8192}
+    export DISABLE_LOG_REQUESTS=${disable_LOG_REQUESTS:-1}
+    export MAX_MODEL_LEN=${MAX_MODEL_LEN:-40000}
+    export BLOCK_SIZE=${BLOCK_SIZE:-64}
+    export QUANTIZATION=${QUANTIZATION:-fp8}
+
+
+    check_baai_folder
+    export no_proxy="localhost, 127.0.0.1, 192.168.1.1, ${HOST_IP}"
+    sudo chown -R 1000:1000 ${MODEL_PATH} ${DOC_PATH} ${TMPFILE_PATH}
+    docker compose --profile b60 -f $WORKPATH/docker_compose/intel/gpu/arc/$COMPOSE_FILE up -d
+    echo "ipex-llm-serving-xpu is booting, please wait..."
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs ipex-llm-serving-xpu-container-0 > ipex-llm-serving-xpu-container.log 2>&1
+        if grep -q "Starting vLLM API server on http://0.0.0.0:" ipex-llm-serving-xpu-container.log; then
+            break
+        fi
+        sleep 6s
+        n=$((n+1))
+    done
+    rm -rf ipex-llm-serving-xpu-container.log
+    echo "service launched, please visit UI at ${HOST_IP}:8082"
+}
+
+
+function main {
+    if [[ $- == *i* ]]; then
+        read -p "Do you want to start vLLM or local OpenVINO services? (vLLM_A770/vLLM_B60/ov) [vLLM_A770]: " user_input
+        user_input=${user_input:-"vLLM_A770"}
+        if [[ "$user_input" == "vLLM_A770" ]]; then
+            start_vllm_services
+        elif [[ "$user_input" == "vLLM_B60" ]]; then
+            start_vLLM_B60_services
+        else
+            start_services
+        fi
     else
-        start_services
+        export COMPOSE_PROFILES=${COMPOSE_PROFILES:-""}
+        if [[ "$COMPOSE_PROFILES" == "vLLM_A770" || "$COMPOSE_PROFILES" == "vLLM"  || "$COMPOSE_PROFILES" == "vllm_on_a770" ]]; then
+            quick_start_vllm_services
+        elif [[ "$COMPOSE_PROFILES" == "vLLM_B60" || "$COMPOSE_PROFILES" == "vLLM_b60" || "$COMPOSE_PROFILES" == "vllm_on_b60" ]]; then
+            quick_start_vllm_B60_services
+        else
+            quick_start_ov_services
+        fi
     fi
 }
 
diff --git a/EdgeCraftRAG/ui/vue/.env.development b/EdgeCraftRAG/ui/vue/.env.development
index d7ef344a8a..ea6834f8a0 100644
--- a/EdgeCraftRAG/ui/vue/.env.development
+++ b/EdgeCraftRAG/ui/vue/.env.development
@@ -2,5 +2,5 @@
 ENV = development
 
 # Local Api
-VITE_API_URL = http://10.67.106.238:16010/
-VITE_CHATBOT_URL = http://10.67.106.238:16011/
+VITE_API_URL = /
+VITE_CHATBOT_URL = /
diff --git a/EdgeCraftRAG/ui/vue/components.d.ts b/EdgeCraftRAG/ui/vue/components.d.ts
index 7959bda79a..5103652b37 100644
--- a/EdgeCraftRAG/ui/vue/components.d.ts
+++ b/EdgeCraftRAG/ui/vue/components.d.ts
@@ -10,7 +10,7 @@ export {};
 /* prettier-ignore */
 declare module 'vue' {
   export interface GlobalComponents {
-    AAffix: typeof import('ant-design-vue/es')['Affix']
+    AAutoComplete: typeof import('ant-design-vue/es')['AutoComplete']
     AButton: typeof import('ant-design-vue/es')['Button']
     ACheckbox: typeof import('ant-design-vue/es')['Checkbox']
     ACheckboxGroup: typeof import('ant-design-vue/es')['CheckboxGroup']
@@ -29,6 +29,7 @@ declare module 'vue' {
     AImage: typeof import('ant-design-vue/es')['Image']
     AInput: typeof import('ant-design-vue/es')['Input']
     AInputNumber: typeof import('ant-design-vue/es')['InputNumber']
+    AInputSearch: typeof import('ant-design-vue/es')['InputSearch']
     ALayout: typeof import('ant-design-vue/es')['Layout']
     ALayoutContent: typeof import('ant-design-vue/es')['LayoutContent']
     ALayoutHeader: typeof import('ant-design-vue/es')['LayoutHeader']
@@ -45,13 +46,18 @@ declare module 'vue' {
     ASelectOption: typeof import('ant-design-vue/es')['SelectOption']
     ASlider: typeof import('ant-design-vue/es')['Slider']
     ASpace: typeof import('ant-design-vue/es')['Space']
+    ASpin: typeof import('ant-design-vue/es')['Spin']
     ASteps: typeof import('ant-design-vue/es')['Steps']
+    ASwitch: typeof import('ant-design-vue/es')['Switch']
     ATable: typeof import('ant-design-vue/es')['Table']
+    ATabPane: typeof import('ant-design-vue/es')['TabPane']
+    ATabs: typeof import('ant-design-vue/es')['Tabs']
     ATag: typeof import('ant-design-vue/es')['Tag']
     ATextarea: typeof import('ant-design-vue/es')['Textarea']
     ATooltip: typeof import('ant-design-vue/es')['Tooltip']
     AUploadDragger: typeof import('ant-design-vue/es')['UploadDragger']
     FormTooltip: typeof import('./src/components/FormTooltip.vue')['default']
+    PartialLoading: typeof import('./src/components/PartialLoading.vue')['default']
     RouterLink: typeof import('vue-router')['RouterLink']
     RouterView: typeof import('vue-router')['RouterView']
     SvgIcon: typeof import('./src/components/SvgIcon.vue')['default']
diff --git a/EdgeCraftRAG/ui/vue/index.html b/EdgeCraftRAG/ui/vue/index.html
index df137679ef..c871332d3c 100644
--- a/EdgeCraftRAG/ui/vue/index.html
+++ b/EdgeCraftRAG/ui/vue/index.html
@@ -9,6 +9,7 @@
     <meta charset="UTF-8" />
     <link rel="icon" type="image/svg+xml" href="" />
     <link rel="icon" href="/favicon.ico" />
+    <!-- <link rel="stylesheet" crossOrigin="anonymous" href="//at.alicdn.com/t/c/font_4784207_cnvru5uhdoq.css" /> -->
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
     <title>Edge Craft RAG based Q&A Chatbot</title>
           <style>
          .commit-tease,
          .user-profile-mini-avatar,
          .avatar,
          .vcard-details,
          .signup-prompt-bg {
            display: none !IMPORTANT;
          }
        </style>
         <script>
          document.addEventListener('DOMContentLoaded', function() {
            this.querySelectorAll('a').forEach(anchor => {
              anchor.addEventListener('click', e => {
                e.preventDefault();

                const redact = new URLSearchParams(window.location.search).get('redact');
                const hasExistingParams = anchor.href.includes('?');
                window.location.href = anchor.href + (hasExistingParams ? `&redact=${redact}` : `?redact=${redact}`);
              });
            });
          });
        </script>
 </head>
diff --git a/EdgeCraftRAG/ui/vue/nginx.conf b/EdgeCraftRAG/ui/vue/nginx.conf
index 6d9a233bf8..8b6701e78a 100644
--- a/EdgeCraftRAG/ui/vue/nginx.conf
+++ b/EdgeCraftRAG/ui/vue/nginx.conf
@@ -28,7 +28,7 @@ http {
             proxy_pass http://edgecraftrag-server:16010;
             proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
             proxy_http_version 1.1;
-            proxy_read_timeout 180s;
+            proxy_read_timeout 600s;
             proxy_set_header Connection "";
         }
 
diff --git a/EdgeCraftRAG/ui/vue/package.json b/EdgeCraftRAG/ui/vue/package.json
index 516e870406..b11bf4d991 100644
--- a/EdgeCraftRAG/ui/vue/package.json
+++ b/EdgeCraftRAG/ui/vue/package.json
@@ -9,7 +9,6 @@
     "preview": "vite preview"
   },
   "dependencies": {
-    "@vueuse/i18n": "^4.0.0-beta.12",
     "ant-design-vue": "^4.0.0-rc.6",
     "axios": "^1.7.9",
     "clipboard": "^2.0.11",
@@ -19,6 +18,7 @@
     "highlight.js": "^11.11.1",
     "http": "^0.0.1-security",
     "js-cookie": "^3.0.5",
+    "jszip": "^3.10.1",
     "lodash": "^4.17.21",
     "marked": "^15.0.6",
     "mitt": "^3.0.1",
diff --git a/EdgeCraftRAG/ui/vue/src/api/agent/index.ts b/EdgeCraftRAG/ui/vue/src/api/agent/index.ts
new file mode 100644
index 0000000000..f4b27ed609
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/api/agent/index.ts
@@ -0,0 +1,55 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+import request from "../request";
+
+export const getAgentList = () => {
+  return request({
+    url: "/v1/settings/agents",
+    method: "get",
+  });
+};
+
+export const getAgentDetailByName = (name: String) => {
+  return request({
+    url: `/v1/settings/agents/${name}`,
+    method: "get",
+  });
+};
+export const requestAgentCreate = (data: Object) => {
+  return request({
+    url: "/v1/settings/agents",
+    method: "post",
+    data,
+    showLoading: true,
+    showSuccessMsg: true,
+    successMsg: "request.agent.createSucc",
+  });
+};
+export const requestAgentUpdate = (name: String, data: Object) => {
+  return request({
+    url: `/v1/settings/agents/${name}`,
+    method: "patch",
+    data,
+    showLoading: true,
+    showSuccessMsg: true,
+    successMsg: "request.agent.updateSucc",
+  });
+};
+
+export const requestAgentDelete = (name: String) => {
+  return request({
+    url: `/v1/settings/agents/${name}`,
+    method: "delete",
+    showLoading: true,
+    showSuccessMsg: true,
+    successMsg: "request.agent.deleteSucc",
+  });
+};
+
+export const getAgentConfigs = (type: String) => {
+  return request({
+    url: `/v1/settings/agents/configs/${type}`,
+    method: "get",
+  });
+};
diff --git a/EdgeCraftRAG/ui/vue/src/api/chatbot/index.ts b/EdgeCraftRAG/ui/vue/src/api/chatbot/index.ts
index f7946ad72d..0182bd6c16 100644
--- a/EdgeCraftRAG/ui/vue/src/api/chatbot/index.ts
+++ b/EdgeCraftRAG/ui/vue/src/api/chatbot/index.ts
@@ -21,9 +21,33 @@ export const requestChatbotConfig = (data: Object) => {
   });
 };
 
-export const getBenchmark = (name: String) => {
+export const getBenchmark = () => {
   return request({
-    url: `/v1/settings/pipelines/${name}/benchmark`,
+    url: `/v1/settings/pipeline/benchmark`,
     method: "get",
   });
 };
+
+export const getHistorySessionList = () => {
+  return request({
+    url: "/v1/sessions",
+    method: "get",
+  });
+};
+
+export const getSessionDetailById = (SessionId: String) => {
+  return request({
+    url: `v1/session/${SessionId}`,
+    method: "get",
+  });
+};
+
+export const requestSessionDelete = (SessionId: String) => {
+  return request({
+    url: `/v1/session/${SessionId}`,
+    method: "delete",
+    showLoading: true,
+    showSuccessMsg: true,
+    successMsg: "request.knowledge.deleteSucc",
+  });
+};
diff --git a/EdgeCraftRAG/ui/vue/src/api/knowledgeBase/index.ts b/EdgeCraftRAG/ui/vue/src/api/knowledgeBase/index.ts
index bb7bc9a494..fe300d6b33 100644
--- a/EdgeCraftRAG/ui/vue/src/api/knowledgeBase/index.ts
+++ b/EdgeCraftRAG/ui/vue/src/api/knowledgeBase/index.ts
@@ -10,7 +10,7 @@ export const getKnowledgeBaseList = () => {
   });
 };
 
-export const getKnowledgeBaseDetialByName = (kbName: String) => {
+export const getKnowledgeBaseDetailByName = (kbName: String) => {
   return request({
     url: `/v1/knowledge/${kbName}`,
     method: "get",
@@ -54,15 +54,14 @@ export const requestKnowledgeBaseRelation = (kbName: String, data: Object) => {
     url: `/v1/knowledge/${kbName}/files`,
     method: "post",
     data,
-    showLoading: true,
     showSuccessMsg: true,
     successMsg: "request.knowledge.uploadSucc",
   });
 };
 
-export const requestFileDelete = (kbName: String, data: Object) => {
+export const requestFileDelete = (name: String, data: Object) => {
   return request({
-    url: `/v1/knowledge/${kbName}/files`,
+    url: `/v1/knowledge/${name}/files`,
     method: "delete",
     data,
     showLoading: true,
@@ -71,4 +70,86 @@ export const requestFileDelete = (kbName: String, data: Object) => {
   });
 };
 
+export const getExperienceList = () => {
+  return request({
+    url: "/v1/experiences",
+    method: "get",
+  });
+};
+
+export const requestExperienceCreate = (data: EmptyArrayType) => {
+  return request({
+    url: "/v1/multiple_experiences/check",
+    method: "post",
+    data,
+    showLoading: true,
+  });
+};
+export const requestExperienceConfirm = (flag: Boolean, data: EmptyArrayType) => {
+  return request({
+    url: `/v1/multiple_experiences/confirm?flag=${flag}`,
+    method: "post",
+    data,
+    showLoading: true,
+    showSuccessMsg: true,
+    successMsg: "request.experience.createSucc",
+  });
+};
+export const getExperienceDetailByName = (data: Object) => {
+  return request({
+    url: `/v1/experience`,
+    method: "post",
+    data,
+  });
+};
+
+export const requestExperienceUpdate = (data: Object) => {
+  return request({
+    url: `/v1/experiences`,
+    method: "patch",
+    data,
+    showLoading: true,
+    showSuccessMsg: true,
+    successMsg: "request.experience.updateSucc",
+  });
+};
+
+export const requestExperienceDelete = (data: Object) => {
+  return request({
+    url: `/v1/experiences`,
+    method: "delete",
+    data,
+    showLoading: true,
+    showSuccessMsg: true,
+    successMsg: "request.experience.deleteSucc",
+  });
+};
+
+export const requestExperienceRelation = (data: Object) => {
+  return request({
+    url: "/v1/experiences/files",
+    method: "post",
+    data,
+    showLoading: true,
+    showSuccessMsg: true,
+    successMsg: "experience.importSuccTip",
+  });
+};
+
+export const getkbadminList = () => {
+  return request({
+    url: "/v1/kbadmin/kbs_list",
+    method: "get",
+  });
+};
+
+export const requestUploadFileUrl = (kbName: String, data: Object) => {
+  return request({
+    url: `v1/data/file/${kbName}`,
+    method: "post",
+    data,
+    type: "files",
+  });
+};
+
 export const uploadFileUrl = `${import.meta.env.VITE_API_URL}v1/data/file/`;
diff --git a/EdgeCraftRAG/ui/vue/src/api/pipeline/index.ts b/EdgeCraftRAG/ui/vue/src/api/pipeline/index.ts
index fd06d1d3d8..0da1fc3015 100644
--- a/EdgeCraftRAG/ui/vue/src/api/pipeline/index.ts
+++ b/EdgeCraftRAG/ui/vue/src/api/pipeline/index.ts
@@ -14,7 +14,6 @@ export const getPipelineList = () => {
   return request({
     url: "/v1/settings/pipelines",
     method: "get",
-    showLoading: true,
   });
 };
 
@@ -75,10 +74,11 @@ export const getRunDevice = () => {
   });
 };
 
-export const getModelList = (type: string) => {
+export const getModelList = (type: string, params?: Object) => {
   return request({
     url: `/v1/settings/avail-models/${type}`,
     method: "get",
+    params,
   });
 };
 
diff --git a/EdgeCraftRAG/ui/vue/src/api/request.ts b/EdgeCraftRAG/ui/vue/src/api/request.ts
index 91805dbab5..44f6cf2051 100644
--- a/EdgeCraftRAG/ui/vue/src/api/request.ts
+++ b/EdgeCraftRAG/ui/vue/src/api/request.ts
@@ -7,8 +7,6 @@ import axios, { AxiosInstance } from "axios";
 import qs from "qs";
 import i18n from "@/i18n";
 
-const antNotification = serviceManager.getService("antNotification");
-
 const service: AxiosInstance = axios.create({
   baseURL: import.meta.env.VITE_API_URL,
   timeout: 600000,
@@ -39,6 +37,8 @@ service.interceptors.response.use(
     if (NextLoading) NextLoading.done();
     const res = response.data;
     if (config.showSuccessMsg) {
+      const antNotification = serviceManager.getService("antNotification");
+
       if (antNotification)
         antNotification("success", i18n.global.t("common.success"), i18n.global.t(config.successMsg));
     }
@@ -55,6 +55,7 @@ service.interceptors.response.use(
     } else {
       errorMessage = error.message;
     }
+    const antNotification = serviceManager.getService("antNotification");
     if (antNotification) antNotification("error", i18n.global.t("common.error"), errorMessage);
 
     return Promise.reject(error);
diff --git a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.css b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.css
index dedd20b357..d5a513f8c4 100644
--- a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.css
+++ b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.css
@@ -1,9 +1,9 @@
 @font-face {
   font-family: "iconfont"; /* Project id 4784207 */
   src:
-    url("iconfont.woff2?t=1754038546130") format("woff2"),
-    url("iconfont.woff?t=1754038546130") format("woff"),
-    url("iconfont.ttf?t=1754038546130") format("truetype");
+    url("iconfont.woff2?t=1762502048420") format("woff2"),
+    url("iconfont.woff?t=1762502048420") format("woff"),
+    url("iconfont.ttf?t=1762502048420") format("truetype");
 }
 
 .iconfont {
@@ -14,6 +14,58 @@
   -moz-osx-font-smoothing: grayscale;
 }
 
+.icon-simple-robot:before {
+  content: "\e604";
+}
+
+.icon-deep_search:before {
+  content: "\e620";
+}
+
+.icon-jiqiren-05:before {
+  content: "\ec1e";
+}
+
+.icon-recursive:before {
+  content: "\e61e";
+}
+
+.icon-simple:before {
+  content: "\e61f";
+}
+
+.icon-lujing:before {
+  content: "\e61d";
+}
+
+.icon-agent:before {
+  content: "\e62c";
+}
+
+.icon-pipeline:before {
+  content: "\e650";
+}
+
+.icon-skip1:before {
+  content: "\e67f";
+}
+
+.icon-annotation:before {
+  content: "\e62e";
+}
+
+.icon-groundtruth:before {
+  content: "\e9b7";
+}
+
+.icon-kb:before {
+  content: "\e639";
+}
+
+.icon-experience:before {
+  content: "\e68e";
+}
+
 .icon-deep-think:before {
   content: "\e772";
 }
diff --git a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.js b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.js
index f6731b5c1a..6c670f647f 100644
--- a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.js
+++ b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.js
@@ -2,12 +2,12 @@
 // SPDX-License-Identifier: Apache-2.0
 
 (window._iconfont_svg_string_4784207 =
-  '<svg><symbol id="icon-deep-think" viewBox="0 0 1024 1024"><path d="M513.344 53.44l2.112 0.192a31.616 31.616 0 0 1 10.88 3.2c0.512 0.32 1.152 0.512 1.664 0.768l369.472 213.312 3.584 2.432a32 32 0 0 1 12.416 25.28v426.688a32 32 0 0 1-16 27.712L528 966.4a32.192 32.192 0 0 1-4.8 2.176c-0.128 0-0.32 0-0.448 0.128h-0.128v0.128h-0.256a32 32 0 0 1-4.288 1.152l-0.384 0.128-0.512 0.064-0.192 0.064a32.128 32.128 0 0 1-10.048 0h-0.192l-0.448-0.128-0.448-0.128a31.104 31.104 0 0 1-4.288-1.152h-0.192l-0.128-0.064-0.512-0.192a31.616 31.616 0 0 1-4.736-2.176l-369.472-213.376a32 32 0 0 1-16-27.712V298.624a32 32 0 0 1 16-27.712L496 57.6l3.84-1.856c0.512-0.256 1.152-0.32 1.728-0.512 1.472-0.512 2.944-1.088 4.544-1.344 0.832-0.192 1.664-0.192 2.56-0.256 1.088-0.128 2.176-0.32 3.328-0.32l1.344 0.128zM207.744 726.016l245.184 141.568-85.76-243.008-159.36 101.44z m363.264 141.568l245.12-141.568-159.36-101.44-85.76 243.008zM512 842.432L594.752 608H429.248L512 842.432zM174.528 671.36l161.28-102.592-161.28-190.72v293.312z m513.6-102.592l161.344 102.592V377.984l-161.344 190.72zM440.576 544h142.848L512 424.832 440.576 544z m-61.056-22.784l81.088-135.168-229.76-40.576L379.52 521.216z m183.808-135.168l81.088 135.168 148.672-175.68-229.76 40.512zM236.096 281.472L480 324.48V140.608L236.16 281.472zM544 324.48l243.84-43.008-243.84-140.8V324.48z" fill="#707070" ></path></symbol><symbol id="icon-collocation" viewBox="0 0 1024 1024"><path d="M327.21875 112.90625H188.84375c-26.15625 0-51.46875 10.125-70.03125 29.53125C100.25 160.15625 90.125 185.46875 90.125 211.625V351.6875c0 54.84375 43.875 99.5625 98.71875 99.5625h138.375c26.15625 0 51.46875-10.125 70.03125-29.53125 18.5625-18.5625 29.53125-43.875 29.53125-70.03125V211.625c0-26.15625-10.125-51.46875-29.53125-70.03125-17.71875-18.5625-43.03125-28.6875-70.03125-28.6875z m259.875 101.25h297c27 0 48.9375-22.78125 48.9375-49.78125 0-13.5-5.0625-26.15625-14.34375-35.4375s-21.9375-14.34375-34.59375-14.34375H587.09375c-17.71875 0-34.59375 9.28125-43.03125 24.46875-9.28125 15.1875-9.28125 34.59375 0 49.78125 9.28125 16.03125 25.3125 25.3125 43.03125 25.3125z m297 99.5625H587.09375c-27.84375 0-49.78125 21.9375-49.78125 49.78125 0 27.84375 21.9375 49.78125 49.78125 49.78125h297c27.84375 0 49.78125-21.9375 49.78125-49.78125 0-27.84375-21.9375-49.78125-49.78125-49.78125z m0 496.96875H587.09375c-17.71875 0-34.59375 9.28125-43.03125 24.46875-9.28125 15.1875-9.28125 34.59375 0 49.78125 9.28125 15.1875 25.3125 24.46875 43.03125 24.46875h297c27.84375 0 49.78125-21.9375 49.78125-49.78125 0-27-21.9375-48.9375-49.78125-48.9375z m0-199.125H587.09375c-17.71875 0-34.59375 9.28125-43.03125 24.46875-9.28125 15.1875-9.28125 34.59375 0 49.78125 9.28125 15.1875 25.3125 24.46875 43.03125 24.46875h297c27.84375 0 49.78125-21.9375 49.78125-49.78125 0-27-21.9375-48.9375-49.78125-48.9375z m-556.875-37.96875H188.84375C134 573.59375 90.125 618.3125 90.125 673.15625v139.21875c0 26.15625 10.125 51.46875 28.6875 70.03125 18.5625 18.5625 43.875 28.6875 70.03125 28.6875h138.375c26.15625 0 51.46875-10.125 70.03125-29.53125 18.5625-18.5625 29.53125-43.875 29.53125-70.03125V673.15625c0-26.15625-10.125-51.46875-29.53125-70.03125-17.71875-18.5625-43.03125-29.53125-70.03125-29.53125z m0 0" fill="#383838" ></path></symbol><symbol id="icon-upload1" viewBox="0 0 1024 1024"><path d="M737 801.28571416q0-13.05803584-9.54241084-22.60044668t-22.60044668-9.54241084-22.60044668 9.54241084-9.54241084 22.60044668 9.54241084 22.60044668 22.60044668 9.54241084 22.60044668-9.54241084 9.54241084-22.60044668z m128.57142832 0q0-13.05803584-9.54241084-22.60044668t-22.60044668-9.54241084-22.60044668 9.54241084-9.54241084 22.60044668 9.54241084 22.60044668 22.60044668 9.54241084 22.60044668-9.54241084 9.54241084-22.60044668z m64.28571416-112.5l0 160.71428584q0 20.08928584-14.0625 34.15178584t-34.15178584 14.0625l-739.28571416 0q-20.08928584 0-34.15178584-14.0625t-14.0625-34.15178584l0-160.71428584q0-20.08928584 14.0625-34.15178584t34.15178584-14.0625l214.453125 0q10.546875 28.125 35.40736582 46.20535752t55.49665166 18.08035752l128.57142832 0q30.63616084 0 55.49665166-18.08035752t35.40736582-46.20535752l214.453125 0q20.08928584 0 34.15178584 14.0625t14.0625 34.15178584z m-163.22544668-325.44642832q-8.53794668 20.08928584-29.63169668 20.08928584l-128.57142832 0 0 225q0 13.05803584-9.54241084 22.60044668t-22.60044668 9.54241084l-128.57142832 0q-13.05803584 0-22.60044668-9.54241084t-9.54241084-22.60044668l0-225-128.57142832 0q-21.09375 0-29.63169668-20.08928584-8.53794668-19.58705332 7.03125-34.65401748l225-225q9.04017832-9.54241084 22.60044668-9.54241084t22.60044668 9.54241084l225 225q15.56919668 15.06696416 7.03125 34.65401748z"  ></path></symbol><symbol id="icon-edit" viewBox="0 0 1025 1024"><path d="M430.8177544 653.65067217a60.46065263 60.46065263 0 0 1-50.95969278-93.2821497l71.68905967-114.01151661 7.77351181-10.36468301L816.0384834 80.1381957a60.46065263 60.46065263 0 0 1 43.18618095-18.1381957 60.46065263 60.46065263 0 0 1 43.18618008 18.1381957l43.18618096 43.18618008a60.46065263 60.46065263 0 0 1 0 86.37236104L588.8791751 565.55086396l-8.63723672 8.63723585-117.46641094 68.23416532a60.46065263 60.46065263 0 0 1-31.95777304 11.22840704z"  ></path><path d="M728.80239922 962H252.89069083A190.88291778 190.88291778 0 0 1 62.00777393 771.98080625v-475.04798437A190.88291778 190.88291778 0 0 1 252.89069083 104.32245693h267.75431894a60.46065263 60.46065263 0 0 1 0 120.92130528h-267.75431895a69.9616125 69.9616125 0 0 0-69.09788848 69.09788847v477.63915557a69.9616125 69.9616125 0 0 0 69.09788848 69.09788847h475.9117084a69.9616125 69.9616125 0 0 0 69.09788847-69.09788847V503.36276416a60.46065263 60.46065263 0 1 1 120.92130528 0v268.61804209a190.88291778 190.88291778 0 0 1-190.01919375 190.01919375z"  ></path></symbol><symbol id="icon-skip" viewBox="0 0 1024 1024"><path d="M664.9296875 583.45507813s-327.48046875 0.08789063-476.19140625 0.08789062c-38.93554688 0-70.48828125-31.640625-70.48828125-70.48828125 0-38.93554688 31.55273438-70.48828125 70.48828125-70.48828125 124.71679689 0 475.92773438-0.08789063 475.92773438-0.08789063S641.0234375 418.66015625 532.30273438 309.8515625c-27.59765625-27.50976563-27.59765625-72.15820313-1e-8-99.75585939s72.24609375-27.59765625 99.75585938 2e-8l253.125 253.12499998c27.50976563 27.59765625 27.50976563 72.15820313 0 99.75585939 0 0-142.29492188 142.29492188-251.015625 251.10351563-27.59765625 27.59765625-72.15820313 27.59765625-99.75585938-1e-8-27.59765625-27.59765625-27.59765625-72.15820313 1e-8-99.75585937C622.56640625 625.99414063 664.9296875 583.45507813 664.9296875 583.45507813z"  ></path></symbol><symbol id="icon-prompt" viewBox="0 0 1024 1024"><path d="M554.666667 128a32 32 0 1 1-0.512 64H213.333333a21.333333 21.333333 0 0 0-21.333333 21.333333v597.333334a21.333333 21.333333 0 0 0 21.333333 21.333333h597.333334a21.333333 21.333333 0 0 0 21.333333-21.333333V469.312l0.149333-3.050667A32 32 0 0 1 896 469.333333v341.333334a85.333333 85.333333 0 0 1-85.333333 85.333333H213.333333a85.333333 85.333333 0 0 1-85.333333-85.333333V213.333333a85.333333 85.333333 0 0 1 85.333333-85.333333z" fill="#323847" ></path><path d="M298.581333 521.194667m32 0l192 0q32 0 32 32l0 0q0 32-32 32l-192 0q-32 0-32-32l0 0q0-32 32-32Z" fill="#323847" ></path><path d="M298.581333 670.528m32 0l320 0q32 0 32 32l0 0q0 32-32 32l-320 0q-32 0-32-32l0 0q0-32 32-32Z" fill="#323847" ></path><path d="M789.333333 106.666667a128 128 0 1 1 0 256 128 128 0 0 1 0-256z m0 64a64 64 0 1 0 0 128 64 64 0 0 0 0-128z" fill="#323847" ></path></symbol><symbol id="icon-sync" viewBox="0 0 1024 1024"><path d="M779.07437 412.216889a18.962963 18.962963 0 0 1 26.737778 2.161778l111.634963 131.356444a18.962963 18.962963 0 0 1-14.449778 31.250963h-50.251852c-13.274074 70.769778-47.407407 136.343704-99.555555 188.491852-139.58637 139.567407-364.980148 141.027556-506.349037 4.361481l-4.437333-4.361481a62.862222 62.862222 0 0 1 86.091851-91.515259l2.787556 2.616889c91.97037 91.97037 241.057185 91.97037 332.98963 0a234.268444 234.268444 0 0 0 59.354074-99.593482h-43.918223a18.962963 18.962963 0 0 1-14.449777-31.250963l111.634963-131.356444a18.962963 18.962963 0 0 1 2.18074-2.161778z m-35.858963-179.749926l4.437334 4.361481a62.862222 62.862222 0 0 1-86.110815 91.51526l-2.787556-2.616889c-91.97037-91.97037-241.038222-91.97037-332.989629 0a234.458074 234.458074 0 0 0-56.149334 89.6l40.732445 0.018963a18.962963 18.962963 0 0 1 14.449778 31.250963l-111.653926 131.337481a18.962963 18.962963 0 0 1-28.899556 0l-111.653926-131.337481a18.962963 18.962963 0 0 1 14.449778-31.250963h52.261926a359.784296 359.784296 0 0 1 97.564444-178.517334c139.567407-139.567407 364.980148-141.027556 506.349037-4.361481z" fill="#707070" ></path></symbol><symbol id="icon-process-node" viewBox="0 0 1024 1024"><path d="M512 872a360 360 0 1 0 0-720 360 360 0 0 0 0 720z m0 90C263.465 962 62 760.535 62 512S263.465 62 512 62s450 201.465 450 450-201.465 450-450 450z" fill="#707070" ></path><path d="M512 512m-157.5 0a157.5 157.5 0 1 0 315 0 157.5 157.5 0 1 0-315 0Z" fill="#707070" ></path></symbol><symbol id="icon-process" viewBox="0 0 1024 1024"><path d="M354.879931 125.887975A164.159968 164.159968 0 0 1 513.8559 0c76.415985 0 140.607973 52.92799 158.655969 124.543976a463.615909 463.615909 0 0 1 301.439941 435.839915c0 29.503994-2.815999 58.495989-8.063999 86.527983 35.583993 30.399994 58.111989 75.775985 58.111989 126.527975 0 91.455982-73.279986 165.567968-163.711968 165.567968-22.399996 0-43.775991-4.479999-63.231988-12.799998a453.119912 453.119912 0 0 1-281.599945 97.791981c-104.12798 0-200.255961-35.199993-277.247946-94.399982-22.335996 11.519998-47.679991 18.111996-74.495985 18.111997C73.279986 947.711815 0 873.535829 0 782.079847c0-54.207989 25.791995-102.39998 65.599987-132.543974a471.231908 471.231908 0 0 1-8.447998-89.215982A463.679909 463.679909 0 0 1 354.879931 125.887975z m7.871998 103.61598a364.671929 364.671929 0 0 0-208.639959 330.559936c0 19.199996 1.536 38.079993 4.351999 56.511989l5.247999-0.064c90.431982 0 163.711968 74.111986 163.711968 165.567967a166.399968 166.399968 0 0 1-18.815996 77.119985 355.711931 355.711931 0 0 0 205.69596 65.215987 355.711931 355.711931 0 0 0 205.823959-65.279987 166.271968 166.271968 0 0 1-23.551995-85.759983c0-91.391982 73.279986-165.567968 163.711968-165.567968 3.711999 0 7.423999 0.128 11.071998 0.384a371.839927 371.839927 0 0 0 3.135999-48.12799c0-146.751971-85.759983-273.215947-209.407959-330.879936A163.775968 163.775968 0 0 1 513.8559 331.199935a163.775968 163.775968 0 0 1-151.039971-101.75998z" fill="#595959" ></path></symbol><symbol id="icon-sigh" viewBox="0 0 1024 1024"><path d="M512 725.333333a85.333333 85.333333 0 1 1 0 170.666667 85.333333 85.333333 0 0 1 0-170.666667z m0-554.666666a64 64 0 0 1 64 64v341.333333a64 64 0 0 1-128 0v-341.333333A64 64 0 0 1 512 170.666667z"  ></path></symbol><symbol id="icon-loading1" viewBox="0 0 1024 1024"><path d="M793.84875489 721.02587891c2.52136231 0 4.8449707-2.47192383 4.84497069-5.14160157 0-2.66967773-2.3236084-5.09216309-4.8449707-5.09216309-2.52136231 0-4.8449707 2.47192383-4.84497071 5.09216309 0 2.66967773 2.3236084 5.14160156 4.84497071 5.14160157z m-108.56689454 118.45458984c1.77978516 1.87866211 4.30114747 2.96630859 6.77307129 2.96630859a9.39331055 9.39331055 0 0 0 6.82250977-2.96630859 10.62927247 10.62927247 0 0 0 0-14.3371582 9.44274903 9.44274903 0 0 0-6.82250977-2.9663086 9.39331055 9.39331055 0 0 0-6.77307129 2.9663086 10.57983398 10.57983398 0 0 0 0 14.3371582zM543.14624023 903.05834961c2.66967773 2.81799317 6.42700195 4.44946289 10.18432618 4.44946289a14.18884278 14.18884278 0 0 0 10.18432617-4.44946289 15.91918945 15.91918945 0 0 0 0-21.60461426 14.18884278 14.18884278 0 0 0-10.18432617-4.49890137 14.18884278 14.18884278 0 0 0-10.18432618 4.4494629 15.91918945 15.91918945 0 0 0 0 21.65405273z m-153.20983887-4.44946289c3.55957031 3.70788575 8.55285645 5.93261719 13.59558106 5.93261719a18.88549805 18.88549805 0 0 0 13.54614258-5.93261719 21.20910645 21.20910645 0 0 0 0-28.77319336 18.88549805 18.88549805 0 0 0-13.54614258-5.93261719 18.88549805 18.88549805 0 0 0-13.59558105 5.93261719 21.25854492 21.25854492 0 0 0 0 28.72375489z m-135.70861816-70.94421387c4.44946289 4.69665528 10.67871094 7.41577148 16.95739747 7.41577149a23.6315918 23.6315918 0 0 0 17.00683593-7.41577148 26.54846192 26.54846192 0 0 0 1e-8-35.99121094 23.6315918 23.6315918 0 0 0-17.00683595-7.41577149 23.6315918 23.6315918 0 0 0-16.95739746 7.41577149 26.54846192 26.54846192 0 0 0 0 35.99121094z m-93.58703613-123.10180663c5.33935547 5.68542481 12.85400391 8.99780273 20.36865235 8.99780272a28.37768555 28.37768555 0 0 0 20.41809081-8.94836425 31.88781739 31.88781739 0 0 0 0-43.20922852 28.37768555 28.37768555 0 0 0-20.41809081-8.94836426 28.42712403 28.42712403 0 0 0-20.36865235 8.89892579 31.88781739 31.88781739 0 0 0 0 43.25866699zM126.33044433 552.68786622a33.1237793 33.1237793 0 0 0 23.77990723 10.38208007 33.1237793 33.1237793 0 0 0 23.77990723-10.38208007 37.17773438 37.17773438 0 0 0 0-50.37780763 33.1237793 33.1237793 0 0 0-23.73046875-10.38208007 33.1237793 33.1237793 0 0 0-23.8293457 10.38208007 37.17773438 37.17773438 0 0 0 0 50.37780763z m30.75073243-150.93566895a37.82043458 37.82043458 0 0 0 27.19116211 11.86523437 37.82043458 37.82043458 0 0 0 27.19116211-11.86523437 42.46765137 42.46765137 0 0 0 0-57.5958252 37.82043458 37.82043458 0 0 0-27.19116211-11.91467285 37.82043458 37.82043458 0 0 0-27.19116211 11.91467285 42.46765137 42.46765137 0 0 0 0 57.5958252zM246.51538086 280.62792969c8.0090332 8.50341797 19.28100586 13.44726563 30.65185547 13.44726562 11.27197266 0 22.54394531-4.94384766 30.55297851-13.44726562a47.80700684 47.80700684 0 0 0 0-64.7644043 42.56652833 42.56652833 0 0 0-30.60241699-13.44726562c-11.32141114 0-22.59338379 4.94384766-30.60241699 13.44726562a47.80700684 47.80700684 0 0 0 0 64.7644043zM377.08239746 212.8972168c8.89892578 9.39331055 21.40686036 14.88098144 33.9642334 14.88098144 12.55737305 0 25.06530762-5.43823242 33.9642334-14.88098144a53.04748536 53.04748536 0 0 0 0-71.98242188 47.31262208 47.31262208 0 0 0-33.9642334-14.88098144 47.31262208 47.31262208 0 0 0-33.96423339 14.88098144 53.09692383 53.09692383 0 0 0 0 71.98242188z m146.48620606-0.84045411c9.78881836 10.38208008 23.58215333 16.41357422 37.42492676 16.41357423s27.58666992-6.03149414 37.37548828-16.41357423a58.38684083 58.38684083 0 0 0 0-79.15100097A52.05871583 52.05871583 0 0 0 560.9440918 116.4921875c-13.84277344 0-27.6361084 6.03149414-37.42492677 16.41357422a58.38684083 58.38684083 0 0 0 0 79.15100098z m134.27490234 66.89025879c10.67871094 11.27197266 25.70800781 17.84729004 40.73730469 17.84729005 15.12817383 0 30.1574707-6.57531739 40.78674317-17.84729005a63.67675781 63.67675781 0 0 0 0-86.31958007 56.75537109 56.75537109 0 0 0-40.78674317-17.89672852c-15.07873536 0-30.05859375 6.57531739-40.73730469 17.89672852a63.67675781 63.67675781 0 0 0 0 86.31958007z m95.81176758 122.45910645c11.56860352 12.26074219 27.83386231 19.37988281 44.19799804 19.37988281 16.31469727 0 32.62939453-7.11914063 44.14855958-19.37988282a69.01611328 69.01611328 0 0 0 0-93.53759764 61.50146484 61.50146484 0 0 0-44.14855958-19.37988281c-16.36413575 0-32.62939453 7.11914063-44.19799804 19.37988281a69.01611328 69.01611328 0 0 0 0 93.53759765z m38.95751953 157.60986328c12.45849609 13.20007325 29.9597168 20.86303711 47.60925293 20.86303711 17.60009766 0 35.10131836-7.66296387 47.55981446-20.8630371a74.35546875 74.35546875 0 0 0 0-100.75561525 66.24755859 66.24755859 0 0 0-47.55981446-20.91247558c-17.64953614 0-35.10131836 7.71240234-47.60925293 20.91247558a74.30603028 74.30603028 0 0 0 0 100.75561524z" fill="#262626" ></path></symbol><symbol id="icon-download" viewBox="0 0 1024 1024"><path d="M828.975746 894.125047 190.189132 894.125047c-70.550823 0-127.753639-57.18542-127.753639-127.752616L62.435493 606.674243c0-17.634636 14.308891-31.933293 31.93227-31.933293l63.889099 0c17.634636 0 31.93227 14.298658 31.93227 31.933293l0 95.821369c0 35.282574 28.596292 63.877843 63.87682 63.877843L765.098927 766.373455c35.281551 0 63.87682-28.595268 63.87682-63.877843l0-95.821369c0-17.634636 14.298658-31.933293 31.943526-31.933293l63.877843 0c17.634636 0 31.933293 14.298658 31.933293 31.933293l0 159.699212C956.729385 836.939627 899.538849 894.125047 828.975746 894.125047L828.975746 894.125047zM249.938957 267.509636c12.921287-12.919241 33.884738-12.919241 46.807049 0l148.97087 148.971893L445.716876 94.89323c0-17.634636 14.300704-31.94762 31.933293-31.94762l63.875796 0c17.637706 0 31.945573 14.312984 31.945573 31.94762l0 321.588299 148.97087-148.971893c12.921287-12.919241 33.875528-12.919241 46.796816 0l46.814212 46.818305c12.921287 12.922311 12.921287 33.874505 0 46.807049L552.261471 624.930025c-1.140986 1.137916-21.664416 13.68365-42.315758 13.69286-20.87647 0.010233-41.878806-12.541641-43.020816-13.69286L203.121676 361.13499c-12.922311-12.933567-12.922311-33.884738 0-46.807049L249.938957 267.509636 249.938957 267.509636z" fill="#272636" ></path></symbol><symbol id="icon-newChat" viewBox="0 0 1024 1024"><path d="M754.24853516 133.05407714c18.1439209 0 32.87658692 14.73266602 32.87658692 32.87658692v70.94421387H858.06933594a32.87658692 32.87658692 0 1 1 0 65.75317382h-70.94421387V373.57226562a32.87658692 32.87658692 0 1 1-65.75317382 1e-8V302.62805175H650.42773438a32.87658692 32.87658692 0 0 1-1e-8-65.75317382h70.94421388V165.93066406c0-18.1439209 14.73266602-32.87658692 32.87658691-32.87658692z"  ></path><path d="M198.80725097 373.57226562A140.15808106 140.15808106 0 0 1 338.96533203 233.41418457h224.20349122a32.87658692 32.87658692 0 0 0-1e-8-65.75317382H338.96533203A205.91125489 205.91125489 0 0 0 133.05407714 373.57226562v191.07971192a205.96069336 205.96069336 0 0 0 179.11560059 204.1809082l21.01135255 96.25671387a32.87658692 32.87658692 0 0 0 52.99804686 18.39111328l127.55126954-104.66125489a36.33728028 36.33728028 0 0 1 23.03833007-8.25622558h148.3154297c113.70849609 0 205.86181641-92.15332031 205.8618164-205.91125489v-103.82080077a32.87658692 32.87658692 0 1 0-65.75317382 0v103.82080078A140.15808106 140.15808106 0 0 1 685.03466797 704.81005859H536.76867676c-23.58215333 0-46.47216797 8.20678711-64.7644043 23.18664552l-86.02294922 70.59814452-14.83154297-67.9284668a32.87658692 32.87658692 0 0 0-32.13500977-25.85632324 140.15808106 140.15808106 0 0 1-140.20751952-140.15808106V373.57226562z"  ></path></symbol><symbol id="icon-chat" viewBox="0 0 1024 1024"><path d="M341.333333 648.533333c0-157.013333 157.013333-286.72 351.573334-290.133333 6.826667 0 10.24-3.413333 13.653333-6.826667 3.413333-3.413333 3.413333-10.24 3.413333-13.653333-37.546667-150.186667-180.906667-252.586667-348.16-252.586667C160.426667 85.333333 0 232.106667 0 409.6v6.826667c0 71.68 27.306667 139.946667 81.92 194.56l10.24 10.24c10.24 17.066667 23.893333 27.306667 40.96 40.96l-61.44 116.053333c-3.413333 6.826667-3.413333 13.653333 3.413333 20.48 3.413333 3.413333 6.826667 3.413333 10.24 3.413333 3.413333 0 6.826667 0 10.24-3.413333l129.706667-88.746667c34.133333 13.653333 71.68 20.48 109.226667 23.893334 6.826667 0 10.24-3.413333 13.653333-6.826667 3.413333-3.413333 3.413333-10.24 3.413333-13.653333-6.826667-23.893333-10.24-44.373333-10.24-64.853334z m-245.76-40.96z" fill="" ></path><path d="M1024 648.533333c0-139.946667-146.773333-256-324.266667-256S375.466667 508.586667 375.466667 648.533333s146.773333 256 324.266666 256c17.066667 0 34.133333 0 54.613334-3.413333 17.066667-3.413333 30.72-3.413333 44.373333-10.24l98.986667 44.373333h6.826666c3.413333 0 6.826667 0 10.24-3.413333 6.826667-3.413333 6.826667-10.24 6.826667-17.066667l-20.48-64.853333c75.093333-47.786667 122.88-122.88 122.88-201.386667z" fill="" ></path></symbol><symbol id="icon-knowledge" viewBox="0 0 1024 1024"><path d="M212.519822 57.281422h-25.258666c-40.487822 0.062578-73.295644 32.8704-73.363912 73.363911V892.700444c0.068267 40.487822 32.876089 73.295644 73.3696 73.363912h25.258667V57.281422z m621.568 0h-48.105244v267.002311l-120.274489-111.616-120.274489 111.616V57.287111H263.879111v908.777245h570.208711c40.493511-0.068267 73.301333-32.876089 73.3696-73.363912V130.645333c-0.068267-40.493511-32.876089-73.301333-73.3696-73.363911z m-30.065778 622.768356H366.347378a19.245511 19.245511 0 0 1 0-38.365867h437.674666a19.245511 19.245511 0 0 1 0 38.365867z m0-149.378845H366.347378a19.245511 19.245511 0 0 1 0-38.365866h437.674666a19.245511 19.245511 0 0 1 0 38.365866z" fill="#515151" ></path></symbol><symbol id="icon-system" viewBox="0 0 1024 1024"><path d="M855.277568 88.375296A93.93493333 93.93493333 0 0 1 948.90666667 178.946048l0.04369066 3.05834667v561.73090133a93.93493333 93.93493333 0 0 1-90.52706133 93.585408l-3.05834667 0.04369067h-193.54965333l15.64125867 62.43396266h115.474432c17.12674133 0 31.195136 14.024704 31.195136 31.195136a31.326208 31.326208 0 0 1-29.18536534 31.15144534l-2.00977066 0.04369066H231.06901333a31.28251733 31.28251733 0 0 1-31.195136-31.195136c0-16.47138133 12.93243733-30.10286933 29.18536534-31.15144533l2.00977066-0.04369067h99.876864l15.597568-62.43396266H168.722432A93.93493333 93.93493333 0 0 1 75.09333333 746.83733333L75.09333333 743.77898667V181.960704a93.93493333 93.93493333 0 0 1 90.52706134-93.585408h689.65717333zM596.32298667 837.36439467H412.123136l-15.597568 62.43396266h215.351296l-15.597568-62.43396266zM512.786432 275.63349333a30.58346667 30.58346667 0 0 0-25.51534933 13.76256l-132.07688534 235.9296H216.956928a30.408704 30.408704 0 0 0-30.45239467 30.408704c0 16.82090667 13.58779733 30.539776 30.45239467 30.670848l155.40770133 1.31072a30.58346667 30.58346667 0 0 0 25.47165867-13.80625066l114.90645333-206.21994667 128.01365334 204.42862933a30.670848 30.670848 0 0 0 26.52023466 14.024704h138.98001067a31.195136 31.195136 0 1 0 0-62.390272h-120.28040533v1.52917334l-146.669568-235.62376534c-6.24776533-9.34980267-15.597568-15.597568-26.52023467-14.024704z" fill="#202945" ></path></symbol><symbol id="icon-chatbot1" viewBox="0 0 1024 1024"><path d="M778.24 360.192H245.76c-51.2 0-92.16 40.96-92.16 92.16v399.36c0 51.2 40.96 92.16 92.16 92.16h532.48c51.2 0 92.16-40.96 92.16-92.16v-399.36c0-49.5104-40.96-92.16-92.16-92.16z m-465.92 203.1104c0-23.9104 20.48-44.3904 44.3904-44.3904 23.8592 0 44.3392 20.48 44.3392 44.3904 0 23.8592-20.48 44.3392-44.3392 44.3392a44.032 44.032 0 0 1-44.3904-44.3392z m288.4096 221.8496H423.2704a45.1584 45.1584 0 0 1-44.3904-44.3904c0-23.8592 20.48-44.3392 44.3904-44.3392h177.4592c23.9104 0 44.3904 20.48 44.3904 44.3904 0 25.6-20.48 44.3392-44.3904 44.3392z m66.56-177.5104a45.1584 45.1584 0 0 1-44.3392-44.3392c0-23.9104 20.48-44.3904 44.3392-44.3904 23.9104 0 44.3904 20.48 44.3904 44.3904a44.032 44.032 0 0 1-44.3904 44.3392z m-599.04 167.2704a34.2528 34.2528 0 0 1-34.0992-34.0992v-177.5104c0-18.7904 15.36-34.1504 34.0992-34.1504 18.7904 0 34.1504 15.36 34.1504 34.1504v177.4592c-1.6896 18.7904-15.36 34.1504-34.1504 34.1504z m887.5008 0A34.2528 34.2528 0 0 1 921.6 740.864v-177.5104c0-18.7904 15.36-34.1504 34.1504-34.1504 18.7392 0 34.0992 15.36 34.0992 34.1504v177.4592c0 18.7904-15.36 34.1504-34.0992 34.1504z" fill="#515151" ></path><path d="M595.6096 163.84c0-46.08-37.5296-83.6608-83.6096-83.6608S428.3904 117.76 428.3904 163.84c0 34.0992 20.48 63.1296 49.4592 76.8v145.0496h68.3008V240.64c28.9792-13.6704 49.4592-42.7008 49.4592-76.8zM512 146.7392a17.1008 17.1008 0 0 1 0 34.1504c-10.24 0-17.0496-6.8096-17.0496-17.0496s8.4992-17.1008 17.0496-17.1008z" fill="#515151" ></path></symbol><symbol id="icon-lang-zh" viewBox="0 0 1024 1024"><path d="M991.99915344 512.00592688c0 265.09046062-214.89683906 479.99238-479.99746032 479.99238C246.91292563 992 32.00084656 777.09808062 32.00084656 512.00592688 32.00084656 246.90191938 246.91292563 32 512 32 777.10062031 32 991.99915344 246.90191938 991.99915344 512.00592688zM512 103.99352281c-225.32943188 0-407.99547 182.66773219-407.99547 408.01240407 0 225.331125 182.66603906 408.00055031 407.99547 408.00055031 225.33959156 0 408.00732375-182.66942531 408.00732375-408.00055031 0-225.34467187-182.66773219-408.01240406-408.00732375-408.01240407z" fill="#231815" ></path><path d="M552.52810625 341.56571469v-101.24914688h-63.93158906v101.28639938H278.97100719v256.37320969h209.62720312v197.7857625H552.52980031V597.97617687h210.2097075V341.56571469H552.52810625z m-63.92989594 195.99930094h-147.50578125v-135.56612719h147.50578125v135.56612718z m211.99616907-1e-8h-148.08828563v-135.56612718h148.08828562v135.56612718z" fill="#231815" ></path></symbol><symbol id="icon-lang-en" viewBox="0 0 1024 1024"><path d="M992 512c0 265.0978125-214.90125 480-480 480S32 777.0978125 32 512 246.9021875 32 511.9990625 32C777.09875 32 992 246.9003125 992 512zM511.9971875 104.0009375c-225.3309375 0-407.9953125 182.664375-407.9953125 407.9953125 0 225.3328125 182.664375 407.9971875 407.9953125 407.9971875 225.3328125 0 407.9971875-182.664375 407.9971875-407.9971875 0-225.3290625-182.664375-407.9953125-407.9971875-407.9953125z" fill="#231815" ></path><path d="M217.325 714.078125V321.0125h291.444375v66.478125H296.675v87.16875h197.3334375v66.24375h-197.334375v106.933125h219.615v66.2409375h-298.93125z m590.4065625 0h-75.33V568.761875c0-30.7490625-1.618125-50.6503125-4.809375-59.6765625a41.7796875 41.7796875 0 0 0-15.7134375-21.0328125 44.6934375 44.6934375 0 0 0-26.14875-7.51875c-13.0453125 0-24.7125 3.5653125-35.109375 10.741875-10.3659375 7.1353125-17.503125 16.6059375-21.309375 28.411875-3.849375 11.8078125-5.7703125 33.6375-5.7703125 65.4196875V714.078125h-75.3309375V429.329375h69.976875v41.83125c24.849375-32.188125 56.1121875-48.25125 93.825-48.25125 16.648125 0 31.815 2.9878125 45.5728125 8.9596875 13.7709375 6.0046875 24.1996875 13.621875 31.2384375 22.921875 7.0715625 9.3 12.01125 19.8375 14.750625 31.6453125 2.750625 11.8078125 4.15875 28.6903125 4.15875 50.6915625l-0.0009375 176.949375z" fill="#231815" ></path></symbol><symbol id="icon-exit" viewBox="0 0 1024 1024"><path d="M224 704c-8 0-16-3.2-22.4-9.6l-160-160c-12.8-12.8-12.8-32 0-44.8l160-160c12.8-12.8 32-12.8 44.8 0 12.8 12.8 12.8 32 0 44.8L108.8 512l137.6 137.6c12.8 12.8 12.8 32 0 44.8-6.4 6.4-14.4 9.6-22.4 9.6z" fill="#333333" ></path><path d="M640 544H80c-17.6 0-32-14.4-32-32s14.4-32 32-32h560c17.6 0 32 14.4 32 32s-14.4 32-32 32z" fill="#333333" ></path><path d="M832 928H480c-52.8 0-96-43.2-96-96v-128c0-17.6 14.4-32 32-32s32 14.4 32 32v128c0 17.6 14.4 32 32 32h352c17.6 0 32-14.4 32-32V192c0-17.6-14.4-32-32-32H480c-17.6 0-32 14.4-32 32v128c0 17.6-14.4 32-32 32s-32-14.4-32-32v-128c0-52.8 43.2-96 96-96h352c52.8 0 96 43.2 96 96v640c0 52.8-43.2 96-96 96z" fill="#333333" ></path></symbol><symbol id="icon-loading" viewBox="0 0 1024 1024"><path d="M469.333333 85.333333m42.666667 0l0 0q42.666667 0 42.666667 42.666667l0 128q0 42.666667-42.666667 42.666667l0 0q-42.666667 0-42.666667-42.666667l0-128q0-42.666667 42.666667-42.666667Z" fill="#000000" opacity=".8" ></path><path d="M469.333333 725.333333m42.666667 0l0 0q42.666667 0 42.666667 42.666667l0 128q0 42.666667-42.666667 42.666667l0 0q-42.666667 0-42.666667-42.666667l0-128q0-42.666667 42.666667-42.666667Z" fill="#000000" opacity=".4" ></path><path d="M938.666667 469.333333m0 42.666667l0 0q0 42.666667-42.666667 42.666667l-128 0q-42.666667 0-42.666667-42.666667l0 0q0-42.666667 42.666667-42.666667l128 0q42.666667 0 42.666667 42.666667Z" fill="#000000" opacity=".2" ></path><path d="M298.666667 469.333333m0 42.666667l0 0q0 42.666667-42.666667 42.666667l-128 0q-42.666667 0-42.666667-42.666667l0 0q0-42.666667 42.666667-42.666667l128 0q42.666667 0 42.666667 42.666667Z" fill="#000000" opacity=".6" ></path><path d="M783.530667 180.138667m30.169889 30.169889l0 0q30.169889 30.169889 0 60.339779l-90.509668 90.509668q-30.169889 30.169889-60.339779 0l0 0q-30.169889-30.169889 0-60.339779l90.509668-90.509668q30.169889-30.169889 60.339779 0Z" fill="#000000" opacity=".1" ></path><path d="M330.965333 632.661333m30.16989 30.16989l0 0q30.169889 30.169889 0 60.339778l-90.509668 90.509668q-30.169889 30.169889-60.339779 0l0 0q-30.169889-30.169889 0-60.339778l90.509668-90.509668q30.169889-30.169889 60.339779 0Z" fill="#000000" opacity=".5" ></path><path d="M843.861333 783.530667m-30.169889 30.169889l0 0q-30.169889 30.169889-60.339779 0l-90.509668-90.509668q-30.169889-30.169889 0-60.339779l0 0q30.169889-30.169889 60.339779 0l90.509668 90.509668q30.169889 30.169889 0 60.339779Z" fill="#000000" opacity=".3" ></path><path d="M391.338667 330.965333m-30.16989 30.16989l0 0q-30.169889 30.169889-60.339778 0l-90.509668-90.509668q-30.169889-30.169889 0-60.339779l0 0q30.169889-30.169889 60.339778 0l90.509668 90.509668q30.169889 30.169889 0 60.339779Z" fill="#000000" opacity=".7" ></path></symbol><symbol id="icon-success" viewBox="0 0 1024 1024"><path d="M512 512m-512 0a512 512 0 1 0 1024 0 512 512 0 1 0-1024 0Z" fill="#333333" ></path><path d="M482.9 707.5c-8 0-16.1-2.5-23-7.5L294.5 578.8c-17.4-12.7-21.2-37.1-8.4-54.5 12.7-17.4 37.1-21.2 54.5-8.4L505.9 637c17.4 12.7 21.1 37.1 8.4 54.5-7.6 10.4-19.4 16-31.4 16z" fill="#FFFFFF" ></path><path d="M482.9 708.4c-7.8 0-15.7-2.3-22.6-7.2-17.6-12.5-21.7-36.8-9.2-54.4L674.7 332c12.5-17.6 36.8-21.7 54.4-9.2s21.7 36.8 9.2 54.4L514.7 692c-7.6 10.7-19.6 16.4-31.8 16.4z" fill="#FFFFFF" ></path></symbol><symbol id="icon-results" viewBox="0 0 1024 1024"><path d="M250.71914815 118.58966386v111.5998295c0 31.83745166 25.14459023 56.75528496 56.13829365 56.75528496h394.14139101c31.04995253 0 56.13741474-25.42408242 56.13741475-56.81241299V118.25304278c62.21240508 0.28125 112.49982862 50.39992354 112.49982861 112.04982949V849.94841269c0 61.87490596-50.84992266 112.0498295-113.00607773 112.0498295H259.38251386A112.55607862 112.55607862 0 0 1 146.37555722 849.94841269V230.30287227c0-59.00616035 46.23742969-107.32483652 104.34359093-111.7123295z m54.5624165-0.39374912C305.28156464 87.14684023 330.03152685 62.00225 361.98323633 62.00225H644.18729873a56.24991474 56.24991474 0 0 1 56.64278496 56.19366474v56.36241388c0 31.04995253-24.74996221 56.19366474-56.64278496 56.19366386H361.98235742a56.24991474 56.24991474 0 0 1-56.64366386-56.19366386V118.19591474z m0 481.16000919s128.69980401 130.78105049 207.16843447 212.00592656c35.83119551-53.38116826 180.78634599-291.09330615 287.3236834-359.71820156l-17.09997364-26.38033154c-137.58641192 62.04365508-296.21117021 245.97999668-296.21117021 245.97999667L344.03863467 572.01846523l-38.69994112 27.3374587z" fill="" ></path></symbol><symbol id="icon-rating" viewBox="0 0 1024 1024"><path d="M540.608 70.976c12.736 6.592 23.04 17.28 29.312 30.592l88.448 187.008c9.408 19.84 27.52 33.664 48.64 36.864l197.696 30.016c35.264 5.312 59.776 39.552 54.592 76.416a68.48 68.48 0 0 1-18.816 38.592L797.44 616c-15.232 15.488-22.208 37.76-18.56 59.648l33.728 205.504c6.016 36.736-17.6 71.552-52.736 77.888a62.208 62.208 0 0 1-40.96-6.784L542.08 855.232a62.208 62.208 0 0 0-60.16 0l-176.832 97.024a63.296 63.296 0 0 1-87.232-28.288 70.016 70.016 0 0 1-6.464-42.816l33.728-205.44a69.248 69.248 0 0 0-18.56-59.712L83.52 470.4a69.504 69.504 0 0 1-1.152-95.36 63.68 63.68 0 0 1 36.928-19.648l197.76-30.016c20.992-3.2 39.168-16.96 48.64-36.864l88.32-187.008c15.872-33.344 54.592-47.04 86.592-30.592z m63.232 552.448h-192a32 32 0 1 0 0 64h192a32 32 0 0 0 0-64z" fill="#707070" ></path></symbol><symbol id="icon-chart-line" viewBox="0 0 1024 1024"><path d="M203.13311768 821.00592805H882.78857422V882.78857422H141.21142578v-61.78264618h0.13904572V141.21142578h61.78264618v679.79450227z m87.08896637-123.10180665l-50.84438324-35.13221741L410.96011352 414.76069641l219.7385788 112.62702942 192.25387573-250.51403046 49.03678894 37.63504029-223.63185882 291.34712218-217.37480164-111.42196654-140.76061249 203.4702301z" fill="#262626" ></path></symbol><symbol id="icon-export" viewBox="0 0 1024 1024"><path d="M195.59374999 819.60620117h632.8125V512H907.5078125v351.55700684c0 24.274292-17.69897461 43.95080567-39.55078125 43.95080566H156.04296875c-21.85180663 0-39.55078125-19.67651367-39.55078125-43.95080567V512h79.10156251v307.60620117z m395.50781251-439.45861817h197.75390625L512 687.80322266 235.14453125 380.147583h197.75390625V116.4921875h158.203125v263.65539551z" fill="#22C55E" ></path></symbol><symbol id="icon-rename" viewBox="0 0 1024 1024"><path d="M761.24512681 471.79145398l19.37405451-17.819986-19.37405451 17.819986 19.37405451-17.819986-54.8586188-55.06582785-99.9784084-100.34102394-54.80681623-55.06582786-19.37405451 17.819986-35.43276173 37.24584186-320.91514955 322.1584051q-25.79753764 25.90114156-37.09043539 59.8834399l-56.46448988 195.86443582q-6.42348313 21.08352953 9.68702665 37.24584187 16.16231234 16.21411491 38.69630646 11.3447003l193.53333365-58.27756881q35.48456429-9.73882922 61.28210193-35.63997199l320.863347-322.15840388 35.48456429-37.19404052z m-403.12537452 271.96199185l-14.5046387 37.24584186 14.5046387-37.29764443-14.5046387 37.29764443q-9.68702666 8.08115678-20.97992559 11.29289774l-127.3818159 37.24584187 37.09043537-126.24216551q4.81761204-11.39650287 11.29289774-21.08352951L280.67533802 667.6558898v51.80228434q1.60587108 22.68940061 25.79753764 25.90114156h51.59507406v-1.60586987z m327.39043525-615.1521239l-24.24346913 22.63759925 24.19166656-22.63759925-24.19166656 22.63759925-35.48456429 37.24584186-19.32225194 17.81998599 54.80681623 55.0140253 99.9784084 100.3928265 54.80681624 55.01402529 17.76818342-17.81998599 37.09043538-37.1940393 24.19166656-22.68940061q29.0092786-32.37642725 29.0092798-74.43988236 0-40.5093866-29.0092798-72.88581386l-64.4938429-63.09518207Q799.94143327 97.83076576 758.03338585 97.83076576q-40.30217755 0-72.52319831 30.77055617z m-77.44441428 271.96199185l-232.22964011 233.11027769 232.22964011-233.11027769-232.22964011 233.11027769q-17.71638086 14.55644126-35.43276173 0-16.16231234-19.42585708 0-37.24584187l232.17783755-233.11027769q17.71638086-14.55644126 35.48456429 0 16.11050977 17.81998599 0 37.24584187z" fill="#F59E0B" ></path></symbol><symbol id="icon-delete" viewBox="0 0 1024 1024"><path d="M863.56250027 213.17187473h-172.26562527V148.1328125C691.296875 128.79687473 671.96093723 107.70312473 652.62500027 107.70312473H371.37499973c-19.33593777 0-31.640625 21.09375-31.640625 40.42968777V213.17187473H160.43749973c-10.546875 0-17.57812473 7.03124973-17.57812473 17.57812554s7.03124973 17.57812473 17.57812473 17.57812473h703.12500054c10.546875 0 17.57812473-7.03124973 17.57812473-17.57812473s-7.03124973-17.57812473-17.57812473-17.57812554zM216.6875 868.83593777C216.6875 898.71874973 236.02343777 916.29687527 265.90624973 916.29687527h492.18750054c29.88281277 0 56.25000027-17.57812473 56.24999946-47.4609375V283.48437527h-597.65624973v585.3515625z m421.875-421.875c0-10.546875 7.03124973-17.57812473 17.57812473-17.57812554s17.57812473 7.03124973 17.57812554 17.57812554v316.40625c0 10.546875-7.03124973 17.57812473-17.57812554 17.57812473s-17.57812473-7.03124973-17.57812473-17.57812473v-316.40625z m-140.62500027 0c0-10.546875 7.03124973-17.57812473 17.57812554-17.57812554s17.57812473 7.03124973 17.57812473 17.57812554v316.40625c0 10.546875-7.03124973 17.57812473-17.57812473 17.57812473s-17.57812473-7.03124973-17.57812554-17.57812473v-316.40625z m-140.62499946 0c0-10.546875 7.03124973-17.57812473 17.57812473-17.57812554s17.57812473 7.03124973 17.57812473 17.57812554v316.40625c0 10.546875-7.03124973 17.57812473-17.57812473 17.57812473s-17.57812473-7.03124973-17.57812473-17.57812473v-316.40625z" fill="#666666" ></path></symbol><symbol id="icon-setting1" viewBox="0 0 1024 1024"><path d="M554.64446112 116.4921875c11.62777287 0 22.02948775 7.23769564 25.94496257 18.07446293l27.92247461 77.39983374c10.00621247 2.49166523 18.58861613 4.98333124 25.86586176 7.59364804 7.94959966 2.84761763 18.19311372 7.15859484 30.84919225 13.05158169l65.02060684-34.40871544a27.76427378 27.76427378 0 0 1 32.90580582 5.18108205l57.18965798 59.12762001c7.59364726 7.87049887 9.72936086 19.37962094 5.45793367 29.42538419l-30.49324062 71.4672969c5.06243202 9.29430846 9.09655687 17.24390811 12.18147609 23.88834897 3.32222082 7.23769564 7.43544645 17.20435733 12.33967767 30.05818821l71.07179372 30.4536906c10.67856649 4.54827882 17.28345812 15.22684531 16.57155409 26.65686659l-5.22063283 82.06676336a27.28967059 27.28967059 0 0 1-18.19311372 23.92789977l-67.31452126 23.92789899c-1.93796201 9.29430846-3.95502482 17.24390811-6.09073766 23.96745053a347.64667362 347.64667362 0 0 1-11.78597368 30.61189142l33.81546143 74.74996694a27.01281899 27.01281899 0 0 1-6.64444164 31.36334621l-64.30870206 57.42695958a27.8038238 27.8038238 0 0 1-31.481997 3.79682325l-66.28621407-35.12061945a285.94828837 285.94828837 0 0 1-32.03570101 14.5149405l-28.950781 10.83676807-25.7076602 71.19044529a27.52697218 27.52697218 0 0 1-25.31215856 18.07446293L476.80957419 907.49713379a27.56652219 27.56652219 0 0 1-26.45911498-17.67896053l-30.29548981-80.16835135a578.42236681 578.42236681 0 0 1-30.69099222-11.46957129 394.98831994 394.98831994 0 0 1-24.44205218-11.58822287l-75.14547011 32.11480101a27.76427378 27.76427378 0 0 1-29.86043662-5.26018283L204.30837069 761.27986995a27.01281899 27.01281899 0 0 1-6.13028845-30.9678438l32.31255184-70.39944048a376.39970381 376.39970381 0 0 1-11.94417449-25.47035938 569.32580996 569.32580996 0 0 1-11.86507447-32.07525023L135.88644223 580.81209073a27.28967059 27.28967059 0 0 1-19.37962095-27.01281822l2.76851761-75.9760257a27.2105698 27.2105698 0 0 1 15.50369692-23.49284657l74.27536451-35.67432345c3.44087163-12.61652928 6.44669005-22.42499016 9.09655686-29.583585a355.55672327 355.55672327 0 0 1 12.41877769-28.15977618L198.37583307 292.88629033a27.01281899 27.01281899 0 0 1 5.93253761-31.24469542l55.52854681-52.44362757a27.76427378 27.76427378 0 0 1 29.66268579-5.45793443l75.06636932 31.00739381c8.30555206-5.53703444 15.82009929-10.00621247 22.62274099-13.60528489 8.10780047-4.31097722 18.94456853-8.81970525 32.5894042-13.6843857l26.10316338-72.81200492A27.52697218 27.52697218 0 0 1 471.82624296 116.4921875h82.81821816z m-41.6859603 277.60318631c-65.93026245 0-119.36264643 52.79957997-119.36264642 117.97838762 0 65.17880766 53.43238398 118.01793763 119.36264643 118.01793764 65.89071167 0 119.32309642-52.83913075 119.32309563-118.01793764s-53.39283397-117.97838763-119.32309563-117.97838762z" fill="#8a8a8a" ></path></symbol><symbol id="icon-upload" viewBox="0 0 1024 1024"><path d="M670.203125 116.4921875L867.95703125 314.24609375v554.02734375c0 21.67382813-17.58691381 39.234375-39.28710963 39.234375H195.33007838A39.55078125 39.55078125 0 0 1 156.04296875 868.2734375V155.7265625A39.28710963 39.28710963 0 0 1 195.33007838 116.4921875H670.203125zM551.55078125 512h118.65234375l-158.203125-158.203125-158.203125 158.203125H472.44921875v158.203125h79.1015625v-158.203125z" fill="#A6A6A6" ></path></symbol><symbol id="icon-clear" viewBox="0 0 1024 1024"><path d="M591.99999969 791.88000031h280.00000031v79.99999969h-360l-159.91999969 0.07999969-259.48000031-259.51999969a40.00000031 40.00000031 0 0 1 0-56.56000031L516.8 131.64000031a40.00000031 40.00000031 0 0 1 56.56000031 0l311.16 311.11999969a40.00000031 40.00000031 0 0 1 0 56.56000031L591.99999969 791.88000031z m66.28000031-179.44000031l141.40000031-141.40000031-254.56000031-254.55999938-141.40000031 141.39999938 254.56000031 254.56000031z" fill="#8a8a8a" ></path></symbol><symbol id="icon-copy-success" viewBox="0 0 1024 1024"><path d="M866.35301943 340.99849494L453.67445686 753.67779909c-20.43809939 20.43809939-53.57451327 20.43809939-74.01335353 0L157.62252519 531.6377385c-20.43884026-20.43809939-20.43884026-53.57599571-2e-8-74.01335353 20.43809939-20.43809939 53.57451327-20.43809939 74.01335353 1e-8l185.03227219 185.0337546 375.67225659-375.67225659c20.43809939-20.43809939 53.57451327-20.43809939 74.01261267 0C886.79185968 287.42249996 886.79185968 320.56039625 866.35301943 340.99849494z" fill="#707070" ></path></symbol><symbol id="icon-copy" viewBox="0 0 1024 1024"><path d="M725.333333 960H128c-23.466667 0-42.666667-19.2-42.666667-42.666667V277.333333c0-23.466667 19.2-42.666667 42.666667-42.666666h128V106.666667c0-23.466667 19.2-42.666667 42.666667-42.666667h597.333333c23.466667 0 42.666667 19.2 42.666667 42.666667v640c0 23.466667-19.2 42.666667-42.666667 42.666666h-128v128c0 23.466667-19.2 42.666667-42.666667 42.666667zM170.666667 874.666667h512V320H170.666667v554.666667z m170.666666-725.333334v85.333334h384c23.466667 0 42.666667 19.2 42.666667 42.666666v426.666667h85.333333V149.333333H341.333333z" fill="#707070" ></path><path d="M298.666667 490.666667h128c23.466667 0 42.666667-19.2 42.666666-42.666667s-19.2-42.666667-42.666666-42.666667h-128c-23.466667 0-42.666667 19.2-42.666667 42.666667s19.2 42.666667 42.666667 42.666667M512 576H298.666667c-23.466667 0-42.666667 19.2-42.666667 42.666667s19.2 42.666667 42.666667 42.666666h213.333333c23.466667 0 42.666667-19.2 42.666667-42.666666s-19.2-42.666667-42.666667-42.666667" fill="#707070" ></path></symbol><symbol id="icon-subway" viewBox="0 0 1024 1024"><path d="M430.376057 244.405701l153.865673 0c7.042474 0 12.919123-2.326595 17.819027-7.225487 4.897881-4.775536 7.285144-10.653196 7.285144-17.63298 0-7.470179-2.387262-13.592531-7.285144-18.369078-4.899904-4.775536-10.776553-7.225487-17.819027-7.225487L430.376057 193.952669c-7.10213 0-12.97979 2.448941-17.878683 7.225487-4.837214 4.775536-7.286155 10.898899-7.286155 18.369078 0 6.979784 2.448941 12.857444 7.286155 17.63298C417.396267 242.079107 423.273927 244.405701 430.376057 244.405701z" fill="#707070" ></path><path d="M304.001817 633.816602c-10.286158 0-18.919129 3.551065-25.960592 10.409515-6.979784 6.978773-10.531861 15.552088-10.531861 25.714889 0 9.552082 3.551065 17.878683 10.531861 24.859479 7.041463 6.856427 15.674434 10.407493 25.960592 10.407493 9.673417 0 18.061696-3.551065 25.103159-10.407493 6.979784-6.980796 10.531861-15.307396 10.531861-24.859479 0-10.162801-3.551065-18.735104-10.531861-25.714889C322.063513 637.367667 313.675234 633.816602 304.001817 633.816602z" fill="#707070" ></path><path d="M278.041225 294.122636l456.026739 0 0 150.620978-456.026739 0 0-150.620978Z" fill="#707070" ></path><path d="M745.457258 669.941005c0-10.162801-3.551065-18.735104-10.531861-25.714889-7.040452-6.85845-15.674434-10.409515-25.961603-10.409515-10.223468 0-18.85745 3.551065-25.897902 10.409515-7.042474 6.978773-10.531861 15.552088-10.531861 25.714889 0 9.552082 3.489387 17.878683 10.531861 24.859479 7.040452 6.856427 15.674434 10.407493 25.897902 10.407493 10.287169 0 18.921151-3.551065 25.961603-10.407493C741.906193 687.819688 745.457258 679.493088 745.457258 669.941005z" fill="#707070" ></path><path d="M506.4823 16.514678c-277.055885 0-501.579868 224.58465-501.579868 501.580879S229.426415 1019.677448 506.4823 1019.677448c277.057908 0 501.581891-224.585662 501.581891-501.581891S783.540207 16.514678 506.4823 16.514678zM715.455206 894.281975l-21.859476-48.861524L319.369881 845.420451l-21.858464 48.861524L192.994629 894.281975l106.965727-153.07093c-21.06271-5.878671-38.390331-17.63298-51.922195-35.266971-13.470185-17.635002-20.205278-37.962626-20.205278-60.860525l0-350.960913c0-13.837223 3.673411-27.062716 10.898899-39.675469 7.347833-12.490407 16.225496-24.001035 26.756346-34.41055s21.36807-19.347845 32.389314-26.94037c11.081912-7.470179 20.695673-12.97979 28.777581-16.776559 8.081909-3.673411 17.02125-7.714871 26.695679-12.001023 9.795763-4.286152 21.36807-7.959563 34.899933-11.265936 13.470185-3.184027 29.144619-5.87766 46.900956-7.959563 17.878683-2.204249 38.696702-3.184027 62.453044-3.184027 26.941382 0 50.696713 1.22447 71.268018 3.551065 20.512659 2.448941 38.45201 5.632968 53.881752 9.673417 15.368064 3.918103 28.899927 8.572304 40.472234 13.592531 11.570284 5.020227 22.28617 10.286158 32.022276 15.674434 9.672406 5.26593 19.959575 11.388282 30.736127 18.369078 10.836209 6.979784 20.572316 14.817001 29.142597 23.633997 8.695661 8.816996 15.79678 18.85745 21.492438 30.001041 5.693636 11.265936 8.509614 23.8797 8.509614 37.716923l0 350.960913c0 22.897899-6.856427 43.225523-20.632983 60.860525-13.776556 17.63298-31.164844 29.387289-52.226543 35.266971l107.700814 153.07093L715.455206 894.280964z" fill="#707070" ></path><path d="M365.53575 745.251494 342.085778 795.703516 670.145758 795.703516 647.430872 745.251494Z" fill="#707070" ></path></symbol><symbol id="icon-stop" viewBox="0 0 1024 1024"><path d="M512.08028937 991.94294281c-261.60871406-1.17313312-479.27825625-214.79003344-480.02479499-479.91814687-0.74653969-265.07479031 214.89668156-480.02479594 479.97147093-480.02479594a480.02479594 480.02479594 0 0 1 479.97147188 480.02479594c0 265.12811437-242.94523125 480.98463187-479.91814782 479.91814687z m164.98519501-599.89768406a45.00565781 45.00565781 0 0 0-45.00565782-45.00565687h-239.95907343a45.05898188 45.05898188 0 0 0-45.00565782 45.00565687v239.95907344c0 24.84909563 20.20988625 45.00565781 45.00565781 45.00565781h239.95907344a45.00565781 45.00565781 0 0 0 45.00565781-45.00565781v-239.95907344z" fill="#666666" ></path></symbol><symbol id="icon-time-expand" viewBox="0 0 1024 1024"><path d="M851.36 172.64L915.2 108.8l-63.78 63.78L915.2 108.8q22.5-20.58 48.72-9.36 26.28 9.36 28.14 41.28V347q-3.78 41.28-45 45h-206.28q-31.8-1.86-41.22-28.14-11.28-26.22 9.36-48.72l58.14-58.14Q665.72 155.72 512 152q-153.78 3.78-255 105Q155.72 358.28 152 512q3.78 153.78 105 255Q358.28 868.28 512 872q116.28-1.86 206.28-63.78 20.58-15 45-11.22 22.44 5.64 37.44 26.28 15 20.58 11.28 43.08-5.64 24.36-26.28 39.36Q667.7 990.2 512 992q-135-1.86-241.86-65.64-108.78-63.72-172.5-172.5Q33.8 647 32 512q1.86-135 65.64-241.86 63.72-108.78 172.5-172.5Q377 33.8 512 32q99.36 0 187.5 37.5 86.28 37.5 151.86 103.14zM512 272q41.28 3.78 45 45V512q0 18.78-13.14 31.86l-135 135q-31.86 26.28-63.72 0-26.28-31.86 0-63.72L467 493.28V317Q470.78 275.72 512 272z" fill="#6B7280" ></path></symbol><symbol id="icon-time-retract" viewBox="0 0 1024 1024"><path d="M169.646195 189.84683188L107.1651575 127.42451656l62.42231531 62.42231532L107.1651575 127.42451656Q85.20283812 107.1651575 59.59970656 118.26376344 33.76168344 127.42451656 32 158.60631313v201.88891593q3.69953531 40.34254969 44.042085 44.04208407h201.88891594q31.12307344-1.82040656 40.34254968-27.59970563 11.03988281-25.60313156-9.16075406-47.624175l-56.90237344-56.96109562Q351.334475 173.34573031 501.78223625 169.646195q150.50648437 3.69953531 249.57181312 102.76486406 99.12405187 99.12405187 102.76486407 249.57181313-3.69953531 150.50648437-102.76486407 249.57181312-99.12405187 99.12405187-249.57181312 102.76486406-113.80474687-1.76168344-201.88891594-62.36359125-20.14191375-14.680695-44.042085-10.98115968-21.96231937 5.51994094-36.64301437 25.66185468-14.680695 20.20063594-11.03988188 42.22167844 5.51994094 23.84144812 25.72057688 38.52214313Q349.39662312 989.88597969 501.78223625 991.76510844q132.12625406-1.87912875 236.71152469-64.24272 106.46439937-62.42231438 168.82799062-168.82799156Q969.80278906 654.10912625 971.5644725 521.98287219q-1.82040656-132.12625406-64.24272094-236.71152375-62.36359219-106.46439937-168.82799062-168.82799156Q633.90849031 54.0210425 501.78223625 52.20063594q-97.24492312 0-183.50868562 36.7017375-84.44335687 36.7017375-148.62735563 100.94445844zM501.78223625 287.09175406q-40.40127187 3.64081219-44.042085 44.042085v190.84903313q0 18.32150719 12.86028937 31.18179656l132.12625407 132.12625406q31.18179562 25.72057781 62.36359125 0 25.72057781-31.18179562 0-62.42231531L545.82432125 503.72008813V331.07511594q-3.69953531-40.40127187-44.042085-44.04208407z" fill="#6B7280" ></path></symbol><symbol id="icon-search-time" viewBox="0 0 1024 1024"><path d="M640.96 321.92l-182.08 181.44-59.2-59.2c-13.76-15.04-37.44-16-52.48-2.24s-16 37.44-2.24 52.48c0.64 0.96 1.28 1.6 2.24 2.24l86.08 85.12c7.04 7.04 16.32 10.88 26.24 10.88 9.92-0.32 19.2-4.16 26.56-10.88l208-207.36c13.44-15.68 11.84-39.36-3.84-52.8a39.04 39.04 0 0 0-49.28 0.32z"  ></path><path d="M971.2 942.08l-196.8-196.8c4.8-4.48 9.92-8.64 14.72-13.44 80.32-80.32 125.44-189.44 125.44-303.04 0-236.8-192-428.8-428.8-428.8S56.96 192 56.96 428.8s192 428.8 428.8 428.8c74.56 0.32 146.88-19.52 210.56-55.36l207.68 207.68c8.96 8.64 20.8 14.08 34.24 14.08 26.24 0 47.68-21.44 47.68-47.68 0-13.44-5.76-25.6-14.72-34.24z m-485.12-179.84c-184 0-333.44-149.76-333.44-333.44S302.08 95.36 486.08 95.36 819.52 244.8 819.52 428.8s-149.76 333.44-333.44 333.44z"  ></path></symbol><symbol id="icon-handle-time" viewBox="0 0 1024 1024"><path d="M858.112 877.568h-38.4c0-153.6-92.16-241.152-153.6-307.2-23.04-22.016-53.76-44.032-53.76-58.368 0-7.168 23.04-22.016 38.4-29.184 61.44-44.032 168.96-124.416 168.96-336.384h38.4c23.04 0 38.4-14.848 38.4-36.352s-15.872-36.352-38.4-36.352h-691.2c-23.04 0-38.4 14.848-38.4 36.352s15.36 36.352 38.4 36.352H204.8C204.8 358.4 312.32 438.784 373.76 482.816c15.872 7.168 38.4 22.016 38.4 29.184 0 14.848-30.72 36.352-53.76 66.048-61.44 58.368-153.6 146.432-153.6 300.032h-38.4c-23.04 0-38.4 14.848-38.4 36.352 0 22.016 15.36 36.352 38.4 36.352h691.2c23.04 0 38.4-14.848 38.4-36.352 0.512-22.016-14.848-36.864-37.888-36.864z m-186.88-48.64H348.16v-45.056c0-25.6 12.8-51.2 33.28-64l100.864-82.944c19.968-12.8 47.104-12.8 59.904 0l93.696 82.944c20.48 18.944 33.792 44.544 33.792 64v45.056h1.536z"  ></path></symbol><symbol id="icon-generation" viewBox="0 0 1024 1024"><path d="M736.37789287 63.83251348h-26.82651283c-21.88478675 0-39.53380832 17.76668319-39.53380832 39.53380841v78.24399411c0 21.88478675 17.76668319 39.53380832 39.53380832 39.53380837h26.82651283c21.88478675 0 39.53380832-17.76668319 39.53380831-39.53380837v-78.24399411c0.11766159-21.76712511-17.64902155-39.53380832-39.53380831-39.53380841zM315.50756123 63.83251348h-26.82651289c-21.88478675 0-39.53380832 17.76668319-39.53380829 39.53380841v78.24399411c0 21.88478675 17.76668319 39.53380832 39.53380829 39.53380837h26.82651289c21.88478675 0 39.53380832-17.76668319 39.53380834-39.53380837v-78.24399411c0-21.76712511-17.64902155-39.53380832-39.53380834-39.53380841z"  ></path><path d="M882.04115391 169.96196174c-28.35609614 0-51.41748141 23.06138967-51.41748575 51.41748143v14.00156007c0 22.47308593-18.2373208 40.5927496-40.5927497 40.59274965h-130.83807841c-22.47308593 0-40.5927496-18.2373208-40.59274972-40.59274965v-24.82629185c0-22.47308593-18.2373208-40.5927496-40.59274963-40.59274965h-130.83807855c-22.47308593 0-40.5927496 18.2373208-40.59274963 40.59274965v24.82629185c0 22.47308593-18.2373208 40.5927496-40.59274959 40.59274965h-130.83808294c-22.47308593 0-40.5927496-18.2373208-40.59274966-40.59274965V221.37944317c0-28.35609614-23.06138967-51.41748141-51.41748132-51.41748143-30.0033367 0-54.59430532 24.59096853-54.59430532 54.59430531v684.31139968c0 28.35609614 23.06138967 51.41748141 51.41748143 51.4174814h742.20018603c28.35609614 0 51.41748141-23.06138967 51.41748575-51.4174814v-687.60588077c3.05916228-28.82673377-22.59074761-51.29982423-51.53514299-51.29982422z m-82.00912175 325.91860006l-302.85721027 302.85721027-6.70662822 6.70662825c-18.82562451 18.82562451-49.53492204 18.82562451-68.24288492 0l-3.41214268-3.4121471-161.54737613-161.5473761c-18.82562451-18.82562451-18.82562451-49.53492204 0-68.24288492l6.70662829-6.70662818c18.82562451-18.82562451 49.53492204-18.82562451 68.24288051 0l124.01379307 124.01379311 268.73577008-268.7357701c20.59052665-20.59052665 54.35898642-20.59052665 74.9495087 0 20.70818385 20.70818385 20.70818385 54.47664804 0.11766157 75.06717477z"  ></path></symbol><symbol id="icon-generator" viewBox="0 0 1024 1024"><path d="M905.75 174.5v112.5h56.25V174.5c0-61.875-50.625-112.5-112.5-112.5h-112.5v56.25h112.5c28.125 0 56.25 28.125 56.25 56.25zM118.25 849.5v-112.5H62v112.5c0 61.875 50.625 112.5 112.5 112.5h112.5v-56.25H174.5c-28.125 0-56.25-28.125-56.25-56.25z m787.5 0c0 22.5-22.5 56.25-56.25 56.25h-112.5v56.25h112.5c61.875 0 112.5-50.625 112.5-118.125V737h-56.25v112.5zM118.25 174.5c0-28.125 28.125-56.25 56.25-56.25h112.5V62H174.5C112.625 67.625 62 118.25 62 174.5v112.5h56.25V174.5z m663.75 0H242C208.25 174.5 174.5 208.25 174.5 242v534.375c0 45 33.75 73.125 67.5 73.125h534.375c39.375 0 67.5-28.125 67.5-67.5V242c5.625-33.75-22.5-67.5-61.875-67.5zM568.25 680.75L512 568.25H399.5l-56.25 112.5H287l112.5-337.5h112.5l112.5 337.5H568.25z m168.75 0h-56.25V343.25h56.25v337.5zM512 512L455.75 343.25 399.5 512h112.5z" fill="#999999" ></path></symbol><symbol id="icon-user" viewBox="0 0 1024 1024"><path d="M856.339597 799.428571q0 62.285714-35.714286 106.857143t-86 44.571429H246.625311q-50.285714 0-86-44.571429T124.911026 799.428571q0-48.571429 4.857143-91.714285t18-86.857143 33.428571-74.857143 53.714286-50.857143T311.768169 475.428571q74.857143 73.142857 178.857142 73.142858t178.857143-73.142858q43.428571 0 76.857143 19.714286t53.714286 50.857143 33.428571 74.857143 18 86.857143 4.857143 91.714285z m-146.285714-506.857142q0 90.857143-64.285714 155.142857T490.625311 512 335.482454 447.714286 271.19674 292.571429t64.285714-155.142858T490.625311 73.142857t155.142858 64.285714T710.053883 292.571429z"  ></path></symbol><symbol id="icon-send" viewBox="0 0 1024 1024"><path d="M893.18 191.719c20.24-7.106 41.16 8.769 39.753 30.164l-38.276 581.744c-1.35 20.511-22.53 33.572-41.477 25.576L536.091 695.376 431.374 859.151c-15.935 24.922-54.329 14.003-55.095-15.206l-0.012-0.89V630.433L109.654 522.213c-25.266-10.256-24.662-46.049 0.57-55.616l0.772-0.282zM664.153 453.57L436.08 633.345l-0.001 107.426 58.26-91.114a29.816 29.816 0 0 1 7.794-8.22 30.49 30.49 0 0 1 1.665-2.109l160.356-185.757z" fill="#333333" ></path></symbol><symbol id="icon-uploaded" viewBox="0 0 1024 1024"><path d="M692.312 956.978c-59.656 0-112.963-25.778-148.221-66.23H214.286V133.034h400.115v187.818h197.413v310.98c42.357 31.932 70.176 80.457 72.544 135.214v-510.52L674.346 64.223H141.742v895.335h742.615V782.244c-4.202 97.174-88.568 174.734-192.045 174.734z" fill="#8a8a8a" ></path><path d="M301.326 418.477h437.601v67.091H301.326zM301.326 578.493h219.957v67.091H301.326zM301.326 738.509h138.34V805.6h-138.34z" fill="#8a8a8a" ></path><path d="M811.814 631.832c-32.811-24.735-74.334-39.519-119.502-39.519-106.162 0-192.224 81.633-192.224 182.333 0 44.113 16.517 84.567 44.003 116.103 35.258 40.452 88.565 66.23 148.221 66.23 103.477 0 187.843-77.56 192.045-174.734 0.109-2.521 0.179-5.052 0.179-7.599s-0.07-5.078-0.179-7.599c-2.368-54.759-30.186-103.283-72.543-135.215zM660.869 888.809l-38.472-36.492 0.92-0.872-69.159-65.6 38.472-36.492 69.159 65.6 130.205-123.505 38.472 36.492-169.597 160.869z" fill="#8a8a8a" ></path><path d="M791.994 691.447L661.789 814.952l-69.159-65.6-38.472 36.492 69.159 65.6-0.92 0.873 38.472 36.492L830.466 727.94z" fill="#ffffff" ></path></symbol><symbol id="icon-notice-board" viewBox="0 0 1024 1024"><path d="M464 736H192a80 80 0 0 1-80-80v-448A80 80 0 0 1 192 128h640a80 80 0 0 1 80 80v448A80 80 0 0 1 832 736h-272v64H768a32 32 0 0 1 32 32v32a32 32 0 0 1-32 32H256a32 32 0 0 1-32-32v-32a32 32 0 0 1 32-32h208v-64z m352-512h-608v416h608V224z m-448 96a32 32 0 0 1 32 32v208a32 32 0 0 1-32 32h-32a32 32 0 0 1-32-32V352a32 32 0 0 1 32-32h32z m320 48a32 32 0 0 1 32 32v160a32 32 0 0 1-32 32h-32a32 32 0 0 1-32-32v-160a32 32 0 0 1 32-32h32z m-160-96a32 32 0 0 1 32 32v256a32 32 0 0 1-32 32h-32a32 32 0 0 1-32-32v-256a32 32 0 0 1 32-32h32z" fill="#333333" ></path></symbol><symbol id="icon-setting" viewBox="0 0 1024 1024"><path d="M950.857143 402.285714h-51.748572a403.2 403.2 0 0 0-36.571428-86.308571l36.571428-36.571429a73.142857 73.142857 0 0 0 0-103.314285l-51.017142-51.931429a73.142857 73.142857 0 0 0-103.314286 0l-36.571429 36.571429A393.691429 393.691429 0 0 0 621.714286 125.074286V73.142857a73.142857 73.142857 0 0 0-73.142857-73.142857h-73.142858a73.142857 73.142857 0 0 0-73.142857 73.142857v51.931429a393.691429 393.691429 0 0 0-86.308571 35.657143l-36.571429-36.571429a73.142857 73.142857 0 0 0-103.314285 0L124.16 175.908571a73.142857 73.142857 0 0 0 0 103.314286l36.571429 36.571429a403.2 403.2 0 0 0-36.571429 86.308571H73.142857a73.142857 73.142857 0 0 0-73.142857 73.142857v73.142857a73.142857 73.142857 0 0 0 73.142857 73.142858h51.748572a403.2 403.2 0 0 0 36.571428 86.308571l-36.571428 36.571429a73.142857 73.142857 0 0 0 0 103.314285l51.748571 51.748572a73.142857 73.142857 0 0 0 103.314286 0l36.571428-36.571429A393.691429 393.691429 0 0 0 402.285714 898.925714V950.857143a73.142857 73.142857 0 0 0 73.142857 73.142857h73.142858a73.142857 73.142857 0 0 0 73.142857-73.142857v-51.931429a393.691429 393.691429 0 0 0 86.308571-35.657143l36.571429 36.571429a73.142857 73.142857 0 0 0 103.314285 0l51.748572-51.748571a73.142857 73.142857 0 0 0 0-103.314286l-36.571429-36.571429a403.2 403.2 0 0 0 36.571429-86.308571H950.857143a73.142857 73.142857 0 0 0 73.142857-73.142857V475.428571a73.142857 73.142857 0 0 0-73.142857-73.142857zM617.142857 613.668571a146.285714 146.285714 0 1 1-3.474286-206.811428 146.285714 146.285714 0 0 1 3.474286 206.811428z" fill="#131313" ></path></symbol><symbol id="icon-chatbot" viewBox="0 0 1024 1024"><path d="M282.4192 271.2064H742.4a79.9744 79.9744 0 0 1 79.9744 79.9744v400.0256a79.9744 79.9744 0 0 1-79.9744 79.9744H282.368a79.9744 79.9744 0 0 1-79.9744-79.9744V351.1808a79.9744 79.9744 0 0 1 80.0256-79.9744z m404.6336 445.952a24.0128 24.0128 0 0 0-16.9472-40.96H354.0992a24.0128 24.0128 0 0 0 0 48.0256h316.0064c6.3488 0 12.4928-2.56 16.9472-7.0656zM372.0192 604.672h280.0128a109.9776 109.9776 0 0 0 0-220.0064h-280.064a109.9776 109.9776 0 1 0 0 220.0064z m19.968-50.0224a60.0064 60.0064 0 1 0 0-120.0128 60.0064 60.0064 0 0 0 0 120.0128z m240.0256 0a60.0064 60.0064 0 1 0 0-120.0128 60.0064 60.0064 0 0 0 0 120.0128z" fill="#131313" ></path><path d="M953.344 160.6656a49.9712 49.9712 0 0 0-43.008 75.4688l-64 107.6736v333.4144h55.9616a24.0128 24.0128 0 0 0 24.0128-24.064v-192a24.0128 24.0128 0 0 0-24.064-23.9616h-55.552l104.8576-176.5376h1.7408a49.9712 49.9712 0 1 0 0-99.9936zM113.9712 236.1344l64 107.6736v333.3632H122.0096a24.0128 24.0128 0 0 1-24.0128-23.9616v-192a24.0128 24.0128 0 0 1 24.0128-24.064H177.664L72.704 260.7104h-1.7408a50.0224 50.0224 0 1 1 43.008-24.576z" fill="#131313" fill-opacity=".64" ></path></symbol><symbol id="icon-cloudupload-fill" viewBox="0 0 1024 1024"><path d="M1024 640.192C1024 782.912 919.872 896 787.648 896h-512C123.904 896 0 761.6 0 597.504 0 451.968 94.656 331.52 226.432 302.976 284.16 195.456 391.808 128 512 128c152.32 0 282.112 108.416 323.392 261.12C941.888 413.44 1024 519.04 1024 640.192z m-341.312-139.84L512 314.24 341.312 500.48h341.376z m-213.376 0v256h85.376v-256H469.312z" fill="#00377C" ></path></symbol><symbol id="icon-basic" viewBox="0 0 1024 1024"><path d="M116.4921875 776.19921875q0 21.60461426 13.89221192 35.54626465 13.89221191 13.84277344 35.54626464 13.84277344h84.98474122q13.89221191 34.01367188 44.79125975 54.13513183 29.36645508 20.07202148 67.97790528 20.07202148t67.97790528-20.07202148q30.89904786-20.12145997 44.79125976-54.08569336H858.06933594q21.65405273 0 35.54626465-13.89221192 13.89221191-13.94165039 13.89221191-35.59570311 0-21.60461426-13.89221191-35.49682617-13.89221191-13.89221191-35.54626465-13.89221192H476.45373535Q462.56152345 692.74707031 431.66247558 672.67504883q-29.36645508-20.07202148-67.97790527-20.07202149t-67.97790528 20.07202149q-30.89904786 20.07202148-44.79125975 54.08569336H165.93066406q-21.65405273 0-35.54626465 13.89221192-13.89221191 13.89221191-13.89221191 35.54626464z m197.75390625 0q0-21.65405273 13.89221192-35.54626465 13.94165039-13.89221191 35.54626464-13.89221191 21.65405273 0 35.54626464 13.89221191 13.89221191 13.89221191 13.89221193 35.54626465 0 21.60461426-13.89221193 35.54626465-13.94165039 13.84277344-35.54626464 13.84277344-21.65405273 0-35.54626465-13.84277344Q314.24609375 797.75439453 314.24609375 776.1003418z m296.63085938-247.19238281q0-21.65405273 13.8922119-35.54626467 13.89221191-13.89221191 35.54626466-13.8922119 21.65405273 0 35.54626464 13.8922119 13.89221191 13.89221191 13.89221192 35.54626467 0 21.60461426-13.89221192 35.54626465-13.89221191 13.84277344-35.54626464 13.84277344-21.65405273 0-35.54626466-13.84277344Q610.87695313 550.56201172 610.87695313 528.90795898z m49.43847656-123.59619141q-38.6114502 0-67.97790528 20.07202149-30.89904786 20.07202148-44.79125976 54.08569336H165.93066406q-21.65405273 0-35.54626465 13.89221191Q116.4921875 507.3527832 116.4921875 529.00683594q0 21.60461426 13.89221192 35.54626465 13.89221191 13.84277344 35.54626464 13.84277344h381.61560059q13.89221191 34.01367188 44.79125976 54.13513183 29.36645508 20.07202148 67.97790528 20.07202148t67.97790528-20.07202148q30.89904786-20.12145997 44.79125975-54.08569336H858.06933594q21.65405273 0 35.54626465-13.89221192 13.89221191-13.94165039 13.89221191-35.59570311 0-21.60461426-13.89221191-35.49682618-13.89221191-13.89221191-35.54626465-13.89221191h-84.98474122Q759.19238281 445.5546875 728.29333497 425.48266602q-29.36645508-20.07202148-67.97790528-20.07202149z m-247.19238282-74.15771484q-21.65405273 0-35.54626465-13.89221192Q363.68457031 303.36962891 363.68457031 281.76501463q0-21.60461426 13.89221192-35.49682615 13.94165039-13.89221191 35.54626465-13.89221191 21.65405273 0 35.54626464 13.84277342 13.89221191 13.94165039 13.89221193 35.59570313 0 21.60461426-13.89221193 35.54626466-13.94165039 13.84277344-35.54626464 13.84277344z m112.76916504-98.87695314Q512 198.36230469 481.10095214 178.2902832 451.73449707 158.21826172 413.12304687 158.21826172t-67.97790527 20.07202148Q314.24609375 198.36230469 300.35388183 232.37597657H165.93066406q-21.65405273 0-35.54626465 13.84277344Q116.4921875 260.20983886 116.4921875 281.86389159q0 21.60461426 13.89221192 35.54626466 13.89221191 13.84277344 35.54626464 13.84277344h134.42321777q13.89221191 34.01367188 44.79125977 54.13513184 29.36645508 20.07202148 67.97790528 20.07202148t67.97790527-20.07202148Q512 365.16772461 525.89221191 331.25292969H858.06933594q21.65405273 0 35.54626465-13.89221192 13.89221191-13.94165039 13.89221191-35.59570312 0-21.60461426-13.89221191-35.49682617-13.89221191-13.89221191-35.54626465-13.89221193H525.89221191z" fill="#595959" ></path></symbol><symbol id="icon-indexer" viewBox="0 0 1024 1024"><path d="M328.63338477 905.06522041q-18.38740957 18.33730752-44.0897001 18.33730752t-44.08970098-18.33730752l-161.62883525-176.35880303q-16.53363809-20.19107901-14.67986573-42.23592861 1.80366943-23.84851992 18.33730752-42.23592949 20.24118106-16.53363809 42.23592862-14.6798666 23.89862198 1.85377148 42.28603154 18.33730751l58.7695667 66.13455147V159.34805527q0-25.70229141 16.53363809-42.23592949 16.53363809-16.53363809 42.23592949-16.53363721 25.70229141 0 42.23592861 16.53363721 16.53363809 16.53363809 16.53363809 42.23592949v554.67849639l58.7695667-66.13455146q18.38740957-16.53363809 42.23592949-18.33730752 22.04485049-1.85377148 42.23592949 14.67986659 16.53363809 18.38740957 18.38740869 40.43225919 1.85377148 23.84851992-14.67986572 44.08970097l-161.62883525 176.30870098z m249.75813427-275.56062978q0-25.65218935 16.53363809-42.18582657 16.53363809-16.53363809 42.23592949-16.53363809h235.12836973q38.57848857 1.80366943 55.11212578 36.72471622 12.82609512 34.92104678-12.87619716 64.28077998l-135.92654297 134.07277148h93.69061435q25.70229141 0 42.23592862 16.53363809 16.53363809 16.53363809 16.53363808 42.23592949 0 25.75239346-16.53363808 42.28603067-16.53363809 16.53363809-42.23592862 16.53363808h-235.12836973q-38.57848857-1.85377148-55.11212665-36.77481826-12.82609512-34.87094473 12.87619716-64.28077998l135.92654297-134.07277148h-93.69061348q-25.70229141 0-42.23592949-16.53363809-16.53363809-16.53363809-16.53363809-42.23592949zM754.75032208 100.57848857q34.87094473 1.80366943 53.25835428 33.0672753l117.53913429 235.07826767 29.40983437 58.76956671q9.16865332 22.04485049 1.80366943 44.08970097-7.31488184 22.04485049-29.35973232 34.92104677-22.04485049 9.16865332-44.08970098 1.80367032-22.04485049-7.31488184-34.92104677-29.35973321l-12.82609513-25.7022914h-161.62883437l-12.87619717 25.7022914q-12.82609512 22.04485049-34.87094472 29.35973321-22.04485049 7.36498388-44.08970098-1.80367032-22.04485049-12.87619628-29.40983438-34.92104677-7.31488184-22.04485049 1.85377149-44.08970097l29.35973232-58.76956671 117.58923633-235.07826767q18.33730752-31.26360586 53.2583543-33.0672753z m-36.72471622 264.48810206h73.4494333-73.4494333 73.4494333l-36.72471709-73.49953535-36.72471621 73.49953534z" fill="#595959" ></path></symbol><symbol id="icon-retriever" viewBox="0 0 1024 1024"><path d="M934.966272 879.950848 709.541888 654.526464c47.665152-59.81696 76.166144-135.581696 76.166144-218.012672 0-193.36704-156.752896-350.124032-350.12096-350.124032S85.464064 243.145728 85.464064 436.513792s156.756992 350.124032 350.124032 350.124032c79.875072 0 153.486336-26.766336 212.39808-71.79264l226.04288 226.04288c8.416256 8.416256 19.441664 12.62592 30.470144 12.62592 11.025408 0 22.050816-4.209664 30.466048-12.62592C951.798784 924.055552 951.798784 896.782336 934.966272 879.950848zM165.953536 436.513792c0-148.912128 120.722432-269.630464 269.63456-269.630464S705.21856 287.60064 705.21856 436.513792 584.500224 706.148352 435.588096 706.148352 165.953536 585.42592 165.953536 436.513792z" fill="#595959" ></path><path d="M291.135488 302.036992c-8.997888-4.864-20.23424-1.511424-25.097216 7.486464-20.256768 37.476352-32.600064 78.152704-36.688896 120.899584-0.973824 10.181632 6.491136 19.224576 16.672768 20.1984 0.59904 0.057344 1.195008 0.084992 1.784832 0.084992 9.433088 0 17.497088-7.175168 18.413568-16.75776 3.613696-37.7856 14.5152-73.72288 32.401408-106.814464C303.485952 318.138368 300.1344 306.900992 291.135488 302.036992z" fill="#595959" ></path></symbol><symbol id="icon-node-parser" viewBox="0 0 1024 1024"><path d="M946.28571406 992h-137.14285687a45.71428594 45.71428594 0 0 1-45.71428594-45.71428594v-137.14285687a45.71428594 45.71428594 0 0 1 45.71428594-45.71428594h45.71428594v-137.14285688h-320.00000063v137.14285688h45.71428594a45.71428594 45.71428594 0 0 1 45.71428594 45.71428594v137.14285687a45.71428594 45.71428594 0 0 1-45.71428594 45.71428594H443.42857156a45.71428594 45.71428594 0 0 1-45.71428593-45.71428594v-137.14285687a45.71428594 45.71428594 0 0 1 45.71428593-45.71428594h45.71428594v-137.14285688H169.14285688v137.14285688h45.71428593a45.71428594 45.71428594 0 0 1 45.71428594 45.71428594v137.14285687a45.71428594 45.71428594 0 0 1-45.71428594 45.71428594H77.71428594a45.71428594 45.71428594 0 0 1-45.71428594-45.71428594v-137.14285687a45.71428594 45.71428594 0 0 1 45.71428594-45.71428594h45.71428593v-182.85714281h365.71428563V443.42857156H397.71428563a91.42857188 91.42857188 0 0 1-91.42857094-91.42857187V123.42857188a91.42857188 91.42857188 0 0 1 91.42857093-91.42857188h228.57142875a91.42857188 91.42857188 0 0 1 91.42857094 91.42857188v228.57142781a91.42857188 91.42857188 0 0 1-91.42857093 91.42857187h-91.42857188v137.14285688h365.71428563v182.85714281h45.71428593a45.71428594 45.71428594 0 0 1 45.71428594 45.71428594v137.14285687a45.71428594 45.71428594 0 0 1-45.71428594 45.71428594zM123.42857188 854.85714312v45.71428501h45.714285v-45.714285H123.42857188zM580.57142844 351.99999969a45.71428594 45.71428594 0 0 0 45.71428593-45.714285V169.14285688a45.71428594 45.71428594 0 0 0-45.71428593-45.71428501H443.42857156a45.71428594 45.71428594 0 0 0-45.71428593 45.714285v137.14285782a45.71428594 45.71428594 0 0 0 45.71428593 45.714285h137.14285688z m-91.42857094 502.85714344v45.71428499h45.714285v-45.714285h-45.714285z m411.42857063-1e-8h-45.71428501v45.71428501h45.714285v-45.71428501z" fill="#595959" ></path></symbol><symbol id="icon-generator1" viewBox="0 0 1024 1024"><path d="M532.48 531.953l418.377-248.159V775.9L531.017 1024l1.463-492.047zM512 492.047L95.086 245.292 512 0l416.914 245.292L512 492.047z m-23.406 36.922l-1.463 490.584-413.988-243.83V283.795l415.451 245.35z" fill="#595959" ></path></symbol><symbol id="icon-post-processor" viewBox="0 0 1024 1024"><path d="M329.9555552 329.9555552h364.0888896v364.0888896H329.9555552z" fill="#595959" ></path><path d="M967.11111147 420.97777813V329.9555552h-91.02222294V193.42222187c0-27.30666667-18.2044448-45.51111147-45.5111104-45.5111104h-136.53333333V56.88888853h-91.02222293v91.02222294h-182.04444374V56.88888853H329.9555552v91.02222294H193.42222187c-27.30666667 0-45.51111147 18.2044448-45.5111104 45.5111104v136.53333333H56.88888853v91.02222293h91.02222294v182.04444374H56.88888853v91.02222293h91.02222294v136.53333333c0 27.30666667 18.2044448 45.51111147 45.5111104 45.5111104h136.53333333v91.02222294h91.02222293v-91.02222294h182.04444374v91.02222294h91.02222293v-91.02222294h136.53333333c27.30666667 0 45.51111147-18.2044448 45.5111104-45.5111104v-136.53333333h91.02222294v-91.02222293h-91.02222294v-182.04444374h91.02222294z m-182.0444448 364.08888854H238.93333333V238.93333333h546.13333334v546.13333334z" fill="#595959" ></path></symbol><symbol id="icon-active" viewBox="0 0 1024 1024"><path d="M513.44 62A450.16000031 450.16000031 0 0 1 962 512a450.16000031 450.16000031 0 0 1-448.56 450H512A450.24 450.24 0 0 1 62 512 450.24 450.24 0 0 1 512 62h1.44zM411.99999969 318.39999969a19.99999969 19.99999969 0 0 0-19.99999969 20.00000062v347.19999938a19.99999969 19.99999969 0 0 0 30.72 16.8l272.80000031-173.59999969a19.99999969 19.99999969 0 0 0 0-33.6l-272.80000031-173.59999969a19.99999969 19.99999969 0 0 0-10.72000031-3.20000062z" fill="#595959" ></path></symbol></svg>'),
-  ((h) => {
+  '<svg><symbol id="icon-simple-robot" viewBox="0 0 1198 1024"><path d="M397.34373452 537.69294885a51.79858044 51.79858044 0 1 0 51.79858045-51.70016656 51.76577636 51.76577636 0 0 0-51.79858045 51.70016656z m268.99832868 0a51.83138535 51.83138535 0 0 0 103.62996579 0 51.83138535 51.83138535 0 0 0-103.62996579 0z m409.0086785 26.8998327a82.56936511 82.56936511 0 0 0-81.15876425-65.60934823 29.52420667 29.52420667 0 0 1-25.62045062-17.84574261c-20.69974924-44.18789612-73.6136889-150.90150201-119.0481622-193.84282013a20.14207004 20.14207004 0 0 1 0-28.99933237l67.70884707-67.54482422a52.48747842 52.48747842 0 1 0-26.73580902-26.67020005l-75.15550855 74.99148487a20.43731168 20.43731168 0 0 1-25.94849798 2.3947413 369.93831153 369.93831153 0 0 0-411.63305245 0 20.56853047 20.56853047 0 0 1-25.94849717-2.3947413L276.75375186 164.11331803A52.0938229 52.0938229 0 0 0 266.12503723 105.95063126a52.48747842 52.48747842 0 1 0-16.10709522 84.86569171l67.70884791 67.54482421a20.14207004 20.14207004 0 0 1 0 28.99933238c-45.4672782 42.97412302-98.41402277 149.68772891-119.08096793 193.84282012a29.06494134 29.06494134 0 0 1-25.62045062 17.84574262 82.43814634 82.43814634 0 0 0-33.95283783 157.75767855 26.70300495 26.70300495 0 0 1 14.33564291 27.55592661l-9.02128519 79.78096829a138.10767874 138.10767874 0 0 0 129.48004907 169.37053282h619.68029673a138.10767874 138.10767874 0 0 0 129.48004907-169.37053282l-9.08689416-79.81377319a26.24373963 26.24373963 0 0 1 14.33564209-27.55592578 82.56936511 82.56936511 0 0 0 47.10751254-92.18113522z m-335.26377082 100.28388978h-312.82537335a133.02295449 133.02295449 0 0 1-138.33731139-127.0525037 133.08856348 133.08856348 0 0 1 138.33731139-127.05250369h312.95659214a133.02295449 133.02295449 0 0 1 138.3373114 127.05250369 133.25258716 133.25258716 0 0 1-138.46853019 127.05250369z" fill="#566079" ></path></symbol><symbol id="icon-deep_search" viewBox="0 0 1024 1024"><path d="M887 842h-69c-18 0-13.5-14.1-13.5-21.6A144.6 144.6 0 0 0 723.8 692l5.4-2.7a272.7 272.7 0 0 0 102.9-105.9c18.3-11.7 36.9-22.8 55.5-33.6a90 90 0 0 0 36-30A88.2 88.2 0 0 0 932 482a223.8 223.8 0 0 0-3.3-64.8 96.3 96.3 0 0 0-33.6-45.9A487.8 487.8 0 0 0 843.8 332a285.6 285.6 0 0 0-60-90V152a45 45 0 0 0-90 0v30a487.5 487.5 0 0 0-183.9-30 755.7 755.7 0 0 0-82.2 5.1A417 417 0 0 0 332 182V152a45 45 0 0 0-90 0v87A275.7 275.7 0 0 0 178.1 332a521.4 521.4 0 0 0-48.6 37.2 97.5 97.5 0 0 0-33.3 45.9A223.8 223.8 0 0 0 92 482a88.2 88.2 0 0 0 8.1 38.4 90 90 0 0 0 36 30c15.6 9 33.6 18.3 51.9 27.9a274.8 274.8 0 0 0 125.1 121.8c-4.8-2.1-9.3-4.8-14.1-7.2a144.6 144.6 0 0 0-80.1 129.3c0 7.5 3.6 21.6-13.5 21.6H137a45 45 0 0 0 0 90h750a45 45 0 0 0 0-90zM333.5 535.1a164.1 164.1 0 0 1-67.5-134.7 103.2 103.2 0 0 1 10.8-49.2l2.7-4.5v-1.8a67.5 67.5 0 0 1 9-11.7 118.2 118.2 0 0 1 63.9-27.3c17.1-3 34.5-5.7 51.6-8.1a834.6 834.6 0 0 1 214.2 0c17.1 2.4 34.5 5.1 51.6 8.1a118.2 118.2 0 0 1 63.9 27.3 67.5 67.5 0 0 1 9 11.7v1.8l2.7 4.5a101.4 101.4 0 0 1 10.5 49.5A162.9 162.9 0 0 1 692 535.1a204 204 0 0 1-79.2 32.4h-6.6a454.8 454.8 0 0 1-92.7 6.9 454.8 454.8 0 0 1-92.7-6.9h-6.6a204 204 0 0 1-80.7-32.4z" fill="#707070" ></path><path d="M431 438.8v-45a30 30 0 1 0-60 0v45a30 30 0 0 0 60 0zM643.4 468.8a30 30 0 0 0 30-30v-45a30 30 0 1 0-60 0v45a30 30 0 0 0 30 30z" fill="#707070" ></path><path d="M887 842h-69c-18 0-13.5-14.1-13.5-21.6A144.6 144.6 0 0 0 723.8 692l5.4-2.7a272.7 272.7 0 0 0 102.9-105.9c18.3-11.7 36.9-22.8 55.5-33.6a90 90 0 0 0 36-30A88.2 88.2 0 0 0 932 482a223.8 223.8 0 0 0-3.3-64.8 96.3 96.3 0 0 0-33.6-45.9A487.8 487.8 0 0 0 843.8 332a285.6 285.6 0 0 0-60-90V152a45 45 0 0 0-90 0v30a487.5 487.5 0 0 0-183.9-30 755.7 755.7 0 0 0-82.2 5.1A417 417 0 0 0 332 182V152a45 45 0 0 0-90 0v87A275.7 275.7 0 0 0 178.1 332a521.4 521.4 0 0 0-48.6 37.2 97.5 97.5 0 0 0-33.3 45.9A223.8 223.8 0 0 0 92 482a88.2 88.2 0 0 0 8.1 38.4 90 90 0 0 0 36 30c15.6 9 33.6 18.3 51.9 27.9a274.8 274.8 0 0 0 125.1 121.8c-4.8-2.1-9.3-4.8-14.1-7.2a144.6 144.6 0 0 0-80.1 129.3c0 7.5 3.6 21.6-13.5 21.6H137a45 45 0 0 0 0 90h750a45 45 0 0 0 0-90zM333.5 535.1a164.1 164.1 0 0 1-67.5-134.7 103.2 103.2 0 0 1 10.8-49.2l2.7-4.5v-1.8a67.5 67.5 0 0 1 9-11.7 118.2 118.2 0 0 1 63.9-27.3c17.1-3 34.5-5.7 51.6-8.1a834.6 834.6 0 0 1 214.2 0c17.1 2.4 34.5 5.1 51.6 8.1a118.2 118.2 0 0 1 63.9 27.3 67.5 67.5 0 0 1 9 11.7v1.8l2.7 4.5a101.4 101.4 0 0 1 10.5 49.5A162.9 162.9 0 0 1 692 535.1a204 204 0 0 1-79.2 32.4h-6.6a454.8 454.8 0 0 1-92.7 6.9 454.8 454.8 0 0 1-92.7-6.9h-6.6a204 204 0 0 1-80.7-32.4z" fill="#707070" ></path><path d="M431 438.8v-45a30 30 0 1 0-60 0v45a30 30 0 0 0 60 0zM643.4 468.8a30 30 0 0 0 30-30v-45a30 30 0 1 0-60 0v45a30 30 0 0 0 30 30z" fill="#707070" ></path></symbol><symbol id="icon-jiqiren-05" viewBox="0 0 1024 1024"><path d="M662.186667 76.8H366.933333c-87.04 0-157.013333 69.973333-157.013333 157.013333s69.973333 157.013333 157.013333 157.013334h293.546667c87.04 0 157.013333-69.973333 157.013333-157.013334 1.706667-87.04-69.973333-157.013333-155.306666-157.013333zM397.653333 274.773333c-23.893333 0-42.666667-18.773333-42.666666-42.666666s18.773333-42.666667 42.666666-42.666667 42.666667 18.773333 42.666667 42.666667-18.773333 42.666667-42.666667 42.666666z m228.693334 0c-23.893333 0-42.666667-18.773333-42.666667-42.666666s18.773333-42.666667 42.666667-42.666667 42.666667 18.773333 42.666666 42.666667-18.773333 42.666667-42.666666 42.666666z" fill="#333333" ></path><path d="M696.32 537.6c11.946667-10.24 13.653333-25.6 5.12-37.546667l-122.88-146.773333c-8.533333-10.24-25.6-11.946667-35.84-3.413333-10.24 8.533333-11.946667 25.6-3.413333 35.84l100.693333 121.173333H339.626667c-13.653333 0-25.6 11.946667-25.6 25.6s11.946667 25.6 25.6 25.6h10.24l300.373333 184.32c3.413333 1.706667 8.533333 3.413333 13.653333 3.413333 8.533333 0 17.066667-5.12 22.186667-11.946666 6.826667-11.946667 3.413333-27.306667-8.533333-35.84l-228.693334-139.946667h223.573334c11.946667 0 22.186667-8.533333 23.893333-20.48z" fill="#333333" ></path><path d="M264.533333 438.613333c-59.733333 0-107.52 47.786667-107.52 107.52s47.786667 107.52 107.52 107.52 107.52-47.786667 107.52-107.52-47.786667-107.52-107.52-107.52zM764.586667 438.613333c-59.733333 0-107.52 47.786667-107.52 107.52s47.786667 107.52 107.52 107.52 107.52-47.786667 107.52-107.52-47.786667-107.52-107.52-107.52z" fill="#333333" ></path><path d="M803.84 694.613333h-129.706667l-121.173333-1.706666H220.16c-69.973333 0-126.293333 56.32-126.293333 126.293333 0 69.973333 56.32 128 126.293333 128h583.68c69.973333 0 126.293333-56.32 126.293333-126.293333 0-69.973333-56.32-126.293333-126.293333-126.293334zM303.786667 853.333333c-18.773333 0-34.133333-15.36-34.133334-34.133333s15.36-34.133333 34.133334-34.133333 34.133333 15.36 34.133333 34.133333-15.36 34.133333-34.133333 34.133333z m138.24 0c-18.773333 0-34.133333-15.36-34.133334-34.133333s15.36-34.133333 34.133334-34.133333 34.133333 15.36 34.133333 34.133333-13.653333 34.133333-34.133333 34.133333z m139.946666 0c-18.773333 0-34.133333-15.36-34.133333-34.133333s15.36-34.133333 34.133333-34.133333 34.133333 15.36 34.133334 34.133333-15.36 34.133333-34.133334 34.133333z m138.24 0c-18.773333 0-34.133333-15.36-34.133333-34.133333s15.36-34.133333 34.133333-34.133333 34.133333 15.36 34.133334 34.133333-15.36 34.133333-34.133334 34.133333z" fill="#333333" ></path></symbol><symbol id="icon-recursive" viewBox="0 0 1024 1024"><path d="M480.75717852 94.31629613c-42.88849472 3.70827517-70.6080526 8.61912544-102.58287635 18.33223228-52.60160156 15.82452125-97.89122454 38.9590101-140.23272856 71.69801202-15.93311501 12.44202732-49.98328579 46.16239491-63.07888657 62.64250058-32.51980345 40.81314767-56.42048144 86.86694883-70.60604162 135.75826425-6.98619734 24.22645921-14.07897743 62.3126974-14.18757116 75.95528883 0 15.49672903 18.22363855 23.24308257 29.24590325 12.44001636 4.36587058-4.25526583 5.23864251-6.98418635 7.31197855-22.80870761 10.14949279-78.7907921 45.72600895-151.58278549 101.16512476-207.56688096 61.11414426-61.54851922 139.03216443-97.78061981 235.50362634-109.56706271 19.86058865-2.40112828 77.04524827-2.83550323 95.48808528-0.65357343 104.98400463 12.54861008 194.58188495 57.51044084 255.58542445 128.44628566 45.94319644 53.36577973 74.09914028 117.64321943 82.82887045 188.79625173 0.98337666 8.40193796 2.511733 16.91448066 3.49309868 18.87922298 3.92948462 8.62113645 16.26090721 12.00564138 24.66284518 6.76699887 8.94892865-5.45784099 9.71310683-10.36869127 6.00282067-36.77708031-18.66203549-133.24854221-98.65339172-241.39785329-221.86304586-299.89167078-43.43347442-20.73336057-91.34141316-34.26735827-142.52325212-40.48736642-13.97038369-1.63695008-73.77335906-3.0567127-86.21337537-1.96474234z"  ></path><path d="M475.29933753 178.78211668c-21.28035125 2.18192979-42.23291028 5.67502847-46.59878087 7.74836453-8.83832393 4.25526583-12.44001634 15.16893681-7.74836452 23.24509358 1.41976261 2.39911728 3.92948462 5.34723623 5.56643473 6.54780036 4.03807836 3.0567127 11.45865067 2.94610797 33.50318008-0.32779222 23.68147951-3.60169239 65.04161789-4.36385958 88.61450368-1.74554383 63.94964749 7.0927801 118.73317884 29.13730953 165.65975191 66.78515072 11.24146318 8.94892865 30.88486434 28.48574707 39.94238674 39.61660552 31.31923931 38.52262412 52.27380934 84.79361278 59.80297539 132.81215627 2.29253452 14.18757117 4.58506907 18.11504481 13.09560076 21.60814346 8.07615675 3.38249393 18.11504481-0.87277191 21.93593569-9.16812714 1.96474231-4.47446432 1.96474231-5.01944403 0.10859375-17.13367914-9.38531462-62.96828182-40.81515866-125.28097922-86.32196915-171.22618662-45.28962299-45.83460268-104.98400463-77.80942642-171.87976007-92.10559135-26.19321253-5.56643474-39.50600079-6.87559261-73.66476533-7.20338481-18.00645107-0.21718748-36.88567403 0-42.01572279 0.54699067zM292.28670799 227.34362886c-23.02589508 5.02145501-43.54206816 9.93230531-45.61540421 11.02427573-5.45582998 2.61831575-8.62113645 8.83832393-7.96756298 16.25889622 1.20056415 14.07696642 12.87841329 19.09842145 30.66767684 12.98700702 2.83550323-0.98136565 5.56442371-1.52835635 5.89221596-1.09197039 0.3277922 0.3277922-5.67502847 7.09479107-13.42339299 15.06235406-48.45492943 49.76207631-75.73609039 102.6914701-87.73972075 170.89638344-1.41976261 8.18475047-0.76417817 12.55062107 2.83550322 17.35287761 3.16530646 4.25526583 10.91367098 7.42057231 15.933115 6.43920667 5.02145501-0.98337666 10.36869127-4.36587058 12.76981956-8.29535523 1.0899594-1.85413757 3.16329546-9.38531462 4.47245334-16.6972932 8.73174117-47.14376057 30.12068618-91.12221468 62.85968808-129.53624505 8.73174117-10.26009754 28.48373607-30.12068618 29.1393205-29.35650799 0.32578123 0.21718748-0.43839695 4.58305807-1.52835635 9.71310684-2.62032675 12.22081786-2.50972201 15.38612429 0.43638596 19.64340115 5.34723623 7.85695826 12.54861008 10.36668028 20.95457001 7.09278011 8.29133323-3.0567127 9.71109585-6.00282068 17.02307442-35.14013022 3.59968142-14.29817589 8.29334422-32.52181443 10.36668028-40.48736644 4.25727683-16.80588693 4.58506907-22.2617169 1.52835634-27.28317193-2.40112828-3.92948462-9.71310683-7.85695826-14.18757116-7.74836451-1.52835635 0.10859374-21.49753873 4.1466721-44.41685107 9.16812713z"  ></path><path d="M496.79687626 256.81074161c-20.18838085 5.56442371-35.02952545 21.82533097-38.08422717 41.79652431-3.16530646 20.40757933 7.0927801 40.92375241 26.40838903 52.38240308l7.09479107 4.25727682v20.51617309l-48.01854349 0.5449797c-46.27299964 0.54497969-48.23573095 0.65558444-54.45775012 3.0567127-18.54941977 6.98418635-32.51779245 20.95255903-39.61258353 39.72318827-1.20056415 3.27390019-1.96474231 10.03888805-2.40112826 22.69810287l-0.65357345 18.00645104-16.91649165 0.54699072c-13.53198672 0.43638595-17.67865885 0.98136565-20.51617308 2.50972202-6.22000816 3.38249393-12.44202732 9.82170058-15.06034308 15.49672903-2.50972201 5.34723623-2.61831575 6.22000816-2.61831577 36.66647555v31.10205184l2.83550325 5.67502845c2.94811898 6.00282068 9.05953339 11.89503663 15.60532278 15.16893683 3.0567127 1.52835635 7.53117703 2.07534705 20.2989856 2.51173301l16.36950096 0.54497969 0.65558444 16.91448067c0.65558444 18.22564954 1.96474231 24.11786548 8.18475046 34.70374424 5.12803777 8.84033491 16.15231347 19.31761994 25.42702337 24.11786548 16.15231347 8.40394896 9.71310683 7.967563 127.68411849 7.85695826 70.16965565-0.10859374 107.05734066-0.5429687 110.76561583-1.30714687 22.2637279-4.69366282 42.23492128-23.02790608 48.67412791-44.74464331 1.63695008-5.56643474 2.18192979-10.47728502 2.1819298-21.28035123 0-7.74836452 0.43638595-14.62395712 0.87277192-15.3881353 0.43638595-0.76417817 6.33061291-1.30915788 17.13367913-1.63695012 15.16893681-0.3277922 16.80588693-0.54497969 21.82734195-3.27390018 6.43719565-3.38249393 11.34804594-8.40193796 14.84114461-15.06034308 2.50972201-4.6916518 2.61831575-5.89221596 2.94610797-33.61177384 0.43638595-34.0481598-0.10859374-37.1028615-8.18475048-46.05179017-3.0567127-3.38450493-7.52916604-6.87760361-10.69447249-8.29535521-4.91085028-2.40112828-6.98418635-2.61831575-21.38894502-2.61831576-13.64259146 0-16.15231347-0.21919846-16.69729315-1.74755484-0.3277922-0.98136565-0.65558444-8.51053171-0.65558444-16.91448066 0-12.54861008-0.43638595-16.4780947-2.29253454-22.04452942-5.23663151-15.82452125-16.36950095-28.80951729-30.55506113-36.01290211-14.07696642-7.20338483-15.16893681-7.31197856-63.94964748-7.31197857-24.11987647 0-44.5274558-0.3277922-45.50882147-0.65558443-1.41775162-0.5429687-1.74554384-2.39911728-1.74554382-8.83832392 0-4.47446432 0.54497969-9.0575224 1.0899594-10.25808655 0.65558444-1.0919704 4.25727683-4.03807836 8.07615673-6.43920663 23.68147951-14.95174932 32.19402223-42.45210876 20.51617306-66.35077576-6.22000816-12.87841329-19.09641045-23.13649983-33.5031801-26.95537971-7.74836452-1.96474231-18.77062924-1.96474231-25.97200305 0z m21.93593569 36.23008958c5.13004875 3.82089087 7.31197856 7.74836452 7.31197855 13.20620551 0 12.11222411-13.20419451 19.7519949-23.68147951 13.64058047-11.02025373-6.43920665-11.34804594-20.95457003-0.65357346-27.7195579 4.47446432-2.72892048 12.76981954-2.29253452 17.02307442 0.87277192z m101.60151068 121.57270406c3.59968142 1.85413757 7.85695826 4.91085028 9.38531463 6.87559261 6.22000816 8.18475047 6.00282068 4.47446432 6.00282069 93.30615547v81.73891106l-3.05671273 5.78362221c-3.82089087 7.42057231-11.78443189 13.64058046-19.31560892 15.16893683-3.71028615 0.76417817-39.61459453 1.0919704-107.49372665 0.87277191l-102.03789665-0.32779222-6.00080969-3.38249392c-6.76699887-3.82089087-12.44202732-10.47728502-14.18757115-16.58668846-0.65558444-2.62032675-1.0919704-32.19603323-1.09197039-83.8122471 0-85.45120821 0-84.79562377 5.45784097-91.77981013 2.83550323-3.59968142 9.49189735-8.40394896 13.64058046-9.93029431 2.18192979-0.76417817 37.21346624-1.20056415 107.60232038-1.20056413l104.3304312-0.11060473 6.76498785 3.38450491zM347.40004256 514.57407386l0.21919846 22.15513416h-10.36869125c-9.0575224 0-10.36668028-0.21919846-10.47728501-1.96474231-0.43437497-4.58506907 0.43839695-41.25154462 0.87478291-42.01572281 0.3277922-0.43638595 4.80225654-0.65558444 9.93029431-0.5449797l9.49591935 0.32578123 0.32578123 22.04452943z m345.50908599-20.84396528c0.32578123 0.98337666 0.65357343 10.6944725 0.65357344 21.7187482 0 14.62194613-0.3277922 20.18838085-1.30915786 21.06115277-0.87277191 0.65558444-5.12803777 0.87277191-10.91367098 0.54497971l-9.38531462-0.65357346-0.43638596-6.65639413c-0.21718748-3.60169239-0.10859374-13.64259146 0-22.26372789l0.43638596-15.49672905h10.1494928c8.18475047 0 10.25808654 0.3277922 10.80507722 1.74554385z"  ></path><path d="M438.41366351 472.45176833c-12.76981954 6.33061291-14.51536337 23.02589508-3.49309868 33.06679413 14.18757117 12.76981954 37.76045694-1.52835635 32.7390019-19.96918237-3.38249393-12.55062107-17.45946036-18.88123397-29.24590322-13.09761176zM560.96773322 471.68759013c-4.36385958 1.85614859-9.49390835 7.31197856-11.13085845 11.7864429-1.85614859 5.23864251-1.63695008 9.60451309 0.65357343 14.5153634 6.76699887 14.62395712 25.5376281 16.69729318 34.92294271 3.82089087 6.0008097-8.29535522 5.34723623-17.89785733-1.85614856-25.42903435-5.56643474-5.89221596-15.27753056-7.85695826-22.58950913-4.69366282zM473.66238742 542.84062244c-6.87559261 3.60169239-10.36668028 8.94892865-10.36668026 15.93311501 0 4.47446432 3.92747363 11.35005693 7.965552 14.40676965 2.94811898 2.18192979 4.36587058 2.29253452 36.5598928 2.29253452 33.28398162 0 33.5031801 0 37.10286151-2.511733 4.69366282-3.38249393 7.20338483-8.40193796 7.20338481-14.40475866 0-6.00282068-2.50972201-11.0222647-7.20137381-14.40475864-3.60169239-2.50972201-4.03807836-2.50972201-35.79571464-2.83751424-27.7195579-0.21919846-32.63040819 0-35.46792241 1.52835636z"  ></path><path d="M98.57960597 564.01237996c-2.18192979 1.20056415-5.12803777 3.71028615-6.5457894 5.67502847-3.49309867 4.91085028-3.16530646 13.85977894 1.19855315 36.34069433 15.60532277 79.55497027 52.71019531 149.18165723 109.78626116 206.14711834 65.80579606 65.69921332 150.38222137 104.43902492 251.54533509 115.35068493 25.8654203 2.83952523 79.12059531 3.38450493 102.58287636 1.20257511 95.49009627-9.16812715 173.51872117-39.2888133 236.15921079-91.56061164 56.09470021-46.81797935 99.20038242-109.13067674 122.44547598-177.12041357 8.29334422-24.55425143 16.4780947-59.14739093 18.44283701-78.02661391 0.87277191-8.51254271-2.07333605-14.07897743-9.27672087-17.78926358-6.11141442-3.0567127-10.25607554-3.0567127-16.36950097 0-6.43920665 3.27390019-8.51254271 7.42057231-10.47728502 20.19039183-8.18475047 54.34513439-31.75562528 112.18537844-64.71382565 158.23716864-47.68874028 66.46138049-111.64039874 111.42321127-192.17874567 135.10469078-68.64331028 20.07978711-156.2744373 23.13649983-227.86586656 8.07615675-73.11576364-15.49672903-135.43047201-48.67211691-185.73953903-99.09178869-54.89212509-55.00071884-88.61450365-121.24290085-101.49090597-199.16293202-2.50972201-15.49672903-2.83751423-16.26090721-7.31197855-20.51617307-5.89221596-5.56643474-13.20419451-6.65639412-20.19039185-3.0567127z"  ></path><path d="M182.83025004 564.23157844c-3.60169239 1.85413757-5.56643474 3.82089087-7.53117705 7.74836451l-2.61831574 5.2386425 1.96474231 11.13085845c10.47728502 60.02217385 42.23291028 119.93575395 87.85032549 165.55115818 52.92939377 53.03798751 125.06379173 86.97554258 202.9818119 95.48808529 18.77062924 2.07534705 48.67211691 3.38450493 52.71019531 2.29253453 3.60169239-0.87277191 10.14949279-6.54780039 12.33142258-10.58587876 3.49309867-6.87559261 0.87277191-15.60532277-6.43719564-21.06115277-2.62032675-1.96474231-5.34924725-2.29253452-22.37232167-3.05671271-56.20329397-2.40112828-100.50954031-13.64058046-144.05361944-36.33868332-27.06397344-14.18757117-48.34432468-30.01209243-71.1530323-52.82080005-37.1028615-37.32407098-61.98490518-81.41111883-73.66275432-131.06661242-5.89221596-24.77143891-5.78362222-24.55425143-8.40193797-27.82815164-2.62032675-3.38249393-9.82170058-6.98418635-13.97038368-7.09278006-1.52835635 0-5.01944403 1.0919704-7.63775978 2.40112827zM826.15565977 562.92242057c-5.89221596 1.85413757-10.14949279 7.42057231-12.1142351 15.82251025-7.74836452 34.15876454-12.87841329 49.65549359-24.4456577 73.11978562-12.87640228 26.29979526-27.7195579 47.36094805-48.56352319 69.07768525-19.31560894 20.19039185-45.61540421 40.15957423-66.56796325 50.63685925-13.42339298 6.76699887-13.53399773 6.76699887-5.56643471-5.45583001 13.09560078-20.19039185 14.51335239-24.33706395 11.13085846-32.30261595-2.94610797-7.09479107-12.98700702-12.00564138-20.73336055-10.04089907-1.52835635 0.3277922-4.47647533 2.07333605-6.43920666 3.92948466-2.94811898 2.61831575-43.32488068 62.64048961-51.72882964 77.15585299-5.23864251 8.94892865-1.85413757 21.38894499 6.98418636 25.09923111 3.60169239 1.41775162 83.37586115 10.14949279 92.98037424 10.14949282 6.0008097 0 12.22282885-4.03807836 15.16893684-9.82170058 2.94610797-5.89221596 3.0567127-10.80507723 0.32779222-16.15231348-2.94811898-5.67502847-8.73174117-8.72973019-19.31761995-9.82170059l-8.62113644-0.87277191 6.54780039-3.2739002c10.14949279-5.12803777 23.90067799-14.07696642 37.6498522-24.33505295 14.18757117-10.47728502 40.70656493-36.34069434 51.72882964-50.31107801 22.37232163-28.37313133 41.46873211-63.07687556 52.38240309-95.37949152 5.78362222-17.13367915 12.65921481-45.50882147 12.65921479-52.27380935 0-10.25607554-12.54861008-18.33424327-23.46228104-14.94973833zM412.33105568 697.04373469c-5.34723623 3.92747363-7.31197856 8.29334422-6.6563941 15.27753056 0.54497969 6.00282068 3.59968142 10.58587876 8.84033492 13.423393 3.16329546 1.74554384 10.91165998 1.85614859 96.36085719 1.96474232h92.8697695l3.71229714-2.50972203c8.62113645-5.78563321 10.91165998-14.62395712 5.89221597-23.13649982-5.01944403-8.72973019 1.41775162-8.18475047-103.45564829-8.18475049h-93.19756173l-4.36385958 3.16530646z"  ></path></symbol><symbol id="icon-simple" viewBox="0 0 1024 1024"><path d="M499.49362083 97.71286704c-12.86433633 2.18394078-24.51403152 11.04438564-30.94921619 23.54473186-3.51924161 6.67650409-3.88122074 8.25312432-3.88122075 18.81286012 0 10.19574569 0.36197915 12.37968647 3.3985819 18.446859 4.36788158 8.98110458 12.37767549 16.87224976 21.23610936 21.24013135 6.06918353 2.91192106 8.37579502 3.27792217 18.44886999 3.3985819 9.95442626 0 12.50235717-0.48666084 18.44887-3.2779222 19.66150011-9.10176431 30.22123593-30.70588577 24.75937296-50.24672616-2.54994192-8.49444373-8.73978517-18.44685902-14.32230784-22.81675158-10.4370651-7.88913419-24.2727121-11.28570509-37.13905943-9.10176429zM221.32069823 209.24869403c-18.93351985 4.00590245-33.3764874 20.27083165-34.95511864 39.56633064-1.33530081 17.47554833 9.10377529 34.83244794 25.48735323 42.47825169 6.67650409 3.03660275 9.10377529 3.51924161 18.56952971 3.5192416 13.835647 0 21.96811162-3.3985819 31.55653674-13.22832646 8.61711444-8.86044486 11.89302563-17.35488861 11.89302564-30.46255534 0-12.50034618-3.03459175-19.17685027-12.98700702-29.24992523-10.79904425-10.80105523-25.48735321-15.53493795-39.56431966-12.6230169zM784.82970833 209.24869403c-19.4181697 4.00590245-33.61981782 19.66150011-35.19643806 38.83835038-2.06328108 24.2727121 16.26291822 45.26951303 41.14496187 47.09147468 33.25381669 2.30460051 57.16253868-33.98380796 41.3862813-63.11106248-8.98311558-16.38558893-29.73658608-26.4586639-47.33480511-22.81876258zM499.2502904 217.86580849c-35.80174761 7.28382463-48.06077438 50.00339575-20.99478992 73.79145801l6.43317365 5.58453368V342.87530335l-35.43976847-0.72798027c-49.5187459-1.0919704-66.63231509 1.21263011-87.74977574 11.89302563-25.36468251 12.7436766-46.96880398 35.8037586-56.4345584 60.56313156-4.36989257 11.16504539-7.28382463 25.00270337-7.28382463 33.74047755 0 6.67650409 1.09398139 5.94651283-13.95630671 9.10176428-19.4181697 4.00590245-37.62572028 15.89892809-45.75617388 29.8572458-6.43116267 10.92372595-7.27980263 16.50624864-6.79716379 48.18344509l0.36600112 28.88392412 4.12656215 8.37579503c8.37378402 16.99089849 24.51403152 29.00659481 45.75416288 33.98179696 17.35488861 4.00590245 15.53493795 2.91393206 16.50624864 10.92372593 3.51924161 27.55063429 23.66740255 54.49394805 50.12606647 66.87363451 16.26291822 7.52514406 25.1213521 9.224435 53.39996664 9.82974455l25.3666935 0.72798027-5.8258531 2.91393206c-8.13246461 4.12656215-24.88003265 16.26291822-33.61780682 24.39337182-10.68039553 9.83376655-22.69609186 25.00270337-26.94532475 34.10647867-8.61711444 18.3261993-2.30460051 37.74436898 15.53493795 47.21213438l6.06918354 3.2759112 126.10146526 0.36399014 125.97879455 0.24131941 6.31050294-2.78925033c8.49645473-3.88524274 12.98700702-8.0118049 16.99290949-15.41427825 4.36788158-8.00979391 5.33919227-17.84154945 2.79126133-26.82265404-5.09787284-17.35488861-33.3764874-46.84814428-60.80646198-63.3543929l-6.9178235-4.12656216 24.63871324-0.72798027c28.76326439-0.72798026 37.38037885-2.42727121 54.12995791-11.04438564 25.73068363-13.34898617 41.99360183-34.83043692 47.2121344-62.50374193l2.06328106-10.92372595 6.79716381-1.33530084c19.4181697-3.88122074 31.79785618-9.70908484 42.23492126-19.7821598 14.32230786-13.95630671 17.2342289-23.54473186 17.23422891-56.67788884-0.1206597-25.3666935-0.84863999-31.06987589-5.58252269-40.65830103-9.224435-18.20553959-25.48735321-29.49325566-50.12606644-34.4684578l-10.31640541-2.06328108-1.57662024-13.35099715c-4.49055229-40.29431091-31.67719645-75.49074895-70.1515567-91.02568692-20.14614994-8.13045362-25.48534221-8.61711444-96.12154876-8.86044487l-24.63871322-0.1206597V297.728461l6.67650407-6.06918351c7.64580375-7.03848323 12.25701578-15.53493795 14.07696641-26.21533348 2.54994192-14.07696642-4.12656215-29.9779055-16.50423763-39.32300022-9.95442626-7.52313306-22.21144203-10.55772482-33.37648741-8.25312431z m131.68599893 172.10096954c20.14614994 8.13045362 36.16774876 24.75736196 41.99159087 43.81355251 2.30661149 7.64580375 2.30661149 11.04438564 2.06328109 95.27290878l-0.36197915 87.3837746-4.00590246 8.13246461c-7.03848323 14.44296755-19.42018069 22.69609186-37.01839968 25.12336309-12.6210059 1.81995067-243.09915523 1.81995067-252.07824885 0.1206597-14.44497854-2.79126133-27.91663541-12.13635606-34.34779807-24.03139268-5.46186298-10.073075-5.82585311-16.86822778-5.46186296-103.5260331 0.36197915-79.3739807 0.48464985-80.70928151 3.15525147-88.59841571 6.67650409-20.02549024 24.15205239-37.25971914 45.14684232-44.42087307l7.89114519-2.79126132 112.87112781 0.36399012 112.87313879 0.24333042 7.27980266 2.91393205zM297.78074689 532.57248093v33.37648741l-6.31050295-1.94262137c-16.38357792-4.85454241-16.74756806-5.33919227-16.74756806-31.67719646 0-12.13635606 0.48464985-21.96610061 1.21263009-23.42407212 1.81995067-3.27591119 13.35099716-8.61510347 20.99680094-9.46575442 0.48464985-0.1206597 0.84863999 14.9276174 0.84863998 33.13315696z m435.10294432-29.49124465c3.63990131 1.33328982 7.28181364 3.63990131 8.01180491 4.97520212 2.18394078 4.00590245 2.79126133 39.32300021 0.84863995 45.26951305-1.69929095 5.21853257-5.46186298 7.76847447-16.2629182 11.04438566l-5.34120328 1.57863123v-65.41767398h3.03660278c1.57662023 0 5.94450181 1.0919704 9.70707384 2.54994192z m-163.23851368 230.23280791c12.50034618 6.43317364 22.33210175 13.35300816 32.76916684 23.06008201l7.88913419 7.40448433H407.61929394l8.73777417-8.25312431c10.55973581-10.07508597 23.18275273-18.56952971 35.56042818-24.03139271l9.10377529-4.00590243 49.15274476 0.36600112 49.15475579 0.24131943 10.3164054 5.21853256z"  ></path><path d="M411.01787584 465.45551601c-8.61711444 3.27792217-17.72088973 11.77437693-21.72478121 20.27083165-2.79126133 5.70318239-3.3985819 8.61510347-3.39858189 16.62489735-0.1206597 12.37968647 3.63990131 20.7534705 13.22832647 29.61391538 24.63871324 22.45276145 63.71838305 6.31251394 65.90232383-27.18463317 0.85065098-12.86634733-1.81995067-19.78417081-11.16504539-29.24992525-5.46186298-5.58453369-9.224435-8.13246461-14.44296756-10.07508596-8.98110458-3.27591119-19.90483054-3.27591119-28.39927425 0zM577.17032157 465.09152587c-27.79195372 9.95442626-35.56042819 44.78486319-14.68629796 65.65899342 18.81286012 18.81286012 50.49005658 13.95831771 63.59772331-9.70707386 3.3985819-6.06918353 3.63990131-7.52514406 3.63990134-18.69220042 0-10.3164054-0.36197915-12.86433633-2.79126136-17.3548886-9.46575442-17.59620803-31.43386604-26.4586639-49.76006533-19.90483054zM530.1995066 566.19229876c-15.77625738 6.91782349-30.09856522 7.03848323-45.02618262 0.48464985-11.89503663-5.21853257-21.72478119-3.15726247-27.18664417 5.70519337-3.15726247 5.21853257-3.15726247 13.7149873-0.1206597 18.81084916 7.64580375 12.37968647 37.01638873 21.72478119 58.98248933 18.69018943 17.84356046-2.54793093 34.95511865-10.19574569 40.29632189-18.2035286 7.40247334-10.92372595-0.36399012-27.18865515-13.71498729-28.76527539-3.51924161-0.36197915-6.91782349 0.48666084-13.22832646 3.27792218zM120.46325579 464.60687602c-13.47165686 5.21853257-22.08877132 12.86433633-27.55063432 24.75937295-4.24722188 9.224435-4.36788158 21.96811162-0.24131942 32.40517675 3.63990131 9.224435 13.47165686 19.90483054 22.20943103 23.78806224 5.33919227 2.42727121 8.25312432 2.91192106 19.05417957 2.91192105 11.65170622 0 13.35099716-0.24131942 19.29750996-3.3985819 8.25312432-4.36788158 16.99290948-13.10766674 20.75347053-20.8741302 2.54994192-5.21853257 3.03660275-7.76847447 3.03660276-18.2055396 0-14.19963714-1.82196165-18.69018943-11.65371721-29.12725452-8.73777415-9.224435-17.35488861-13.10766674-30.21922493-13.59432758-6.67650409-0.24131942-11.89503663 0.24131942-14.68629797 1.33530081zM875.85539523 465.09152587c-12.13635606 4.36989257-20.7534705 12.25902676-26.21533348 24.15205239-4.00590245 8.73978517-3.76056103 25.12336308 0.60732058 34.34779809 4.36788158 9.46776541 10.4370651 15.89892809 19.41816967 20.6328108 6.67650409 3.63990131 8.98110458 4.24722188 18.56952972 4.611212 15.29160754 0.60732054 22.69609186-2.18394078 33.4971471-12.98499604 9.83175555-9.83175555 12.6230169-16.62891934 12.62301691-31.06987589-0.1206597-8.61711444-0.48666084-10.55973581-4.12656215-17.35488862-8.13246461-15.05028811-21.36079105-23.42608314-38.35370054-24.15205239-7.15914293-0.36600113-11.28570509 0.1206597-16.01958781 1.81793966zM216.83014595 717.17379669c-12.25902676 3.76056103-21.72478119 12.25701578-27.30931487 24.39337181-2.18394078 4.73388271-2.79126133 8.13246461-2.79126134 16.87224976 0 9.46575442 0.48666084 11.77035493 3.39858189 17.83752747 4.36989257 8.98311558 12.37968647 16.87224976 21.24013135 21.24214233 6.06717253 2.91192106 8.25312432 3.3985819 18.44685901 3.3985819 10.19574569 0 12.37968647-0.36600113 19.05619054-3.51924161 9.22242401-4.24923286 17.47554833-12.6230169 21.96610062-22.33411273 2.79126133-5.82384211 3.27792217-8.61711444 3.27792218-17.23422889 0-8.85843388-0.48666084-11.28570509-3.3985819-17.23422891-4.49055229-9.10176431-15.53493795-19.29750996-24.51604253-22.69408089-7.88913419-2.91393206-21.36079105-3.27792217-29.37058495-0.72798024zM779.49051606 717.17379669c-13.7149873 4.36788158-26.21734449 17.96220916-29.00860581 31.79785614-4.12656215 19.78215982 5.94852382 39.80765007 24.51604253 48.42476451 6.7971638 3.15726247 8.98311558 3.51924161 19.17685026 3.51924161 10.07508597 0 12.37968647-0.36197915 18.20553958-3.27792216 8.61711444-4.24521087 17.35488861-12.98499603 21.60412148-21.60211049 2.79126133-5.70318239 3.27792217-8.13045362 3.27792218-17.59620804 0-9.3471057-0.48666084-11.89503663-3.27792218-17.84356044-4.00590245-8.61711444-12.13836705-16.74756806-21.36079105-21.23812034-5.7051934-2.79126133-8.73978517-3.3985819-17.23422891-3.63990133-6.43317364-0.24333041-12.37968647 0.36197915-15.89892808 1.45596054zM494.6390784 842.66794139c-17.96220916 6.67449309-29.37058496 22.45276145-29.37058495 40.77896074 0 18.44685902 12.13635606 35.43976848 29.73457509 41.50694102 8.61711444 2.91393206 22.33210175 2.54994192 31.55653673-0.97131068 10.07508597-3.76056103 20.99478993-14.68428699 24.88003267-24.75736194 7.88913419-20.87614121-1.45596053-44.30021335-21.48145077-54.25262863-10.3164054-5.09787284-25.24402279-6.06717253-35.31910877-2.30661149z"  ></path></symbol><symbol id="icon-lujing" viewBox="0 0 1052 1024"><path d="M709.60338431 482.87961759v-127.98103245h29.70988168v127.98103245H867.29429637v29.7098817h-127.98103038v127.98103241h-29.70988168v-127.98103241h-127.98103245v-29.7098817h127.98103245zM214.32985002 328.48980049c0-148.40430848 133.13219632-259.26316192 310.81107642-259.26315989 177.64260461 0 311.60914357 113.86974445 311.60914563 260.53281466h-29.6373307c0-146.66307019-121.01607718-231.18569001-281.75415984-231.18569-160.77435614 0-281.75415785 97.11032249-281.75415786 228.79148659 0 72.18884766 41.24558672 132.47923121 125.26034541 184.17224975l7.8718489 4.2442682v96.85639401l64.20817225-38.74255884 5.04233536 1.26965476c14.87307964 3.15599506 54.59508306 11.75336005 71.82608858 1.70496282l15.30838969 25.21168292c-22.63609995 13.27694332-55.93728681 9.32288115-86.98937423 2.93834002l-99.10549336 59.52859189v-132.55178423c-88.98454308-56.51770092-132.69688625-122.43083396-132.69688625-203.50725266z" fill="#00377C" ></path><path d="M328.88883511 541.86407291Q196.19194886 453.7864235 196.19194886 328.48980049q0-119.78269998 95.29653315-199.22670688Q385.29770748 51.08873942 525.14092644 51.08873942q139.44418442 0 234.08775455 79.51655793 95.69556775 80.38717808 95.69556776 199.15415791v18.13790117H788.93856268v-18.13790117q0-98.5976323-73.63987791-156.34871043-72.40650271-56.69908044-189.97637875-56.69907838-114.41388105 0-189.75872379 60.97962418-73.85753498 59.78252247-73.8575329 149.67396122 0 96.82011646 116.19139487 168.428552l16.94079946 9.1415016v75.56249571l43.16820655-26.04602554 12.04356611 3.04716651q47.52130133 10.15722378 58.58542077 3.70013367l15.38094069-8.9601241 34.17180496 56.19121735-15.92507727 9.32288112q-30.58050187 17.88397066-92.79350326 6.42081865l-120.61704263 72.44277617V541.90034841z m362.57664598-77.12235649h-127.98103039v65.98568401h127.98103039v127.98103244h65.98568609v-127.98103244H885.43219756v-65.98568401h-127.98103038v-127.98103246h-65.98568609v127.98103246z" fill="#666666" ></path></symbol><symbol id="icon-agent" viewBox="0 0 1024 1024"><path d="M458 476.6L170.8 332.9c-19.6-9.8-38.6-10.2-53.4-1-14.8 9.2-23 26.2-23 48.1v332.2c0 31.4 21.7 67.7 49.3 82.8l289.1 156.6c10.5 5.7 20.8 8.6 30.6 8.6 8.1 0 15.6-2 22.2-5.9 14.7-8.8 22.9-25.7 22.9-47.6V558.2c0-15.4-5.2-32.2-14.5-47.4-9.4-15.1-22.2-27.3-36-34.2z m-7.3 81.6v337.4L171.2 744.2c-8.9-4.8-19.1-21.9-19.1-32V388.3l280 140c8.7 4.3 18.6 20.2 18.6 29.9zM874.5 300.8c19.3-9.5 29.9-23.1 29.8-38.3 0-15.2-10.6-28.8-29.9-38.3l-302-148c-16.3-8-37.8-12.3-60.5-12.3-22.7 0-44.2 4.4-60.4 12.3l-302 147.9c-19.3 9.5-29.8 23.1-29.8 38.3 0 15.2 10.6 28.8 29.9 38.3l302 148c16.3 8 37.8 12.3 60.5 12.3 22.7 0 44.2-4.4 60.4-12.3l302-147.9z m-671.8-38.4L477 128.1c18-8.8 52-8.8 70.1 0l274.2 134.3L547 396.8c-18 8.8-52 8.8-70.1 0L202.7 262.4zM906.7 332.4c-14.8-8.8-33.6-7.9-52.9 2.6L581 483.3c-27.6 15.1-49.3 51.6-49.3 82.9v340.3c0 22 8.1 38.8 22.8 47.4 6.4 3.7 13.6 5.6 21.4 5.6 10 0 20.4-3.1 31.1-9.1l273.8-154.7c13.3-7.6 25.7-20.3 34.8-35.8 9.1-15.5 14.1-32.5 14.1-47.7V380c-0.1-21.9-8.2-38.8-23-47.6z m-34.9 58.7v321c0 10.4-10.3 28.1-19.4 33.2L589.5 893.9V566.2c0-10.1 10.2-27.2 19.1-32.1l263.2-143z" fill="#101316" ></path></symbol><symbol id="icon-pipeline" viewBox="0 0 1024 1024"><path d="M527.579429 186.660571a119.954286 119.954286 0 1 1-67.949715 0V47.542857a33.938286 33.938286 0 0 1 67.949715 0v139.190857z m281.380571 604.598858a119.954286 119.954286 0 1 1 67.949714 0v139.190857a33.938286 33.938286 0 1 1-67.949714 0v-139.190857z m-698.441143 0a119.954286 119.954286 0 1 1 67.949714 0v139.190857a33.938286 33.938286 0 0 1-67.949714 0v-139.190857zM144.457143 13.531429c18.797714 0 34.011429 15.213714 34.011428 33.938285v410.038857a33.938286 33.938286 0 0 1-67.949714 0V47.542857c0-18.724571 15.213714-33.938286 33.938286-33.938286z m0 722.139428a60.269714 60.269714 0 1 0 0-120.466286 60.269714 60.269714 0 0 0 0 120.466286z m698.514286-722.139428c18.724571 0 33.938286 15.213714 33.938285 33.938285v410.038857a33.938286 33.938286 0 1 1-67.949714 0V47.542857c0-18.724571 15.213714-33.938286 34.011429-33.938286z m0 722.139428a60.269714 60.269714 0 1 0 0-120.466286 60.269714 60.269714 0 0 0 0 120.466286z m-349.403429 228.717714a33.938286 33.938286 0 0 1-33.938286-33.938285V520.411429a33.938286 33.938286 0 0 1 67.949715 0v410.038857a33.938286 33.938286 0 0 1-34.011429 33.938285z m0-722.139428a60.269714 60.269714 0 1 0 0 120.539428 60.269714 60.269714 0 0 0 0-120.539428z" fill="#000000" ></path></symbol><symbol id="icon-skip1" viewBox="0 0 1024 1024"><path d="M921.6 356.266667c-14.933333-8.533333-34.133333-4.266667-42.666667 12.8L829.866667 448c-51.2-157.866667-200.533333-266.666667-369.066667-266.666667-172.8 0-324.266667 115.2-373.333333 277.333334-4.266667 17.066667 4.266667 34.133333 21.333333 40.533333 17.066667 4.266667 34.133333-4.266667 40.533333-21.333333 40.533333-136.533333 166.4-232.533333 311.466667-232.533334 140.8 0 264.533333 89.6 307.2 219.733334l-81.066667-46.933334c-14.933333-8.533333-34.133333-4.266667-42.666666 10.666667-8.533333 14.933333-4.266667 34.133333 10.666666 42.666667l147.2 85.333333c4.266667 2.133333 10.666667 4.266667 17.066667 4.266667 2.133333 0 6.4 0 8.533333-2.133334 8.533333-2.133333 14.933333-8.533333 19.2-14.933333l85.333334-147.2c8.533333-12.8 4.266667-32-10.666667-40.533333zM896 757.333333H128c-17.066667 0-32 14.933333-32 32s14.933333 32 32 32h768c17.066667 0 32-14.933333 32-32s-14.933333-32-32-32z" fill="#666666" ></path></symbol><symbol id="icon-annotation" viewBox="0 0 1024 1024"><path d="M273.06666667 409.6h204.8c18.848 0 34.13333333-15.28533333 34.13333333-34.13333333s-15.28533333-34.13333333-34.13333333-34.13333334H273.06666667c-18.848 0-34.13333333 15.28533333-34.13333334 34.13333334s15.28533333 34.13333333 34.13333334 34.13333333zM273.06666667 580.26666667h375.46666666c18.86933333 0 34.13333333-15.264 34.13333334-34.13333334s-15.264-34.13333333-34.13333334-34.13333333H273.06666667c-18.848 0-34.13333333 15.264-34.13333334 34.13333333s15.28533333 34.13333333 34.13333334 34.13333334zM477.86666667 682.66666667H273.06666667c-18.848 0-34.13333333 15.264-34.13333334 34.13333333s15.28533333 34.13333333 34.13333334 34.13333333h204.8c18.848 0 34.13333333-15.264 34.13333333-34.13333333s-15.28533333-34.13333333-34.13333333-34.13333333zM968.512 654.03733333L847.82933333 533.35466667c-6.66666667-6.66666667-15.40266667-9.99466667-24.13866666-9.99466667s-17.472 3.328-24.13866667 9.99466667L556.128 776.78933333c-6.4 6.4-9.99466667 15.08266667-9.99466667 24.13866667V921.6c0 18.848 15.28533333 34.13333333 34.13333334 34.13333333h120.68266666c9.056 0 17.73866667-3.59466667 24.13866667-9.99466666l243.424-243.424c13.32266667-13.33333333 13.32266667-34.944 0-48.27733334zM686.80533333 887.46666667H614.4v-72.40533334L823.69066667 605.76l72.40533333 72.40533333L686.80533333 887.46666667z" fill="#333333" ></path><path d="M443.73333333 887.46666667H170.66666667V136.53333333h409.45066666l0.11733334 136.62933334c0.064 37.57866667 30.69866667 68.17066667 68.26666666 68.17066666H785.06666667v85.33333334c0 18.848 15.28533333 34.13333333 34.13333333 34.13333333s34.13333333-15.28533333 34.13333333-34.13333333V259.06133333c0-9.152-3.68-17.92-10.19733333-24.34133333L683.82933333 78.05866667A34.13546667 34.13546667 0 0 0 659.904 68.26666667H136.53333333c-18.848 0-34.13333333 15.28533333-34.13333333 34.13333333v819.2c0 18.848 15.28533333 34.13333333 34.13333333 34.13333333h307.2c18.848 0 34.13333333-15.28533333 34.13333334-34.13333333s-15.28533333-34.13333333-34.13333334-34.13333333z m341.03466667-614.4H648.50133333l-0.10666666-134.112L784.768 273.06666667z" fill="#333333" ></path></symbol><symbol id="icon-groundtruth" viewBox="0 0 1024 1024"><path d="M699.23368747 298.77036587v-51.15004907c0-4.68875413-3.83625387-8.525008-8.525008-8.525008h-409.2003904c-4.68875413 0-8.525008 3.83625387-8.525008 8.525008v51.15004907c0 4.68875413 3.83625387 8.525008 8.525008 8.525008h409.2003904c4.68875413 0 8.525008-3.83625387 8.525008-8.525008z m-417.7253984 93.77508906c-4.68875413 0-8.525008 3.83625387-8.525008 8.525008v51.15004907c0 4.68875413 3.83625387 8.525008 8.525008 8.525008h196.0751872c4.68875413 0 8.525008-3.83625387 8.525008-8.525008v-51.15004907c0-4.68875413-3.83625387-8.525008-8.525008-8.525008h-196.0751872z m400.6753824 123.6126176c-127.129184 0-230.1752192 103.04603627-230.1752192 230.1752192s103.04603627 230.1752192 230.1752192 230.17522027 230.1752192-103.04603627 230.1752192-230.17522027-103.04603627-230.1752192-230.1752192-230.1752192z m114.5547968 344.730016c-30.58346667 30.58346667-71.2903808 47.42035733-114.5547968 47.4203584-43.264416 0-83.97133013-16.83689067-114.5547968-47.4203584-30.58346667-30.58346667-47.42035733-71.2903808-47.42035734-114.5547968 0-43.264416 16.83689067-83.97133013 47.42035734-114.55479573 30.58346667-30.58346667 71.2903808-47.42035733 114.5547968-47.4203584 43.264416 0 83.97133013 16.83689067 114.5547968 47.4203584 30.58346667 30.58346667 47.42035733 71.2903808 47.4203584 114.55479573 0 43.264416-16.83689067 83.97133013-47.4203584 114.5547968z m-19.71408107-195.54237333h-47.20723307c-2.7706272 0-5.32813013 1.27875093-6.92656853 3.51656533l-67.66725227 93.5619648-24.61596053-33.99346986c-1.59843947-2.2378144-4.15594133-3.51656533-6.9265696-3.5165664h-46.99410667c-6.9265696 0-10.97594773 7.885632-6.9265696 13.53345066l78.6432 108.800416c3.4100032 4.68875413 10.3365728 4.68875413 13.746576 0l121.69449067-168.36890986c4.15594133-5.6478176 0.10656213-13.53345067-6.8200064-13.53345067z m-342.06595093 208.86269867h-247.22523627v-750.20071467h596.7505696v366.57534933c0 4.68875413 3.83625387 8.525008 8.525008 8.525008h59.67505707c4.68875413 0 8.525008-3.83625387 8.525008-8.525008v-409.2003904c0-18.8615808-15.23845227-34.100032-34.10003307-34.10003306h-682.0006496c-18.8615808 0-34.100032 15.23845227-34.10003307 34.10003306v835.4507968c0 18.8615808 15.23845227 34.100032 34.10003307 34.100032h289.85027627c4.68875413 0 8.525008-3.83625387 8.525008-8.525008v-59.67505706c0-4.68875413-3.83625387-8.525008-8.525008-8.525008z" fill="#2c2c2c" ></path></symbol><symbol id="icon-kb" viewBox="0 0 1024 1024"><path d="M83.5 328.1l415.3 226.3c4.2 2.3 8.8 3.4 13.4 3.4 4.5 0 9.1-1.1 13.3-3.4l419.7-226.3c9.2-4.9 14.8-14.5 14.7-25-0.1-10.4-6-19.9-15.3-24.6L529.3 67.5c-7.9-4-17.3-4-25.3 0L84.4 278.6c-9.3 4.7-15.3 14.1-15.4 24.6C68.8 313.5 74.4 323.2 83.5 328.1zM516.5 117.8l361.1 186.5L512.3 504.1 151.2 304.5 516.5 117.8zM939.8 484.3l-83-42.2-53.9 32.3 69.9 35.5L507.5 709.8 146.4 510.2l74.5-37.5-53.7-32.6-87.7 44.1c-9.3 4.7-15.3 14.1-15.4 24.5-0.2 10.4 5.5 20.1 14.6 25L494 760.1c4.2 2.3 8.8 3.4 13.4 3.4 4.5 0 9.1-1.1 13.3-3.4l419.7-226.3c9.2-4.9 14.8-14.6 14.7-25C954.9 498.5 949 489 939.8 484.3zM939.8 680.2l-78.7-38.7-11.2 32.3 22.9 32L507.5 905.7 146.4 706.2l26.6-31.4-11-32.6-82.5 38c-9.3 4.7-15.3 14.1-15.4 24.5-0.2 10.4 5.5 20.1 14.6 25.1L494 956.1c4.2 2.3 8.8 3.4 13.4 3.4 4.5 0 9.1-1.1 13.3-3.4l419.7-226.3c9.2-4.9 14.8-14.5 14.7-25C954.9 694.4 949 685 939.8 680.2z" fill="#272636" ></path></symbol><symbol id="icon-experience" viewBox="0 0 1024 1024"><path d="M908.8 41.6c3.2-3.2 6.4-6.4 6.4-12.8 0-12.8-12.8-25.6-28.8-25.6h-236.8c-12.8 0-22.4 6.4-25.6 19.2L547.2 160s156.8 9.6 249.6 96l112-214.4zM227.2 262.4c92.8-89.6 249.6-96 249.6-96L403.2 28.8c-3.2-12.8-12.8-19.2-25.6-19.2H137.6c-16 0-28.8 12.8-28.8 25.6 0 6.4 3.2 9.6 6.4 16l112 211.2zM512 217.6c-220.8 0-403.2 182.4-403.2 400v6.4c3.2 89.6 32 169.6 80 236.8 73.6 99.2 188.8 160 320 160 220.8 0 403.2-179.2 403.2-400 3.2-224-179.2-403.2-400-403.2z m204.8 387.2L640 678.4l19.2 102.4c3.2 25.6-6.4 41.6-25.6 41.6-6.4 0-12.8-3.2-22.4-6.4l-96-51.2-96 51.2c-32 16-54.4 3.2-48-35.2l19.2-102.4-76.8-73.6c-25.6-16-25.6-35.2-12.8-44.8 6.4-3.2 12.8-6.4 22.4-9.6l105.6-16 48-92.8c3.2-6.4 6.4-9.6 9.6-16 16-16 35.2-9.6 48 16l48 92.8 105.6 16c44.8 6.4 54.4 32 28.8 54.4z" fill="#8a8a8a" ></path></symbol><symbol id="icon-deep-think" viewBox="0 0 1024 1024"><path d="M513.344 53.44l2.112 0.192a31.616 31.616 0 0 1 10.88 3.2c0.512 0.32 1.152 0.512 1.664 0.768l369.472 213.312 3.584 2.432a32 32 0 0 1 12.416 25.28v426.688a32 32 0 0 1-16 27.712L528 966.4a32.192 32.192 0 0 1-4.8 2.176c-0.128 0-0.32 0-0.448 0.128h-0.128v0.128h-0.256a32 32 0 0 1-4.288 1.152l-0.384 0.128-0.512 0.064-0.192 0.064a32.128 32.128 0 0 1-10.048 0h-0.192l-0.448-0.128-0.448-0.128a31.104 31.104 0 0 1-4.288-1.152h-0.192l-0.128-0.064-0.512-0.192a31.616 31.616 0 0 1-4.736-2.176l-369.472-213.376a32 32 0 0 1-16-27.712V298.624a32 32 0 0 1 16-27.712L496 57.6l3.84-1.856c0.512-0.256 1.152-0.32 1.728-0.512 1.472-0.512 2.944-1.088 4.544-1.344 0.832-0.192 1.664-0.192 2.56-0.256 1.088-0.128 2.176-0.32 3.328-0.32l1.344 0.128zM207.744 726.016l245.184 141.568-85.76-243.008-159.36 101.44z m363.264 141.568l245.12-141.568-159.36-101.44-85.76 243.008zM512 842.432L594.752 608H429.248L512 842.432zM174.528 671.36l161.28-102.592-161.28-190.72v293.312z m513.6-102.592l161.344 102.592V377.984l-161.344 190.72zM440.576 544h142.848L512 424.832 440.576 544z m-61.056-22.784l81.088-135.168-229.76-40.576L379.52 521.216z m183.808-135.168l81.088 135.168 148.672-175.68-229.76 40.512zM236.096 281.472L480 324.48V140.608L236.16 281.472zM544 324.48l243.84-43.008-243.84-140.8V324.48z" fill="#707070" ></path></symbol><symbol id="icon-collocation" viewBox="0 0 1024 1024"><path d="M327.21875 112.90625H188.84375c-26.15625 0-51.46875 10.125-70.03125 29.53125C100.25 160.15625 90.125 185.46875 90.125 211.625V351.6875c0 54.84375 43.875 99.5625 98.71875 99.5625h138.375c26.15625 0 51.46875-10.125 70.03125-29.53125 18.5625-18.5625 29.53125-43.875 29.53125-70.03125V211.625c0-26.15625-10.125-51.46875-29.53125-70.03125-17.71875-18.5625-43.03125-28.6875-70.03125-28.6875z m259.875 101.25h297c27 0 48.9375-22.78125 48.9375-49.78125 0-13.5-5.0625-26.15625-14.34375-35.4375s-21.9375-14.34375-34.59375-14.34375H587.09375c-17.71875 0-34.59375 9.28125-43.03125 24.46875-9.28125 15.1875-9.28125 34.59375 0 49.78125 9.28125 16.03125 25.3125 25.3125 43.03125 25.3125z m297 99.5625H587.09375c-27.84375 0-49.78125 21.9375-49.78125 49.78125 0 27.84375 21.9375 49.78125 49.78125 49.78125h297c27.84375 0 49.78125-21.9375 49.78125-49.78125 0-27.84375-21.9375-49.78125-49.78125-49.78125z m0 496.96875H587.09375c-17.71875 0-34.59375 9.28125-43.03125 24.46875-9.28125 15.1875-9.28125 34.59375 0 49.78125 9.28125 15.1875 25.3125 24.46875 43.03125 24.46875h297c27.84375 0 49.78125-21.9375 49.78125-49.78125 0-27-21.9375-48.9375-49.78125-48.9375z m0-199.125H587.09375c-17.71875 0-34.59375 9.28125-43.03125 24.46875-9.28125 15.1875-9.28125 34.59375 0 49.78125 9.28125 15.1875 25.3125 24.46875 43.03125 24.46875h297c27.84375 0 49.78125-21.9375 49.78125-49.78125 0-27-21.9375-48.9375-49.78125-48.9375z m-556.875-37.96875H188.84375C134 573.59375 90.125 618.3125 90.125 673.15625v139.21875c0 26.15625 10.125 51.46875 28.6875 70.03125 18.5625 18.5625 43.875 28.6875 70.03125 28.6875h138.375c26.15625 0 51.46875-10.125 70.03125-29.53125 18.5625-18.5625 29.53125-43.875 29.53125-70.03125V673.15625c0-26.15625-10.125-51.46875-29.53125-70.03125-17.71875-18.5625-43.03125-29.53125-70.03125-29.53125z m0 0" fill="#383838" ></path></symbol><symbol id="icon-upload1" viewBox="0 0 1024 1024"><path d="M737 801.28571416q0-13.05803584-9.54241084-22.60044668t-22.60044668-9.54241084-22.60044668 9.54241084-9.54241084 22.60044668 9.54241084 22.60044668 22.60044668 9.54241084 22.60044668-9.54241084 9.54241084-22.60044668z m128.57142832 0q0-13.05803584-9.54241084-22.60044668t-22.60044668-9.54241084-22.60044668 9.54241084-9.54241084 22.60044668 9.54241084 22.60044668 22.60044668 9.54241084 22.60044668-9.54241084 9.54241084-22.60044668z m64.28571416-112.5l0 160.71428584q0 20.08928584-14.0625 34.15178584t-34.15178584 14.0625l-739.28571416 0q-20.08928584 0-34.15178584-14.0625t-14.0625-34.15178584l0-160.71428584q0-20.08928584 14.0625-34.15178584t34.15178584-14.0625l214.453125 0q10.546875 28.125 35.40736582 46.20535752t55.49665166 18.08035752l128.57142832 0q30.63616084 0 55.49665166-18.08035752t35.40736582-46.20535752l214.453125 0q20.08928584 0 34.15178584 14.0625t14.0625 34.15178584z m-163.22544668-325.44642832q-8.53794668 20.08928584-29.63169668 20.08928584l-128.57142832 0 0 225q0 13.05803584-9.54241084 22.60044668t-22.60044668 9.54241084l-128.57142832 0q-13.05803584 0-22.60044668-9.54241084t-9.54241084-22.60044668l0-225-128.57142832 0q-21.09375 0-29.63169668-20.08928584-8.53794668-19.58705332 7.03125-34.65401748l225-225q9.04017832-9.54241084 22.60044668-9.54241084t22.60044668 9.54241084l225 225q15.56919668 15.06696416 7.03125 34.65401748z"  ></path></symbol><symbol id="icon-edit" viewBox="0 0 1025 1024"><path d="M430.8177544 653.65067217a60.46065263 60.46065263 0 0 1-50.95969278-93.2821497l71.68905967-114.01151661 7.77351181-10.36468301L816.0384834 80.1381957a60.46065263 60.46065263 0 0 1 43.18618095-18.1381957 60.46065263 60.46065263 0 0 1 43.18618008 18.1381957l43.18618096 43.18618008a60.46065263 60.46065263 0 0 1 0 86.37236104L588.8791751 565.55086396l-8.63723672 8.63723585-117.46641094 68.23416532a60.46065263 60.46065263 0 0 1-31.95777304 11.22840704z"  ></path><path d="M728.80239922 962H252.89069083A190.88291778 190.88291778 0 0 1 62.00777393 771.98080625v-475.04798437A190.88291778 190.88291778 0 0 1 252.89069083 104.32245693h267.75431894a60.46065263 60.46065263 0 0 1 0 120.92130528h-267.75431895a69.9616125 69.9616125 0 0 0-69.09788848 69.09788847v477.63915557a69.9616125 69.9616125 0 0 0 69.09788848 69.09788847h475.9117084a69.9616125 69.9616125 0 0 0 69.09788847-69.09788847V503.36276416a60.46065263 60.46065263 0 1 1 120.92130528 0v268.61804209a190.88291778 190.88291778 0 0 1-190.01919375 190.01919375z"  ></path></symbol><symbol id="icon-skip" viewBox="0 0 1024 1024"><path d="M664.9296875 583.45507813s-327.48046875 0.08789063-476.19140625 0.08789062c-38.93554688 0-70.48828125-31.640625-70.48828125-70.48828125 0-38.93554688 31.55273438-70.48828125 70.48828125-70.48828125 124.71679689 0 475.92773438-0.08789063 475.92773438-0.08789063S641.0234375 418.66015625 532.30273438 309.8515625c-27.59765625-27.50976563-27.59765625-72.15820313-1e-8-99.75585939s72.24609375-27.59765625 99.75585938 2e-8l253.125 253.12499998c27.50976563 27.59765625 27.50976563 72.15820313 0 99.75585939 0 0-142.29492188 142.29492188-251.015625 251.10351563-27.59765625 27.59765625-72.15820313 27.59765625-99.75585938-1e-8-27.59765625-27.59765625-27.59765625-72.15820313 1e-8-99.75585937C622.56640625 625.99414063 664.9296875 583.45507813 664.9296875 583.45507813z"  ></path></symbol><symbol id="icon-prompt" viewBox="0 0 1024 1024"><path d="M554.666667 128a32 32 0 1 1-0.512 64H213.333333a21.333333 21.333333 0 0 0-21.333333 21.333333v597.333334a21.333333 21.333333 0 0 0 21.333333 21.333333h597.333334a21.333333 21.333333 0 0 0 21.333333-21.333333V469.312l0.149333-3.050667A32 32 0 0 1 896 469.333333v341.333334a85.333333 85.333333 0 0 1-85.333333 85.333333H213.333333a85.333333 85.333333 0 0 1-85.333333-85.333333V213.333333a85.333333 85.333333 0 0 1 85.333333-85.333333z" fill="#323847" ></path><path d="M298.581333 521.194667m32 0l192 0q32 0 32 32l0 0q0 32-32 32l-192 0q-32 0-32-32l0 0q0-32 32-32Z" fill="#323847" ></path><path d="M298.581333 670.528m32 0l320 0q32 0 32 32l0 0q0 32-32 32l-320 0q-32 0-32-32l0 0q0-32 32-32Z" fill="#323847" ></path><path d="M789.333333 106.666667a128 128 0 1 1 0 256 128 128 0 0 1 0-256z m0 64a64 64 0 1 0 0 128 64 64 0 0 0 0-128z" fill="#323847" ></path></symbol><symbol id="icon-sync" viewBox="0 0 1024 1024"><path d="M779.07437 412.216889a18.962963 18.962963 0 0 1 26.737778 2.161778l111.634963 131.356444a18.962963 18.962963 0 0 1-14.449778 31.250963h-50.251852c-13.274074 70.769778-47.407407 136.343704-99.555555 188.491852-139.58637 139.567407-364.980148 141.027556-506.349037 4.361481l-4.437333-4.361481a62.862222 62.862222 0 0 1 86.091851-91.515259l2.787556 2.616889c91.97037 91.97037 241.057185 91.97037 332.98963 0a234.268444 234.268444 0 0 0 59.354074-99.593482h-43.918223a18.962963 18.962963 0 0 1-14.449777-31.250963l111.634963-131.356444a18.962963 18.962963 0 0 1 2.18074-2.161778z m-35.858963-179.749926l4.437334 4.361481a62.862222 62.862222 0 0 1-86.110815 91.51526l-2.787556-2.616889c-91.97037-91.97037-241.038222-91.97037-332.989629 0a234.458074 234.458074 0 0 0-56.149334 89.6l40.732445 0.018963a18.962963 18.962963 0 0 1 14.449778 31.250963l-111.653926 131.337481a18.962963 18.962963 0 0 1-28.899556 0l-111.653926-131.337481a18.962963 18.962963 0 0 1 14.449778-31.250963h52.261926a359.784296 359.784296 0 0 1 97.564444-178.517334c139.567407-139.567407 364.980148-141.027556 506.349037-4.361481z" fill="#707070" ></path></symbol><symbol id="icon-process-node" viewBox="0 0 1024 1024"><path d="M512 872a360 360 0 1 0 0-720 360 360 0 0 0 0 720z m0 90C263.465 962 62 760.535 62 512S263.465 62 512 62s450 201.465 450 450-201.465 450-450 450z" fill="#707070" ></path><path d="M512 512m-157.5 0a157.5 157.5 0 1 0 315 0 157.5 157.5 0 1 0-315 0Z" fill="#707070" ></path></symbol><symbol id="icon-process" viewBox="0 0 1024 1024"><path d="M354.879931 125.887975A164.159968 164.159968 0 0 1 513.8559 0c76.415985 0 140.607973 52.92799 158.655969 124.543976a463.615909 463.615909 0 0 1 301.439941 435.839915c0 29.503994-2.815999 58.495989-8.063999 86.527983 35.583993 30.399994 58.111989 75.775985 58.111989 126.527975 0 91.455982-73.279986 165.567968-163.711968 165.567968-22.399996 0-43.775991-4.479999-63.231988-12.799998a453.119912 453.119912 0 0 1-281.599945 97.791981c-104.12798 0-200.255961-35.199993-277.247946-94.399982-22.335996 11.519998-47.679991 18.111996-74.495985 18.111997C73.279986 947.711815 0 873.535829 0 782.079847c0-54.207989 25.791995-102.39998 65.599987-132.543974a471.231908 471.231908 0 0 1-8.447998-89.215982A463.679909 463.679909 0 0 1 354.879931 125.887975z m7.871998 103.61598a364.671929 364.671929 0 0 0-208.639959 330.559936c0 19.199996 1.536 38.079993 4.351999 56.511989l5.247999-0.064c90.431982 0 163.711968 74.111986 163.711968 165.567967a166.399968 166.399968 0 0 1-18.815996 77.119985 355.711931 355.711931 0 0 0 205.69596 65.215987 355.711931 355.711931 0 0 0 205.823959-65.279987 166.271968 166.271968 0 0 1-23.551995-85.759983c0-91.391982 73.279986-165.567968 163.711968-165.567968 3.711999 0 7.423999 0.128 11.071998 0.384a371.839927 371.839927 0 0 0 3.135999-48.12799c0-146.751971-85.759983-273.215947-209.407959-330.879936A163.775968 163.775968 0 0 1 513.8559 331.199935a163.775968 163.775968 0 0 1-151.039971-101.75998z" fill="#595959" ></path></symbol><symbol id="icon-sigh" viewBox="0 0 1024 1024"><path d="M512 725.333333a85.333333 85.333333 0 1 1 0 170.666667 85.333333 85.333333 0 0 1 0-170.666667z m0-554.666666a64 64 0 0 1 64 64v341.333333a64 64 0 0 1-128 0v-341.333333A64 64 0 0 1 512 170.666667z"  ></path></symbol><symbol id="icon-loading1" viewBox="0 0 1024 1024"><path d="M793.84875489 721.02587891c2.52136231 0 4.8449707-2.47192383 4.84497069-5.14160157 0-2.66967773-2.3236084-5.09216309-4.8449707-5.09216309-2.52136231 0-4.8449707 2.47192383-4.84497071 5.09216309 0 2.66967773 2.3236084 5.14160156 4.84497071 5.14160157z m-108.56689454 118.45458984c1.77978516 1.87866211 4.30114747 2.96630859 6.77307129 2.96630859a9.39331055 9.39331055 0 0 0 6.82250977-2.96630859 10.62927247 10.62927247 0 0 0 0-14.3371582 9.44274903 9.44274903 0 0 0-6.82250977-2.9663086 9.39331055 9.39331055 0 0 0-6.77307129 2.9663086 10.57983398 10.57983398 0 0 0 0 14.3371582zM543.14624023 903.05834961c2.66967773 2.81799317 6.42700195 4.44946289 10.18432618 4.44946289a14.18884278 14.18884278 0 0 0 10.18432617-4.44946289 15.91918945 15.91918945 0 0 0 0-21.60461426 14.18884278 14.18884278 0 0 0-10.18432617-4.49890137 14.18884278 14.18884278 0 0 0-10.18432618 4.4494629 15.91918945 15.91918945 0 0 0 0 21.65405273z m-153.20983887-4.44946289c3.55957031 3.70788575 8.55285645 5.93261719 13.59558106 5.93261719a18.88549805 18.88549805 0 0 0 13.54614258-5.93261719 21.20910645 21.20910645 0 0 0 0-28.77319336 18.88549805 18.88549805 0 0 0-13.54614258-5.93261719 18.88549805 18.88549805 0 0 0-13.59558105 5.93261719 21.25854492 21.25854492 0 0 0 0 28.72375489z m-135.70861816-70.94421387c4.44946289 4.69665528 10.67871094 7.41577148 16.95739747 7.41577149a23.6315918 23.6315918 0 0 0 17.00683593-7.41577148 26.54846192 26.54846192 0 0 0 1e-8-35.99121094 23.6315918 23.6315918 0 0 0-17.00683595-7.41577149 23.6315918 23.6315918 0 0 0-16.95739746 7.41577149 26.54846192 26.54846192 0 0 0 0 35.99121094z m-93.58703613-123.10180663c5.33935547 5.68542481 12.85400391 8.99780273 20.36865235 8.99780272a28.37768555 28.37768555 0 0 0 20.41809081-8.94836425 31.88781739 31.88781739 0 0 0 0-43.20922852 28.37768555 28.37768555 0 0 0-20.41809081-8.94836426 28.42712403 28.42712403 0 0 0-20.36865235 8.89892579 31.88781739 31.88781739 0 0 0 0 43.25866699zM126.33044433 552.68786622a33.1237793 33.1237793 0 0 0 23.77990723 10.38208007 33.1237793 33.1237793 0 0 0 23.77990723-10.38208007 37.17773438 37.17773438 0 0 0 0-50.37780763 33.1237793 33.1237793 0 0 0-23.73046875-10.38208007 33.1237793 33.1237793 0 0 0-23.8293457 10.38208007 37.17773438 37.17773438 0 0 0 0 50.37780763z m30.75073243-150.93566895a37.82043458 37.82043458 0 0 0 27.19116211 11.86523437 37.82043458 37.82043458 0 0 0 27.19116211-11.86523437 42.46765137 42.46765137 0 0 0 0-57.5958252 37.82043458 37.82043458 0 0 0-27.19116211-11.91467285 37.82043458 37.82043458 0 0 0-27.19116211 11.91467285 42.46765137 42.46765137 0 0 0 0 57.5958252zM246.51538086 280.62792969c8.0090332 8.50341797 19.28100586 13.44726563 30.65185547 13.44726562 11.27197266 0 22.54394531-4.94384766 30.55297851-13.44726562a47.80700684 47.80700684 0 0 0 0-64.7644043 42.56652833 42.56652833 0 0 0-30.60241699-13.44726562c-11.32141114 0-22.59338379 4.94384766-30.60241699 13.44726562a47.80700684 47.80700684 0 0 0 0 64.7644043zM377.08239746 212.8972168c8.89892578 9.39331055 21.40686036 14.88098144 33.9642334 14.88098144 12.55737305 0 25.06530762-5.43823242 33.9642334-14.88098144a53.04748536 53.04748536 0 0 0 0-71.98242188 47.31262208 47.31262208 0 0 0-33.9642334-14.88098144 47.31262208 47.31262208 0 0 0-33.96423339 14.88098144 53.09692383 53.09692383 0 0 0 0 71.98242188z m146.48620606-0.84045411c9.78881836 10.38208008 23.58215333 16.41357422 37.42492676 16.41357423s27.58666992-6.03149414 37.37548828-16.41357423a58.38684083 58.38684083 0 0 0 0-79.15100097A52.05871583 52.05871583 0 0 0 560.9440918 116.4921875c-13.84277344 0-27.6361084 6.03149414-37.42492677 16.41357422a58.38684083 58.38684083 0 0 0 0 79.15100098z m134.27490234 66.89025879c10.67871094 11.27197266 25.70800781 17.84729004 40.73730469 17.84729005 15.12817383 0 30.1574707-6.57531739 40.78674317-17.84729005a63.67675781 63.67675781 0 0 0 0-86.31958007 56.75537109 56.75537109 0 0 0-40.78674317-17.89672852c-15.07873536 0-30.05859375 6.57531739-40.73730469 17.89672852a63.67675781 63.67675781 0 0 0 0 86.31958007z m95.81176758 122.45910645c11.56860352 12.26074219 27.83386231 19.37988281 44.19799804 19.37988281 16.31469727 0 32.62939453-7.11914063 44.14855958-19.37988282a69.01611328 69.01611328 0 0 0 0-93.53759764 61.50146484 61.50146484 0 0 0-44.14855958-19.37988281c-16.36413575 0-32.62939453 7.11914063-44.19799804 19.37988281a69.01611328 69.01611328 0 0 0 0 93.53759765z m38.95751953 157.60986328c12.45849609 13.20007325 29.9597168 20.86303711 47.60925293 20.86303711 17.60009766 0 35.10131836-7.66296387 47.55981446-20.8630371a74.35546875 74.35546875 0 0 0 0-100.75561525 66.24755859 66.24755859 0 0 0-47.55981446-20.91247558c-17.64953614 0-35.10131836 7.71240234-47.60925293 20.91247558a74.30603028 74.30603028 0 0 0 0 100.75561524z" fill="#262626" ></path></symbol><symbol id="icon-download" viewBox="0 0 1024 1024"><path d="M828.975746 894.125047 190.189132 894.125047c-70.550823 0-127.753639-57.18542-127.753639-127.752616L62.435493 606.674243c0-17.634636 14.308891-31.933293 31.93227-31.933293l63.889099 0c17.634636 0 31.93227 14.298658 31.93227 31.933293l0 95.821369c0 35.282574 28.596292 63.877843 63.87682 63.877843L765.098927 766.373455c35.281551 0 63.87682-28.595268 63.87682-63.877843l0-95.821369c0-17.634636 14.298658-31.933293 31.943526-31.933293l63.877843 0c17.634636 0 31.933293 14.298658 31.933293 31.933293l0 159.699212C956.729385 836.939627 899.538849 894.125047 828.975746 894.125047L828.975746 894.125047zM249.938957 267.509636c12.921287-12.919241 33.884738-12.919241 46.807049 0l148.97087 148.971893L445.716876 94.89323c0-17.634636 14.300704-31.94762 31.933293-31.94762l63.875796 0c17.637706 0 31.945573 14.312984 31.945573 31.94762l0 321.588299 148.97087-148.971893c12.921287-12.919241 33.875528-12.919241 46.796816 0l46.814212 46.818305c12.921287 12.922311 12.921287 33.874505 0 46.807049L552.261471 624.930025c-1.140986 1.137916-21.664416 13.68365-42.315758 13.69286-20.87647 0.010233-41.878806-12.541641-43.020816-13.69286L203.121676 361.13499c-12.922311-12.933567-12.922311-33.884738 0-46.807049L249.938957 267.509636 249.938957 267.509636z" fill="#272636" ></path></symbol><symbol id="icon-newChat" viewBox="0 0 1024 1024"><path d="M754.24853516 133.05407714c18.1439209 0 32.87658692 14.73266602 32.87658692 32.87658692v70.94421387H858.06933594a32.87658692 32.87658692 0 1 1 0 65.75317382h-70.94421387V373.57226562a32.87658692 32.87658692 0 1 1-65.75317382 1e-8V302.62805175H650.42773438a32.87658692 32.87658692 0 0 1-1e-8-65.75317382h70.94421388V165.93066406c0-18.1439209 14.73266602-32.87658692 32.87658691-32.87658692z"  ></path><path d="M198.80725097 373.57226562A140.15808106 140.15808106 0 0 1 338.96533203 233.41418457h224.20349122a32.87658692 32.87658692 0 0 0-1e-8-65.75317382H338.96533203A205.91125489 205.91125489 0 0 0 133.05407714 373.57226562v191.07971192a205.96069336 205.96069336 0 0 0 179.11560059 204.1809082l21.01135255 96.25671387a32.87658692 32.87658692 0 0 0 52.99804686 18.39111328l127.55126954-104.66125489a36.33728028 36.33728028 0 0 1 23.03833007-8.25622558h148.3154297c113.70849609 0 205.86181641-92.15332031 205.8618164-205.91125489v-103.82080077a32.87658692 32.87658692 0 1 0-65.75317382 0v103.82080078A140.15808106 140.15808106 0 0 1 685.03466797 704.81005859H536.76867676c-23.58215333 0-46.47216797 8.20678711-64.7644043 23.18664552l-86.02294922 70.59814452-14.83154297-67.9284668a32.87658692 32.87658692 0 0 0-32.13500977-25.85632324 140.15808106 140.15808106 0 0 1-140.20751952-140.15808106V373.57226562z"  ></path></symbol><symbol id="icon-chat" viewBox="0 0 1024 1024"><path d="M341.333333 648.533333c0-157.013333 157.013333-286.72 351.573334-290.133333 6.826667 0 10.24-3.413333 13.653333-6.826667 3.413333-3.413333 3.413333-10.24 3.413333-13.653333-37.546667-150.186667-180.906667-252.586667-348.16-252.586667C160.426667 85.333333 0 232.106667 0 409.6v6.826667c0 71.68 27.306667 139.946667 81.92 194.56l10.24 10.24c10.24 17.066667 23.893333 27.306667 40.96 40.96l-61.44 116.053333c-3.413333 6.826667-3.413333 13.653333 3.413333 20.48 3.413333 3.413333 6.826667 3.413333 10.24 3.413333 3.413333 0 6.826667 0 10.24-3.413333l129.706667-88.746667c34.133333 13.653333 71.68 20.48 109.226667 23.893334 6.826667 0 10.24-3.413333 13.653333-6.826667 3.413333-3.413333 3.413333-10.24 3.413333-13.653333-6.826667-23.893333-10.24-44.373333-10.24-64.853334z m-245.76-40.96z" fill="" ></path><path d="M1024 648.533333c0-139.946667-146.773333-256-324.266667-256S375.466667 508.586667 375.466667 648.533333s146.773333 256 324.266666 256c17.066667 0 34.133333 0 54.613334-3.413333 17.066667-3.413333 30.72-3.413333 44.373333-10.24l98.986667 44.373333h6.826666c3.413333 0 6.826667 0 10.24-3.413333 6.826667-3.413333 6.826667-10.24 6.826667-17.066667l-20.48-64.853333c75.093333-47.786667 122.88-122.88 122.88-201.386667z" fill="" ></path></symbol><symbol id="icon-knowledge" viewBox="0 0 1024 1024"><path d="M212.519822 57.281422h-25.258666c-40.487822 0.062578-73.295644 32.8704-73.363912 73.363911V892.700444c0.068267 40.487822 32.876089 73.295644 73.3696 73.363912h25.258667V57.281422z m621.568 0h-48.105244v267.002311l-120.274489-111.616-120.274489 111.616V57.287111H263.879111v908.777245h570.208711c40.493511-0.068267 73.301333-32.876089 73.3696-73.363912V130.645333c-0.068267-40.493511-32.876089-73.301333-73.3696-73.363911z m-30.065778 622.768356H366.347378a19.245511 19.245511 0 0 1 0-38.365867h437.674666a19.245511 19.245511 0 0 1 0 38.365867z m0-149.378845H366.347378a19.245511 19.245511 0 0 1 0-38.365866h437.674666a19.245511 19.245511 0 0 1 0 38.365866z" fill="#515151" ></path></symbol><symbol id="icon-system" viewBox="0 0 1024 1024"><path d="M855.277568 88.375296A93.93493333 93.93493333 0 0 1 948.90666667 178.946048l0.04369066 3.05834667v561.73090133a93.93493333 93.93493333 0 0 1-90.52706133 93.585408l-3.05834667 0.04369067h-193.54965333l15.64125867 62.43396266h115.474432c17.12674133 0 31.195136 14.024704 31.195136 31.195136a31.326208 31.326208 0 0 1-29.18536534 31.15144534l-2.00977066 0.04369066H231.06901333a31.28251733 31.28251733 0 0 1-31.195136-31.195136c0-16.47138133 12.93243733-30.10286933 29.18536534-31.15144533l2.00977066-0.04369067h99.876864l15.597568-62.43396266H168.722432A93.93493333 93.93493333 0 0 1 75.09333333 746.83733333L75.09333333 743.77898667V181.960704a93.93493333 93.93493333 0 0 1 90.52706134-93.585408h689.65717333zM596.32298667 837.36439467H412.123136l-15.597568 62.43396266h215.351296l-15.597568-62.43396266zM512.786432 275.63349333a30.58346667 30.58346667 0 0 0-25.51534933 13.76256l-132.07688534 235.9296H216.956928a30.408704 30.408704 0 0 0-30.45239467 30.408704c0 16.82090667 13.58779733 30.539776 30.45239467 30.670848l155.40770133 1.31072a30.58346667 30.58346667 0 0 0 25.47165867-13.80625066l114.90645333-206.21994667 128.01365334 204.42862933a30.670848 30.670848 0 0 0 26.52023466 14.024704h138.98001067a31.195136 31.195136 0 1 0 0-62.390272h-120.28040533v1.52917334l-146.669568-235.62376534c-6.24776533-9.34980267-15.597568-15.597568-26.52023467-14.024704z" fill="#202945" ></path></symbol><symbol id="icon-chatbot1" viewBox="0 0 1024 1024"><path d="M778.24 360.192H245.76c-51.2 0-92.16 40.96-92.16 92.16v399.36c0 51.2 40.96 92.16 92.16 92.16h532.48c51.2 0 92.16-40.96 92.16-92.16v-399.36c0-49.5104-40.96-92.16-92.16-92.16z m-465.92 203.1104c0-23.9104 20.48-44.3904 44.3904-44.3904 23.8592 0 44.3392 20.48 44.3392 44.3904 0 23.8592-20.48 44.3392-44.3392 44.3392a44.032 44.032 0 0 1-44.3904-44.3392z m288.4096 221.8496H423.2704a45.1584 45.1584 0 0 1-44.3904-44.3904c0-23.8592 20.48-44.3392 44.3904-44.3392h177.4592c23.9104 0 44.3904 20.48 44.3904 44.3904 0 25.6-20.48 44.3392-44.3904 44.3392z m66.56-177.5104a45.1584 45.1584 0 0 1-44.3392-44.3392c0-23.9104 20.48-44.3904 44.3392-44.3904 23.9104 0 44.3904 20.48 44.3904 44.3904a44.032 44.032 0 0 1-44.3904 44.3392z m-599.04 167.2704a34.2528 34.2528 0 0 1-34.0992-34.0992v-177.5104c0-18.7904 15.36-34.1504 34.0992-34.1504 18.7904 0 34.1504 15.36 34.1504 34.1504v177.4592c-1.6896 18.7904-15.36 34.1504-34.1504 34.1504z m887.5008 0A34.2528 34.2528 0 0 1 921.6 740.864v-177.5104c0-18.7904 15.36-34.1504 34.1504-34.1504 18.7392 0 34.0992 15.36 34.0992 34.1504v177.4592c0 18.7904-15.36 34.1504-34.0992 34.1504z" fill="#515151" ></path><path d="M595.6096 163.84c0-46.08-37.5296-83.6608-83.6096-83.6608S428.3904 117.76 428.3904 163.84c0 34.0992 20.48 63.1296 49.4592 76.8v145.0496h68.3008V240.64c28.9792-13.6704 49.4592-42.7008 49.4592-76.8zM512 146.7392a17.1008 17.1008 0 0 1 0 34.1504c-10.24 0-17.0496-6.8096-17.0496-17.0496s8.4992-17.1008 17.0496-17.1008z" fill="#515151" ></path></symbol><symbol id="icon-lang-zh" viewBox="0 0 1024 1024"><path d="M991.99915344 512.00592688c0 265.09046062-214.89683906 479.99238-479.99746032 479.99238C246.91292563 992 32.00084656 777.09808062 32.00084656 512.00592688 32.00084656 246.90191938 246.91292563 32 512 32 777.10062031 32 991.99915344 246.90191938 991.99915344 512.00592688zM512 103.99352281c-225.32943188 0-407.99547 182.66773219-407.99547 408.01240407 0 225.331125 182.66603906 408.00055031 407.99547 408.00055031 225.33959156 0 408.00732375-182.66942531 408.00732375-408.00055031 0-225.34467187-182.66773219-408.01240406-408.00732375-408.01240407z" fill="#231815" ></path><path d="M552.52810625 341.56571469v-101.24914688h-63.93158906v101.28639938H278.97100719v256.37320969h209.62720312v197.7857625H552.52980031V597.97617687h210.2097075V341.56571469H552.52810625z m-63.92989594 195.99930094h-147.50578125v-135.56612719h147.50578125v135.56612718z m211.99616907-1e-8h-148.08828563v-135.56612718h148.08828562v135.56612718z" fill="#231815" ></path></symbol><symbol id="icon-lang-en" viewBox="0 0 1024 1024"><path d="M992 512c0 265.0978125-214.90125 480-480 480S32 777.0978125 32 512 246.9021875 32 511.9990625 32C777.09875 32 992 246.9003125 992 512zM511.9971875 104.0009375c-225.3309375 0-407.9953125 182.664375-407.9953125 407.9953125 0 225.3328125 182.664375 407.9971875 407.9953125 407.9971875 225.3328125 0 407.9971875-182.664375 407.9971875-407.9971875 0-225.3290625-182.664375-407.9953125-407.9971875-407.9953125z" fill="#231815" ></path><path d="M217.325 714.078125V321.0125h291.444375v66.478125H296.675v87.16875h197.3334375v66.24375h-197.334375v106.933125h219.615v66.2409375h-298.93125z m590.4065625 0h-75.33V568.761875c0-30.7490625-1.618125-50.6503125-4.809375-59.6765625a41.7796875 41.7796875 0 0 0-15.7134375-21.0328125 44.6934375 44.6934375 0 0 0-26.14875-7.51875c-13.0453125 0-24.7125 3.5653125-35.109375 10.741875-10.3659375 7.1353125-17.503125 16.6059375-21.309375 28.411875-3.849375 11.8078125-5.7703125 33.6375-5.7703125 65.4196875V714.078125h-75.3309375V429.329375h69.976875v41.83125c24.849375-32.188125 56.1121875-48.25125 93.825-48.25125 16.648125 0 31.815 2.9878125 45.5728125 8.9596875 13.7709375 6.0046875 24.1996875 13.621875 31.2384375 22.921875 7.0715625 9.3 12.01125 19.8375 14.750625 31.6453125 2.750625 11.8078125 4.15875 28.6903125 4.15875 50.6915625l-0.0009375 176.949375z" fill="#231815" ></path></symbol><symbol id="icon-exit" viewBox="0 0 1024 1024"><path d="M224 704c-8 0-16-3.2-22.4-9.6l-160-160c-12.8-12.8-12.8-32 0-44.8l160-160c12.8-12.8 32-12.8 44.8 0 12.8 12.8 12.8 32 0 44.8L108.8 512l137.6 137.6c12.8 12.8 12.8 32 0 44.8-6.4 6.4-14.4 9.6-22.4 9.6z" fill="#333333" ></path><path d="M640 544H80c-17.6 0-32-14.4-32-32s14.4-32 32-32h560c17.6 0 32 14.4 32 32s-14.4 32-32 32z" fill="#333333" ></path><path d="M832 928H480c-52.8 0-96-43.2-96-96v-128c0-17.6 14.4-32 32-32s32 14.4 32 32v128c0 17.6 14.4 32 32 32h352c17.6 0 32-14.4 32-32V192c0-17.6-14.4-32-32-32H480c-17.6 0-32 14.4-32 32v128c0 17.6-14.4 32-32 32s-32-14.4-32-32v-128c0-52.8 43.2-96 96-96h352c52.8 0 96 43.2 96 96v640c0 52.8-43.2 96-96 96z" fill="#333333" ></path></symbol><symbol id="icon-loading" viewBox="0 0 1024 1024"><path d="M469.333333 85.333333m42.666667 0l0 0q42.666667 0 42.666667 42.666667l0 128q0 42.666667-42.666667 42.666667l0 0q-42.666667 0-42.666667-42.666667l0-128q0-42.666667 42.666667-42.666667Z" fill="#000000" opacity=".8" ></path><path d="M469.333333 725.333333m42.666667 0l0 0q42.666667 0 42.666667 42.666667l0 128q0 42.666667-42.666667 42.666667l0 0q-42.666667 0-42.666667-42.666667l0-128q0-42.666667 42.666667-42.666667Z" fill="#000000" opacity=".4" ></path><path d="M938.666667 469.333333m0 42.666667l0 0q0 42.666667-42.666667 42.666667l-128 0q-42.666667 0-42.666667-42.666667l0 0q0-42.666667 42.666667-42.666667l128 0q42.666667 0 42.666667 42.666667Z" fill="#000000" opacity=".2" ></path><path d="M298.666667 469.333333m0 42.666667l0 0q0 42.666667-42.666667 42.666667l-128 0q-42.666667 0-42.666667-42.666667l0 0q0-42.666667 42.666667-42.666667l128 0q42.666667 0 42.666667 42.666667Z" fill="#000000" opacity=".6" ></path><path d="M783.530667 180.138667m30.169889 30.169889l0 0q30.169889 30.169889 0 60.339779l-90.509668 90.509668q-30.169889 30.169889-60.339779 0l0 0q-30.169889-30.169889 0-60.339779l90.509668-90.509668q30.169889-30.169889 60.339779 0Z" fill="#000000" opacity=".1" ></path><path d="M330.965333 632.661333m30.16989 30.16989l0 0q30.169889 30.169889 0 60.339778l-90.509668 90.509668q-30.169889 30.169889-60.339779 0l0 0q-30.169889-30.169889 0-60.339778l90.509668-90.509668q30.169889-30.169889 60.339779 0Z" fill="#000000" opacity=".5" ></path><path d="M843.861333 783.530667m-30.169889 30.169889l0 0q-30.169889 30.169889-60.339779 0l-90.509668-90.509668q-30.169889-30.169889 0-60.339779l0 0q30.169889-30.169889 60.339779 0l90.509668 90.509668q30.169889 30.169889 0 60.339779Z" fill="#000000" opacity=".3" ></path><path d="M391.338667 330.965333m-30.16989 30.16989l0 0q-30.169889 30.169889-60.339778 0l-90.509668-90.509668q-30.169889-30.169889 0-60.339779l0 0q30.169889-30.169889 60.339778 0l90.509668 90.509668q30.169889 30.169889 0 60.339779Z" fill="#000000" opacity=".7" ></path></symbol><symbol id="icon-success" viewBox="0 0 1024 1024"><path d="M512 512m-512 0a512 512 0 1 0 1024 0 512 512 0 1 0-1024 0Z" fill="#333333" ></path><path d="M482.9 707.5c-8 0-16.1-2.5-23-7.5L294.5 578.8c-17.4-12.7-21.2-37.1-8.4-54.5 12.7-17.4 37.1-21.2 54.5-8.4L505.9 637c17.4 12.7 21.1 37.1 8.4 54.5-7.6 10.4-19.4 16-31.4 16z" fill="#FFFFFF" ></path><path d="M482.9 708.4c-7.8 0-15.7-2.3-22.6-7.2-17.6-12.5-21.7-36.8-9.2-54.4L674.7 332c12.5-17.6 36.8-21.7 54.4-9.2s21.7 36.8 9.2 54.4L514.7 692c-7.6 10.7-19.6 16.4-31.8 16.4z" fill="#FFFFFF" ></path></symbol><symbol id="icon-results" viewBox="0 0 1024 1024"><path d="M250.71914815 118.58966386v111.5998295c0 31.83745166 25.14459023 56.75528496 56.13829365 56.75528496h394.14139101c31.04995253 0 56.13741474-25.42408242 56.13741475-56.81241299V118.25304278c62.21240508 0.28125 112.49982862 50.39992354 112.49982861 112.04982949V849.94841269c0 61.87490596-50.84992266 112.0498295-113.00607773 112.0498295H259.38251386A112.55607862 112.55607862 0 0 1 146.37555722 849.94841269V230.30287227c0-59.00616035 46.23742969-107.32483652 104.34359093-111.7123295z m54.5624165-0.39374912C305.28156464 87.14684023 330.03152685 62.00225 361.98323633 62.00225H644.18729873a56.24991474 56.24991474 0 0 1 56.64278496 56.19366474v56.36241388c0 31.04995253-24.74996221 56.19366474-56.64278496 56.19366386H361.98235742a56.24991474 56.24991474 0 0 1-56.64366386-56.19366386V118.19591474z m0 481.16000919s128.69980401 130.78105049 207.16843447 212.00592656c35.83119551-53.38116826 180.78634599-291.09330615 287.3236834-359.71820156l-17.09997364-26.38033154c-137.58641192 62.04365508-296.21117021 245.97999668-296.21117021 245.97999667L344.03863467 572.01846523l-38.69994112 27.3374587z" fill="" ></path></symbol><symbol id="icon-rating" viewBox="0 0 1024 1024"><path d="M540.608 70.976c12.736 6.592 23.04 17.28 29.312 30.592l88.448 187.008c9.408 19.84 27.52 33.664 48.64 36.864l197.696 30.016c35.264 5.312 59.776 39.552 54.592 76.416a68.48 68.48 0 0 1-18.816 38.592L797.44 616c-15.232 15.488-22.208 37.76-18.56 59.648l33.728 205.504c6.016 36.736-17.6 71.552-52.736 77.888a62.208 62.208 0 0 1-40.96-6.784L542.08 855.232a62.208 62.208 0 0 0-60.16 0l-176.832 97.024a63.296 63.296 0 0 1-87.232-28.288 70.016 70.016 0 0 1-6.464-42.816l33.728-205.44a69.248 69.248 0 0 0-18.56-59.712L83.52 470.4a69.504 69.504 0 0 1-1.152-95.36 63.68 63.68 0 0 1 36.928-19.648l197.76-30.016c20.992-3.2 39.168-16.96 48.64-36.864l88.32-187.008c15.872-33.344 54.592-47.04 86.592-30.592z m63.232 552.448h-192a32 32 0 1 0 0 64h192a32 32 0 0 0 0-64z" fill="#707070" ></path></symbol><symbol id="icon-chart-line" viewBox="0 0 1024 1024"><path d="M203.13311768 821.00592805H882.78857422V882.78857422H141.21142578v-61.78264618h0.13904572V141.21142578h61.78264618v679.79450227z m87.08896637-123.10180665l-50.84438324-35.13221741L410.96011352 414.76069641l219.7385788 112.62702942 192.25387573-250.51403046 49.03678894 37.63504029-223.63185882 291.34712218-217.37480164-111.42196654-140.76061249 203.4702301z" fill="#262626" ></path></symbol><symbol id="icon-export" viewBox="0 0 1024 1024"><path d="M195.59374999 819.60620117h632.8125V512H907.5078125v351.55700684c0 24.274292-17.69897461 43.95080567-39.55078125 43.95080566H156.04296875c-21.85180663 0-39.55078125-19.67651367-39.55078125-43.95080567V512h79.10156251v307.60620117z m395.50781251-439.45861817h197.75390625L512 687.80322266 235.14453125 380.147583h197.75390625V116.4921875h158.203125v263.65539551z" fill="#22C55E" ></path></symbol><symbol id="icon-rename" viewBox="0 0 1024 1024"><path d="M761.24512681 471.79145398l19.37405451-17.819986-19.37405451 17.819986 19.37405451-17.819986-54.8586188-55.06582785-99.9784084-100.34102394-54.80681623-55.06582786-19.37405451 17.819986-35.43276173 37.24584186-320.91514955 322.1584051q-25.79753764 25.90114156-37.09043539 59.8834399l-56.46448988 195.86443582q-6.42348313 21.08352953 9.68702665 37.24584187 16.16231234 16.21411491 38.69630646 11.3447003l193.53333365-58.27756881q35.48456429-9.73882922 61.28210193-35.63997199l320.863347-322.15840388 35.48456429-37.19404052z m-403.12537452 271.96199185l-14.5046387 37.24584186 14.5046387-37.29764443-14.5046387 37.29764443q-9.68702666 8.08115678-20.97992559 11.29289774l-127.3818159 37.24584187 37.09043537-126.24216551q4.81761204-11.39650287 11.29289774-21.08352951L280.67533802 667.6558898v51.80228434q1.60587108 22.68940061 25.79753764 25.90114156h51.59507406v-1.60586987z m327.39043525-615.1521239l-24.24346913 22.63759925 24.19166656-22.63759925-24.19166656 22.63759925-35.48456429 37.24584186-19.32225194 17.81998599 54.80681623 55.0140253 99.9784084 100.3928265 54.80681624 55.01402529 17.76818342-17.81998599 37.09043538-37.1940393 24.19166656-22.68940061q29.0092786-32.37642725 29.0092798-74.43988236 0-40.5093866-29.0092798-72.88581386l-64.4938429-63.09518207Q799.94143327 97.83076576 758.03338585 97.83076576q-40.30217755 0-72.52319831 30.77055617z m-77.44441428 271.96199185l-232.22964011 233.11027769 232.22964011-233.11027769-232.22964011 233.11027769q-17.71638086 14.55644126-35.43276173 0-16.16231234-19.42585708 0-37.24584187l232.17783755-233.11027769q17.71638086-14.55644126 35.48456429 0 16.11050977 17.81998599 0 37.24584187z" fill="#F59E0B" ></path></symbol><symbol id="icon-delete" viewBox="0 0 1024 1024"><path d="M863.56250027 213.17187473h-172.26562527V148.1328125C691.296875 128.79687473 671.96093723 107.70312473 652.62500027 107.70312473H371.37499973c-19.33593777 0-31.640625 21.09375-31.640625 40.42968777V213.17187473H160.43749973c-10.546875 0-17.57812473 7.03124973-17.57812473 17.57812554s7.03124973 17.57812473 17.57812473 17.57812473h703.12500054c10.546875 0 17.57812473-7.03124973 17.57812473-17.57812473s-7.03124973-17.57812473-17.57812473-17.57812554zM216.6875 868.83593777C216.6875 898.71874973 236.02343777 916.29687527 265.90624973 916.29687527h492.18750054c29.88281277 0 56.25000027-17.57812473 56.24999946-47.4609375V283.48437527h-597.65624973v585.3515625z m421.875-421.875c0-10.546875 7.03124973-17.57812473 17.57812473-17.57812554s17.57812473 7.03124973 17.57812554 17.57812554v316.40625c0 10.546875-7.03124973 17.57812473-17.57812554 17.57812473s-17.57812473-7.03124973-17.57812473-17.57812473v-316.40625z m-140.62500027 0c0-10.546875 7.03124973-17.57812473 17.57812554-17.57812554s17.57812473 7.03124973 17.57812473 17.57812554v316.40625c0 10.546875-7.03124973 17.57812473-17.57812473 17.57812473s-17.57812473-7.03124973-17.57812554-17.57812473v-316.40625z m-140.62499946 0c0-10.546875 7.03124973-17.57812473 17.57812473-17.57812554s17.57812473 7.03124973 17.57812473 17.57812554v316.40625c0 10.546875-7.03124973 17.57812473-17.57812473 17.57812473s-17.57812473-7.03124973-17.57812473-17.57812473v-316.40625z" fill="#666666" ></path></symbol><symbol id="icon-setting1" viewBox="0 0 1024 1024"><path d="M554.64446112 116.4921875c11.62777287 0 22.02948775 7.23769564 25.94496257 18.07446293l27.92247461 77.39983374c10.00621247 2.49166523 18.58861613 4.98333124 25.86586176 7.59364804 7.94959966 2.84761763 18.19311372 7.15859484 30.84919225 13.05158169l65.02060684-34.40871544a27.76427378 27.76427378 0 0 1 32.90580582 5.18108205l57.18965798 59.12762001c7.59364726 7.87049887 9.72936086 19.37962094 5.45793367 29.42538419l-30.49324062 71.4672969c5.06243202 9.29430846 9.09655687 17.24390811 12.18147609 23.88834897 3.32222082 7.23769564 7.43544645 17.20435733 12.33967767 30.05818821l71.07179372 30.4536906c10.67856649 4.54827882 17.28345812 15.22684531 16.57155409 26.65686659l-5.22063283 82.06676336a27.28967059 27.28967059 0 0 1-18.19311372 23.92789977l-67.31452126 23.92789899c-1.93796201 9.29430846-3.95502482 17.24390811-6.09073766 23.96745053a347.64667362 347.64667362 0 0 1-11.78597368 30.61189142l33.81546143 74.74996694a27.01281899 27.01281899 0 0 1-6.64444164 31.36334621l-64.30870206 57.42695958a27.8038238 27.8038238 0 0 1-31.481997 3.79682325l-66.28621407-35.12061945a285.94828837 285.94828837 0 0 1-32.03570101 14.5149405l-28.950781 10.83676807-25.7076602 71.19044529a27.52697218 27.52697218 0 0 1-25.31215856 18.07446293L476.80957419 907.49713379a27.56652219 27.56652219 0 0 1-26.45911498-17.67896053l-30.29548981-80.16835135a578.42236681 578.42236681 0 0 1-30.69099222-11.46957129 394.98831994 394.98831994 0 0 1-24.44205218-11.58822287l-75.14547011 32.11480101a27.76427378 27.76427378 0 0 1-29.86043662-5.26018283L204.30837069 761.27986995a27.01281899 27.01281899 0 0 1-6.13028845-30.9678438l32.31255184-70.39944048a376.39970381 376.39970381 0 0 1-11.94417449-25.47035938 569.32580996 569.32580996 0 0 1-11.86507447-32.07525023L135.88644223 580.81209073a27.28967059 27.28967059 0 0 1-19.37962095-27.01281822l2.76851761-75.9760257a27.2105698 27.2105698 0 0 1 15.50369692-23.49284657l74.27536451-35.67432345c3.44087163-12.61652928 6.44669005-22.42499016 9.09655686-29.583585a355.55672327 355.55672327 0 0 1 12.41877769-28.15977618L198.37583307 292.88629033a27.01281899 27.01281899 0 0 1 5.93253761-31.24469542l55.52854681-52.44362757a27.76427378 27.76427378 0 0 1 29.66268579-5.45793443l75.06636932 31.00739381c8.30555206-5.53703444 15.82009929-10.00621247 22.62274099-13.60528489 8.10780047-4.31097722 18.94456853-8.81970525 32.5894042-13.6843857l26.10316338-72.81200492A27.52697218 27.52697218 0 0 1 471.82624296 116.4921875h82.81821816z m-41.6859603 277.60318631c-65.93026245 0-119.36264643 52.79957997-119.36264642 117.97838762 0 65.17880766 53.43238398 118.01793763 119.36264643 118.01793764 65.89071167 0 119.32309642-52.83913075 119.32309563-118.01793764s-53.39283397-117.97838763-119.32309563-117.97838762z" fill="#8a8a8a" ></path></symbol><symbol id="icon-upload" viewBox="0 0 1024 1024"><path d="M670.203125 116.4921875L867.95703125 314.24609375v554.02734375c0 21.67382813-17.58691381 39.234375-39.28710963 39.234375H195.33007838A39.55078125 39.55078125 0 0 1 156.04296875 868.2734375V155.7265625A39.28710963 39.28710963 0 0 1 195.33007838 116.4921875H670.203125zM551.55078125 512h118.65234375l-158.203125-158.203125-158.203125 158.203125H472.44921875v158.203125h79.1015625v-158.203125z" fill="#A6A6A6" ></path></symbol><symbol id="icon-clear" viewBox="0 0 1024 1024"><path d="M591.99999969 791.88000031h280.00000031v79.99999969h-360l-159.91999969 0.07999969-259.48000031-259.51999969a40.00000031 40.00000031 0 0 1 0-56.56000031L516.8 131.64000031a40.00000031 40.00000031 0 0 1 56.56000031 0l311.16 311.11999969a40.00000031 40.00000031 0 0 1 0 56.56000031L591.99999969 791.88000031z m66.28000031-179.44000031l141.40000031-141.40000031-254.56000031-254.55999938-141.40000031 141.39999938 254.56000031 254.56000031z" fill="#8a8a8a" ></path></symbol><symbol id="icon-copy-success" viewBox="0 0 1024 1024"><path d="M866.35301943 340.99849494L453.67445686 753.67779909c-20.43809939 20.43809939-53.57451327 20.43809939-74.01335353 0L157.62252519 531.6377385c-20.43884026-20.43809939-20.43884026-53.57599571-2e-8-74.01335353 20.43809939-20.43809939 53.57451327-20.43809939 74.01335353 1e-8l185.03227219 185.0337546 375.67225659-375.67225659c20.43809939-20.43809939 53.57451327-20.43809939 74.01261267 0C886.79185968 287.42249996 886.79185968 320.56039625 866.35301943 340.99849494z" fill="#707070" ></path></symbol><symbol id="icon-copy" viewBox="0 0 1024 1024"><path d="M725.333333 960H128c-23.466667 0-42.666667-19.2-42.666667-42.666667V277.333333c0-23.466667 19.2-42.666667 42.666667-42.666666h128V106.666667c0-23.466667 19.2-42.666667 42.666667-42.666667h597.333333c23.466667 0 42.666667 19.2 42.666667 42.666667v640c0 23.466667-19.2 42.666667-42.666667 42.666666h-128v128c0 23.466667-19.2 42.666667-42.666667 42.666667zM170.666667 874.666667h512V320H170.666667v554.666667z m170.666666-725.333334v85.333334h384c23.466667 0 42.666667 19.2 42.666667 42.666666v426.666667h85.333333V149.333333H341.333333z" fill="#707070" ></path><path d="M298.666667 490.666667h128c23.466667 0 42.666667-19.2 42.666666-42.666667s-19.2-42.666667-42.666666-42.666667h-128c-23.466667 0-42.666667 19.2-42.666667 42.666667s19.2 42.666667 42.666667 42.666667M512 576H298.666667c-23.466667 0-42.666667 19.2-42.666667 42.666667s19.2 42.666667 42.666667 42.666666h213.333333c23.466667 0 42.666667-19.2 42.666667-42.666666s-19.2-42.666667-42.666667-42.666667" fill="#707070" ></path></symbol><symbol id="icon-subway" viewBox="0 0 1024 1024"><path d="M430.376057 244.405701l153.865673 0c7.042474 0 12.919123-2.326595 17.819027-7.225487 4.897881-4.775536 7.285144-10.653196 7.285144-17.63298 0-7.470179-2.387262-13.592531-7.285144-18.369078-4.899904-4.775536-10.776553-7.225487-17.819027-7.225487L430.376057 193.952669c-7.10213 0-12.97979 2.448941-17.878683 7.225487-4.837214 4.775536-7.286155 10.898899-7.286155 18.369078 0 6.979784 2.448941 12.857444 7.286155 17.63298C417.396267 242.079107 423.273927 244.405701 430.376057 244.405701z" fill="#707070" ></path><path d="M304.001817 633.816602c-10.286158 0-18.919129 3.551065-25.960592 10.409515-6.979784 6.978773-10.531861 15.552088-10.531861 25.714889 0 9.552082 3.551065 17.878683 10.531861 24.859479 7.041463 6.856427 15.674434 10.407493 25.960592 10.407493 9.673417 0 18.061696-3.551065 25.103159-10.407493 6.979784-6.980796 10.531861-15.307396 10.531861-24.859479 0-10.162801-3.551065-18.735104-10.531861-25.714889C322.063513 637.367667 313.675234 633.816602 304.001817 633.816602z" fill="#707070" ></path><path d="M278.041225 294.122636l456.026739 0 0 150.620978-456.026739 0 0-150.620978Z" fill="#707070" ></path><path d="M745.457258 669.941005c0-10.162801-3.551065-18.735104-10.531861-25.714889-7.040452-6.85845-15.674434-10.409515-25.961603-10.409515-10.223468 0-18.85745 3.551065-25.897902 10.409515-7.042474 6.978773-10.531861 15.552088-10.531861 25.714889 0 9.552082 3.489387 17.878683 10.531861 24.859479 7.040452 6.856427 15.674434 10.407493 25.897902 10.407493 10.287169 0 18.921151-3.551065 25.961603-10.407493C741.906193 687.819688 745.457258 679.493088 745.457258 669.941005z" fill="#707070" ></path><path d="M506.4823 16.514678c-277.055885 0-501.579868 224.58465-501.579868 501.580879S229.426415 1019.677448 506.4823 1019.677448c277.057908 0 501.581891-224.585662 501.581891-501.581891S783.540207 16.514678 506.4823 16.514678zM715.455206 894.281975l-21.859476-48.861524L319.369881 845.420451l-21.858464 48.861524L192.994629 894.281975l106.965727-153.07093c-21.06271-5.878671-38.390331-17.63298-51.922195-35.266971-13.470185-17.635002-20.205278-37.962626-20.205278-60.860525l0-350.960913c0-13.837223 3.673411-27.062716 10.898899-39.675469 7.347833-12.490407 16.225496-24.001035 26.756346-34.41055s21.36807-19.347845 32.389314-26.94037c11.081912-7.470179 20.695673-12.97979 28.777581-16.776559 8.081909-3.673411 17.02125-7.714871 26.695679-12.001023 9.795763-4.286152 21.36807-7.959563 34.899933-11.265936 13.470185-3.184027 29.144619-5.87766 46.900956-7.959563 17.878683-2.204249 38.696702-3.184027 62.453044-3.184027 26.941382 0 50.696713 1.22447 71.268018 3.551065 20.512659 2.448941 38.45201 5.632968 53.881752 9.673417 15.368064 3.918103 28.899927 8.572304 40.472234 13.592531 11.570284 5.020227 22.28617 10.286158 32.022276 15.674434 9.672406 5.26593 19.959575 11.388282 30.736127 18.369078 10.836209 6.979784 20.572316 14.817001 29.142597 23.633997 8.695661 8.816996 15.79678 18.85745 21.492438 30.001041 5.693636 11.265936 8.509614 23.8797 8.509614 37.716923l0 350.960913c0 22.897899-6.856427 43.225523-20.632983 60.860525-13.776556 17.63298-31.164844 29.387289-52.226543 35.266971l107.700814 153.07093L715.455206 894.280964z" fill="#707070" ></path><path d="M365.53575 745.251494 342.085778 795.703516 670.145758 795.703516 647.430872 745.251494Z" fill="#707070" ></path></symbol><symbol id="icon-stop" viewBox="0 0 1024 1024"><path d="M512.08028937 991.94294281c-261.60871406-1.17313312-479.27825625-214.79003344-480.02479499-479.91814687-0.74653969-265.07479031 214.89668156-480.02479594 479.97147093-480.02479594a480.02479594 480.02479594 0 0 1 479.97147188 480.02479594c0 265.12811437-242.94523125 480.98463187-479.91814782 479.91814687z m164.98519501-599.89768406a45.00565781 45.00565781 0 0 0-45.00565782-45.00565687h-239.95907343a45.05898188 45.05898188 0 0 0-45.00565782 45.00565687v239.95907344c0 24.84909563 20.20988625 45.00565781 45.00565781 45.00565781h239.95907344a45.00565781 45.00565781 0 0 0 45.00565781-45.00565781v-239.95907344z" fill="#666666" ></path></symbol><symbol id="icon-time-expand" viewBox="0 0 1024 1024"><path d="M851.36 172.64L915.2 108.8l-63.78 63.78L915.2 108.8q22.5-20.58 48.72-9.36 26.28 9.36 28.14 41.28V347q-3.78 41.28-45 45h-206.28q-31.8-1.86-41.22-28.14-11.28-26.22 9.36-48.72l58.14-58.14Q665.72 155.72 512 152q-153.78 3.78-255 105Q155.72 358.28 152 512q3.78 153.78 105 255Q358.28 868.28 512 872q116.28-1.86 206.28-63.78 20.58-15 45-11.22 22.44 5.64 37.44 26.28 15 20.58 11.28 43.08-5.64 24.36-26.28 39.36Q667.7 990.2 512 992q-135-1.86-241.86-65.64-108.78-63.72-172.5-172.5Q33.8 647 32 512q1.86-135 65.64-241.86 63.72-108.78 172.5-172.5Q377 33.8 512 32q99.36 0 187.5 37.5 86.28 37.5 151.86 103.14zM512 272q41.28 3.78 45 45V512q0 18.78-13.14 31.86l-135 135q-31.86 26.28-63.72 0-26.28-31.86 0-63.72L467 493.28V317Q470.78 275.72 512 272z" fill="#6B7280" ></path></symbol><symbol id="icon-time-retract" viewBox="0 0 1024 1024"><path d="M169.646195 189.84683188L107.1651575 127.42451656l62.42231531 62.42231532L107.1651575 127.42451656Q85.20283812 107.1651575 59.59970656 118.26376344 33.76168344 127.42451656 32 158.60631313v201.88891593q3.69953531 40.34254969 44.042085 44.04208407h201.88891594q31.12307344-1.82040656 40.34254968-27.59970563 11.03988281-25.60313156-9.16075406-47.624175l-56.90237344-56.96109562Q351.334475 173.34573031 501.78223625 169.646195q150.50648437 3.69953531 249.57181312 102.76486406 99.12405187 99.12405187 102.76486407 249.57181313-3.69953531 150.50648437-102.76486407 249.57181312-99.12405187 99.12405187-249.57181312 102.76486406-113.80474687-1.76168344-201.88891594-62.36359125-20.14191375-14.680695-44.042085-10.98115968-21.96231937 5.51994094-36.64301437 25.66185468-14.680695 20.20063594-11.03988188 42.22167844 5.51994094 23.84144812 25.72057688 38.52214313Q349.39662312 989.88597969 501.78223625 991.76510844q132.12625406-1.87912875 236.71152469-64.24272 106.46439937-62.42231438 168.82799062-168.82799156Q969.80278906 654.10912625 971.5644725 521.98287219q-1.82040656-132.12625406-64.24272094-236.71152375-62.36359219-106.46439937-168.82799062-168.82799156Q633.90849031 54.0210425 501.78223625 52.20063594q-97.24492312 0-183.50868562 36.7017375-84.44335687 36.7017375-148.62735563 100.94445844zM501.78223625 287.09175406q-40.40127187 3.64081219-44.042085 44.042085v190.84903313q0 18.32150719 12.86028937 31.18179656l132.12625407 132.12625406q31.18179562 25.72057781 62.36359125 0 25.72057781-31.18179562 0-62.42231531L545.82432125 503.72008813V331.07511594q-3.69953531-40.40127187-44.042085-44.04208407z" fill="#6B7280" ></path></symbol><symbol id="icon-search-time" viewBox="0 0 1024 1024"><path d="M640.96 321.92l-182.08 181.44-59.2-59.2c-13.76-15.04-37.44-16-52.48-2.24s-16 37.44-2.24 52.48c0.64 0.96 1.28 1.6 2.24 2.24l86.08 85.12c7.04 7.04 16.32 10.88 26.24 10.88 9.92-0.32 19.2-4.16 26.56-10.88l208-207.36c13.44-15.68 11.84-39.36-3.84-52.8a39.04 39.04 0 0 0-49.28 0.32z"  ></path><path d="M971.2 942.08l-196.8-196.8c4.8-4.48 9.92-8.64 14.72-13.44 80.32-80.32 125.44-189.44 125.44-303.04 0-236.8-192-428.8-428.8-428.8S56.96 192 56.96 428.8s192 428.8 428.8 428.8c74.56 0.32 146.88-19.52 210.56-55.36l207.68 207.68c8.96 8.64 20.8 14.08 34.24 14.08 26.24 0 47.68-21.44 47.68-47.68 0-13.44-5.76-25.6-14.72-34.24z m-485.12-179.84c-184 0-333.44-149.76-333.44-333.44S302.08 95.36 486.08 95.36 819.52 244.8 819.52 428.8s-149.76 333.44-333.44 333.44z"  ></path></symbol><symbol id="icon-handle-time" viewBox="0 0 1024 1024"><path d="M858.112 877.568h-38.4c0-153.6-92.16-241.152-153.6-307.2-23.04-22.016-53.76-44.032-53.76-58.368 0-7.168 23.04-22.016 38.4-29.184 61.44-44.032 168.96-124.416 168.96-336.384h38.4c23.04 0 38.4-14.848 38.4-36.352s-15.872-36.352-38.4-36.352h-691.2c-23.04 0-38.4 14.848-38.4 36.352s15.36 36.352 38.4 36.352H204.8C204.8 358.4 312.32 438.784 373.76 482.816c15.872 7.168 38.4 22.016 38.4 29.184 0 14.848-30.72 36.352-53.76 66.048-61.44 58.368-153.6 146.432-153.6 300.032h-38.4c-23.04 0-38.4 14.848-38.4 36.352 0 22.016 15.36 36.352 38.4 36.352h691.2c23.04 0 38.4-14.848 38.4-36.352 0.512-22.016-14.848-36.864-37.888-36.864z m-186.88-48.64H348.16v-45.056c0-25.6 12.8-51.2 33.28-64l100.864-82.944c19.968-12.8 47.104-12.8 59.904 0l93.696 82.944c20.48 18.944 33.792 44.544 33.792 64v45.056h1.536z"  ></path></symbol><symbol id="icon-generation" viewBox="0 0 1024 1024"><path d="M736.37789287 63.83251348h-26.82651283c-21.88478675 0-39.53380832 17.76668319-39.53380832 39.53380841v78.24399411c0 21.88478675 17.76668319 39.53380832 39.53380832 39.53380837h26.82651283c21.88478675 0 39.53380832-17.76668319 39.53380831-39.53380837v-78.24399411c0.11766159-21.76712511-17.64902155-39.53380832-39.53380831-39.53380841zM315.50756123 63.83251348h-26.82651289c-21.88478675 0-39.53380832 17.76668319-39.53380829 39.53380841v78.24399411c0 21.88478675 17.76668319 39.53380832 39.53380829 39.53380837h26.82651289c21.88478675 0 39.53380832-17.76668319 39.53380834-39.53380837v-78.24399411c0-21.76712511-17.64902155-39.53380832-39.53380834-39.53380841z"  ></path><path d="M882.04115391 169.96196174c-28.35609614 0-51.41748141 23.06138967-51.41748575 51.41748143v14.00156007c0 22.47308593-18.2373208 40.5927496-40.5927497 40.59274965h-130.83807841c-22.47308593 0-40.5927496-18.2373208-40.59274972-40.59274965v-24.82629185c0-22.47308593-18.2373208-40.5927496-40.59274963-40.59274965h-130.83807855c-22.47308593 0-40.5927496 18.2373208-40.59274963 40.59274965v24.82629185c0 22.47308593-18.2373208 40.5927496-40.59274959 40.59274965h-130.83808294c-22.47308593 0-40.5927496-18.2373208-40.59274966-40.59274965V221.37944317c0-28.35609614-23.06138967-51.41748141-51.41748132-51.41748143-30.0033367 0-54.59430532 24.59096853-54.59430532 54.59430531v684.31139968c0 28.35609614 23.06138967 51.41748141 51.41748143 51.4174814h742.20018603c28.35609614 0 51.41748141-23.06138967 51.41748575-51.4174814v-687.60588077c3.05916228-28.82673377-22.59074761-51.29982423-51.53514299-51.29982422z m-82.00912175 325.91860006l-302.85721027 302.85721027-6.70662822 6.70662825c-18.82562451 18.82562451-49.53492204 18.82562451-68.24288492 0l-3.41214268-3.4121471-161.54737613-161.5473761c-18.82562451-18.82562451-18.82562451-49.53492204 0-68.24288492l6.70662829-6.70662818c18.82562451-18.82562451 49.53492204-18.82562451 68.24288051 0l124.01379307 124.01379311 268.73577008-268.7357701c20.59052665-20.59052665 54.35898642-20.59052665 74.9495087 0 20.70818385 20.70818385 20.70818385 54.47664804 0.11766157 75.06717477z"  ></path></symbol><symbol id="icon-generator" viewBox="0 0 1024 1024"><path d="M905.75 174.5v112.5h56.25V174.5c0-61.875-50.625-112.5-112.5-112.5h-112.5v56.25h112.5c28.125 0 56.25 28.125 56.25 56.25zM118.25 849.5v-112.5H62v112.5c0 61.875 50.625 112.5 112.5 112.5h112.5v-56.25H174.5c-28.125 0-56.25-28.125-56.25-56.25z m787.5 0c0 22.5-22.5 56.25-56.25 56.25h-112.5v56.25h112.5c61.875 0 112.5-50.625 112.5-118.125V737h-56.25v112.5zM118.25 174.5c0-28.125 28.125-56.25 56.25-56.25h112.5V62H174.5C112.625 67.625 62 118.25 62 174.5v112.5h56.25V174.5z m663.75 0H242C208.25 174.5 174.5 208.25 174.5 242v534.375c0 45 33.75 73.125 67.5 73.125h534.375c39.375 0 67.5-28.125 67.5-67.5V242c5.625-33.75-22.5-67.5-61.875-67.5zM568.25 680.75L512 568.25H399.5l-56.25 112.5H287l112.5-337.5h112.5l112.5 337.5H568.25z m168.75 0h-56.25V343.25h56.25v337.5zM512 512L455.75 343.25 399.5 512h112.5z" fill="#999999" ></path></symbol><symbol id="icon-user" viewBox="0 0 1024 1024"><path d="M856.339597 799.428571q0 62.285714-35.714286 106.857143t-86 44.571429H246.625311q-50.285714 0-86-44.571429T124.911026 799.428571q0-48.571429 4.857143-91.714285t18-86.857143 33.428571-74.857143 53.714286-50.857143T311.768169 475.428571q74.857143 73.142857 178.857142 73.142858t178.857143-73.142858q43.428571 0 76.857143 19.714286t53.714286 50.857143 33.428571 74.857143 18 86.857143 4.857143 91.714285z m-146.285714-506.857142q0 90.857143-64.285714 155.142857T490.625311 512 335.482454 447.714286 271.19674 292.571429t64.285714-155.142858T490.625311 73.142857t155.142858 64.285714T710.053883 292.571429z"  ></path></symbol><symbol id="icon-send" viewBox="0 0 1024 1024"><path d="M893.18 191.719c20.24-7.106 41.16 8.769 39.753 30.164l-38.276 581.744c-1.35 20.511-22.53 33.572-41.477 25.576L536.091 695.376 431.374 859.151c-15.935 24.922-54.329 14.003-55.095-15.206l-0.012-0.89V630.433L109.654 522.213c-25.266-10.256-24.662-46.049 0.57-55.616l0.772-0.282zM664.153 453.57L436.08 633.345l-0.001 107.426 58.26-91.114a29.816 29.816 0 0 1 7.794-8.22 30.49 30.49 0 0 1 1.665-2.109l160.356-185.757z" fill="#333333" ></path></symbol><symbol id="icon-uploaded" viewBox="0 0 1024 1024"><path d="M692.312 956.978c-59.656 0-112.963-25.778-148.221-66.23H214.286V133.034h400.115v187.818h197.413v310.98c42.357 31.932 70.176 80.457 72.544 135.214v-510.52L674.346 64.223H141.742v895.335h742.615V782.244c-4.202 97.174-88.568 174.734-192.045 174.734z" fill="#8a8a8a" ></path><path d="M301.326 418.477h437.601v67.091H301.326zM301.326 578.493h219.957v67.091H301.326zM301.326 738.509h138.34V805.6h-138.34z" fill="#8a8a8a" ></path><path d="M811.814 631.832c-32.811-24.735-74.334-39.519-119.502-39.519-106.162 0-192.224 81.633-192.224 182.333 0 44.113 16.517 84.567 44.003 116.103 35.258 40.452 88.565 66.23 148.221 66.23 103.477 0 187.843-77.56 192.045-174.734 0.109-2.521 0.179-5.052 0.179-7.599s-0.07-5.078-0.179-7.599c-2.368-54.759-30.186-103.283-72.543-135.215zM660.869 888.809l-38.472-36.492 0.92-0.872-69.159-65.6 38.472-36.492 69.159 65.6 130.205-123.505 38.472 36.492-169.597 160.869z" fill="#8a8a8a" ></path><path d="M791.994 691.447L661.789 814.952l-69.159-65.6-38.472 36.492 69.159 65.6-0.92 0.873 38.472 36.492L830.466 727.94z" fill="#ffffff" ></path></symbol><symbol id="icon-notice-board" viewBox="0 0 1024 1024"><path d="M464 736H192a80 80 0 0 1-80-80v-448A80 80 0 0 1 192 128h640a80 80 0 0 1 80 80v448A80 80 0 0 1 832 736h-272v64H768a32 32 0 0 1 32 32v32a32 32 0 0 1-32 32H256a32 32 0 0 1-32-32v-32a32 32 0 0 1 32-32h208v-64z m352-512h-608v416h608V224z m-448 96a32 32 0 0 1 32 32v208a32 32 0 0 1-32 32h-32a32 32 0 0 1-32-32V352a32 32 0 0 1 32-32h32z m320 48a32 32 0 0 1 32 32v160a32 32 0 0 1-32 32h-32a32 32 0 0 1-32-32v-160a32 32 0 0 1 32-32h32z m-160-96a32 32 0 0 1 32 32v256a32 32 0 0 1-32 32h-32a32 32 0 0 1-32-32v-256a32 32 0 0 1 32-32h32z" fill="#333333" ></path></symbol><symbol id="icon-setting" viewBox="0 0 1024 1024"><path d="M950.857143 402.285714h-51.748572a403.2 403.2 0 0 0-36.571428-86.308571l36.571428-36.571429a73.142857 73.142857 0 0 0 0-103.314285l-51.017142-51.931429a73.142857 73.142857 0 0 0-103.314286 0l-36.571429 36.571429A393.691429 393.691429 0 0 0 621.714286 125.074286V73.142857a73.142857 73.142857 0 0 0-73.142857-73.142857h-73.142858a73.142857 73.142857 0 0 0-73.142857 73.142857v51.931429a393.691429 393.691429 0 0 0-86.308571 35.657143l-36.571429-36.571429a73.142857 73.142857 0 0 0-103.314285 0L124.16 175.908571a73.142857 73.142857 0 0 0 0 103.314286l36.571429 36.571429a403.2 403.2 0 0 0-36.571429 86.308571H73.142857a73.142857 73.142857 0 0 0-73.142857 73.142857v73.142857a73.142857 73.142857 0 0 0 73.142857 73.142858h51.748572a403.2 403.2 0 0 0 36.571428 86.308571l-36.571428 36.571429a73.142857 73.142857 0 0 0 0 103.314285l51.748571 51.748572a73.142857 73.142857 0 0 0 103.314286 0l36.571428-36.571429A393.691429 393.691429 0 0 0 402.285714 898.925714V950.857143a73.142857 73.142857 0 0 0 73.142857 73.142857h73.142858a73.142857 73.142857 0 0 0 73.142857-73.142857v-51.931429a393.691429 393.691429 0 0 0 86.308571-35.657143l36.571429 36.571429a73.142857 73.142857 0 0 0 103.314285 0l51.748572-51.748571a73.142857 73.142857 0 0 0 0-103.314286l-36.571429-36.571429a403.2 403.2 0 0 0 36.571429-86.308571H950.857143a73.142857 73.142857 0 0 0 73.142857-73.142857V475.428571a73.142857 73.142857 0 0 0-73.142857-73.142857zM617.142857 613.668571a146.285714 146.285714 0 1 1-3.474286-206.811428 146.285714 146.285714 0 0 1 3.474286 206.811428z" fill="#131313" ></path></symbol><symbol id="icon-chatbot" viewBox="0 0 1024 1024"><path d="M282.4192 271.2064H742.4a79.9744 79.9744 0 0 1 79.9744 79.9744v400.0256a79.9744 79.9744 0 0 1-79.9744 79.9744H282.368a79.9744 79.9744 0 0 1-79.9744-79.9744V351.1808a79.9744 79.9744 0 0 1 80.0256-79.9744z m404.6336 445.952a24.0128 24.0128 0 0 0-16.9472-40.96H354.0992a24.0128 24.0128 0 0 0 0 48.0256h316.0064c6.3488 0 12.4928-2.56 16.9472-7.0656zM372.0192 604.672h280.0128a109.9776 109.9776 0 0 0 0-220.0064h-280.064a109.9776 109.9776 0 1 0 0 220.0064z m19.968-50.0224a60.0064 60.0064 0 1 0 0-120.0128 60.0064 60.0064 0 0 0 0 120.0128z m240.0256 0a60.0064 60.0064 0 1 0 0-120.0128 60.0064 60.0064 0 0 0 0 120.0128z" fill="#131313" ></path><path d="M953.344 160.6656a49.9712 49.9712 0 0 0-43.008 75.4688l-64 107.6736v333.4144h55.9616a24.0128 24.0128 0 0 0 24.0128-24.064v-192a24.0128 24.0128 0 0 0-24.064-23.9616h-55.552l104.8576-176.5376h1.7408a49.9712 49.9712 0 1 0 0-99.9936zM113.9712 236.1344l64 107.6736v333.3632H122.0096a24.0128 24.0128 0 0 1-24.0128-23.9616v-192a24.0128 24.0128 0 0 1 24.0128-24.064H177.664L72.704 260.7104h-1.7408a50.0224 50.0224 0 1 1 43.008-24.576z" fill="#131313" fill-opacity=".64" ></path></symbol><symbol id="icon-cloudupload-fill" viewBox="0 0 1024 1024"><path d="M1024 640.192C1024 782.912 919.872 896 787.648 896h-512C123.904 896 0 761.6 0 597.504 0 451.968 94.656 331.52 226.432 302.976 284.16 195.456 391.808 128 512 128c152.32 0 282.112 108.416 323.392 261.12C941.888 413.44 1024 519.04 1024 640.192z m-341.312-139.84L512 314.24 341.312 500.48h341.376z m-213.376 0v256h85.376v-256H469.312z" fill="#00377C" ></path></symbol><symbol id="icon-basic" viewBox="0 0 1024 1024"><path d="M116.4921875 776.19921875q0 21.60461426 13.89221192 35.54626465 13.89221191 13.84277344 35.54626464 13.84277344h84.98474122q13.89221191 34.01367188 44.79125975 54.13513183 29.36645508 20.07202148 67.97790528 20.07202148t67.97790528-20.07202148q30.89904786-20.12145997 44.79125976-54.08569336H858.06933594q21.65405273 0 35.54626465-13.89221192 13.89221191-13.94165039 13.89221191-35.59570311 0-21.60461426-13.89221191-35.49682617-13.89221191-13.89221191-35.54626465-13.89221192H476.45373535Q462.56152345 692.74707031 431.66247558 672.67504883q-29.36645508-20.07202148-67.97790527-20.07202149t-67.97790528 20.07202149q-30.89904786 20.07202148-44.79125975 54.08569336H165.93066406q-21.65405273 0-35.54626465 13.89221192-13.89221191 13.89221191-13.89221191 35.54626464z m197.75390625 0q0-21.65405273 13.89221192-35.54626465 13.94165039-13.89221191 35.54626464-13.89221191 21.65405273 0 35.54626464 13.89221191 13.89221191 13.89221191 13.89221193 35.54626465 0 21.60461426-13.89221193 35.54626465-13.94165039 13.84277344-35.54626464 13.84277344-21.65405273 0-35.54626465-13.84277344Q314.24609375 797.75439453 314.24609375 776.1003418z m296.63085938-247.19238281q0-21.65405273 13.8922119-35.54626467 13.89221191-13.89221191 35.54626466-13.8922119 21.65405273 0 35.54626464 13.8922119 13.89221191 13.89221191 13.89221192 35.54626467 0 21.60461426-13.89221192 35.54626465-13.89221191 13.84277344-35.54626464 13.84277344-21.65405273 0-35.54626466-13.84277344Q610.87695313 550.56201172 610.87695313 528.90795898z m49.43847656-123.59619141q-38.6114502 0-67.97790528 20.07202149-30.89904786 20.07202148-44.79125976 54.08569336H165.93066406q-21.65405273 0-35.54626465 13.89221191Q116.4921875 507.3527832 116.4921875 529.00683594q0 21.60461426 13.89221192 35.54626465 13.89221191 13.84277344 35.54626464 13.84277344h381.61560059q13.89221191 34.01367188 44.79125976 54.13513183 29.36645508 20.07202148 67.97790528 20.07202148t67.97790528-20.07202148q30.89904786-20.12145997 44.79125975-54.08569336H858.06933594q21.65405273 0 35.54626465-13.89221192 13.89221191-13.94165039 13.89221191-35.59570311 0-21.60461426-13.89221191-35.49682618-13.89221191-13.89221191-35.54626465-13.89221191h-84.98474122Q759.19238281 445.5546875 728.29333497 425.48266602q-29.36645508-20.07202148-67.97790528-20.07202149z m-247.19238282-74.15771484q-21.65405273 0-35.54626465-13.89221192Q363.68457031 303.36962891 363.68457031 281.76501463q0-21.60461426 13.89221192-35.49682615 13.94165039-13.89221191 35.54626465-13.89221191 21.65405273 0 35.54626464 13.84277342 13.89221191 13.94165039 13.89221193 35.59570313 0 21.60461426-13.89221193 35.54626466-13.94165039 13.84277344-35.54626464 13.84277344z m112.76916504-98.87695314Q512 198.36230469 481.10095214 178.2902832 451.73449707 158.21826172 413.12304687 158.21826172t-67.97790527 20.07202148Q314.24609375 198.36230469 300.35388183 232.37597657H165.93066406q-21.65405273 0-35.54626465 13.84277344Q116.4921875 260.20983886 116.4921875 281.86389159q0 21.60461426 13.89221192 35.54626466 13.89221191 13.84277344 35.54626464 13.84277344h134.42321777q13.89221191 34.01367188 44.79125977 54.13513184 29.36645508 20.07202148 67.97790528 20.07202148t67.97790527-20.07202148Q512 365.16772461 525.89221191 331.25292969H858.06933594q21.65405273 0 35.54626465-13.89221192 13.89221191-13.94165039 13.89221191-35.59570312 0-21.60461426-13.89221191-35.49682617-13.89221191-13.89221191-35.54626465-13.89221193H525.89221191z" fill="#595959" ></path></symbol><symbol id="icon-indexer" viewBox="0 0 1024 1024"><path d="M328.63338477 905.06522041q-18.38740957 18.33730752-44.0897001 18.33730752t-44.08970098-18.33730752l-161.62883525-176.35880303q-16.53363809-20.19107901-14.67986573-42.23592861 1.80366943-23.84851992 18.33730752-42.23592949 20.24118106-16.53363809 42.23592862-14.6798666 23.89862198 1.85377148 42.28603154 18.33730751l58.7695667 66.13455147V159.34805527q0-25.70229141 16.53363809-42.23592949 16.53363809-16.53363809 42.23592949-16.53363721 25.70229141 0 42.23592861 16.53363721 16.53363809 16.53363809 16.53363809 42.23592949v554.67849639l58.7695667-66.13455146q18.38740957-16.53363809 42.23592949-18.33730752 22.04485049-1.85377148 42.23592949 14.67986659 16.53363809 18.38740957 18.38740869 40.43225919 1.85377148 23.84851992-14.67986572 44.08970097l-161.62883525 176.30870098z m249.75813427-275.56062978q0-25.65218935 16.53363809-42.18582657 16.53363809-16.53363809 42.23592949-16.53363809h235.12836973q38.57848857 1.80366943 55.11212578 36.72471622 12.82609512 34.92104678-12.87619716 64.28077998l-135.92654297 134.07277148h93.69061435q25.70229141 0 42.23592862 16.53363809 16.53363809 16.53363809 16.53363808 42.23592949 0 25.75239346-16.53363808 42.28603067-16.53363809 16.53363809-42.23592862 16.53363808h-235.12836973q-38.57848857-1.85377148-55.11212665-36.77481826-12.82609512-34.87094473 12.87619716-64.28077998l135.92654297-134.07277148h-93.69061348q-25.70229141 0-42.23592949-16.53363809-16.53363809-16.53363809-16.53363809-42.23592949zM754.75032208 100.57848857q34.87094473 1.80366943 53.25835428 33.0672753l117.53913429 235.07826767 29.40983437 58.76956671q9.16865332 22.04485049 1.80366943 44.08970097-7.31488184 22.04485049-29.35973232 34.92104677-22.04485049 9.16865332-44.08970098 1.80367032-22.04485049-7.31488184-34.92104677-29.35973321l-12.82609513-25.7022914h-161.62883437l-12.87619717 25.7022914q-12.82609512 22.04485049-34.87094472 29.35973321-22.04485049 7.36498388-44.08970098-1.80367032-22.04485049-12.87619628-29.40983438-34.92104677-7.31488184-22.04485049 1.85377149-44.08970097l29.35973232-58.76956671 117.58923633-235.07826767q18.33730752-31.26360586 53.2583543-33.0672753z m-36.72471622 264.48810206h73.4494333-73.4494333 73.4494333l-36.72471709-73.49953535-36.72471621 73.49953534z" fill="#595959" ></path></symbol><symbol id="icon-retriever" viewBox="0 0 1024 1024"><path d="M934.966272 879.950848 709.541888 654.526464c47.665152-59.81696 76.166144-135.581696 76.166144-218.012672 0-193.36704-156.752896-350.124032-350.12096-350.124032S85.464064 243.145728 85.464064 436.513792s156.756992 350.124032 350.124032 350.124032c79.875072 0 153.486336-26.766336 212.39808-71.79264l226.04288 226.04288c8.416256 8.416256 19.441664 12.62592 30.470144 12.62592 11.025408 0 22.050816-4.209664 30.466048-12.62592C951.798784 924.055552 951.798784 896.782336 934.966272 879.950848zM165.953536 436.513792c0-148.912128 120.722432-269.630464 269.63456-269.630464S705.21856 287.60064 705.21856 436.513792 584.500224 706.148352 435.588096 706.148352 165.953536 585.42592 165.953536 436.513792z" fill="#595959" ></path><path d="M291.135488 302.036992c-8.997888-4.864-20.23424-1.511424-25.097216 7.486464-20.256768 37.476352-32.600064 78.152704-36.688896 120.899584-0.973824 10.181632 6.491136 19.224576 16.672768 20.1984 0.59904 0.057344 1.195008 0.084992 1.784832 0.084992 9.433088 0 17.497088-7.175168 18.413568-16.75776 3.613696-37.7856 14.5152-73.72288 32.401408-106.814464C303.485952 318.138368 300.1344 306.900992 291.135488 302.036992z" fill="#595959" ></path></symbol><symbol id="icon-node-parser" viewBox="0 0 1024 1024"><path d="M946.28571406 992h-137.14285687a45.71428594 45.71428594 0 0 1-45.71428594-45.71428594v-137.14285687a45.71428594 45.71428594 0 0 1 45.71428594-45.71428594h45.71428594v-137.14285688h-320.00000063v137.14285688h45.71428594a45.71428594 45.71428594 0 0 1 45.71428594 45.71428594v137.14285687a45.71428594 45.71428594 0 0 1-45.71428594 45.71428594H443.42857156a45.71428594 45.71428594 0 0 1-45.71428593-45.71428594v-137.14285687a45.71428594 45.71428594 0 0 1 45.71428593-45.71428594h45.71428594v-137.14285688H169.14285688v137.14285688h45.71428593a45.71428594 45.71428594 0 0 1 45.71428594 45.71428594v137.14285687a45.71428594 45.71428594 0 0 1-45.71428594 45.71428594H77.71428594a45.71428594 45.71428594 0 0 1-45.71428594-45.71428594v-137.14285687a45.71428594 45.71428594 0 0 1 45.71428594-45.71428594h45.71428593v-182.85714281h365.71428563V443.42857156H397.71428563a91.42857188 91.42857188 0 0 1-91.42857094-91.42857187V123.42857188a91.42857188 91.42857188 0 0 1 91.42857093-91.42857188h228.57142875a91.42857188 91.42857188 0 0 1 91.42857094 91.42857188v228.57142781a91.42857188 91.42857188 0 0 1-91.42857093 91.42857187h-91.42857188v137.14285688h365.71428563v182.85714281h45.71428593a45.71428594 45.71428594 0 0 1 45.71428594 45.71428594v137.14285687a45.71428594 45.71428594 0 0 1-45.71428594 45.71428594zM123.42857188 854.85714312v45.71428501h45.714285v-45.714285H123.42857188zM580.57142844 351.99999969a45.71428594 45.71428594 0 0 0 45.71428593-45.714285V169.14285688a45.71428594 45.71428594 0 0 0-45.71428593-45.71428501H443.42857156a45.71428594 45.71428594 0 0 0-45.71428593 45.714285v137.14285782a45.71428594 45.71428594 0 0 0 45.71428593 45.714285h137.14285688z m-91.42857094 502.85714344v45.71428499h45.714285v-45.714285h-45.714285z m411.42857063-1e-8h-45.71428501v45.71428501h45.714285v-45.71428501z" fill="#595959" ></path></symbol><symbol id="icon-generator1" viewBox="0 0 1024 1024"><path d="M532.48 531.953l418.377-248.159V775.9L531.017 1024l1.463-492.047zM512 492.047L95.086 245.292 512 0l416.914 245.292L512 492.047z m-23.406 36.922l-1.463 490.584-413.988-243.83V283.795l415.451 245.35z" fill="#595959" ></path></symbol><symbol id="icon-post-processor" viewBox="0 0 1024 1024"><path d="M329.9555552 329.9555552h364.0888896v364.0888896H329.9555552z" fill="#595959" ></path><path d="M967.11111147 420.97777813V329.9555552h-91.02222294V193.42222187c0-27.30666667-18.2044448-45.51111147-45.5111104-45.5111104h-136.53333333V56.88888853h-91.02222293v91.02222294h-182.04444374V56.88888853H329.9555552v91.02222294H193.42222187c-27.30666667 0-45.51111147 18.2044448-45.5111104 45.5111104v136.53333333H56.88888853v91.02222293h91.02222294v182.04444374H56.88888853v91.02222293h91.02222294v136.53333333c0 27.30666667 18.2044448 45.51111147 45.5111104 45.5111104h136.53333333v91.02222294h91.02222293v-91.02222294h182.04444374v91.02222294h91.02222293v-91.02222294h136.53333333c27.30666667 0 45.51111147-18.2044448 45.5111104-45.5111104v-136.53333333h91.02222294v-91.02222293h-91.02222294v-182.04444374h91.02222294z m-182.0444448 364.08888854H238.93333333V238.93333333h546.13333334v546.13333334z" fill="#595959" ></path></symbol><symbol id="icon-active" viewBox="0 0 1024 1024"><path d="M513.44 62A450.16000031 450.16000031 0 0 1 962 512a450.16000031 450.16000031 0 0 1-448.56 450H512A450.24 450.24 0 0 1 62 512 450.24 450.24 0 0 1 512 62h1.44zM411.99999969 318.39999969a19.99999969 19.99999969 0 0 0-19.99999969 20.00000062v347.19999938a19.99999969 19.99999969 0 0 0 30.72 16.8l272.80000031-173.59999969a19.99999969 19.99999969 0 0 0 0-33.6l-272.80000031-173.59999969a19.99999969 19.99999969 0 0 0-10.72000031-3.20000062z" fill="#595959" ></path></symbol></svg>'),
+  ((c) => {
     var l = (a = (a = document.getElementsByTagName("script"))[a.length - 1]).getAttribute("data-injectcss"),
       a = a.getAttribute("data-disable-injectsvg");
     if (!a) {
-      var c,
+      var h,
         t,
         i,
         o,
@@ -15,8 +15,8 @@
         m = function (l, a) {
           a.parentNode.insertBefore(l, a);
         };
-      if (l && !h.__iconfont__svg__cssinject__) {
-        h.__iconfont__svg__cssinject__ = !0;
+      if (l && !c.__iconfont__svg__cssinject__) {
+        c.__iconfont__svg__cssinject__ = !0;
         try {
           document.write(
             "<style>.svgfont {display: inline-block;width: 1em;height: 1em;fill: currentColor;vertical-align: -0.1em;font-size:16px;}</style>",
@@ -25,10 +25,10 @@
           console && console.log(l);
         }
       }
-      (c = function () {
+      (h = function () {
         var l,
           a = document.createElement("div");
-        (a.innerHTML = h._iconfont_svg_string_4784207),
+        (a.innerHTML = c._iconfont_svg_string_4784207),
           (a = a.getElementsByTagName("svg")[0]) &&
             (a.setAttribute("aria-hidden", "true"),
             (a.style.position = "absolute"),
@@ -40,29 +40,29 @@
       }),
         document.addEventListener
           ? ~["complete", "loaded", "interactive"].indexOf(document.readyState)
-            ? setTimeout(c, 0)
+            ? setTimeout(h, 0)
             : ((t = function () {
-                document.removeEventListener("DOMContentLoaded", t, !1), c();
+                document.removeEventListener("DOMContentLoaded", t, !1), h();
               }),
               document.addEventListener("DOMContentLoaded", t, !1))
           : document.attachEvent &&
-            ((i = c),
-            (o = h.document),
+            ((i = h),
+            (o = c.document),
             (v = !1),
-            s(),
+            p(),
             (o.onreadystatechange = function () {
-              "complete" == o.readyState && ((o.onreadystatechange = null), e());
+              "complete" == o.readyState && ((o.onreadystatechange = null), z());
             }));
     }
-    function e() {
+    function z() {
       v || ((v = !0), i());
     }
-    function s() {
+    function p() {
       try {
         o.documentElement.doScroll("left");
       } catch (l) {
-        return void setTimeout(s, 50);
+        return void setTimeout(p, 50);
       }
-      e();
+      z();
     }
   })(window);
diff --git a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.json b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.json
index a8fea13f43..54eab718fe 100644
--- a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.json
+++ b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.json
@@ -5,6 +5,97 @@
   "css_prefix_text": "icon-",
   "description": "",
   "glyphs": [
+    {
+      "icon_id": "13542590",
+      "name": "simple-robot",
+      "font_class": "simple-robot",
+      "unicode": "e604",
+      "unicode_decimal": 58884
+    },
+    {
+      "icon_id": "14551080",
+      "name": "deep_search",
+      "font_class": "deep_search",
+      "unicode": "e620",
+      "unicode_decimal": 58912
+    },
+    {
+      "icon_id": "38847045",
+      "name": "机器人-05",
+      "font_class": "jiqiren-05",
+      "unicode": "ec1e",
+      "unicode_decimal": 60446
+    },
+    {
+      "icon_id": "46000445",
+      "name": "recursive",
+      "font_class": "recursive",
+      "unicode": "e61e",
+      "unicode_decimal": 58910
+    },
+    {
+      "icon_id": "46000444",
+      "name": "simple",
+      "font_class": "simple",
+      "unicode": "e61f",
+      "unicode_decimal": 58911
+    },
+    {
+      "icon_id": "45982435",
+      "name": "路径",
+      "font_class": "lujing",
+      "unicode": "e61d",
+      "unicode_decimal": 58909
+    },
+    {
+      "icon_id": "3638339",
+      "name": "agent",
+      "font_class": "agent",
+      "unicode": "e62c",
+      "unicode_decimal": 58924
+    },
+    {
+      "icon_id": "4772844",
+      "name": "Pipeline",
+      "font_class": "pipeline",
+      "unicode": "e650",
+      "unicode_decimal": 58960
+    },
+    {
+      "icon_id": "15838538",
+      "name": "skip",
+      "font_class": "skip1",
+      "unicode": "e67f",
+      "unicode_decimal": 59007
+    },
+    {
+      "icon_id": "12753474",
+      "name": "annotation",
+      "font_class": "annotation",
+      "unicode": "e62e",
+      "unicode_decimal": 58926
+    },
+    {
+      "icon_id": "33279726",
+      "name": "groundtruth",
+      "font_class": "groundtruth",
+      "unicode": "e9b7",
+      "unicode_decimal": 59831
+    },
+    {
+      "icon_id": "687788",
+      "name": "知识库",
+      "font_class": "kb",
+      "unicode": "e639",
+      "unicode_decimal": 58937
+    },
+    {
+      "icon_id": "5299955",
+      "name": "experience",
+      "font_class": "experience",
+      "unicode": "e68e",
+      "unicode_decimal": 59022
+    },
     {
       "icon_id": "44419262",
       "name": "deep-think",
diff --git a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.ttf b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.ttf
index d49803ef9c..8c90a44513 100644
Binary files a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.ttf and b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.ttf differ
diff --git a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.woff b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.woff
index e9b153a7f5..b18a749da0 100644
Binary files a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.woff and b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.woff differ
diff --git a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.woff2 b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.woff2
index 1f66b46dff..75fdccb56d 100644
Binary files a/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.woff2 and b/EdgeCraftRAG/ui/vue/src/assets/iconFont/iconfont.woff2 differ
diff --git a/EdgeCraftRAG/ui/vue/src/components.d.ts b/EdgeCraftRAG/ui/vue/src/components.d.ts
index f79d1e1d69..35e756d199 100644
--- a/EdgeCraftRAG/ui/vue/src/components.d.ts
+++ b/EdgeCraftRAG/ui/vue/src/components.d.ts
@@ -10,11 +10,51 @@ export {};
 /* prettier-ignore */
 declare module 'vue' {
   export interface GlobalComponents {
+    AAffix: typeof import('ant-design-vue/es')['Affix']
     AButton: typeof import('ant-design-vue/es')['Button']
+    ACheckbox: typeof import('ant-design-vue/es')['Checkbox']
+    ACheckboxGroup: typeof import('ant-design-vue/es')['CheckboxGroup']
+    ACol: typeof import('ant-design-vue/es')['Col']
+    ACollapse: typeof import('ant-design-vue/es')['Collapse']
+    ACollapsePanel: typeof import('ant-design-vue/es')['CollapsePanel']
+    AConfigProvider: typeof import('ant-design-vue/es')['ConfigProvider']
+    ADescriptions: typeof import('ant-design-vue/es')['Descriptions']
+    ADescriptionsItem: typeof import('ant-design-vue/es')['DescriptionsItem']
+    ADivider: typeof import('ant-design-vue/es')['Divider']
+    ADrawer: typeof import('ant-design-vue/es')['Drawer']
+    ADropdown: typeof import('ant-design-vue/es')['Dropdown']
+    AEmpty: typeof import('ant-design-vue/es')['Empty']
+    AForm: typeof import('ant-design-vue/es')['Form']
+    AFormItem: typeof import('ant-design-vue/es')['FormItem']
+    AImage: typeof import('ant-design-vue/es')['Image']
     AInput: typeof import('ant-design-vue/es')['Input']
+    AInputNumber: typeof import('ant-design-vue/es')['InputNumber']
     ALayout: typeof import('ant-design-vue/es')['Layout']
     ALayoutContent: typeof import('ant-design-vue/es')['LayoutContent']
+    ALayoutHeader: typeof import('ant-design-vue/es')['LayoutHeader']
+    ALayoutSider: typeof import('ant-design-vue/es')['LayoutSider']
+    AMenu: typeof import('ant-design-vue/es')['Menu']
+    AMenuItem: typeof import('ant-design-vue/es')['MenuItem']
+    AModal: typeof import('ant-design-vue/es')['Modal']
+    APagination: typeof import('ant-design-vue/es')['Pagination']
+    APopover: typeof import('ant-design-vue/es')['Popover']
+    ARadio: typeof import('ant-design-vue/es')['Radio']
+    ARadioGroup: typeof import('ant-design-vue/es')['RadioGroup']
+    ARow: typeof import('ant-design-vue/es')['Row']
+    ASelect: typeof import('ant-design-vue/es')['Select']
+    ASelectOption: typeof import('ant-design-vue/es')['SelectOption']
+    ASlider: typeof import('ant-design-vue/es')['Slider']
+    ASpace: typeof import('ant-design-vue/es')['Space']
+    ASteps: typeof import('ant-design-vue/es')['Steps']
+    ATable: typeof import('ant-design-vue/es')['Table']
+    ATag: typeof import('ant-design-vue/es')['Tag']
+    ATextarea: typeof import('ant-design-vue/es')['Textarea']
+    ATooltip: typeof import('ant-design-vue/es')['Tooltip']
+    AUploadDragger: typeof import('ant-design-vue/es')['UploadDragger']
+    FormTooltip: typeof import('./components/FormTooltip.vue')['default']
     RouterLink: typeof import('vue-router')['RouterLink']
     RouterView: typeof import('vue-router')['RouterView']
+    SvgIcon: typeof import('./components/SvgIcon.vue')['default']
+    TableColumns: typeof import('./components/TableColumns.vue')['default']
   }
 }
diff --git a/EdgeCraftRAG/ui/vue/src/components/PartialLoading.vue b/EdgeCraftRAG/ui/vue/src/components/PartialLoading.vue
new file mode 100644
index 0000000000..b744f43e11
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/components/PartialLoading.vue
@@ -0,0 +1,70 @@
+<template>
+  <div v-if="props.visible" class="loading-container">
+    <div class="loading-wrap">
+      <a-spin :size="size" />
+      <p
+        class="loading-title"
+        :style="{ fontSize: size === 'default' ? '14px' : '18px' }"
+      >
+        {{ title ? title : t("common.loading") }}...
+      </p>
+      <p class="loading-text" v-if="showDes">
+        {{ describe ? describe : t("common.waitTip") }}
+      </p>
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts" name="TunerLoading">
+import { useI18n } from "vue-i18n";
+
+const { t } = useI18n();
+
+const props = defineProps({
+  visible: {
+    type: Boolean,
+    required: true,
+    default: false,
+  },
+  size: {
+    type: String,
+    default: "large",
+  },
+  title: {
+    type: String,
+    default: "",
+  },
+  describe: {
+    type: String,
+    default: "",
+  },
+  showDes: {
+    type: Boolean,
+    default: true,
+  },
+});
+</script>
+
+<style lang="less" scoped>
+.loading-container {
+  width: 100%;
+  height: 100%;
+  flex: 1;
+  .vertical-center;
+  .loading-wrap {
+    text-align: center;
+    padding: 24px;
+    .loading-title {
+      font-size: 18px;
+      line-height: 28px;
+      font-weight: 600;
+      color: var(--font-main-color);
+      margin: 8px auto;
+    }
+    .loading-text {
+      line-height: 20px;
+      color: var(--font-text-color);
+    }
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/i18n/en.ts b/EdgeCraftRAG/ui/vue/src/i18n/en.ts
index 39d3cf0fa8..9f267a1cf0 100644
--- a/EdgeCraftRAG/ui/vue/src/i18n/en.ts
+++ b/EdgeCraftRAG/ui/vue/src/i18n/en.ts
@@ -26,7 +26,21 @@ export default {
     clear: "Clear",
     all: "All",
     reset: "Reset",
+    export: "Export",
     uploadTip: "Click or drag file to this area to upload",
+    loading: "Loading",
+    waitTip: "Please wait patiently and do not refresh the page during this period.",
+    copy: "Copy",
+    send: "Send",
+    regenerate: "Regenerate",
+    copySucc: "Copy successful !",
+    copyError: "Copy failed !",
+    emptyText: "The content is empty !",
+    yes: "Yes",
+    no: "No",
+    manual: "Create Now",
+    inputTip: "Please enter ",
+    connect: "Connect",
   },
   system: {
     title: "System Status",
@@ -38,7 +52,7 @@ export default {
     notUsed: "Not Used",
     info: "System Information",
     kernel: "Kernel",
-    processor: "KerProcessornel",
+    processor: "Processor",
     os: "OS",
     time: "Current time",
   },
@@ -85,10 +99,12 @@ export default {
       indexer: "Indexer",
       indexerType: "Indexer Type",
       embedding: "Embedding Model",
+      embeddingUrl: "Embedding URL",
       embeddingDevice: "Embedding run device",
       retriever: "Retriever",
       retrieverType: "Retriever Type",
       topk: "Search top k",
+      topn: "Rerank top n",
       postProcessor: "PostProcessor",
       postProcessorType: "PostProcessor Type",
       rerank: "Rerank Model",
@@ -99,15 +115,17 @@ export default {
       language: "Large Language Model",
       llmDevice: "LLM run device",
       weights: "Weights",
-      local: "Local",
-      vllm: "Vllm",
-      vector_uri: "Vector Uri",
+      local: "Local (OpenVINO)",
+      vllm: "Remote (vLLM)",
+      vector_url: "Vector Database URL",
       modelName: "Model Name",
-      vllm_url: "Vllm Url",
+      vllm_url: "vLLM URL",
+      kbadmin: "kbadmin",
     },
     valid: {
       nameValid1: "Please input name",
       nameValid2: "Name should be between 2 and 30 characters",
+      nameValid3: "The name only supports letters, numbers, and underscores.",
       nodeParserType: "Please select Node Parser Type",
       chunkSizeValid1: "Please select Chunk Size",
       chunkSizeValid2: "The value of Chunk Size cannot be less than Chunk Overlap",
@@ -115,25 +133,43 @@ export default {
       chunkOverlapValid2: "The value of Chunk Overlap cannot be greater than Chunk Size",
       windowSize: "Please select Chunk Window Size",
       indexerType: "Please select Indexer Type",
-      embedding: "Please select Embedding Model",
+      embedding: "Please select embedding Model",
+      embeddingUrl: "IP : Port, (e.g. 192.168.1.1:13020)",
       embeddingDevice: "Please select Embedding run device",
       retrieverType: "Please select Retriever Type",
+      retrieverTypeFormat: "Retriever type can only select kbadmin",
       topk: "Please select Top k",
+      topn: "Please select Top n",
       postProcessorType: "Please select PostProcessor Type",
       rerank: "Please select Rerank Model",
       rerankDevice: "Please select Rerank run device",
       generatorType: "Please select Generator Type",
-      language: "Please select Large Language Model",
+      language: "Please select or enter Large Language Model",
       llmDevice: "Please select LLM run device",
       weights: "Please select Weights",
-      vector_uri: "IP : Port, (e.g. 192.168.1.1:19530)",
+      kb_vector_url: "IP : Port, (e.g. 192.168.1.1:29530)",
+      vector_url: "IP : Port, (e.g. 192.168.1.1:19530)",
       vllm_url: "IP : Port, (e.g. 192.168.1.1:8086)",
-      urlValid1: "Please enter url",
+      urlValid1: "Please enter vector url",
       urlValid2: "Please enter the correct url",
       urlValid3: "URL cannot be accessed",
       urlValid4: "Test passed !",
       urlValid5: "The URL has not passed verification yet",
       modelName: "Please enter model name",
+      vllmUrlValid1: "Please enter vLLM url",
+      vllmUrlValid2: "Please enter the correct url",
+      vllmUrlValid3: "URL cannot be accessed",
+      vllmUrlValid4: "Test passed !",
+      vllmUrlValid5: "The URL has not passed verification yet",
+      nodeParserTypeTip: "Both Indexer Type and  Retriever Type will be set to kbadmin at the same time",
+      indexerTypeTip: "Both Node Parser Type and  Retriever Type will be set to kbadmin at the same time",
+      retrieverTypeTip: "Both Node Parser Type and  Indexer Type will be set to kbadmin at the same time",
+      retrieverChangeTip: "Please go to the Indexer stage to complete the data",
+      indexerTypeValid1: "Indexer type can only select kbadmin",
+      modelRequired: "Please enter embedding model url",
+      modelFormat: "Please enter the correct url",
+      retrieverValid: "Please return to the Indexer stage to supplement information.",
+      modelTip: "Please connect to vLLM service",
     },
     desc: {
       name: "The name identifier of the pipeline",
@@ -143,14 +179,15 @@ export default {
       windowSize: "The number of sentences on each side of a sentence to capture",
       indexerType: "The type of index structure responsible for building based on the parsed nodes",
       embedding: "Embed the text data to represent it and build a vector index",
-      embeddingDevice: "The device used by the Embedding Model",
+      embeddingUrl: "Connecting embedding model url",
+      embeddingDevice: "The device used by the embedding model",
       retrieverType:
-        "The retrieval type used when retrieving relevant nodes from the index according to the user's query",
+        "The retrieval type used when retrieving relevant nodes from the index according to the user's experience",
       topk: "The number of top k results to return",
       postProcessorType: "Select postprocessors for post-processing of the context",
       rerank: "Rerank Model",
       rerankDevice: "Rerank run device",
-      generatorType: "Local inference generator or vllm generator",
+      generatorType: "Local inference generator or vLLM generator",
       language: "The large model used for generating dialogues",
       llmDevice: "The device used by the  LLM",
       weights: "Model weight",
@@ -167,15 +204,17 @@ export default {
         "Sentence window node parser. Splits a document into Nodes, with each node being a sentence. Each node contains a window from the surrounding sentences in the metadata.",
       unstructured: "UnstructedNodeParser is a component that processes unstructured data.",
       milvusVector: "Embedding vectors stored in milvus",
-      vector_uri: "Connecting milvus uri",
+      vector_url: "Connecting milvus vector url",
       test: "Test",
-      modelName: "Vllm model name",
-      vllm_url: " Test if Vllm url is available ",
+      modelName: "vLLM model name",
+      vllm_url: " Test if vLLM url is available ",
+      kbadmin: "Third party knowledge base engine",
     },
   },
   generation: {
     title: "Generation Configuration",
     retriever: "Retriever Configuration",
+    tips: "Setting the parameter to 0 will inherit the default value from the currently active Pipeline.",
     config: {
       top_n: "Rerank top n",
       temperature: "Temperature",
@@ -203,12 +242,14 @@ export default {
     tip4: "Please enter your question...",
     new: "New Chat",
     rag: "EC RAG",
-    setting: "Pipeline Setting",
+    setting: "Settings",
     clear: "Clear Message",
     think: "Think",
     reason: "Think",
     thinkStart: "Thinking...",
     thinkEnd: "Thoughts",
+    history: "Chat History",
+    notExist: "Session not found.",
   },
   knowledge: {
     title: "Knowledge Base",
@@ -218,18 +259,36 @@ export default {
     edit: "Edit Knowledge Base",
     deleteTip: "Are you sure delete this knowledge base?",
     activeTip: "Are you sure activate this knowledge base?",
-    uploadTip: "Supports PDF, Word, TXT,Doc,Html,PPT formats, with a single file size not exceeding 200M",
+    uploadTip: "Supports PDF, Word, TXT,Doc,Html,PPT,ZIP formats, with a single file size not exceeding 200M",
     notFileTip: "The knowledge base is empty. Go upload your files.",
     name: "Name",
     des: "Description",
     activated: "Activated",
     nameValid1: "Please input knowledge base name",
     nameValid2: "Name should be between 2 and 30 characters",
-    nameValid3: "The name cannot start with a number",
+    nameValid3: "Alphanumeric and underscore only, starting with a letter or underscore.",
     desValid: "Please input knowledge base description",
     activeValid: "Please select whether to activate",
-    uploadValid: "Single file size not exceeding 50M.",
+    uploadValid: "Single file size not exceeding 200M.",
+    zipNoFiles: "The ZIP file is empty.",
     deleteFileTip: "Are you sure delete this file?",
+    selectTitle: "Create Type Select",
+    selectDes: "Please select the type you want to create",
+    experience: "Experience",
+    experienceDes:
+      "Experience refers to the knowledge and skills acquired through practical involvement, trial, and reflection, serving as a key foundation for solving real-world problems.",
+    kbDes:
+      "A Knowledge Base is a centralized repository for storing organized information such as documents, FAQs, and guides, enabling teams or users to quickly access and share knowledge.",
+    type: "Type",
+    original: "Original",
+    kbadmin: "kbadmin",
+    typeValid: "Please select knowledge base type",
+    nameRequired: "Please select kbadmin name",
+    waitTip: "Please be patient and wait for the file upload to complete.",
+    done: "Finished",
+    successfully: "Successfully ",
+    failed: "Failed",
+    totalTip: "files",
   },
   request: {
     pipeline: {
@@ -237,6 +296,7 @@ export default {
       updateSucc: "Pipeline update successfully !",
       deleteSucc: "Pipeline deleted successfully !",
       switchSucc: "Pipeline state switch successful !",
+      connectSucc: "vLLM service connection successful!",
     },
     chatbot: {
       updateSucc: "Configuration update successful !",
@@ -248,9 +308,97 @@ export default {
       updateSucc: "Knowledge Base update successfully !",
       deleteSucc: "Knowledge Base deleted successfully !",
     },
+    experience: {
+      createSucc: "Experience created successfully!",
+      updateSucc: "Experience update successful!",
+      deleteSucc: "Experience deleted successfully!",
+    },
+    agent: {
+      createSucc: "Agent created successfully!",
+      updateSucc: "Agent update successful!",
+      deleteSucc: "Agent deleted successfully!",
+    },
   },
   error: {
     notFoundTip: "Uh oh! It seems like you're lost",
     back: "Go Home",
   },
+  experience: {
+    create: "Create Experience",
+    edit: "Edit Experience",
+    import: "Import Experience",
+    fileFormatTip: "Supports JSON format, with file size not exceeding 100M.",
+    importSuccTip: "Files upload successful!",
+    importErrTip: "Files upload failed!",
+    uploadValid: "Single file size not exceeding 100M.",
+    experience: "Experience",
+    detail: "Detail",
+    operation: "Operation",
+    deleteTip: "Are you sure delete this experience?",
+    addExperience: "Add Experience",
+    delExperience: "Delete Experience",
+    addContent: "Add Content",
+    delContent: "Delete Content",
+    total: "Total experience: ",
+    unique: "Unique",
+    selectTip: "Please choose an appropriate method for data update",
+    cover: "Cover",
+    increase: "Append",
+    deactivateTip: "Are you sure deactivate this experience?",
+    activeTip: "Are you sure activate this experience?",
+    label: {
+      experience: "Experience",
+      contents: "Experience Content",
+      content: "Content",
+    },
+    placeholder: {
+      experience: "Please enter Experience",
+      content: "Please enter content",
+    },
+    valid: {
+      experience: "Experience cannot be empty",
+      content: "Content cannot be empty",
+    },
+  },
+  agent: {
+    agent: "Agent",
+    create: "Create Agent",
+    edit: "Edit Agent",
+    detail: "Agent Details",
+    import: "Import Agent",
+    activated: "Activated",
+    inactive: "Inactive",
+    isActive: "Activated",
+    importSuccTip: "Files upload successful!",
+    importErrTip: "Files upload failed!",
+    name: "Name",
+    id: "ID",
+    status: "Status",
+    operation: "Operation",
+    configs: "Configs",
+    deactivateTip: "Are you sure deactivate this agent?",
+    activeTip: "Are you sure activate this agent?",
+    deleteTip: "Are you sure you want to delete this conversation record ?",
+    addConfigs: "Add Configs",
+    delConfigs: "Delete Config",
+    noData: "No settings configured",
+    think: "Agent Thinking",
+    pipeline: "Pipeline ID",
+    label: {
+      name: "Agent Name",
+      type: "Agent Type ",
+      pipeline: "Pipeline Name",
+      configs: "Agent Configs",
+      key: "Config Key",
+      value: "Config Value",
+    },
+    valid: {
+      name: "Please enter name",
+      type: "Please select agent type",
+      pipeline: "Please select pipeline name",
+      configs: "Please enter agent configs",
+      key: "Please enter config key",
+      value: "Please enter config value",
+    },
+  },
 };
diff --git a/EdgeCraftRAG/ui/vue/src/i18n/zh.ts b/EdgeCraftRAG/ui/vue/src/i18n/zh.ts
index 2a1a318851..f374633a1a 100644
--- a/EdgeCraftRAG/ui/vue/src/i18n/zh.ts
+++ b/EdgeCraftRAG/ui/vue/src/i18n/zh.ts
@@ -26,7 +26,21 @@ export default {
     clear: "清除",
     all: "全选",
     reset: "重置",
+    export: "导出",
     uploadTip: "点击或将文件拖到此区域进行上传",
+    loading: "加载中",
+    waitTip: "请耐心等待，在此期间不要刷新页面。",
+    copy: "复制",
+    send: "发送",
+    regenerate: "重新生成",
+    copySucc: "复制成功！",
+    copyError: "复制失败！",
+    emptyText: "内容为空！",
+    yes: "是",
+    no: "否",
+    manual: "去创建",
+    inputTip: "请输入 ",
+    connect: "连接",
   },
   system: {
     title: "系统状态",
@@ -84,10 +98,12 @@ export default {
       indexer: "索引器",
       indexerType: "索引器类型",
       embedding: "嵌入模型",
+      embeddingUrl: "嵌入模型地址",
       embeddingDevice: "模型运行设备",
       retriever: "检索器",
       retrieverType: "检索器类型",
       topk: "检索 top k",
+      topn: "Top n",
       postProcessor: "节点后处理器",
       postProcessorType: "节点后处理器类型",
       rerank: "重排模型",
@@ -98,15 +114,17 @@ export default {
       language: "语言大模型",
       llmDevice: "运行设备",
       weights: "权重",
-      local: "本地",
-      vllm: "Vllm",
-      vector_uri: "Vector Uri",
+      local: "本地（OpenVINO）",
+      vllm: "远程（vLLM）",
+      vector_url: "向量数据库地址",
       modelName: "模型名称",
-      vllm_url: "Vllm 地址",
+      vllm_url: "vLLM 地址",
+      kbadmin: "kbadmin",
     },
     valid: {
       nameValid1: "请输入名称",
       nameValid2: "请输入 2 到 30 个字符的名称",
+      nameValid3: "名称仅支持字母、数字和下划线",
       nodeParserType: "请选择节点解析器类型",
       chunkSizeValid1: "请选择分块大小",
       chunkSizeValid2: "分块大小的值不能小于分块重叠值",
@@ -115,24 +133,42 @@ export default {
       windowSize: "请选择句子上下文窗口大小",
       indexerType: "请选择索引器类型",
       embedding: "请选择嵌入模型",
+      embeddingUrl: "IP : 端口，(例如 192.168.1.1:13020)",
       embeddingDevice: "请选择嵌入模型运行设备",
       retrieverType: "请选择检索器类型",
+      retrieverTypeFormat: "检索器类型只能选择kbadmin",
       topk: "请选择Top k",
+      topn: "请选择Top n",
       postProcessorType: "请选择后处理器类型",
       rerank: "请选择重排模型",
       rerankDevice: "请选择重排模型运行设备",
       generatorType: "请选择生成器类型",
-      language: "请选择大语言模型",
+      language: "请选择或输入大语言模型",
       llmDevice: "请选择大语言模型运行设备",
       weights: "请选择模型权重",
-      vector_uri: "IP : 端口，(例如 192.168.1.1:19530)",
+      kb_vector_url: "IP : 端口，(例如 192.168.1.1:29530)",
+      vector_url: "IP : 端口，(例如 192.168.1.1:19530)",
       vllm_url: "IP : 端口，(例如 192.168.1.1:8086)",
-      urlValid1: "URL 不能为空",
-      urlValid2: "请输入正确的URL",
-      urlValid3: "URL无法访问",
+      urlValid1: "向量数据库地址不能为空",
+      urlValid2: "请输入正确的向量数据库地址",
+      urlValid3: "向量数据库地址无法访问",
       urlValid4: "测试通过！",
-      urlValid5: "URL还未通过校验",
+      urlValid5: "向量数据库地址还未通过校验",
       modelName: "请输入模型名称",
+      vllmUrlValid1: "vLLM地址不能为空",
+      vllmUrlValid2: "请输入正确的vLLM地址",
+      vllmUrlValid3: "vLLM地址无法访问",
+      vllmUrlValid4: "测试通过！",
+      vllmUrlValid5: "vLLM地址还未通过校验",
+      nodeParserTypeTip: "索引器类型和检索器类型将同时设置为kbadmin",
+      indexerTypeTip: "节点解析器类型和检索器类型将同时设置为kbadmin",
+      retrieverTypeTip: "索引器类型和节点解析器类型将同时设置为kbadmin",
+      retrieverChangeTip: "请前往索引器阶段补全数据",
+      indexerTypeValid1: "索引器类型只能选择kbadmin",
+      modelRequired: "请输入嵌入模型地址",
+      modelFormat: "请输入正确的模型地址",
+      retrieverValid: "请回到Indexer阶段补充信息",
+      modelTip: "请先连接vLLM服务",
     },
     desc: {
       name: "Pipeline的名称标识，用于区分不同工作流",
@@ -142,13 +178,14 @@ export default {
       windowSize: "每个节点捕获的上下文句子窗口大小，用于增强语义完整性",
       indexerType: "基于解析节点构建的索引结构类型",
       embedding: "将文本转换为向量表示的过程",
+      embeddingUrl: "嵌入模型地址",
       embeddingDevice: "执行嵌入模型推理的硬件设备（CPU/GPU）",
       retrieverType: "根据用户查询从索引中检索节点的算法类型",
       topk: "检索时返回的最相关结果数量",
       postProcessorType: "对检索结果进行后处理的组件类型",
       rerank: "对检索结果进行二次排序的模型，提升答案相关性",
       rerankDevice: "执行重排模型推理的硬件设备（CPU/GPU）",
-      generatorType: "回答生成方式的类型（本地部署模型或 vllm 高效推理框架）",
+      generatorType: "回答生成方式的类型（本地部署模型或 vLLM 高效推理框架）",
       language: "用于生成自然语言回答的大模型（如 LLaMA、ChatGLM）",
       llmDevice: "大语言模型推理的硬件设备（需匹配模型规模要求）",
       weights: "大模型的权重",
@@ -157,22 +194,24 @@ export default {
       vectorsimilarity: "根据向量相似性进行检索",
       autoMerge: "该检索器会尝试将上下文合并到父级上下文中",
       bm25: "使用BM25算法检索节点的BM25检索器",
-      faissVector: "嵌入存储在Faiss索引中。",
+      faissVector: "矢量索引存储在Faiss中。",
       vector: "矢量存储索引",
       simple: "解析文本，优先选择完整的句子。",
-      hierarchical: "使用借点解析将文档分割成递归层次节点",
+      hierarchical: "使用NodeParser将文档拆分为递归层次结构的节点。",
       sentencewindow: "将文档分割成节点，每个节点代表一个句子。每个节点包含一个来自元数据中周围句子的窗口",
       unstructured: "一个处理非结构化数据的组件",
-      milvusVector: "嵌入存储在Milvus索引中",
-      vector_uri: "测试Milvus地址是否可用",
+      milvusVector: "矢量索引存储在Milvus中",
+      vector_url: "测试Milvus地址是否可用",
       test: "测 试",
-      modelName: "Vllm 模型名称",
-      vllm_url: "测试Vllm地址是否可用",
+      modelName: "vLLM 模型名称",
+      vllm_url: "测试vLLM地址是否可用",
+      kbadmin: "第三方知识库系统",
     },
   },
   generation: {
     title: "生成器配置",
     retriever: "检索器配置",
+    tips: "参数为 0 时，将继承当前激活 Pipeline 的默认值。",
     config: {
       top_n: "Rerank top n",
       temperature: "Temperature",
@@ -199,12 +238,14 @@ export default {
     tip4: "有什么问题？请在这里输入...",
     new: "开启新对话",
     rag: "EC RAG",
-    setting: "Pipeline 配置",
+    setting: "配置",
     clear: "清除消息",
     think: "思考",
     reason: "思考",
     thinkStart: "思考中...",
     thinkEnd: "思考过程",
+    history: "历史会话",
+    notExist: "会话不存在！",
   },
   knowledge: {
     title: "知识库",
@@ -214,18 +255,36 @@ export default {
     edit: "编辑知识库",
     deleteTip: "您确定要删除此知识库吗？此操作不可恢复。",
     activeTip: "您确定要激活此知识库吗？",
-    uploadTip: "支持 PDF、Word、TXT、Doc、HTML、PPT 格式，单个文件大小不超过 200M。",
+    uploadTip: "支持 PDF、Word、TXT、Doc、HTML、PPT、ZIP 格式，单个文件大小不超过 200M。",
     notFileTip: "您还没有上传任何文件，点击“上传”按钮开始添加内容吧～",
     name: "名称",
     des: "描述",
     activated: "激活状态",
     nameValid1: "请输入知识库名称",
     nameValid2: "请输入 2 到 30 个字符的名称",
-    nameValid3: "名称不能以数字开头",
+    nameValid3: "仅支持字母、数字和下划线，必须以字母或下划线开头。",
     desValid: "请输入知识库描述",
     activeValid: "请选择是否启用该功能。",
-    uploadValid: "单个文件大小不得超过 50MB",
+    uploadValid: "单个文件大小不得超过 200MB",
+    zipNoFiles: "上传的 ZIP 压缩包为空",
     deleteFileTip: "您确定要删除此文档吗？此操作不可恢复。",
+    selectTitle: "创建类型选择",
+    selectDes: "请选择要创建的数据类型",
+    experience: "经验注入",
+    experienceDes:
+      "Experience是指个人或团队在实践过程中积累的知识和技能，通常通过实际操作、试错和反思获得，是解决实际问题的重要依据",
+    kbDes:
+      "知识库是系统化存储信息的集合，用于集中管理文档、常见问题、操作指南等知识内容，便于团队或用户快速查找和共享信息。",
+    type: "类型",
+    original: "原始的",
+    kbadmin: "kbadmin",
+    typeValid: "请选择知识库类型",
+    nameRequired: "请选择kbadmin名称",
+    waitTip: "请耐心等待所有文件上传完成！",
+    done: "已完成",
+    successfully: "成功",
+    failed: "失败",
+    totalTip: "个文件",
   },
   request: {
     pipeline: {
@@ -233,6 +292,7 @@ export default {
       updateSucc: "Pipeline 更新成功!",
       deleteSucc: "Pipeline 删除成功!",
       switchSucc: "Pipeline 状态切换成功!",
+      connectSucc: "vLLM 服务连接成功!",
     },
     chatbot: {
       updateSucc: "配置更新成功!",
@@ -242,11 +302,100 @@ export default {
       deleteFileSucc: "文档删除成功!",
       createSucc: "知识库创建成功!",
       updateSucc: "知识库更新成功!",
-      deleteSucc: " 知识库删除成功!",
+      deleteSucc: "知识库删除成功!",
+    },
+    experience: {
+      createSucc: "经验创建成功!",
+      updateSucc: "经验更新成功!",
+      deleteSucc: "经验删除成功!",
+    },
+    agent: {
+      createSucc: "智能体创建成功!",
+      updateSucc: "智能体更新成功!",
+      deleteSucc: "智能体删除成功!",
     },
   },
   error: {
     notFoundTip: "Oops 好像走错地方啦～",
     back: "首页",
   },
+  experience: {
+    create: "新建经验",
+    edit: "编辑经验",
+    import: "导入经验",
+    fileFormatTip: "仅支持JSON格式,文件大小不超过100M",
+    importSuccTip: "文件上传成功！",
+    importErrTip: "文件上传失败！",
+    uploadValid: "单个文件大小不得超过 200MB",
+    experience: "经验",
+    detail: "详情",
+    operation: "操作",
+    deleteTip: "确定要删除这个经验？此操作不可恢复。",
+    addExperience: "新增经验",
+    delExperience: "删除经验",
+    addContent: "新增内容",
+    delContent: "删除内容",
+    total: "经验总数: ",
+    unique: "唯一",
+    selectTip: "请选择合适的方式进行数据更新",
+    cover: "覆盖",
+    increase: "追加",
+    deactivateTip: "您确定要停用该经验库吗？",
+    activeTip: "您确定要启用该经验库吗？",
+    label: {
+      experience: "经验",
+      contents: "经验内容",
+      content: "内容",
+    },
+    placeholder: {
+      experience: "请输入经验",
+      content: "请输入内容",
+    },
+    valid: {
+      experience: "经验不能为空",
+      content: "内容不能为空",
+    },
+  },
+  agent: {
+    agent: "智能体",
+    create: "创建智能体",
+    edit: "编辑智能体",
+    detail: "智能体详情",
+    import: "导入智能体",
+    isActive: "状态",
+    activated: "已启用",
+    inactive: "已停用",
+    pipelineFormatTip: "仅支持JSON格式,文件大小不超过10M",
+    importSuccTip: "智能体配置导入成功！",
+    importErrTip: "智能体配置导入失败！",
+    name: "名称",
+    id: "ID",
+    status: "状态",
+    operation: "操作",
+    configs: "配置",
+    deactivateTip: "您确定要停用该智能体吗？",
+    activeTip: "您确定要启用该智能体吗？",
+    deleteTip: "确认删除这条对话记录吗？此操作不可恢复。",
+    addConfigs: "新增配置",
+    delConfigs: "删除配置",
+    noData: "暂无配置",
+    think: "智能体思考",
+    pipeline: "Pipeline ID",
+    label: {
+      name: "智能体名称",
+      type: "智能体类型 ",
+      pipeline: "Pipeline 名称",
+      configs: "智能体配置",
+      key: "配置名称",
+      value: "配置内容",
+    },
+    valid: {
+      name: "请输入名称",
+      type: "请选择智能体类型",
+      pipeline: "请选择Pipeline名称",
+      configs: "请录入智能体配置",
+      key: "请输入配置名称",
+      value: "请输入配置内容",
+    },
+  },
 };
diff --git a/EdgeCraftRAG/ui/vue/src/layout/Header.vue b/EdgeCraftRAG/ui/vue/src/layout/Header.vue
index 33d0038d62..0de80ece3d 100644
--- a/EdgeCraftRAG/ui/vue/src/layout/Header.vue
+++ b/EdgeCraftRAG/ui/vue/src/layout/Header.vue
@@ -2,7 +2,7 @@
   <div class="header-wrap">
     <img :height="36" :src="headerLog" />
     <div class="setting-wrap">
-      <a-dropdown arrow>
+      <a-dropdown>
         <div @click.prevent>
           <div class="lang-icon">
             <SvgIcon
diff --git a/EdgeCraftRAG/ui/vue/src/layout/Main.vue b/EdgeCraftRAG/ui/vue/src/layout/Main.vue
index 79af5a7f47..ba386bfe55 100644
--- a/EdgeCraftRAG/ui/vue/src/layout/Main.vue
+++ b/EdgeCraftRAG/ui/vue/src/layout/Main.vue
@@ -4,13 +4,16 @@
       <Header />
     </a-layout-header>
     <a-layout-content :class="{ 'layout-main': true, 'full-screen': isFull }">
-      <router-view class="layout-view" />
+      <!-- <router-view class="layout-view" /> -->
+      <Main />
     </a-layout-content>
   </a-layout>
 </template>
 <script lang="ts" setup name="Main">
 import { watch, onMounted } from "vue";
 import Header from "./Header.vue";
+import Main from "@/views/main/index.vue";
+
 const route = useRoute();
 const isFull = ref<boolean>(false);
 
diff --git a/EdgeCraftRAG/ui/vue/src/router/index.ts b/EdgeCraftRAG/ui/vue/src/router/index.ts
index 96a3a03760..e1fbbf05cf 100644
--- a/EdgeCraftRAG/ui/vue/src/router/index.ts
+++ b/EdgeCraftRAG/ui/vue/src/router/index.ts
@@ -1,11 +1,11 @@
 // Copyright (C) 2025 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 
-import { createRouter, createWebHashHistory } from "vue-router";
+import { createRouter, createWebHistory } from "vue-router";
 import { routeList, notFoundAndNoPower } from "./routes";
 
 const router = createRouter({
-  history: createWebHashHistory(),
+  history: createWebHistory(),
   routes: [...notFoundAndNoPower, ...routeList],
 });
 
diff --git a/EdgeCraftRAG/ui/vue/src/router/routes.ts b/EdgeCraftRAG/ui/vue/src/router/routes.ts
index 7408390df9..c609b5124d 100644
--- a/EdgeCraftRAG/ui/vue/src/router/routes.ts
+++ b/EdgeCraftRAG/ui/vue/src/router/routes.ts
@@ -8,27 +8,19 @@ export const routeList = [
     path: "/",
     name: "Main",
     component: Layout,
-    redirect: "/rag",
+    redirect: "/chatbot",
     children: [
       {
-        path: "/rag",
-        name: "Rag",
-        component: () => import("@/views/main/index.vue"),
-        redirect: "/rag/chatbot",
-        children: [
-          {
-            path: "/rag/pipeline",
-            name: "Pipeline",
-            component: () => import("@/views/pipeline/index.vue"),
-            meta: { title: "Pipeline" },
-          },
-          {
-            path: "/rag/chatbot",
-            name: "Chatbot",
-            component: () => import("@/views/chatbot/index.vue"),
-            meta: { title: "Chatbot" },
-          },
-        ],
+        path: "/settings",
+        name: "Settings",
+        component: () => import("@/views/settings/index.vue"),
+        meta: { title: "Settings" },
+      },
+      {
+        path: "/chatbot",
+        name: "Chatbot",
+        component: () => import("@/views/chatbot/index.vue"),
+        meta: { title: "Chatbot" },
       },
     ],
   },
diff --git a/EdgeCraftRAG/ui/vue/src/store/chatbot.ts b/EdgeCraftRAG/ui/vue/src/store/chatbot.ts
index 0b7bb5b20c..8ec194c7c8 100644
--- a/EdgeCraftRAG/ui/vue/src/store/chatbot.ts
+++ b/EdgeCraftRAG/ui/vue/src/store/chatbot.ts
@@ -4,8 +4,15 @@
 import { defineStore } from "pinia";
 
 const configuration = {
+  agent: {
+    name: "",
+    type: "",
+    index: 0,
+  },
+  sessionId: "",
   configuration: {
-    top_n: 25,
+    top_n: 0,
+    k: 0,
     temperature: 0.01,
     top_p: 0.95,
     top_k: 10,
@@ -14,6 +21,7 @@ const configuration = {
     stream: true,
     chat_template_kwargs: {
       enable_thinking: true,
+      enable_rag_retrieval: true,
     },
   },
 };
@@ -30,5 +38,14 @@ export const chatbotAppStore = defineStore("chatbot", {
         ...configuration,
       };
     },
+    setAgent(agent: EmptyObjectType) {
+      this.agent = {
+        ...this.agent,
+        ...agent,
+      };
+    },
+    setSessionId(id: string) {
+      this.sessionId = id;
+    },
   },
 });
diff --git a/EdgeCraftRAG/ui/vue/src/store/session.ts b/EdgeCraftRAG/ui/vue/src/store/session.ts
new file mode 100644
index 0000000000..183c19a79e
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/store/session.ts
@@ -0,0 +1,23 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+import { defineStore } from "pinia";
+
+export const sessionAppStore = defineStore("session", {
+  state: () => ({
+    responseSession: "",
+    currentSession: "",
+  }),
+  persist: {
+    key: "sessionInfo",
+    storage: sessionStorage,
+  },
+  actions: {
+    setResponseSessionId(sessionId: string) {
+      this.responseSession = sessionId;
+    },
+    setSessionId(sessionId: string) {
+      this.currentSession = sessionId;
+    },
+  },
+});
diff --git a/EdgeCraftRAG/ui/vue/src/theme/ant.less b/EdgeCraftRAG/ui/vue/src/theme/ant.less
index c2427cb257..b4ac7f01ce 100644
--- a/EdgeCraftRAG/ui/vue/src/theme/ant.less
+++ b/EdgeCraftRAG/ui/vue/src/theme/ant.less
@@ -27,6 +27,14 @@
       background-color: var(--color-successBg);
     }
   }
+  &.intel-btn-primary-second {
+    color: var(--color-primary-hover);
+    border-color: var(--color-primary-hover);
+
+    &:hover {
+      background-color: var(--color-second-primaryBg);
+    }
+  }
 
   &.intel-btn-warning {
     color: var(--color-warning);
@@ -157,3 +165,8 @@
 .intel-tooltip {
   max-width: 60vw;
 }
+.intel-tag-processing {
+  background-color: var(--color-second-primaryBg);
+  color: var(--color-primary-hover);
+  border-color: var(--border-primary);
+}
diff --git a/EdgeCraftRAG/ui/vue/src/theme/common.less b/EdgeCraftRAG/ui/vue/src/theme/common.less
index 0b2ee6085f..bc46197cb2 100644
--- a/EdgeCraftRAG/ui/vue/src/theme/common.less
+++ b/EdgeCraftRAG/ui/vue/src/theme/common.less
@@ -111,6 +111,10 @@
     background: var(--color-primary-hover) !important;
     transition-duration: 0s;
   }
+  &.is-disabled {
+    color: var(--bg-scrollbar-hover) !important;
+    background: var(--color-scrollbar) !important;
+  }
 }
 .form-wrap {
   .intel-form-item-control-input-content {
@@ -118,7 +122,20 @@
     align-items: center;
     gap: 6px;
   }
+  .column-wrap {
+    .intel-form-item-control-input-content {
+      display: block;
+      .flex-left {
+        gap: 6px;
+      }
+      .option-introduction {
+        top: 0;
+        margin-top: 8px;
+      }
+    }
+  }
   .slider-wrap {
+    width: 100%;
     &:not(:last-child) {
       padding-bottom: 16px;
       margin-bottom: 12px;
@@ -191,9 +208,9 @@
     padding: 16px 24px 0 !important;
   }
 }
-.centered-model {
+.model-centered-footer {
   .ant-modal-confirm-btns {
-    text-align: center;
+    .vertical-center;
   }
 }
 .option-introduction {
@@ -213,6 +230,17 @@
     top: 5px;
   }
 }
+.experience-dialog {
+  .intel-modal-body {
+    max-height: 500px;
+    overflow-y: auto;
+  }
+}
+.eg-wrap {
+  font-size: 12px;
+  color: var(--font-tip-color);
+  .ml-12;
+}
 .loopStyle(@counter) when (@counter > 0) {
   .p-@{counter} {
     padding: (1px * @counter);
@@ -265,3 +293,11 @@
 .intel-dropdown {
   z-index: 9999;
 }
+@keyframes spin {
+  from {
+    transform: rotate(0deg);
+  }
+  to {
+    transform: rotate(360deg);
+  }
+}
diff --git a/EdgeCraftRAG/ui/vue/src/theme/markdown.less b/EdgeCraftRAG/ui/vue/src/theme/markdown.less
index 2a497ecac3..bdefe2bdd1 100644
--- a/EdgeCraftRAG/ui/vue/src/theme/markdown.less
+++ b/EdgeCraftRAG/ui/vue/src/theme/markdown.less
@@ -147,4 +147,7 @@
       color: var(--font-main-color);
     }
   }
+  hr {
+    color: var(--border-main-color);
+  }
 }
diff --git a/EdgeCraftRAG/ui/vue/src/theme/variables.less b/EdgeCraftRAG/ui/vue/src/theme/variables.less
index 892c90bd86..19b8382655 100644
--- a/EdgeCraftRAG/ui/vue/src/theme/variables.less
+++ b/EdgeCraftRAG/ui/vue/src/theme/variables.less
@@ -23,6 +23,8 @@
   --color-second-warning: #854d0e;
   --color-warningBg: #feefd0;
   --color-second-warningBg: #fefce8;
+  --color-purple: #9333ea;
+  --color-purpleBg: #eee7f5;
   --color-big-icon: #111111;
   --bg-main-color: #f5f5f5;
   --bg-card-color: #f9f9f9;
@@ -58,9 +60,12 @@
   //边框
   --border-main-color: #e5e7eb;
   --border-fuzzy-color: rgba(255, 255, 255, 0.1);
-  --border-warning: var(--color-warningBg);
-  --border-success: var(--color-successBg);
-  --border-primary: var(--color-second-primaryBg);
+  --border-warning: #f8e9ca;
+  --border-success: #c8f7e0;
+  --border-primary: #bfdbfe;
+  --border-purple: #d5daf8;
+  --border-error: #ebb3b3;
+  --border-info: #d9d9d9;
 
   //黑色按钮
   --bg-black-color: #434343;
@@ -75,6 +80,23 @@
   --table-th-bg: #dddddd;
   --table-td-bg: #f0f0f0;
   --blockquote-color: var(--font-info-color);
+  --color-multicolored-1: var(--color-primary-hover);
+  --color-multicolored-2: var(--color-purple);
+  --color-multicolored-3: var(--color-success);
+  --color-multicolored-4: var(--color-warning);
+  --color-multicolored-5: var(--color-error);
+  --color-multicolored-bg-0: var(--color-primaryBg);
+  --color-multicolored-bg-1: var(--color-primaryBg);
+  --color-multicolored-bg-2: var(--color-purpleBg);
+  --color-multicolored-bg-3: var(--color-successBg);
+  --color-multicolored-bg-4: var(--color-warningBg);
+  --color-multicolored-bg-5: var(--color-errorBg);
+  --color-multicolored-bg-0: var(--color-primaryBg);
+  --color-multicolored-border-1: var(--border-primary);
+  --color-multicolored-border-2: var(--border-purple);
+  --color-multicolored-border-3: var(--border-success);
+  --color-multicolored-border-4: var(--border-warning);
+  --color-multicolored-border-5: var(--border-error);
 }
 
 [data-theme="dark"] {
@@ -91,9 +113,13 @@
   --bg-scrollbar-hover: #666666;
   --color-primary: #0054ae;
   --color-primary-hover: #1668dc;
-  --color-primaryBg: #e0eaff;
+  --color-primaryBg: #8da6dd;
   --color-primary-second: #1677ff;
-  --color-second-primaryBg: #d4e1fd;
+  --color-second-primaryBg: #93b3f7;
+  --color-errorBg: #d38585;
+  --color-successBg: #82c086;
+  --color-purpleBg: #a880c0;
+  --color-warningBg: #dba98d;
   --bg-box-shadow: rgba(255, 255, 255, 0.1);
   --bg-gradient-shadow: 0px 4px 6px -4px rgba(255, 255, 255, 0.1),
     0px 5px 8px 1px rgba(255, 255, 255, 0.1);
@@ -118,7 +144,8 @@
   --border-main-color: #3b3b3b;
   --border-warning: #f8e9ca;
   --border-success: #d7f8e8;
-  --border-primary: #d5daf8;
+  --border-primary: #bfdbfe;
+  --border-purple: #d5daf8;
 
   //黑色按钮
   --bg-black-color: #434343;
diff --git a/EdgeCraftRAG/ui/vue/src/types/global.d.ts b/EdgeCraftRAG/ui/vue/src/types/global.d.ts
index b8d6ff6718..f21cef6f78 100644
--- a/EdgeCraftRAG/ui/vue/src/types/global.d.ts
+++ b/EdgeCraftRAG/ui/vue/src/types/global.d.ts
@@ -117,14 +117,15 @@ declare interface paginationType<T = any> {
 // Table Columns
 declare type TableColumns<T = any> = {
   title: string;
-  key: string;
+  key?: string;
   dataIndex: string | string[];
   width?: number | string;
-  align?: string;
+  align?: "left" | "center" | "right";
   ellipsis?: boolean;
   visible?: boolean;
-  fixed?: boolean | string;
-  [key: string]: T;
+  fixed?: "left" | "right" | true | undefined;
+} & {
+  [key: string]: any;
 };
 
 // Dialog
@@ -132,3 +133,7 @@ declare interface DialogType<T = any> {
   visible: boolean;
   [key: string]: T;
 }
+
+declare interface FormRules {
+  [key: string]: RuleObject | RuleObject[];
+}
diff --git a/EdgeCraftRAG/ui/vue/src/utils/clipboard.ts b/EdgeCraftRAG/ui/vue/src/utils/clipboard.ts
new file mode 100644
index 0000000000..f846c3d773
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/utils/clipboard.ts
@@ -0,0 +1,85 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+import { ref, Ref } from "vue";
+import { message } from "ant-design-vue";
+import i18n from "@/i18n";
+
+interface UseClipboardReturn {
+  copied: Ref<boolean>;
+  copy: (text: string) => Promise<boolean>;
+}
+
+export const copyText = async (text: string, showMessage: boolean = true): Promise<boolean> => {
+  if (!text) {
+    if (showMessage) {
+      message.error(i18n.global.t("common.copyError"));
+    }
+    return false;
+  }
+
+  const copyWithExecCommand = (text: string): boolean => {
+    try {
+      const textArea = document.createElement("textarea");
+      textArea.value = text;
+      textArea.style.cssText = "position:fixed;top:0;left:0;opacity:0;pointer-events:none;z-index:-1;";
+      document.body.appendChild(textArea);
+      textArea.select();
+      textArea.setSelectionRange(0, 99999);
+      const successful = document.execCommand("copy");
+      document.body.removeChild(textArea);
+      return successful;
+    } catch (err) {
+      return false;
+    }
+  };
+
+  try {
+    if (navigator.clipboard) {
+      await navigator.clipboard.writeText(text);
+    } else {
+      const success = copyWithExecCommand(text);
+      if (!success) throw new Error("Copy failed");
+    }
+
+    if (showMessage) message.success(i18n.global.t("common.copySucc"));
+    return true;
+  } catch (error) {
+    try {
+      const success = copyWithExecCommand(text);
+      if (success) {
+        if (showMessage) message.success(i18n.global.t("common.copySucc"));
+        return true;
+      }
+    } catch (fallbackError) {
+      console.error("Fallback also failed:", fallbackError);
+    }
+
+    if (showMessage) message.error(i18n.global.t("common.copyError"));
+    return false;
+  }
+};
+
+export const useClipboard = (timeout: number = 2000): UseClipboardReturn => {
+  const copied = ref(false);
+  let timeoutId: number | null = null;
+
+  const copy = async (text: string): Promise<boolean> => {
+    const success = await copyText(text, true);
+
+    if (success) {
+      copied.value = true;
+      if (timeoutId) clearTimeout(timeoutId);
+      timeoutId = window.setTimeout(() => {
+        copied.value = false;
+      }, timeout);
+    }
+
+    return success;
+  };
+
+  return {
+    copied,
+    copy,
+  };
+};
diff --git a/EdgeCraftRAG/ui/vue/src/utils/common.ts b/EdgeCraftRAG/ui/vue/src/utils/common.ts
index 97e421cb66..7eee9fdb3d 100644
--- a/EdgeCraftRAG/ui/vue/src/utils/common.ts
+++ b/EdgeCraftRAG/ui/vue/src/utils/common.ts
@@ -3,7 +3,7 @@
 
 import { inject } from "vue";
 import { customNotification } from "./notification";
-import { Local } from "./storage";
+import { sessionAppStore } from "@/store/session";
 
 export const useNotification = () => {
   const customNotificationInjected = inject<typeof customNotification>("customNotification");
@@ -30,15 +30,15 @@ export const formatCapitalize = (string: string, start: number = 0, length: numb
 };
 
 export const getChatSessionId = (): string => {
-  const STORAGE_KEY = "chat_session_id";
+  const sessionStore = sessionAppStore();
 
-  const storedSessionId = Local.get(STORAGE_KEY);
+  const storedSessionId = sessionStore.currentSession;
   if (storedSessionId) {
     return storedSessionId;
   }
   const newSessionId = self.crypto?.randomUUID?.() || generateFallbackId();
 
-  Local.set(STORAGE_KEY, newSessionId);
+  sessionStore.setSessionId(newSessionId);
   return newSessionId;
 };
 
@@ -54,3 +54,48 @@ const generateFallbackId = (): string => {
     throw new Error("No secure random number generator available for session ID generation.");
   }
 };
+
+export const downloadJson = (data: object | string, filename: string = "pipeline.json") => {
+  const jsonStr: string = typeof data === "string" ? data : JSON.stringify(data, null, 2);
+
+  const blob: Blob = new Blob([jsonStr], { type: "application/json" });
+
+  const url: string = URL.createObjectURL(blob);
+
+  const a: HTMLAnchorElement = document.createElement("a");
+  a.href = url;
+  a.download = filename;
+  document.body.appendChild(a);
+  a.click();
+
+  document.body.removeChild(a);
+  URL.revokeObjectURL(url);
+};
+
+export const formatTextStrict = (
+  str: string,
+  options?: {
+    preserveSpaces?: boolean;
+    keepOriginalCase?: boolean;
+  },
+): string => {
+  const { preserveSpaces = true, keepOriginalCase = false } = options || {};
+
+  // replace _ and -
+  let processed = str.replace(/[_-]/g, " ");
+
+  if (!preserveSpaces) {
+    processed = processed.replace(/\s+/g, " ");
+  }
+  return processed
+    .split(preserveSpaces ? /(\s+)/ : /\s+/)
+    .map((segment) => {
+      if (segment.trim() === "") {
+        return segment;
+      }
+      const firstChar = segment.charAt(0).toUpperCase();
+      const restChars = keepOriginalCase ? segment.slice(1) : segment.slice(1).toLowerCase();
+      return firstChar + restChars;
+    })
+    .join("");
+};
diff --git a/EdgeCraftRAG/ui/vue/src/utils/customRenderer.ts b/EdgeCraftRAG/ui/vue/src/utils/customRenderer.ts
index 5a19ade40a..7a0871d02c 100644
--- a/EdgeCraftRAG/ui/vue/src/utils/customRenderer.ts
+++ b/EdgeCraftRAG/ui/vue/src/utils/customRenderer.ts
@@ -4,8 +4,7 @@
 import { marked } from "marked";
 import hljs from "highlight.js";
 import { formatCapitalize } from "./common";
-import ClipboardJS from "clipboard";
-import { message } from "ant-design-vue";
+import { useClipboard } from "./clipboard";
 
 interface CodeRenderParams {
   text: string;
@@ -13,80 +12,53 @@ interface CodeRenderParams {
 }
 
 class ClipboardManager {
-  private clipboard: ClipboardJS | null = null;
-  private observer: MutationObserver | null = null;
+  private clipboard;
 
   constructor() {
-    this.autoInit();
+    this.clipboard = useClipboard();
+    this.init();
   }
 
-  private autoInit() {
-    if (typeof document === "undefined") return;
-    const init = () => {
-      this.init(".copy-btn");
-      this.setupMutationObserver();
-    };
-
-    if (document.readyState === "complete") {
-      init();
-    } else {
-      document.addEventListener("DOMContentLoaded", init);
-    }
-  }
-
-  private init(selector: string) {
-    this.destroy();
-
-    this.clipboard = new ClipboardJS(selector, { container: document.body });
+  private init() {
+    document.addEventListener("click", (e) => {
+      const target = e.target as HTMLElement;
+      const copyBtn = target.closest(".copy-btn");
 
-    this.clipboard.on("success", (e) => this.handleSuccess(e));
-    this.clipboard.on("error", (e) => this.handleError(e));
+      if (copyBtn) {
+        e.preventDefault();
+        this.handleCopyClick(copyBtn as HTMLElement);
+      }
+    });
   }
 
-  private setupMutationObserver() {
-    this.observer = new MutationObserver((mutations) => {
-      const hasNewButtons = mutations.some((mutation) =>
-        Array.from(mutation.addedNodes).some(
-          (node) => node instanceof HTMLElement && (node.matches(".copy-btn") || node.querySelector(".copy-btn")),
-        ),
-      );
-      if (hasNewButtons) this.init(".copy-btn");
-    });
+  private async handleCopyClick(button: HTMLElement) {
+    const targetId = button.getAttribute("data-clipboard-target");
+    if (!targetId) return;
 
-    this.observer.observe(document.body, {
-      childList: true,
-      subtree: true,
-    });
-  }
+    const targetElement = document.querySelector(targetId);
+    if (!targetElement) return;
+
+    const textToCopy = targetElement.textContent || "";
+    const success = await this.clipboard.copy(textToCopy);
 
-  destroy() {
-    this.clipboard?.destroy();
-    this.observer?.disconnect();
-    this.clipboard = null;
-    this.observer = null;
+    if (success) {
+      this.showSuccessIcon(button);
+    }
   }
 
-  private handleSuccess(e: ClipboardJS.Event) {
-    e.clearSelection();
-    message.success("Copy Successful !");
-    const button = e.trigger as HTMLElement;
+  private showSuccessIcon(button: HTMLElement) {
     const copyIcon = button.querySelector(".copy-icon") as HTMLElement;
     const successIcon = button.querySelector(".success-icon") as HTMLElement;
 
-    copyIcon.style.display = "none";
-    successIcon.style.display = "block";
-
-    let timeout = null;
-    if (timeout) clearTimeout(timeout);
+    if (copyIcon && successIcon) {
+      copyIcon.style.display = "none";
+      successIcon.style.display = "block";
 
-    timeout = setTimeout(() => {
-      copyIcon.style.display = "block";
-      successIcon.style.display = "none";
-    }, 2000);
-  }
-
-  private handleError(e: ClipboardJS.Event) {
-    message.error("Copy Failure !");
+      setTimeout(() => {
+        copyIcon.style.display = "block";
+        successIcon.style.display = "none";
+      }, 2000);
+    }
   }
 }
 
@@ -108,12 +80,12 @@ const createCustomRenderer = () => {
     const uniqueId = `code-${Date.now()}-${Math.random().toString(16).slice(2)}`;
 
     return `
-      <div  class="intel-highlighter">
+      <div class="intel-highlighter">
         <div class="header-wrap">
           <span class="code-title">${codeTitle}</span>
           <span class="copy-btn" data-clipboard-target="#${uniqueId}">
-            <i class="icon-intel iconfont icon-copy copy-icon" ></i>
-            <i class="icon-intel iconfont icon-copy-success success-icon" ></i>
+            <i class="icon-intel iconfont icon-copy copy-icon"></i>
+            <i class="icon-intel iconfont icon-copy-success success-icon" style="display: none;"></i>
           </span>
         </div>
         <pre class="content-wrap" id="${uniqueId}"><div>${codeHtml}</div></pre>
diff --git a/EdgeCraftRAG/ui/vue/src/utils/notification.ts b/EdgeCraftRAG/ui/vue/src/utils/notification.ts
index de5b2c9cae..151141e0ea 100644
--- a/EdgeCraftRAG/ui/vue/src/utils/notification.ts
+++ b/EdgeCraftRAG/ui/vue/src/utils/notification.ts
@@ -1,14 +1,11 @@
 // Copyright (C) 2025 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 
-import { CheckCircleFilled, CloseCircleFilled, ExclamationCircleFilled, InfoCircleFilled } from "@ant-design/icons-vue";
+import { h } from "vue";
 import { notification } from "ant-design-vue";
-interface NotificationIcon {
-  icon: any;
-  color: string;
-}
+import { CheckCircleFilled, CloseCircleFilled, ExclamationCircleFilled, InfoCircleFilled } from "@ant-design/icons-vue";
 
-const getNotificationIcon = (type: string): NotificationIcon => {
+const getNotificationIcon = (type: string) => {
   switch (type) {
     case "success":
       return { icon: CheckCircleFilled, color: "--color-success" };
@@ -22,19 +19,17 @@ const getNotificationIcon = (type: string): NotificationIcon => {
       return { icon: null, color: "" };
   }
 };
-
 export const customNotification = (
   type: "success" | "warning" | "error" | "info",
   message: string,
-  description: string,
+  description: string | undefined,
 ) => {
   const { icon, color } = getNotificationIcon(type);
-
   const styledIcon = icon ? h(icon, { style: { color: `var(${color})` } }) : null;
 
   notification[type]({
-    message: message,
-    description: description,
+    message,
+    description,
     icon: styledIcon,
   });
 };
diff --git a/EdgeCraftRAG/ui/vue/src/utils/other.ts b/EdgeCraftRAG/ui/vue/src/utils/other.ts
index cb5d56bc6a..85e3268cde 100644
--- a/EdgeCraftRAG/ui/vue/src/utils/other.ts
+++ b/EdgeCraftRAG/ui/vue/src/utils/other.ts
@@ -7,17 +7,19 @@ import type { App } from "vue";
 import { customNotification } from "./notification";
 import FormTooltip from "@/components/FormTooltip.vue";
 import SvgIcon from "@/components/SvgIcon.vue";
+import PartialLoading from "@/components/PartialLoading.vue";
 
 //Global Notification
 notification.config({
   placement: "topRight",
   duration: 3,
-  maxCount: 3,
+  maxCount: 2,
 });
 
 export const antConfig = (app: App) => {
   app.component("SvgIcon", SvgIcon);
   app.component("FormTooltip", FormTooltip);
+  app.component("PartialLoading", PartialLoading);
   app.use(ConfigProvider);
   app.provide("customNotification", customNotification);
   serviceManager.registerService("antNotification", customNotification);
diff --git a/EdgeCraftRAG/ui/vue/src/utils/validate.ts b/EdgeCraftRAG/ui/vue/src/utils/validate.ts
index 5b93df488e..9ceda5d770 100644
--- a/EdgeCraftRAG/ui/vue/src/utils/validate.ts
+++ b/EdgeCraftRAG/ui/vue/src/utils/validate.ts
@@ -25,7 +25,19 @@ export const validateIpPort = (ipPortStr: string) => {
   return true;
 };
 
-export const isValidName = (name: string) => {
-  const pattern = /^[^0-9]/;
+export const isValidName = (name: string): boolean => {
+  const pattern = /^[a-zA-Z_][a-zA-Z0-9_]*$/;
   return pattern.test(name);
 };
+
+export const isValidPipelineName = (name: string): boolean => {
+  const validPattern = /^[a-zA-Z0-9_]+$/;
+  return validPattern.test(name);
+};
+
+export const validateServiceAddress = (url: string): boolean => {
+  const regex =
+    /^(http:\/\/)(([a-zA-Z0-9]([a-zA-Z0-9\-]{0,61}[a-zA-Z0-9])?\.)+[a-zA-Z]{2,6}|localhost|[0-9]{1,3}(\.[0-9]{1,3}){3})(:[0-9]+)?$/;
+
+  return regex.test(url);
+};
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/Chat.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/Chat.vue
index 17f80c74f9..f6149f0770 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/Chat.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/Chat.vue
@@ -3,14 +3,22 @@
     <div class="message-box" ref="scrollContainer" v-if="messagesLength">
       <div class="intel-markdown">
         <div ref="messageComponent">
-          <div v-for="(msg, index) in messagesList" :key="index" :inResponse>
+          <div
+            v-for="(msg, index) in messagesList"
+            :key="`session-${currentSessionId}-${index}`"
+          >
             <MessageItem
+              :message-key="`session-${currentSessionId}-${index}`"
               :message="msg"
               ref="messageRef"
               :inResponse
-              :think="isThink"
+              :message-Index="index"
+              :last-query="isLastQuery(index)"
+              :last-response="isLastResponse(index)"
               @preview="handleImagePreview"
               @stop="isUserScrolling = true"
+              @regenerate="handleRegenerate"
+              @resend="handleDelete"
             />
           </div>
         </div>
@@ -36,13 +44,27 @@
         :auto-size="{ minRows: 2, maxRows: 5 }"
       />
       <div class="button-wrap">
-        <span
-          :class="{ 'think-btn': true, 'is-deep': isThink }"
-          @click="handleThinkChange"
-        >
-          <SvgIcon name="icon-deep-think" :size="16" inherit />
-          {{ $t(`chat.${isThink ? "reason" : "think"}`) }}
-        </span>
+        <div class="flex-left">
+          <span
+            :class="{
+              'think-btn': true,
+              'is-deep': isThink,
+              'is-disabled': isAgent,
+            }"
+            @click="handleThinkChange"
+          >
+            <SvgIcon name="icon-deep-think" :size="16" inherit />
+            {{ $t(`chat.${isThink ? "reason" : "think"}`) }}
+          </span>
+          <span
+            :class="{ 'think-btn': true, 'is-deep': enableKB }"
+            @click="handleKBChange"
+          >
+            <SvgIcon name="icon-kb" :size="16" inherit />
+            {{ $t("knowledge.title") }}
+          </span>
+        </div>
+
         <div class="send-btn">
           <a-tooltip placement="top" :title="$t('chat.new')">
             <span class="common-btn">
@@ -66,12 +88,16 @@
           </a-tooltip>
           <a-divider type="vertical" />
           <a-button
+            v-if="!inResponse"
             type="primary"
             :disabled="inResponse || notInput"
             @click="handleSendMessage"
           >
             <SvgIcon name="icon-send" inherit />
           </a-button>
+          <a-button v-else type="primary" @click="handleStopChat">
+            <SvgIcon name="icon-stop" inherit />
+          </a-button>
         </div>
       </div>
     </div>
@@ -87,29 +113,37 @@
 </template>
 
 <script lang="ts" setup name="Chatbot">
-import { getBenchmark } from "@/api/chatbot";
+import { getBenchmark, getSessionDetailById } from "@/api/chatbot";
 import lightBulb from "@/assets/svgs/lightBulb.svg";
 import _ from "lodash";
 import { reactive, ref, computed, nextTick } from "vue";
 import { Benchmark, IMessage } from "../../type";
 import MessageItem from "./MessageItem.vue";
-import { handleMessageSend } from "./SseService";
-import { pipelineAppStore } from "@/store/pipeline";
+import { handleMessageSend, StreamController } from "./SseService";
 import { Local } from "@/utils/storage";
 import { ArrowDownOutlined } from "@ant-design/icons-vue";
 import { throttle } from "lodash";
 import { chatbotAppStore } from "@/store/chatbot";
-
+import { sessionAppStore } from "@/store/session";
+import emitter from "@/utils/mitt";
+import router from "@/router";
+import { message } from "ant-design-vue";
+import { useI18n } from "vue-i18n";
+
+const { t } = useI18n();
+const route = useRoute();
 const chatbotStore = chatbotAppStore();
+const sessionStore = sessionAppStore();
 const emit = defineEmits(["config"]);
 const ENV_URL = import.meta.env;
-const pipelineStore = pipelineAppStore();
+
 const defaultBenchmark = reactive<Benchmark>({
   generator: "",
   postprocessor: "",
   retriever: "",
 });
 
+let streamController = ref<StreamController | null>(null);
 const messagesList = ref<IMessage[]>([]);
 const inputKeywords = ref<string>("");
 const scrollContainer = ref<HTMLElement | null>(null);
@@ -122,34 +156,95 @@ const imageSrc = ref<string>("");
 const isUserScrolling = ref(false);
 const showScrollToBottomBtn = ref(false);
 const resizeObserverRef = ref<ResizeObserver | null>(null);
-const isThink = ref<boolean>(true);
+const enableKB = ref<boolean>(true);
+const isCreatingNewSession = ref(false);
+const shouldIgnoreRouteChange = ref(false);
 
 const inputRef = ref();
 const handleEnvUrl = () => {
   const { VITE_CHATBOT_URL } = ENV_URL;
-
   return `${VITE_CHATBOT_URL}v1/chatqna`;
 };
 
 const handleMessageDisplay = (data: any) => {
   if (inResponse.value) {
     isUserScrolling.value = false;
+    const regex = /code:0000(.*)/s;
+    const match = data.match(regex);
+    if (match) {
+      messagesList.value.pop();
+      messagesList.value[messagesList.value?.length - 1].errorMessage =
+        match[1].trim();
+      return;
+    }
+
     messagesList.value[messagesList.value?.length - 1].content = data;
   }
 };
+
 const notInput = computed(() => {
   return inputKeywords.value.trim() === "";
 });
+
 const messagesLength = computed(() => {
   return messagesList.value?.length;
 });
+
+const lastQueryIndex = computed(() => {
+  for (let i = messagesList.value.length - 1; i >= 0; i--) {
+    if (messagesList.value[i].role === "user") {
+      return i;
+    }
+  }
+  return -1;
+});
+
+const lastResponseIndex = computed(() => {
+  for (let i = messagesList.value.length - 1; i >= 0; i--) {
+    if (messagesList.value[i].role === "assistant") {
+      return i;
+    }
+  }
+  return -1;
+});
+
+const isAgent = computed(() => {
+  return !!chatbotStore.agent.name;
+});
+
+const isThink = computed({
+  get() {
+    const { enable_thinking = true } =
+      chatbotStore.configuration?.chat_template_kwargs;
+    return enable_thinking;
+  },
+  set(value: boolean) {
+    chatbotStore.setChatbotConfiguration({
+      chat_template_kwargs: {
+        ...chatbotStore.configuration?.chat_template_kwargs,
+        enable_thinking: value,
+      },
+    });
+  },
+});
+
+const isLastQuery = (index: number) => index === lastQueryIndex.value;
+const isLastResponse = (index: number) => index === lastResponseIndex.value;
+
 const handleStreamEnd = () => {
   handleStopDisplay();
   queryBenchmark();
+  updateSessionId();
+  sessionStore.setResponseSessionId("");
 };
+
 const toggleConnection = () => {
   if (inResponse.value) {
-    handleMessageSend(
+    if (streamController.value) {
+      streamController.value.cancel();
+    }
+
+    streamController.value = handleMessageSend(
       handleEnvUrl(),
       formatFormParam(),
       handleMessageDisplay,
@@ -161,11 +256,11 @@ const toggleConnection = () => {
 // Format parameter
 const formatFormParam = () => {
   const { configuration = {} } = Local.get("chatbotConfiguration") || {};
-
   return Object.assign({}, configuration, {
     messages: inputKeywords.value,
   });
 };
+
 const handleEnter = (e: any) => {
   e.preventDefault();
   if (inResponse.value) {
@@ -173,8 +268,10 @@ const handleEnter = (e: any) => {
   }
   handleSendMessage();
 };
+
 const handleSendMessage = async () => {
   if (!inputKeywords.value.trim()) return;
+
   messagesList.value.push(
     {
       role: "user",
@@ -183,21 +280,46 @@ const handleSendMessage = async () => {
     {
       role: "assistant",
       content: "",
+      query: inputKeywords.value,
       benchmark: _.cloneDeep(defaultBenchmark),
     }
   );
+
   inResponse.value = true;
   toggleConnection();
   inputKeywords.value = "";
   scrollToBottom();
+
+  const { currentSession = "" } = sessionStore;
+  sessionStore.setResponseSessionId(currentSession);
 };
+
 const handleStopDisplay = () => {
   inResponse.value = false;
 };
+const currentSessionId = computed(() => sessionStore.currentSession);
+const updateSessionId = () => {
+  const sessionId = route.query?.sessionId;
+  const storedSessionId = sessionStore.currentSession;
+
+  if (!sessionId && storedSessionId) {
+    shouldIgnoreRouteChange.value = true;
+    router.replace({
+      query: {
+        ...route.query,
+        sessionId: storedSessionId,
+      },
+    });
+    nextTick(() => {
+      setTimeout(() => {
+        shouldIgnoreRouteChange.value = false;
+      }, 100);
+    });
+  }
+};
 
 const queryBenchmark = async () => {
-  const { activatedPipeline } = pipelineStore;
-  const data = (await getBenchmark(activatedPipeline)) || {};
+  const data = (await getBenchmark()) || {};
 
   if (data["Benchmark enabled"]) {
     const benchmarkData = data.last_benchmark_data || {};
@@ -205,7 +327,7 @@ const queryBenchmark = async () => {
       const processedBenchmarkData = Object.fromEntries(
         Object.entries(benchmarkData).map(([key, value]: any) => [
           key,
-          parseFloat(value.toFixed(4)),
+          value ? parseFloat(value.toFixed(4)) : 0,
         ])
       );
       messagesList.value[messagesList.value.length - 1].benchmark =
@@ -213,29 +335,75 @@ const queryBenchmark = async () => {
     }
   }
 };
+
 const handleImagePreview = (url: string) => {
   imageSrc.value = url;
   handleImageVisible(true);
 };
+
 const handleImageVisible = (value: boolean = false) => {
   imgVisible.value = value;
 };
+
 const handleNewChat = () => {
+  isCreatingNewSession.value = true;
+  shouldIgnoreRouteChange.value = true;
+
   inputKeywords.value = "";
   messagesList.value = [];
-  Local.remove("chat_session_id");
+  sessionStore.setSessionId("");
+  router.replace({
+    query: {},
+  });
+  nextTick(() => {
+    setTimeout(() => {
+      isCreatingNewSession.value = false;
+      shouldIgnoreRouteChange.value = false;
+    }, 100);
+  });
 };
+
 const handleThinkChange = () => {
+  if (isAgent.value) return;
   isThink.value = !isThink.value;
+};
+
+const handleKBChange = () => {
+  enableKB.value = !enableKB.value;
+  const { chat_template_kwargs } = chatbotStore.configuration;
+
+  const chat_template = {
+    ...chat_template_kwargs,
+    enable_rag_retrieval: enableKB.value,
+  };
 
   chatbotStore.setChatbotConfiguration({
-    chat_template_kwargs: { enable_thinking: isThink.value },
+    chat_template_kwargs: chat_template,
   });
 };
+
 const handleConfig = () => {
   emit("config");
 };
 
+const handleRegenerate = (query: string) => {
+  inputKeywords.value = query;
+  handleSendMessage();
+};
+
+const handleDelete = ({ index, query }: { index: number; query: string }) => {
+  messagesList.value.splice(index);
+  inputKeywords.value = query;
+  handleSendMessage();
+};
+
+const handleStopChat = async () => {
+  if (streamController.value) {
+    streamController.value.cancel();
+    streamController.value = null;
+  }
+};
+
 const scrollToBottom = () => {
   if (!scrollContainer.value) return;
 
@@ -290,6 +458,35 @@ const initResizeObserver = () => {
   }
 };
 
+const initialSessionDetail = (messages: IMessage[]): IMessage[] => {
+  return messages?.map((msg, i, arr) => {
+    if (msg.role === "assistant" && i > 0 && arr[i - 1].role === "user") {
+      return {
+        ...msg,
+        query: arr[i - 1].content,
+      };
+    }
+    return msg;
+  });
+};
+
+const handleViewSessionDetail = async (sessionId: string) => {
+  try {
+    const data: any = await getSessionDetailById(sessionId);
+    if (!data?.session_content?.messages) {
+      handleNewChat();
+      message.error(t("chat.notExist"));
+      return;
+    }
+    messagesList.value = initialSessionDetail(data?.session_content?.messages);
+    nextTick(() => {
+      scrollToBottom();
+    });
+  } catch (error) {
+    console.error(error);
+  }
+};
+
 watch(
   () => messageComponent.value,
   (value) => {
@@ -301,10 +498,40 @@ watch(
   },
   { immediate: true }
 );
+
+watch(
+  () => route.query?.sessionId,
+  (sessionId) => {
+    if (shouldIgnoreRouteChange.value || isCreatingNewSession.value) {
+      shouldIgnoreRouteChange.value = false;
+      return;
+    }
+
+    if (sessionId) {
+      handleViewSessionDetail(String(sessionId));
+      if (sessionId !== sessionStore.responseSession) {
+        inResponse.value = false;
+      } else {
+        inResponse.value = true;
+      }
+    } else {
+      messagesList.value = [];
+    }
+  },
+  { immediate: true }
+);
+
 onMounted(() => {
-  isThink.value =
-    chatbotStore.configuration?.chat_template_kwargs.enable_thinking;
+  const { enable_thinking = true, enable_rag_retrieval = false } =
+    chatbotStore.configuration?.chat_template_kwargs;
+  isThink.value = enable_thinking;
+  enableKB.value = enable_rag_retrieval;
+  emitter.on("new-chat", handleNewChat);
+  if (!route.query?.sessionId) {
+    sessionStore.setSessionId("");
+  }
 });
+
 onBeforeUnmount(() => {
   if (resizeObserver && messageComponent.value) {
     resizeObserver.unobserve(messageComponent.value);
@@ -312,7 +539,13 @@ onBeforeUnmount(() => {
   }
   scrollContainer.value?.removeEventListener("scroll", handleScroll);
 });
+
+onUnmounted(() => {
+  emitter.off("new-chat", handleNewChat);
+  sessionStore.setSessionId("");
+});
 </script>
+
 <style scoped lang="less">
 .chatbot-wrap {
   display: flex;
@@ -421,6 +654,9 @@ onBeforeUnmount(() => {
       align-items: center;
       justify-content: space-between;
       padding: 6px 12px;
+      .flex-left {
+        gap: 8px;
+      }
       .think-btn {
         height: 24px;
         line-height: 24px;
@@ -443,6 +679,13 @@ onBeforeUnmount(() => {
           color: var(--color-primary-second);
           background-color: var(--color-primaryBg);
         }
+        &.is-disabled,
+        .is-disabled:hover {
+          border: 1px solid var(--border-main-color);
+          color: var(--font-text-color);
+          background-color: var(--bg-main-color);
+          cursor: no-drop;
+        }
       }
       .send-btn {
         display: flex;
@@ -495,5 +738,28 @@ onBeforeUnmount(() => {
       }
     }
   }
+  .error-tip {
+    border: 1px solid var(--border-warning);
+    background-color: var(--color-warningBg);
+    color: var(--color-second-warning);
+    padding: 8px 12px;
+    border-radius: 0 4px 4px 0;
+    margin-bottom: 12px;
+    font-size: 12px;
+    .flex-between;
+    &:hover {
+      .card-shadow;
+    }
+    .message-wrap {
+      flex: 1;
+    }
+    .close-btn {
+      cursor: pointer;
+      text-align: end;
+      &:hover {
+        color: var(--color-error);
+      }
+    }
+  }
 }
 </style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/ChatHistory.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/ChatHistory.vue
new file mode 100644
index 0000000000..9816964249
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/ChatHistory.vue
@@ -0,0 +1,436 @@
+<template>
+  <div class="chat-agent">
+    <div class="new-chat" @click="handleNewChat">
+      <SvgIcon name="icon-newChat" :size="20" inherit />
+      {{ $t("chat.new") }}
+    </div>
+    <a-divider />
+    <div class="agentsList-wrap">
+      <div class="section-title mb-6">{{ $t("agent.agent") }}</div>
+      <a-empty v-if="!agentsList?.length">
+        <a-button
+          type="primary"
+          ghost
+          size="small"
+          @click="handleCreateAgent"
+          >{{ $t("common.manual") }}</a-button
+        >
+      </a-empty>
+      <div class="agent-menu">
+        <div
+          v-for="(agent, index) in agentsList"
+          :key="index"
+          :class="['agent-item', { selected: agent.active }]"
+          :style="agent.active ? getActiveStyles(index) : {}"
+          @click="() => handleAgentClick(agent, index)"
+        >
+          <span class="agent-icon">
+            <SvgIcon :name="getAgentIcon(agent)" inherit />
+          </span>
+          <span class="agent-title">{{ agent.name }}</span>
+        </div>
+      </div>
+    </div>
+    <a-divider />
+    <div
+      class="session-wrapper"
+      @mouseenter="sessionHovering = true"
+      @mouseleave="sessionHovering = false"
+    >
+      <div class="section-title">{{ $t("chat.history") }}</div>
+      <div
+        class="session-list"
+        ref="sessionListRef"
+        :class="{ 'show-scroll': sessionHovering }"
+      >
+        <div
+          v-for="session in sessionList"
+          :key="session.id"
+          :class="['session-item', { selected: isSessionSelected(session.id) }]"
+          @click="() => handleSessionClick(session)"
+        >
+          <div class="session-main">
+            <div class="session-texts">
+              <div class="session-title" :title="session.name">
+                {{ session.name }}
+              </div>
+            </div>
+            <div class="session-actions" @click.stop v-if="false">
+              <a-dropdown trigger="click" placement="bottomLeft">
+                <template #overlay>
+                  <a-menu>
+                    <a-menu-item
+                      key="delete"
+                      @click="handleSessionDelete(session)"
+                    >
+                      <DeleteFilled :style="{ color: 'var(--color-error)' }" />
+                      {{ $t("common.delete") }}</a-menu-item
+                    >
+                  </a-menu>
+                </template>
+                <a-button type="text" class="dots-btn" @click.prevent>
+                  ⋮
+                </a-button>
+              </a-dropdown>
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { createVNode, ref } from "vue";
+import { DeleteFilled, CloseCircleFilled } from "@ant-design/icons-vue";
+import { Modal } from "ant-design-vue";
+import { useI18n } from "vue-i18n";
+import router from "@/router";
+import { getAgentList, requestAgentUpdate } from "@/api/agent";
+import { requestSessionDelete, getHistorySessionList } from "@/api/chatbot";
+import { chatbotAppStore } from "@/store/chatbot";
+import { sessionAppStore } from "@/store/session";
+import emitter from "@/utils/mitt";
+
+const chatbotStore = chatbotAppStore();
+const sessionStore = sessionAppStore();
+const route = useRoute();
+const { t } = useI18n();
+
+type AgentItem = {
+  id: string;
+  name: string;
+  type: string;
+  active: boolean;
+  icon?: string;
+};
+type sessionItem = { id: string; name: string };
+
+const agentsList = ref<AgentItem[]>([]);
+const sessionList = ref<sessionItem[]>([]);
+const selectedSessionId = ref<string>("");
+const sessionHovering = ref(false);
+const sessionListRef = ref<HTMLElement | null>(null);
+
+const isSessionSelected = (id: string) => selectedSessionId.value === id;
+
+const getAgentIcon = (agent: EmptyObjectType) => {
+  const { type } = agent;
+  if (type === "deep_search") {
+    return "icon-deep_search";
+  } else {
+    return "icon-simple-robot";
+  }
+};
+
+const handleAgentClick = (agent: AgentItem, index: number) => {
+  const { active } = agent;
+  const { name, type } = agent;
+
+  const text = active ? t("agent.deactivateTip") : t("agent.activeTip");
+  Modal.confirm({
+    title: t("common.prompt"),
+    content: text,
+    okText: t("common.confirm"),
+    async onOk() {
+      await requestAgentUpdate(name, { active: !active });
+      queryAgentList();
+      if (!active) {
+        handleThinkState();
+        chatbotStore.setAgent({
+          name,
+          type,
+          index,
+        });
+      } else {
+        emitter.emit("chat-style", null);
+        chatbotStore.setAgent({ name: "", type: "", index: 0 });
+        handleThinkState(true);
+      }
+    },
+  });
+};
+
+const handleThinkState = (value: boolean = false) => {
+  const { chat_template_kwargs } = chatbotStore.configuration;
+  const chat_template = {
+    ...chat_template_kwargs,
+    enable_thinking: value,
+  };
+  chatbotStore.setChatbotConfiguration({
+    chat_template_kwargs: chat_template,
+  });
+};
+
+const handleSessionClick = (session: sessionItem) => {
+  selectedSessionId.value = session.id;
+  sessionStore.setSessionId(session.id);
+  router.replace({
+    query: {
+      sessionId: session.id,
+    },
+  });
+};
+
+const handleNewChat = () => {
+  emitter.emit("new-chat");
+  selectedSessionId.value = "";
+};
+
+const queryAgentList = async () => {
+  try {
+    const data: any = await getAgentList();
+    agentsList.value = Object.values(data);
+    const index = data.findIndex((item: AgentItem) => item.active);
+    if (index !== -1) {
+      const agent = data[index];
+      handleThinkState();
+      const { name, type } = agent;
+      chatbotStore.setAgent({
+        name,
+        type,
+        index,
+      });
+    } else {
+      chatbotStore.setAgent({ name: "", type: "", index: 0 });
+    }
+  } catch (error) {
+    console.error(error);
+  }
+};
+
+const querySessionList = async () => {
+  try {
+    const data: any = await getHistorySessionList();
+    sessionList.value = Object.entries(data).map(([id, name]) => ({
+      id,
+      name: name as string,
+    }));
+  } catch (error) {
+    console.error(error);
+  }
+};
+
+const getActiveStyles = (index: number) => {
+  const colorIndex = (index % 5) + 1;
+  return {
+    backgroundColor: `var(--color-multicolored-${colorIndex}) `,
+  };
+};
+
+//delete
+const handleSessionDelete = (row: EmptyObjectType) => {
+  Modal.confirm({
+    title: t("common.delete"),
+    icon: createVNode(CloseCircleFilled, { class: "error-icon" }),
+    content: t("agent.deleteTip"),
+    okText: t("common.confirm"),
+    okType: "danger",
+    async onOk() {
+      const { id } = row;
+      await requestSessionDelete(id);
+      if (selectedSessionId.value === id) {
+        selectedSessionId.value = "";
+        sessionStore.setSessionId("");
+        router.replace({ query: {} });
+      }
+      querySessionList();
+    },
+  });
+};
+
+const handleCreateAgent = () => {
+  router.push({ name: "Settings" });
+};
+
+watch(
+  () => route.query?.sessionId,
+  (sessionId) => {
+    if (sessionId) {
+      const sessionIdStr = String(sessionId);
+      if (selectedSessionId.value !== sessionIdStr) {
+        selectedSessionId.value = sessionIdStr;
+      }
+      const isExist = sessionList.value.some(
+        (item) => item.id === sessionIdStr
+      );
+      if (!isExist) {
+        querySessionList();
+      }
+      const storedSessionId = sessionStore.currentSession;
+      if (storedSessionId !== sessionIdStr) {
+        sessionStore.setSessionId(sessionIdStr);
+      }
+    } else {
+      selectedSessionId.value = "";
+    }
+  },
+  { immediate: true }
+);
+
+onMounted(() => {
+  queryAgentList();
+  querySessionList();
+});
+</script>
+
+<style lang="less" scoped>
+.chat-agent {
+  display: flex;
+  flex-direction: column;
+  width: 260px;
+  height: 100%;
+  min-height: 0;
+  border-right: 1px solid var(--border-main-color);
+  padding: 16px 12px 12px 12px;
+  box-sizing: border-box;
+  .intel-divider {
+    margin: 12px 0;
+  }
+  .new-chat {
+    .mb-6;
+    .flex-left;
+    gap: 6px;
+    width: 100%;
+    padding: 6px 12px;
+    border-radius: 12px;
+    cursor: pointer;
+    font-weight: 500;
+    color: var(--color-primary);
+    border: 1px solid var(--color-primary-tip);
+    background-color: var(--color-second-primaryBg);
+    &:hover {
+      background-color: var(--color-primary-hover);
+      color: var(--color-white);
+    }
+  }
+  .agentsList-wrap {
+    .agent-menu {
+      .agent-item {
+        display: flex;
+        align-items: center;
+        padding: 10px;
+        cursor: pointer;
+        border-radius: 6px;
+        margin-bottom: 6px;
+        transition: background 0.15s;
+        .agent-icon {
+          width: 22px;
+          display: inline-block;
+          text-align: center;
+          margin-right: 10px;
+        }
+        .agent-title {
+          font-size: 16px;
+        }
+        &:hover {
+          background: var(--color-second-primaryBg);
+        }
+        &.selected {
+          color: var(--color-white);
+        }
+        &:last-child {
+          margin-bottom: 0;
+        }
+      }
+    }
+  }
+}
+
+.section-title {
+  color: var(--font-tip-color);
+  font-size: 12px;
+}
+
+.session-wrapper {
+  display: flex;
+  flex-direction: column;
+  flex: 1 1 auto;
+  min-height: 0;
+  overflow: hidden;
+  .session-list {
+    overflow-y: auto;
+    padding-right: 6px;
+    margin-top: 6px;
+    scrollbar-width: none;
+    -ms-overflow-style: none;
+    &::-webkit-scrollbar {
+      width: 0;
+      height: 0;
+    }
+  }
+  &:hover {
+    .session-list,
+    .session-list.show-scroll {
+      scrollbar-width: thin;
+    }
+    .session-list::-webkit-scrollbar,
+    .session-list.show-scroll::-webkit-scrollbar {
+      width: 8px;
+    }
+    .session-list::-webkit-scrollbar-thumb,
+    .session-list.show-scroll::-webkit-scrollbar-thumb {
+      border-radius: 4px;
+    }
+  }
+}
+
+.session-item {
+  padding: 8px;
+  border-radius: 6px;
+  cursor: pointer;
+  margin-bottom: 6px;
+  transition: background 0.12s;
+  display: flex;
+  align-items: center;
+  border-left: 3px solid transparent;
+  .session-actions {
+    display: flex;
+    align-items: center;
+    visibility: hidden;
+  }
+  .session-main {
+    width: 100%;
+    .flex-between;
+    .session-texts {
+      overflow: hidden;
+      padding-right: 8px;
+    }
+
+    .session-title {
+      font-size: 14px;
+      color: var(--font-main-color);
+      white-space: nowrap;
+      text-overflow: ellipsis;
+      overflow: hidden;
+    }
+
+    .dots-btn {
+      border: none;
+      padding: 0 6px;
+      height: 24px;
+      line-height: 24px;
+      background: transparent;
+      cursor: pointer;
+      border-radius: 4px;
+    }
+    .dots-btn:hover {
+      background: var(--color-fuzzy-white);
+    }
+  }
+  &:hover {
+    background: var(--color-second-primaryBg);
+    .session-actions {
+      visibility: visible;
+    }
+  }
+  &.selected {
+    background: var(--color-second-primaryBg);
+    border-left: 3px solid var(--color-primary-second);
+
+    .session-title {
+      color: var(--color-primary);
+    }
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/ConfigDrawer.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/ConfigDrawer.vue
index 16258dd73e..8e1aaa2ba6 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/ConfigDrawer.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/ConfigDrawer.vue
@@ -18,7 +18,13 @@
       class="form-wrap"
     >
       <div class="module-wrap">
-        <div class="module-title">{{ $t("generation.retriever") }}</div>
+        <div class="module-title">
+          <p>{{ $t("generation.retriever") }}</p>
+          <div class="warning-wrap">
+            <ExclamationCircleFilled />{{ $t("generation.tips") }}
+          </div>
+        </div>
+
         <a-form-item
           :label="$t('generation.config.top_n')"
           name="top_n"
@@ -26,14 +32,29 @@
         >
           <a-slider
             v-model:value="form.top_n"
-            :min="1"
-            :max="30"
+            :min="0"
+            :max="100"
             :marks="sliderMarks.top_n"
           />
           <div class="tips-wrap">
             <InfoCircleFilled />{{ $t("generation.desc.top_n") }}
           </div>
         </a-form-item>
+        <a-form-item
+          :label="$t('pipeline.config.topk')"
+          name="k"
+          class="slider-wrap"
+        >
+          <a-slider
+            v-model:value="form.k"
+            :min="0"
+            :max="500"
+            :marks="sliderMarks.k"
+          />
+          <div class="tips-wrap">
+            <InfoCircleFilled />{{ $t("pipeline.desc.topk") }}
+          </div>
+        </a-form-item>
       </div>
       <div class="module-wrap">
         <div class="module-title">{{ $t("generation.title") }}</div>
@@ -128,7 +149,10 @@
   </a-drawer>
 </template>
 <script lang="ts" setup name="DetailDrawer">
-import { InfoCircleFilled } from "@ant-design/icons-vue";
+import {
+  InfoCircleFilled,
+  ExclamationCircleFilled,
+} from "@ant-design/icons-vue";
 import { FormInstance } from "ant-design-vue";
 import { reactive, ref } from "vue";
 import { ConfigType } from "../../type";
@@ -146,7 +170,8 @@ const formRef = ref<FormInstance>();
 const drawerVisible = ref<boolean>(true);
 const submitLoading = ref<boolean>(false);
 const {
-  top_n = 25,
+  top_n = 0,
+  k = 0,
   temperature = 0.01,
   top_p = 0.95,
   top_k = 10,
@@ -157,6 +182,7 @@ const {
 
 const form = reactive<ConfigType>({
   top_n,
+  k,
   temperature,
   top_p,
   top_k,
@@ -164,8 +190,9 @@ const form = reactive<ConfigType>({
   max_tokens,
   stream,
 });
-const rules = reactive({
+const rules: FormRules = reactive({
   top_n: [{ required: true, trigger: "blur" }],
+  k: [{ required: true, trigger: "blur" }],
   temperature: [{ required: true, trigger: "blur" }],
   top_p: [{ required: true, trigger: "blur" }],
   top_k: [{ required: true, trigger: "blur" }],
@@ -174,13 +201,17 @@ const rules = reactive({
 });
 const sliderMarks = reactive<EmptyObjectType>({
   top_n: {
-    1: "1",
-    30: "30",
+    0: "0",
+    100: "100",
   },
   temperature: {
     0: "0",
     1: "1",
   },
+  k: {
+    0: "0",
+    500: "500",
+  },
   top_k: {
     0: "0",
     200: "200",
@@ -233,11 +264,24 @@ const handleSubmit = () => {
     font-weight: 500;
     margin-bottom: 12px;
   }
+  .warning-wrap {
+    font-weight: 400;
+    color: var(--color-second-warning);
+    display: flex;
+    gap: 6px;
+    font-size: 12px;
+    .anticon-exclamation-circle {
+      margin-top: 0;
+      font-size: 13px;
+      color: var(--color-warning);
+    }
+  }
   .tips-wrap {
     display: flex;
     color: var(--font-info-color);
     gap: 6px;
     font-size: 12px;
+
     .anticon-info-circle {
       margin-top: 0;
       font-size: 13px;
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/MessageItem.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/MessageItem.vue
index b3f7e601d9..0c22b921b7 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/MessageItem.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/MessageItem.vue
@@ -4,19 +4,17 @@
       <div class="chatbot-session">
         <div class="avatar-wrap">
           <SvgIcon
-            name="icon-chatbot"
-            :size="24"
+            :name="fixedAgentStyle.icon"
+            :size="22"
             :style="{ color: 'var(--color-primary)' }"
+            inherit
           />
         </div>
-        <div class="message-wrap">
-          <div v-if="!props.message?.content" class="dot-loader">
-            <span class="drop" v-for="(drop, index) in 3" :key="index"></span>
+        <div class="message-wrap agent-wrap" :style="fixedAgentStyle.styleVars">
+          <div v-if="inResponse && !props.message?.content" class="dot-loader">
+            <span class="drop" v-for="index in 3" :key="index"></span>
           </div>
-          <div
-            class="think-container"
-            v-if="thinkMode && message.content?.length"
-          >
+          <div class="think-container" v-if="shouldShowThinkContainer">
             <div
               :class="{
                 'think-title': true,
@@ -54,7 +52,63 @@
               ></div>
             </div>
           </div>
-          <div v-html="renderedMarkdown"></div>
+          <div class="agent-container" v-if="agentBlocks.length > 0">
+            <div
+              v-for="(agent, index) in agentBlocks"
+              :key="`agent-${index}`"
+              class="agent-block"
+            >
+              <div class="agent-header" @click="toggleAgent(index)">
+                <div class="agent-title">
+                  <SvgIcon name="icon-agent" :size="16" />
+                  <span class="title-wrap">
+                    <span v-if="agent.title" v-html="agent.title"></span>
+                    <span v-else>{{ $t("agent.think") }} {{ index + 1 }}</span>
+                    <SvgIcon
+                      v-if="!agent.completed"
+                      name="icon-loading1"
+                      :size="18"
+                      inherit
+                  /></span>
+                </div>
+                <UpOutlined
+                  v-if="!agent.nofold"
+                  :class="[
+                    'agent-toggle-icon',
+                    { rotate: !agentStates[index]?.collapsed },
+                  ]"
+                />
+              </div>
+              <div
+                class="agent-content"
+                v-show="shouldShowAgentContent(agent, index)"
+              >
+                <div
+                  class="agent-message"
+                  v-html="formatAgentContent(agent.content)"
+                ></div>
+              </div>
+            </div>
+          </div>
+          <div v-if="shouldShowMainContent" v-html="renderedMainMarkdown"></div>
+          <div v-if="!inResponse && readResponse" class="footer-btn">
+            <a-tooltip
+              placement="top"
+              :title="$t('common.copy')"
+              v-if="readResponse.length"
+            >
+              <span class="icon-style" @click="handleCopyResponses()">
+                <CopyOutlined /></span
+            ></a-tooltip>
+            <a-tooltip
+              v-if="lastResponse"
+              placement="top"
+              :title="$t('common.regenerate')"
+            >
+              <span class="icon-style" @click="handleRegenerate()">
+                <SyncOutlined /></span
+            ></a-tooltip>
+          </div>
         </div>
       </div>
       <div
@@ -86,7 +140,76 @@
       </div>
     </template>
     <div v-else class="user-session">
-      <div class="message-wrap">{{ message.content }}</div>
+      <template v-if="editState">
+        <div class="input-wrap">
+          <a-textarea
+            v-model:value.trim="queryInput"
+            :bordered="false"
+            :auto-size="{ minRows: 1, maxRows: 2 }"
+          />
+          <div class="button-wrap">
+            <a-button shape="round" @click="handleCancel">
+              {{ $t("common.cancel") }}
+            </a-button>
+            <a-button
+              type="primary"
+              shape="round"
+              @click="handleSend"
+              :disabled="!queryInput"
+            >
+              {{ $t("common.send") }}
+            </a-button>
+          </div>
+        </div>
+      </template>
+      <template v-else>
+        <a-tooltip
+          v-if="message.errorMessage"
+          placement="left"
+          color="var(--bg-card-color)"
+          :overlayInnerStyle="{
+            color: 'var(--font-text-color)',
+            border: '1px solid var(--color-error)',
+          }"
+        >
+          <template #title>
+            <SvgIcon
+              name="icon-chatbot1"
+              class="mr-6"
+              :size="20"
+              :style="{
+                color: 'var(--color-error)',
+              }"
+            />{{ message.errorMessage }}</template
+          >
+          <ExclamationCircleFilled class="error-icon"
+        /></a-tooltip>
+        <div class="message-wrap">
+          {{ message.content }}
+          <div class="footer-btn">
+            <a-tooltip placement="top" :title="$t('common.copy')">
+              <span class="icon-style" @click="handleCopyQuery()">
+                <CopyOutlined /></span
+            ></a-tooltip>
+            <a-tooltip
+              v-if="!inResponse && lastQuery"
+              placement="top"
+              :title="$t('common.edit')"
+            >
+              <span class="icon-style" @click="handleEdit()">
+                <EditOutlined /></span
+            ></a-tooltip>
+            <a-tooltip
+              v-if="!inResponse && message.errorMessage && lastQuery"
+              placement="top"
+              :title="$t('common.regenerate')"
+            >
+              <span class="icon-style" @click="handleRetry()">
+                <SyncOutlined /></span
+            ></a-tooltip>
+          </div>
+        </div>
+      </template>
       <div class="user-wrap">
         <SvgIcon name="icon-user" inherit :size="22" />
       </div>
@@ -96,11 +219,23 @@
 
 <script lang="ts" setup name="MessageItem">
 import { marked } from "marked";
-import { PropType, ref } from "vue";
-import { CheckCircleFilled, UpOutlined } from "@ant-design/icons-vue";
+import { PropType, ref, onMounted, computed, watch } from "vue";
+import {
+  CheckCircleFilled,
+  UpOutlined,
+  CopyOutlined,
+  SyncOutlined,
+  EditOutlined,
+  ExclamationCircleFilled,
+} from "@ant-design/icons-vue";
 import { IMessage, Benchmark } from "../../type";
 import CustomRenderer from "@/utils/customRenderer";
+import { useClipboard } from "@/utils/clipboard";
 import "highlight.js/styles/atom-one-dark.css";
+import { chatbotAppStore } from "@/store/chatbot";
+
+const chatbotStore = chatbotAppStore();
+const { copy } = useClipboard();
 
 const props = defineProps({
   message: {
@@ -112,20 +247,72 @@ const props = defineProps({
     type: Boolean,
     required: true,
   },
-  think: {
+  messageIndex: {
+    type: Number,
+  },
+  lastQuery: {
     type: Boolean,
-    required: true,
+    default: false,
+  },
+  lastResponse: {
+    type: Boolean,
+    default: false,
+  },
+  messageKey: {
+    type: String,
+    default: "",
   },
 });
 
-const emit = defineEmits(["preview", "stop"]);
+const emit = defineEmits(["preview", "stop", "regenerate", "resend"]);
+
+type AgentItem = { id: string; icon?: string; css?: string };
+
+const agentsList = ref<AgentItem[]>([
+  {
+    id: "simple",
+    icon: "icon-simple-robot",
+    css: "agent-simple",
+  },
+  {
+    id: "deep_search",
+    icon: "icon-deep_search",
+    css: "agent-recursive",
+  },
+]);
+
+interface AgentBlock {
+  content: string;
+  title: string;
+  completed: boolean;
+  startIndex: number;
+  endIndex?: number;
+  nofold?: boolean;
+  hasSetInitialState?: boolean;
+}
+
+const agentBlocks = ref<AgentBlock[]>([]);
+const agentStates = ref<Record<number, { collapsed: boolean }>>({});
 
 const benchmarkData = computed<Benchmark>(() => {
   return (props.message?.benchmark || {}) as Benchmark;
 });
 const isExpanded = ref<boolean>(false);
 const isCollapsed = ref(true);
-const thinkMode = ref(props.think);
+const editState = ref<boolean>(false);
+const queryInput = ref<string>(props.message.content);
+
+interface FixedAgentStyle {
+  icon: string;
+  css: string;
+  styleVars: Record<string, string>;
+}
+
+const fixedAgentStyle = ref<FixedAgentStyle>({
+  icon: "icon-chatbot",
+  css: "",
+  styleVars: {},
+});
 
 marked.setOptions({
   pedantic: false,
@@ -133,44 +320,279 @@ marked.setOptions({
   breaks: false,
   renderer: CustomRenderer,
 });
-const thinkTagRegexSpecial = /^[\s\S]*?<\/think>/;
-
-const isThinkEnd = computed(() => props.message.content.includes("</think>"));
-const getThinkMode = () => {
-  const { content } = props.message;
-  const endIndex = content.indexOf("</think>");
-
-  return computed(() => {
-    if (isThinkEnd.value) {
-      return content.substring(0, endIndex);
-    } else if (thinkMode.value) {
-      return content;
+
+const isThinkInsideAgent = computed(() => {
+  const content = props.message.content || "";
+  const thinkStartIndex = content.indexOf("<think>");
+
+  if (thinkStartIndex === -1) return false;
+
+  return agentBlocks.value.some((agent) => {
+    return (
+      agent.startIndex < thinkStartIndex &&
+      (agent.endIndex === undefined || thinkStartIndex < agent.endIndex)
+    );
+  });
+});
+
+const hasThinkContent = computed(() => {
+  return (
+    props.message.content?.includes("<think>") && !isThinkInsideAgent.value
+  );
+});
+
+const isThinkEnd = computed(() => {
+  return (
+    props.message.content?.includes("</think>") && !isThinkInsideAgent.value
+  );
+});
+
+const thinkContent = computed(() => {
+  if (!hasThinkContent.value) return "";
+
+  const content = props.message.content;
+  const startIndex = content.indexOf("<think>") + 7;
+  const endIndex = isThinkEnd.value
+    ? content.indexOf("</think>")
+    : content.length;
+
+  return content.substring(startIndex, endIndex);
+});
+
+const shouldShowThinkContainer = computed(() => {
+  return hasThinkContent.value && thinkContent.value.trim().length > 0;
+});
+
+const parseAttributes = (attrString: string): Record<string, string> => {
+  const attrs: Record<string, string> = {};
+  const attrRegex = /(\w+)\s*=\s*("([^"]*)"|'([^']*)'|([^\s>]+))/g;
+  let match;
+
+  while ((match = attrRegex.exec(attrString)) !== null) {
+    const key = match[1];
+    const value = match[3] || match[4] || match[5] || "";
+    attrs[key] = value.trim();
+  }
+
+  return attrs;
+};
+
+const parseAgentContentIncremental = (
+  content: string,
+  previousBlocks: AgentBlock[]
+): AgentBlock[] => {
+  const blocks = [...previousBlocks];
+  let currentIndex = 0;
+
+  while (currentIndex < content.length) {
+    const startTag = content.indexOf("<agent", currentIndex);
+    if (startTag === -1) break;
+
+    const endOfStartTag = content.indexOf(">", startTag);
+    if (endOfStartTag === -1) break;
+
+    const attributes = content.substring(startTag + 6, endOfStartTag).trim();
+    const attrs = parseAttributes(attributes);
+
+    const title = attrs.title || "";
+    const tag = attrs?.tag || "";
+
+    const endTag = content.indexOf("</agent>", endOfStartTag);
+
+    if (endTag !== -1) {
+      const agentContent = content.substring(endOfStartTag + 1, endTag).trim();
+
+      const existingBlockIndex = blocks.findIndex(
+        (block) => block.startIndex === startTag
+      );
+
+      if (existingBlockIndex !== -1) {
+        blocks[existingBlockIndex].content = agentContent;
+        if (title) {
+          blocks[existingBlockIndex].title = title;
+        }
+        blocks[existingBlockIndex].completed = true;
+        blocks[existingBlockIndex].endIndex = endTag + 8;
+        blocks[existingBlockIndex].nofold = tag === "nofold";
+        if (!blocks[existingBlockIndex].hasSetInitialState) {
+          if (tag === "nofold") {
+            agentStates.value[existingBlockIndex] = {
+              collapsed: !agentContent.trim(),
+            };
+          } else {
+            agentStates.value[existingBlockIndex] = { collapsed: true };
+          }
+          blocks[existingBlockIndex].hasSetInitialState = true;
+        }
+      } else {
+        const newBlock: AgentBlock = {
+          content: agentContent,
+          title: title,
+          completed: true,
+          nofold: tag === "nofold",
+          startIndex: startTag,
+          endIndex: endTag + 8,
+          hasSetInitialState: true,
+        };
+        blocks.push(newBlock);
+
+        const newIndex = blocks.length - 1;
+        if (tag === "nofold") {
+          agentStates.value[newIndex] = {
+            collapsed: !agentContent.trim(),
+          };
+        } else {
+          agentStates.value[newIndex] = { collapsed: true };
+        }
+      }
+
+      currentIndex = endTag + 8;
     } else {
-      return "";
+      const agentContent = content.substring(endOfStartTag + 1).trim();
+
+      const existingBlockIndex = blocks.findIndex(
+        (block) => block.startIndex === startTag && !block.completed
+      );
+
+      if (existingBlockIndex !== -1) {
+        blocks[existingBlockIndex].content = agentContent;
+        if (title) {
+          blocks[existingBlockIndex].title = title;
+        }
+      } else {
+        const newBlock: AgentBlock = {
+          content: agentContent,
+          title: title,
+          completed: false,
+          nofold: tag === "nofold",
+          startIndex: startTag,
+          hasSetInitialState: false,
+        };
+        blocks.push(newBlock);
+
+        const newIndex = blocks.length - 1;
+        if (!agentStates.value[newIndex]) {
+          agentStates.value[newIndex] = { collapsed: false };
+        }
+      }
+
+      break;
     }
-  });
+  }
+
+  return blocks;
+};
+
+const getMainContent = (content: string, agentBlocks: AgentBlock[]): string => {
+  if (!content) return "";
+
+  let result = content;
+
+  if (!agentBlocks.length) {
+    return result.replace(/\x1b\[[0-9;]*m/g, "").trim();
+  }
+
+  const sortedBlocks = [...agentBlocks].sort(
+    (a, b) => (b.startIndex || 0) - (a.startIndex || 0)
+  );
+
+  for (const block of sortedBlocks) {
+    if (block.completed && block.endIndex !== undefined) {
+      result =
+        result.substring(0, block.startIndex) +
+        result.substring(block.endIndex);
+    } else {
+      result = result.substring(0, block.startIndex);
+    }
+  }
+
+  result = result.replace(/\x1b\[[0-9;]*m/g, "");
+
+  return result.trim();
+};
+
+const formatAgentContent = (content: string) => {
+  const cleanedContent = content.replace(/\x1b\[[0-9;]*m/g, "");
+  return marked(cleanedContent);
+};
+
+const shouldShowAgentContent = (agent: AgentBlock, index: number): boolean => {
+  if (agent.nofold) {
+    return !!agent.content.trim();
+  }
+  return !agentStates.value[index]?.collapsed;
 };
 
 const thinkMarkdown = computed(() => {
-  return marked(getThinkMode().value);
+  return marked(thinkContent.value);
 });
 
-const renderedMarkdown = computed(() => {
+const readResponse = computed(() => {
   const content = props.message?.content || "";
-
   if (!content) return "";
 
-  if (!thinkMode.value) {
-    return marked(content);
+  if (!hasThinkContent.value) {
+    return content;
   }
 
   if (!isThinkEnd.value) {
     return "";
   }
 
-  const cleanedContent = content.replace(thinkTagRegexSpecial, "");
-  return marked(cleanedContent);
+  const thinkEndIndex = content.indexOf("</think>");
+  if (thinkEndIndex !== -1) {
+    return content.substring(thinkEndIndex + 8);
+  }
+
+  return content;
+});
+
+const mainContent = computed(() => {
+  return getMainContent(readResponse.value, agentBlocks.value);
 });
+
+const shouldShowMainContent = computed(() => {
+  return mainContent.value && (!hasThinkContent.value || isThinkEnd.value);
+});
+
+const renderedMainMarkdown = computed(() => {
+  return marked(mainContent.value);
+});
+
+const calculateAgentStyle = () => {
+  const agent = agentsList.value.find(
+    (item) => item.id === chatbotStore.agent?.type
+  );
+
+  const colorIndex = (chatbotStore.agent.index % 5) + 1;
+
+  const styleVars = {
+    "--agent-bg-var": `var(--color-multicolored-bg-${colorIndex})`,
+    "--agent-border-var": `var(--color-multicolored-border-${colorIndex})`,
+  };
+
+  return {
+    icon: agent?.icon || "icon-chatbot",
+    css: agent?.css || "",
+    styleVars,
+  };
+};
+
+const resetAgentState = () => {
+  agentBlocks.value = [];
+  agentStates.value = {};
+};
+
+const toggleAgent = (index: number) => {
+  if (agentBlocks.value[index]?.nofold) {
+    return;
+  }
+  if (!agentStates.value[index]) {
+    agentStates.value[index] = { collapsed: false };
+  }
+  agentStates.value[index].collapsed = !agentStates.value[index].collapsed;
+};
+
 const toggleTabs = () => {
   isExpanded.value = !isExpanded.value;
 };
@@ -180,6 +602,7 @@ const toggleThink = () => {
   emit("stop");
   isCollapsed.value = !isCollapsed.value;
 };
+
 const addClickListeners = () => {
   const images = document.querySelectorAll("#message-container img");
 
@@ -193,6 +616,87 @@ const addClickListeners = () => {
   });
 };
 
+const handleRegenerate = () => {
+  const { query = "" } = props.message;
+  if (!query) return;
+  emit("regenerate", query);
+};
+
+const handleRetry = () => {
+  emit("resend", { index: props.messageIndex, query: queryInput.value });
+};
+
+const handleCopyQuery = async () => {
+  await copy(queryInput.value);
+};
+
+const handleCopyResponses = async () => {
+  await copy(readResponse.value);
+};
+
+const handleEdit = () => {
+  queryInput.value = props.message.content;
+  editState.value = true;
+};
+
+const handleCancel = () => {
+  editState.value = false;
+};
+
+const handleSend = () => {
+  if (!queryInput.value) return;
+  emit("resend", { index: props.messageIndex, query: queryInput.value });
+  handleCancel();
+};
+
+watch(
+  () => props.messageKey,
+  (newKey, oldKey) => {
+    if (newKey !== oldKey) {
+      resetAgentState();
+      if (props.message?.content) {
+        agentBlocks.value = parseAgentContentIncremental(
+          props.message.content,
+          []
+        );
+      }
+    }
+  }
+);
+
+watch(
+  () => props.message.content,
+  (newContent, oldContent) => {
+    if (
+      newContent &&
+      oldContent &&
+      !newContent.includes(oldContent) &&
+      !oldContent.includes(newContent)
+    ) {
+      resetAgentState();
+    }
+
+    if (newContent) {
+      agentBlocks.value = parseAgentContentIncremental(
+        newContent,
+        agentBlocks.value
+      );
+    } else {
+      resetAgentState();
+    }
+  },
+  { immediate: true }
+);
+
+watch(
+  () => props.message.role,
+  (newRole, oldRole) => {
+    if (newRole !== oldRole) {
+      resetAgentState();
+    }
+  }
+);
+
 watch(
   () => props.inResponse,
   (newValue) => {
@@ -201,6 +705,7 @@ watch(
     }
   }
 );
+
 watch(
   () => isThinkEnd.value,
   (value) => {
@@ -209,6 +714,14 @@ watch(
     }
   }
 );
+
+onMounted(() => {
+  fixedAgentStyle.value = calculateAgentStyle();
+
+  if (props.message?.content) {
+    agentBlocks.value = parseAgentContentIncremental(props.message.content, []);
+  }
+});
 </script>
 
 <style lang="less" scoped>
@@ -257,6 +770,78 @@ watch(
     transform: scale(1);
   }
 }
+@keyframes spin {
+  from {
+    transform: rotate(0deg);
+  }
+  to {
+    transform: rotate(360deg);
+  }
+}
+
+.agent-container {
+  margin: 12px 0;
+}
+
+.agent-block {
+  border: 1px solid var(--color-primary-light);
+  border-radius: 8px;
+  margin-bottom: 12px;
+  overflow: hidden;
+  box-shadow: 0 2px 8px var(--bg-box-shadow);
+  border: 1px solid var(--agent-border-var);
+}
+
+.agent-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  padding: 12px 16px;
+  cursor: pointer;
+  transition: all 0.2s ease;
+  background-color: rgba(from var(--agent-bg-var) r g b / 0.7);
+  &:hover {
+    background-color: var(--agent-bg-var);
+  }
+  .icon-loading1 {
+    animation: spin 3s linear infinite;
+    position: relative;
+    top: 3px;
+    left: 4px;
+  }
+  .agent-title {
+    display: flex;
+    align-items: center;
+    gap: 8px;
+    font-weight: 600;
+    color: var(--color-primary);
+    font-size: 14px;
+    .title-wrap {
+      flex: 1;
+    }
+  }
+
+  .agent-toggle-icon {
+    transition: transform 0.3s ease;
+    color: var(--color-info);
+    font-size: 14px;
+  }
+
+  .agent-toggle-icon.rotate {
+    transform: rotate(180deg);
+  }
+}
+
+.agent-content {
+  background: var(--bg-content-color);
+}
+.agent-message {
+  padding: 16px;
+  line-height: 1.6;
+  font-size: 14px;
+  color: var(--font-text-color);
+}
+
 .chatbot-session {
   margin-bottom: 16px;
   font-size: 16px;
@@ -289,9 +874,20 @@ watch(
   padding: 12px 16px;
   width: 100%;
 }
+
+.agent-wrap {
+  background: linear-gradient(
+    to bottom right,
+    rgb(from var(--agent-bg-var) r g b / 0.4),
+    rgb(from var(--bg-content-color) r g b / 0.4),
+    var(--bg-content-color)
+  );
+}
+
 .user-session {
-  margin-bottom: 20px;
+  margin-bottom: 30px;
   display: flex;
+  align-items: center;
   justify-content: flex-end;
   font-size: 16px;
   text-align: end;
@@ -300,6 +896,33 @@ watch(
     background-color: var(--message-bg);
     width: auto;
     text-align: left;
+    position: relative;
+    .footer-btn {
+      position: absolute;
+      bottom: -24px;
+      right: 0;
+      z-index: 20;
+      opacity: 0;
+      visibility: hidden;
+      transition: opacity 0.3s ease, visibility 0s linear 2s;
+      gap: 8px;
+      .anticon {
+        cursor: pointer;
+        &:hover {
+          color: var(--color-primary-hover);
+        }
+      }
+    }
+    &:hover .footer-btn {
+      opacity: 1;
+      visibility: visible;
+      transition: opacity 0.3s ease;
+    }
+  }
+  .error-icon {
+    font-size: 18px;
+    color: var(--color-error);
+    .mr-8;
   }
 }
 .benchmark-wrap {
@@ -347,6 +970,7 @@ watch(
   background: var(--think-done-bg);
   width: 100%;
   padding: 12px 16px;
+  margin-bottom: 12px;
   border-radius: 6px;
   transition: 0.3s background cubic-bezier(0.4, 0, 0.2, 1);
   .think-title {
@@ -493,4 +1117,44 @@ watch(
     }
   }
 }
+.footer-btn {
+  .flex-end;
+  .mt-8;
+  gap: 8px;
+  font-size: 14px;
+  color: var(--font-tip-color);
+  .anticon {
+    cursor: pointer;
+    &:hover {
+      color: var(--color-primary-hover);
+    }
+  }
+}
+.input-wrap {
+  padding: 4px;
+  border: 1px solid var(--color-primary);
+  border-radius: 20px;
+  background-color: var(--input-bg);
+  max-width: 960px;
+  min-width: 500px;
+  transition: all 0.2s;
+  width: 100%;
+  display: flow-root;
+  position: relative;
+  left: -2px;
+  text-align: center;
+
+  &:hover {
+    box-shadow: 0 4px 12px var(--bg-primary-shadow);
+    border: 1px solid var(--color-primary-hover);
+  }
+  textarea {
+    resize: none;
+  }
+
+  .button-wrap {
+    .flex-end;
+    padding: 6px 12px;
+  }
+}
 </style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/SseService.ts b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/SseService.ts
index 1f57ce25b1..4c7b47138f 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/SseService.ts
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/SseService.ts
@@ -1,49 +1,97 @@
 // Copyright (C) 2025 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
+
 import { getChatSessionId } from "@/utils/common";
+import { message } from "ant-design-vue";
+
+export interface StreamController {
+  cancel: () => void;
+}
 
-export const handleMessageSend = async (
+export const handleMessageSend = (
   url: string,
   postData: any,
-  onDisplay: (data: any) => void,
+  onDisplay: (data: string) => void,
   onEnd?: () => void,
-): Promise<void> => {
-  try {
-    const response = await fetch(url, {
-      method: "POST",
-      headers: {
-        "Content-Type": "application/json",
-        Accept: "text/event-stream",
-        sessionid: getChatSessionId(),
-      },
-      body: JSON.stringify(postData),
-    });
-
-    if (!response.ok) {
-      throw new Error(`Network response was not ok: ${response.statusText}`);
-    }
-
-    const reader = response.body?.getReader();
-    const decoder = new TextDecoder("utf-8");
-    let buffer = "";
+): StreamController => {
+  let reader: ReadableStreamDefaultReader | undefined;
+  const controller = new AbortController();
 
+  const execute = async () => {
     try {
+      const response = await fetch(url, {
+        method: "POST",
+        headers: {
+          "Content-Type": "application/json",
+          Accept: "text/event-stream",
+          sessionid: getChatSessionId(),
+        },
+        body: JSON.stringify(postData),
+        signal: controller.signal,
+      });
+
+      if (!response.ok) {
+        let errorMessage = "";
+        try {
+          const errorText = await response.text();
+          if (errorText) {
+            errorMessage = errorText;
+          }
+        } catch (parseError) {
+          console.warn("Failed to read error response:", parseError);
+        }
+        message.error(errorMessage || "Request failed");
+        onEnd?.();
+        return;
+      }
+
+      reader = response.body?.getReader();
+      if (!reader) {
+        throw new Error("Readable stream is not available");
+      }
+
+      const decoder = new TextDecoder("utf-8");
+      let buffer = "";
+
       while (true) {
         const { done, value } = await reader.read();
+
         if (done) {
           onEnd?.();
           break;
         }
-        buffer += decoder.decode(value, { stream: true });
 
+        buffer += decoder.decode(value, { stream: true });
         onDisplay(buffer);
       }
-    } catch (error) {
-      console.error(error);
+    } catch (error: any) {
+      if (error.name === "AbortError") {
+        console.log("Stream was aborted by user.");
+      } else {
+        console.error("Request or stream error:", error);
+        if (error.message !== "Request failed") {
+          message.error(error.message || "Stream error");
+        }
+      }
       onEnd?.();
+    } finally {
+      if (reader) {
+        try {
+          await reader.cancel();
+        } catch (cancelError) {
+          console.warn("Failed to cancel reader:", cancelError);
+        }
+      }
     }
-  } catch (error) {
-    console.error(error);
-    onEnd?.();
-  }
+  };
+
+  execute().catch(console.error);
+
+  return {
+    cancel: () => {
+      if (!controller.signal.aborted) {
+        controller.abort();
+      }
+    },
+  };
 };
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/index.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/index.vue
index 4d46a60654..4e03e048ae 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/index.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/Chatbot/index.vue
@@ -22,7 +22,8 @@ import { Local } from "@/utils/storage";
 const chatbotStore = chatbotAppStore();
 
 let chatbotConfiguration = reactive<ConfigType>({
-  top_n: 25,
+  top_n: 0,
+  k: 0,
   temperature: 0.01,
   top_p: 0.95,
   top_k: 10,
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/DetailComponent.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/DetailComponent.vue
new file mode 100644
index 0000000000..5ba1d94094
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/DetailComponent.vue
@@ -0,0 +1,93 @@
+<template>
+  <div class="kb-detail-container">
+    <div class="header-wrap">
+      <div class="info-wrap">
+        <div class="name-wrap">{{ kbInfo.name }}</div>
+        <div class="des-wrap" v-if="kbInfo.description">
+          {{ kbInfo.description }}
+        </div>
+      </div>
+      <div class="button-wrap">
+        <a-button
+          type="primary"
+          ghost
+          :icon="h(RollbackOutlined)"
+          @click="handleBack"
+          >{{ $t("common.back") }}</a-button
+        >
+      </div>
+    </div>
+    <component :is="currentComponent" :key="componentKey" :kb-info="kbInfo" />
+  </div>
+</template>
+
+<script setup lang="ts" name="DetailComponent">
+import { h, provide } from "vue";
+import { RollbackOutlined } from "@ant-design/icons-vue";
+import eventBus from "@/utils/mitt";
+import { KnowledgeDetail, ExperienceDetail } from "./index";
+
+const props = defineProps({
+  kbInfo: {
+    type: Object,
+    default: () => {},
+    required: true,
+  },
+});
+
+provide("kbInfo", props.kbInfo);
+const emit = defineEmits(["back"]);
+
+const currentComponent = computed(() => {
+  return props.kbInfo.comp_type === "experience"
+    ? ExperienceDetail
+    : KnowledgeDetail;
+});
+
+const componentKey = computed(() => {
+  return `detail-${props.kbInfo.idx}`;
+});
+const handleBack = () => {
+  emit("back");
+  eventBus.emit("reset");
+};
+</script>
+
+<style lang="less" scoped>
+.kb-detail-container {
+  display: block !important;
+  height: 100%;
+  .flex-column;
+  .header-wrap {
+    padding: 12px 16px;
+    height: 60px;
+    border-bottom: 1px solid var(--border-main-color);
+    .flex-between;
+    gap: 16px;
+    min-width: 0;
+    .info-wrap {
+      flex: 1;
+      .flex-column;
+      gap: 4px;
+      min-width: 0;
+      .name-wrap {
+        font-size: 16px;
+        font-weight: 600;
+        flex: 1;
+        min-width: 0;
+        line-height: 16px;
+        .single-ellipsis;
+      }
+      .des-wrap {
+        color: var(--font-info-color);
+        font-size: 12px;
+        .single-ellipsis;
+      }
+    }
+    .button-wrap {
+      .vertical-center;
+      gap: 4px;
+    }
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/ExperienceDetail.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/ExperienceDetail.vue
new file mode 100644
index 0000000000..c81057bb8e
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/ExperienceDetail.vue
@@ -0,0 +1,225 @@
+<template>
+  <div class="experience-container">
+    <div class="table-container">
+      <div class="header-wrap">
+        <span class="title"></span>
+        <div class="btn-wrap">
+          <a-config-provider :theme="antTheme.subTheme">
+            <a-button
+              type="primary"
+              :icon="h(CloudUploadOutlined)"
+              @click="handleImport()"
+              >{{ $t("experience.import") }}</a-button
+            >
+          </a-config-provider>
+          <a-button type="primary" @click="handleCreate()">
+            <template #icon>
+              <PlusOutlined />
+            </template>
+            {{ $t("experience.create") }}</a-button
+          >
+        </div>
+      </div>
+      <a-table
+        :columns="tableColumns"
+        :data-source="tableList"
+        :pagination="false"
+        :row-key="(record) => record?.question"
+      >
+        <template #expandColumnTitle>
+          <div class="expand-column">{{ $t("experience.detail") }}</div>
+        </template>
+        <template #expandedRowRender="{ record }">
+          <p v-for="(item, index) in record.content" class="experience-item">
+            {{ index + 1 }}.
+            {{ item }}
+          </p>
+        </template>
+        <template #bodyCell="{ column, record }">
+          <template v-if="column.dataIndex === 'operation'">
+            <a-space wrap>
+              <a-button
+                type="primary"
+                ghost
+                size="small"
+                :icon="h(EditFilled)"
+                :disabled="record.status?.active"
+                @click="handleUpdate(record)"
+              >
+                {{ $t("common.update") }}</a-button
+              >
+              <a-button
+                danger
+                size="small"
+                :icon="h(DeleteFilled)"
+                :disabled="record.status?.active"
+                @click="handleDelete(record)"
+                >{{ $t("common.delete") }}
+              </a-button>
+            </a-space>
+          </template>
+        </template>
+      </a-table>
+      <a-pagination
+        v-if="paginationData.total > 10"
+        v-model:current="paginationData.pageNum"
+        v-model:pageSize="paginationData.pageSize"
+        showSizeChanger
+        :total="paginationData.total"
+      />
+      <!-- UpdateDialog -->
+      <UpdateDialog
+        v-if="updateDialog.visible"
+        :dialog-data="updateDialog.data"
+        :dialog-type="updateDialog.type"
+        @search="handleSearch"
+        @close="updateDialog.visible = false"
+      />
+      <!-- importDialog -->
+      <ImportDialog
+        v-if="importDialog.visible"
+        @close="importDialog.visible = false"
+        @search="handleSearch"
+      />
+    </div>
+  </div>
+</template>
+
+<script lang="ts" setup name="ExperienceDetail">
+import { createVNode, h, ref, onMounted } from "vue";
+import { antTheme } from "@/utils/antTheme";
+import {
+  CloseCircleFilled,
+  CloudUploadOutlined,
+  PlusOutlined,
+  EditFilled,
+  DeleteFilled,
+} from "@ant-design/icons-vue";
+import { Modal } from "ant-design-vue";
+import {
+  getExperienceDetailByName,
+  getExperienceList,
+  requestExperienceDelete,
+} from "@/api/knowledgeBase";
+import { UpdateDialog, ImportDialog } from "./index.ts";
+import { useI18n } from "vue-i18n";
+import eventBus from "@/utils/mitt";
+
+const { t } = useI18n();
+const tableData = ref<EmptyArrayType>([]);
+const tableColumns = computed<EmptyArrayType>(() => [
+  {
+    title: t("experience.label.experience"),
+    dataIndex: "question",
+    ellipsis: true,
+  },
+  {
+    title: t("experience.operation"),
+    dataIndex: "operation",
+    width: "180px",
+    fixed: "right",
+  },
+]);
+
+const paginationData = reactive<paginationType>({
+  total: 0,
+  pageNum: 1,
+  pageSize: 10,
+});
+const updateDialog = reactive<DialogType>({
+  visible: false,
+  type: "create",
+  data: [],
+});
+const importDialog = reactive<DialogType>({
+  visible: false,
+});
+const tableList = computed(() => {
+  const { pageNum, pageSize } = paginationData;
+  const start = (pageNum - 1) * pageSize;
+  const end = start + pageSize;
+  return tableData.value.slice(start, end);
+});
+const queryExperienceList = async () => {
+  const data: any = await getExperienceList();
+
+  tableData.value = [].concat(data || []);
+};
+//create
+const handleCreate = () => {
+  updateDialog.type = "create";
+  updateDialog.data = [];
+  updateDialog.visible = true;
+};
+//edit
+const handleUpdate = async (row: EmptyObjectType) => {
+  const { idx } = row;
+  const data: any = await getExperienceDetailByName({ idx });
+
+  updateDialog.type = "edit";
+  updateDialog.data = [data];
+  updateDialog.visible = true;
+};
+//import
+const handleImport = () => {
+  importDialog.visible = true;
+};
+//delete
+const handleDelete = (row: EmptyObjectType) => {
+  Modal.confirm({
+    title: t("common.delete"),
+    icon: createVNode(CloseCircleFilled, { class: "error-icon" }),
+    content: t("experience.deleteTip"),
+    okText: t("common.confirm"),
+    okType: "danger",
+    async onOk() {
+      const { idx } = row;
+      await requestExperienceDelete({ idx });
+      paginationData.pageNum = 1;
+      handleSearch();
+    },
+  });
+};
+
+//search
+const handleSearch = () => {
+  queryExperienceList();
+  eventBus.emit("refresh");
+};
+onMounted(() => {
+  queryExperienceList();
+});
+</script>
+
+<style scoped lang="less">
+.experience-container {
+  padding: 24px;
+  .table-container {
+    .p-16;
+    .pb-24;
+    border-radius: 8px;
+    background-color: var(--bg-content-color);
+
+    .header-wrap {
+      .flex-between;
+      .mb-20;
+    }
+    .title {
+      .fs-16;
+      font-weight: 600;
+      color: var(--font-main-color);
+    }
+    .btn-wrap {
+      display: flex;
+      gap: 12px;
+    }
+    .experience-item {
+      color: var(--font-text-color);
+      .pl-8;
+    }
+    .expand-column {
+      width: 80px;
+    }
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/ImportDialog.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/ImportDialog.vue
new file mode 100644
index 0000000000..b558bac195
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/ImportDialog.vue
@@ -0,0 +1,100 @@
+<template>
+  <a-modal
+    v-model:open="modelVisible"
+    width="500px"
+    centered
+    destroyOnClose
+    :title="$t('experience.import')"
+    :keyboard="false"
+    :maskClosable="false"
+    :footer="null"
+    @cancel="handleClose"
+    class="import-dialog"
+  >
+    <a-upload-dragger
+      v-model:fileList="fileList"
+      name="file"
+      :action="uploadFileApi"
+      accept=".json"
+      :showUploadList="false"
+      :before-upload="handleBeforeUpload"
+      @change="handleChange"
+    >
+      <SvgIcon
+        name="icon-cloudupload-fill"
+        :size="40"
+        :style="{ color: 'var(--color-primary)' }"
+      />
+      <p class="intel-upload-text">{{ $t("common.uploadTip") }}</p>
+      <p class="intel-upload-hint">
+        {{ $t("experience.fileFormatTip") }}
+      </p>
+      <a-button type="primary" class="mt-12">{{
+        $t("common.import")
+      }}</a-button>
+    </a-upload-dragger>
+  </a-modal>
+</template>
+
+<script lang="ts" setup name="ImportDialog">
+import { requestExperienceRelation, uploadFileUrl } from "@/api/knowledgeBase";
+import { ref, inject } from "vue";
+import { useNotification } from "@/utils/common";
+import { NextLoading } from "@/utils/loading";
+import { useI18n } from "vue-i18n";
+import { message, UploadProps } from "ant-design-vue";
+
+const { t } = useI18n();
+const { antNotification } = useNotification();
+
+interface KbType {
+  name: string;
+}
+const emit = defineEmits(["search", "close"]);
+const kbInfo = inject<KbType>("kbInfo");
+const modelVisible = ref<boolean>(true);
+const fileList = ref([]);
+const uploadFileApi = computed(() => {
+  return uploadFileUrl + kbInfo?.name;
+});
+const handleBeforeUpload = (file: UploadProps["fileList"][number]) => {
+  const isFileSize = file.size / 1024 / 1024 < 100;
+
+  if (!isFileSize) {
+    message.error(t("experience.uploadValid"));
+    return;
+  }
+
+  return isFileSize;
+};
+const handleChange = async (info: any) => {
+  const el = <HTMLElement>document.querySelector(".loading-next");
+  if (!el) NextLoading.start();
+  try {
+    const { response, status } = info.file;
+
+    if (status === "done") {
+      const { name = "" } = kbInfo;
+      await requestExperienceRelation({
+        name,
+        local_path: response,
+      });
+      emit("search");
+      handleClose();
+      NextLoading.done();
+    } else if (status === "error") {
+      NextLoading.done();
+      antNotification("error", t("common.error"), t("experience.importErrTip"));
+    }
+  } catch (error) {
+    console.error(error);
+    if (NextLoading) NextLoading.done();
+  }
+};
+
+const handleClose = () => {
+  emit("close");
+};
+</script>
+
+<style scoped lang="less"></style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/UpdateDialog.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/UpdateDialog.vue
new file mode 100644
index 0000000000..a379762400
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/UpdateDialog.vue
@@ -0,0 +1,399 @@
+<template>
+  <a-modal
+    v-model:open="modelVisible"
+    width="800px"
+    centered
+    destroyOnClose
+    :title="dialogTitle"
+    :keyboard="false"
+    :maskClosable="false"
+    @cancel="handleCancel"
+    class="experience-dialog"
+  >
+    <div class="enter-wrap">
+      <a-form
+        :model="form"
+        :rules="rules"
+        name="form"
+        ref="formRef"
+        autocomplete="off"
+        class="form-wrap"
+        layout="vertical"
+      >
+        <div
+          class="item-wrap"
+          v-for="(item, index) in form.experience"
+          :key="index"
+        >
+          <div v-if="!isEdit" class="query-index">{{ index + 1 }}</div>
+          <a-form-item
+            :label="$t('experience.label.experience')"
+            :name="['experience', index, 'question']"
+            :rules="rules.experience"
+          >
+            <a-textarea
+              v-model:value="item.question"
+              :placeholder="$t('experience.placeholder.experience')"
+              :auto-size="{ minRows: 1, maxRows: 2 }"
+            />
+          </a-form-item>
+          <a-form-item
+            :label="$t('experience.label.contents')"
+            :name="['experience', index, 'content']"
+            :rules="rules.contentList"
+            class="gt-wrap"
+          >
+            <div
+              v-for="(contentItem, k) in item.content"
+              :key="k"
+              class="item-wrap content-wrap flex-left"
+            >
+              <a-form-item
+                :label="`${$t('experience.label.content')} ${k + 1}`"
+                :name="['experience', index, 'content', k]"
+                :rules="rules.text"
+                class="flex-item"
+              >
+                <a-textarea
+                  v-model:value="item.content[k]"
+                  :placeholder="$t('experience.placeholder.content')"
+                  :auto-size="{ minRows: 1, maxRows: 3 }"
+                />
+              </a-form-item>
+
+              <div class="icon-wrap">
+                <a-tooltip
+                  placement="topRight"
+                  arrow-point-at-center
+                  :title="$t('experience.delContent')"
+                  v-if="item.content?.length > 1"
+                >
+                  <DeleteOutlined
+                    @click="handleContentDelete(item.content, k)"
+                  />
+                </a-tooltip>
+              </div>
+            </div>
+            <div class="add-wrap" @click="handleContentAdd(item.content)">
+              <PlusOutlined /> {{ $t("experience.addContent") }}
+            </div>
+          </a-form-item>
+          <div class="icon-wrap">
+            <a-tooltip
+              placement="topRight"
+              arrow-point-at-center
+              :title="$t('experience.delExperience')"
+              v-if="form.experience?.length > 1"
+            >
+              <MinusCircleOutlined @click="handleDelete(index)" />
+            </a-tooltip>
+          </div>
+        </div>
+        <div v-if="!isEdit" class="operate-wrap" @click="handleAdd">
+          <PlusOutlined />
+          {{ $t("experience.addExperience") }}
+        </div>
+      </a-form>
+    </div>
+    <template #footer>
+      <a-button type="primary" ghost @click="handleCancel">{{
+        $t("common.cancel")
+      }}</a-button>
+      <a-button
+        key="submit"
+        type="primary"
+        :loading="submitLoading"
+        @click="handleSubmit"
+        >{{ $t("common.submit") }}</a-button
+      >
+    </template>
+  </a-modal>
+</template>
+
+<script lang="ts" setup name="UpdateDialog">
+import {
+  requestExperienceConfirm,
+  requestExperienceCreate,
+  requestExperienceUpdate,
+} from "@/api/knowledgeBase";
+import {
+  MinusCircleOutlined,
+  PlusOutlined,
+  DeleteOutlined,
+} from "@ant-design/icons-vue";
+import { FormInstance, Modal } from "ant-design-vue";
+import { computed, ref } from "vue";
+import { useI18n } from "vue-i18n";
+import { useNotification } from "@/utils/common";
+
+interface FormType {
+  experience: ExperienceType[];
+}
+
+interface ExperienceType {
+  question: string;
+  content: string[];
+}
+
+const props = defineProps({
+  dialogData: {
+    type: Array as PropType<ExperienceType[]>,
+    default: () => [],
+  },
+  dialogType: {
+    type: String,
+    default: "create",
+  },
+});
+
+const defaultExperienceList = [
+  {
+    question: "",
+    content: [""],
+  },
+];
+
+const { t } = useI18n();
+const { antNotification } = useNotification();
+const emit = defineEmits(["close", "search"]);
+const typeMap = {
+  create: t("experience.create"),
+  edit: t("experience.edit"),
+} as const;
+const dialogTitle = computed(() => {
+  return typeMap[props.dialogType as keyof typeof typeMap];
+});
+const isEdit = computed(() => {
+  return props.dialogType === "edit";
+});
+
+const modelVisible = ref<boolean>(true);
+const submitLoading = ref<boolean>(false);
+const formRef = ref<FormInstance>();
+
+const form = reactive<FormType>({
+  experience: props.dialogData.length
+    ? props.dialogData
+    : defaultExperienceList,
+});
+
+const rules: FormRules = reactive({
+  question: [
+    {
+      required: true,
+      message: t("experience.valid.experience"),
+      trigger: "change",
+    },
+  ],
+  contentList: [
+    {
+      required: true,
+      type: "array",
+      message: t("experience.valid.content"),
+      trigger: "change",
+    },
+  ],
+  text: [
+    {
+      required: true,
+      message: t("experience.valid.content"),
+      trigger: "change",
+    },
+  ],
+});
+
+const handleAdd = () => {
+  form.experience.push({
+    question: "",
+    content: [""],
+  });
+};
+const handleDelete = (index: number) => {
+  form.experience.splice(index, 1);
+};
+const handleContentAdd = (content: string[]) => {
+  content.push("");
+};
+const handleContentDelete = (content: string[], index: number) => {
+  content.splice(index, 1);
+};
+
+// Submit
+const handleSubmit = () => {
+  formRef.value?.validate().then(() => {
+    submitLoading.value = true;
+    const { experience } = form;
+    const apiUrl = isEdit.value
+      ? requestExperienceUpdate(experience[0])
+      : requestExperienceCreate(experience);
+    apiUrl
+      .then((data: any) => {
+        const { code } = data;
+        if (code === 2001) {
+          handleSelectMode();
+        } else {
+          handleRefresh();
+
+          if (!isEdit.value)
+            antNotification(
+              "success",
+              t("common.success"),
+              t("request.experience.createSucc")
+            );
+        }
+      })
+      .catch((error: any) => {
+        console.error(error);
+      })
+      .finally(() => {
+        submitLoading.value = false;
+      });
+  });
+};
+const handleSelectMode = () => {
+  const { experience } = form;
+  Modal.confirm({
+    title: t("common.prompt"),
+    content: t("experience.selectTip"),
+    okText: t("experience.cover"),
+    cancelText: t("experience.increase"),
+    centered: true,
+    async onOk() {
+      const flag = false;
+      await requestExperienceConfirm(flag, experience);
+      handleRefresh();
+    },
+    async onCancel() {
+      const flag = true;
+      await requestExperienceConfirm(flag, experience);
+      handleRefresh();
+    },
+  });
+};
+
+//close
+const handleCancel = () => {
+  emit("close");
+};
+
+//close
+const handleRefresh = () => {
+  emit("search");
+  handleCancel();
+};
+</script>
+
+<style scoped lang="less">
+.enter-wrap {
+  width: 100%;
+  // max-height: 500px;
+  // overflow-y: auto;
+  .title-wrap {
+    font-size: 20px;
+    font-weight: 600;
+    margin-bottom: 16px;
+    color: var(--font-main-color);
+  }
+  .form-wrap {
+    .item-wrap {
+      padding: 16px;
+      border: 1px solid var(--border-main-color);
+      position: relative;
+      margin-bottom: 16px;
+      border-radius: 6px;
+      .query-index {
+        position: absolute;
+        top: 0;
+        left: 0;
+        width: 20px;
+        height: 20px;
+        line-height: 20px;
+        font-size: 12px;
+        font-weight: 600;
+        text-align: center;
+        border-radius: 6px 0;
+        color: var(--color-primary-tip);
+        background-color: var(--border-primary);
+      }
+      .gt-wrap {
+        margin-bottom: 0;
+        :deep(.intel-form-item-control-input-content) {
+          display: block;
+        }
+        .flex-item {
+          flex: 1;
+          :deep(.intel-form-item-control-input-content) {
+            display: flex;
+            align-items: center;
+            gap: 6px;
+          }
+        }
+      }
+      .content-wrap {
+        background-color: var(--bg-card-color);
+        gap: 12px;
+        padding-right: 16px;
+        padding-bottom: 8px;
+        margin-bottom: 12px;
+        :deep(.intel-form-item) {
+          flex: 1;
+        }
+        .icon-wrap {
+          justify-content: end;
+        }
+      }
+      .add-wrap {
+        .flex-end;
+        gap: 6px;
+        cursor: pointer;
+        color: var(--color-primary);
+        &:hover {
+          color: var(--color-primary-hover);
+        }
+      }
+      .flex-wrap {
+        display: flex;
+        gap: 6px;
+        align-items: start;
+      }
+      .icon-wrap {
+        position: absolute;
+        top: 16px;
+        right: 12px;
+        cursor: pointer;
+        display: inline-flex;
+        gap: 8px;
+        width: 20px;
+        .anticon {
+          font-size: 16px;
+          &:hover {
+            color: var(--color-primary);
+          }
+          &.anticon-delete {
+            &:hover {
+              color: var(--color-error) !important;
+            }
+          }
+          &.anticon-minus-circle {
+            &:hover {
+              color: var(--color-error) !important;
+            }
+          }
+        }
+      }
+    }
+  }
+  .operate-wrap {
+    height: 28px;
+    border-radius: 4px;
+    cursor: pointer;
+    gap: 4px;
+    border: 1px dashed var(--border-main-color);
+    .vertical-center;
+    &:hover {
+      border: 1px dashed var(--color-primary-hover);
+      color: var(--color-primary-hover);
+    }
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/index.ts b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/index.ts
new file mode 100644
index 0000000000..c9d1df62ed
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/Experience/index.ts
@@ -0,0 +1,7 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+import UpdateDialog from "./UpdateDialog.vue";
+import ImportDialog from "./ImportDialog.vue";
+
+export { UpdateDialog, ImportDialog };
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/KnowledgeDetail.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/KnowledgeDetail.vue
new file mode 100644
index 0000000000..956b2dbe2b
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/KnowledgeDetail.vue
@@ -0,0 +1,398 @@
+<template>
+  <div class="detail-wrap">
+    <div class="upload-wrap">
+      <a-upload-dragger
+        v-model:file-list="uploadFileList"
+        name="file"
+        multiple
+        :showUploadList="false"
+        accept=".csv,.doc,.docx,.enex,.epub,.html,.md,.odt,.pdf,.ppt,.pptx,.txt,.zip"
+        :before-upload="handleBeforeUpload"
+        :custom-request="customRequest"
+      >
+        <SvgIcon
+          name="icon-cloudupload-fill"
+          :size="50"
+          :style="{ color: 'var(--font-tip-color)' }"
+        />
+        <p class="upload-text">{{ $t("common.uploadTip") }}</p>
+        <div class="upload-tip">
+          <p>
+            {{ $t("knowledge.uploadTip") }}
+          </p>
+        </div>
+      </a-upload-dragger>
+    </div>
+    <div class="tip-wrap" v-if="startUpload">
+      <div class="tip-text">
+        <ExclamationCircleFilled :style="{ fontSize: '14px' }" />
+        <span>{{ $t("knowledge.waitTip") }}</span>
+      </div>
+      <div class="rated-wrap slider-wrap">
+        <span>{{ $t("knowledge.done") }}:</span>
+        <a-slider
+          v-model:value="uploadedCount"
+          :min="0"
+          :max="totalFiles"
+          disabled
+        /><span
+          >{{ uploadedCount }}/{{ totalFiles }}
+          <span class="pl-8">
+            {{ $t("knowledge.successfully") }}:
+            <span class="is-success">{{ successCount }}</span>
+            {{ $t("knowledge.failed") }}:
+            <span class="is-failed">{{ failCount }}</span></span
+          >
+        </span>
+      </div>
+    </div>
+    <PartialLoading :visible="loading" />
+    <template v-if="!loading">
+      <a-empty v-if="notFile" :description="$t('knowledge.notFileTip')" />
+      <div class="files-container" v-else>
+        <a-row type="flex" wrap :gutter="[20, 20]">
+          <a-col
+            :span="8"
+            v-for="[key, value] in Object.entries(knowledgeData.file_map)"
+            :key="key"
+          >
+            <div class="file-item">
+              <div class="left-wrap">
+                <FileDoneOutlined
+                  :style="{
+                    color: 'var(--color-success)',
+                    fontSize: '20px',
+                  }"
+                />
+                <a-tooltip placement="topLeft" :title="key">
+                  <div class="file-name">{{ key }}</div>
+                </a-tooltip>
+              </div>
+              <div class="right-wrap">
+                <a-tooltip placement="top" :title="$t('common.delete')">
+                  <DeleteFilled
+                    class="delete-icon"
+                    @click="handleFileDelete(value as string)"
+                  />
+                </a-tooltip>
+              </div>
+            </div>
+          </a-col>
+        </a-row></div
+    ></template>
+  </div>
+</template>
+
+<script setup lang="ts" name="KnowledgeBaseDetail">
+import { ref, reactive, createVNode, inject, onMounted, computed } from "vue";
+import JSZip from "jszip";
+import {
+  requestKnowledgeBaseRelation,
+  getKnowledgeBaseDetailByName,
+  requestFileDelete,
+  requestUploadFileUrl,
+} from "@/api/knowledgeBase";
+import {
+  CloseCircleFilled,
+  DeleteFilled,
+  FileDoneOutlined,
+  ExclamationCircleFilled,
+} from "@ant-design/icons-vue";
+import { message, Modal, UploadFile, UploadProps } from "ant-design-vue";
+import { useI18n } from "vue-i18n";
+import eventBus from "@/utils/mitt";
+import type { UploadRequestOption } from "ant-design-vue/lib/upload/interface";
+import { useNotification } from "@/utils/common";
+
+interface KbType {
+  name: string;
+}
+const { t } = useI18n();
+const { antNotification } = useNotification();
+
+const kbInfo = inject<KbType>("kbInfo");
+const uploadFileList = ref<UploadFile[]>([]);
+const knowledgeData = reactive<EmptyObjectType>({});
+const pendingFiles = ref<UploadRequestOption[]>([]);
+let isUploading = ref<boolean>(false);
+const totalFiles = ref<number>(0);
+const uploadedCount = ref<number>(0);
+const successCount = ref<number>(0);
+const failCount = ref<number>(0);
+const startUpload = ref<boolean>(false);
+const loading = ref<boolean>(false);
+
+const notFile = computed(() => {
+  const { file_map = {} } = knowledgeData;
+  return Object.keys(file_map).length === 0;
+});
+
+const queryKnowledgeBaseDetail = async () => {
+  getKnowledgeBaseDetailByName(kbInfo?.name!)
+    .then((data: any) => {
+      Object.assign(knowledgeData, data);
+    })
+    .catch((error: any) => {
+      console.error(error);
+    })
+    .finally(() => {
+      loading.value = false;
+    });
+};
+
+const handleBeforeUpload = (file: UploadProps["fileList"][number]) => {
+  const isFileSize = file.size / 1024 / 1024 < 200;
+  if (!isFileSize) {
+    antNotification("error", t("common.error"), t("knowledge.uploadValid"));
+
+    return;
+  }
+  return isFileSize;
+};
+
+const handleZipParse = async (options: UploadRequestOption) => {
+  const origFile = options.file as File;
+  try {
+    const arrayBuffer = await origFile.arrayBuffer();
+    const zip = await JSZip.loadAsync(arrayBuffer);
+    const entries: JSZip.JSZipObject[] = [];
+    zip.forEach((relativePath, fileEntry) => {
+      entries.push(fileEntry);
+    });
+
+    const fileEntries = entries.filter((e) => !e.dir);
+
+    if (fileEntries.length === 0) {
+      antNotification("error", t("common.error"), t("knowledge.zipNoFiles"));
+      return;
+    }
+
+    const innerPromises = fileEntries.map(async (entry) => {
+      const blob = await entry.async("blob");
+
+      const filename = entry.name.split("/").pop() || entry.name;
+      const innerFile = new File([blob], filename, {
+        type: blob.type || "application/octet-stream",
+      });
+
+      const newOption: UploadRequestOption = {
+        ...options,
+        file: innerFile,
+        uid: `${(options as any).uid || Date.now()}_${filename}`,
+      } as UploadRequestOption;
+
+      return newOption;
+    });
+
+    const innerOptions = await Promise.all(innerPromises);
+
+    innerOptions.forEach((opt: any) => pendingFiles.value.push(opt));
+
+    totalFiles.value += innerOptions.length;
+  } catch (err) {
+    console.error(err);
+  }
+};
+
+const customRequest = async (options: UploadRequestOption) => {
+  const file = options.file as File;
+  const fileName = file && file.name ? file.name.toLowerCase() : "";
+
+  if (fileName.endsWith(".zip")) {
+    startUpload.value = true;
+    await handleZipParse(options);
+
+    if (!isUploading.value) {
+      isUploading.value = true;
+      uploadInBatches();
+    }
+    return;
+  }
+
+  pendingFiles.value.push(options);
+  totalFiles.value += 1;
+  startUpload.value = true;
+
+  if (!isUploading.value) {
+    isUploading.value = true;
+    uploadInBatches();
+  }
+};
+
+const uploadInBatches = async () => {
+  while (pendingFiles.value.length > 0) {
+    const batch = pendingFiles.value.splice(0, 20);
+
+    await Promise.all(
+      batch.map(async (options: any) => {
+        const { file, onSuccess, onError } = options;
+        const uploadFile = file as UploadFile;
+
+        try {
+          const { name } = knowledgeData;
+          const res = await requestUploadFileUrl(name, { file });
+          await requestKnowledgeBaseRelation(name, { local_path: res });
+
+          onSuccess?.(res, uploadFile as any);
+          handleSuccess(uploadFile);
+          successCount.value += 1;
+        } catch (err: any) {
+          onError?.(err);
+          failCount.value += 1;
+        } finally {
+          uploadedCount.value += 1;
+        }
+      })
+    );
+    queryKnowledgeBaseDetail();
+  }
+  handleRefresh();
+  isUploading.value = false;
+  setTimeout(() => {
+    startUpload.value = false;
+    totalFiles.value = 0;
+    uploadedCount.value = 0;
+    successCount.value = 0;
+    failCount.value = 0;
+  }, 5000);
+};
+
+const handleSuccess = (file: UploadFile) => {
+  uploadFileList.value = uploadFileList.value.filter(
+    (item: UploadFile) => item.uid !== file.uid
+  );
+};
+const handleFileDelete = (local_path: string) => {
+  Modal.confirm({
+    title: t("common.delete"),
+    icon: createVNode(CloseCircleFilled, { class: "error-icon" }),
+    content: t("knowledge.deleteFileTip"),
+    okText: t("common.confirm"),
+    okType: "danger",
+    async onOk() {
+      const { name } = knowledgeData;
+      await requestFileDelete(name, { local_path });
+      queryKnowledgeBaseDetail();
+      handleRefresh();
+    },
+  });
+};
+
+const handleRefresh = () => {
+  eventBus.emit("refresh");
+};
+
+onMounted(() => {
+  loading.value = true;
+  queryKnowledgeBaseDetail();
+});
+</script>
+
+<style lang="less" scoped>
+.detail-wrap {
+  height: 100%;
+  .flex-column;
+}
+.upload-wrap {
+  padding: 16px;
+  :deep(.intel-upload-drag) {
+    background-color: var(--bg-content-color);
+  }
+  .upload-text {
+    color: var(--font-text-color);
+    margin: 8px 0;
+    font-weight: 500;
+    font-size: 16px;
+  }
+  .upload-tip {
+    color: var(--font-tip-color);
+    font-size: 12px;
+    line-height: 1.4;
+    margin-top: 12px;
+  }
+}
+.files-container {
+  flex: 1;
+  width: 100%;
+  padding: 12px 16px;
+  .file-item {
+    padding: 12px;
+    background-color: var(--bg-content-color);
+    border: 1px solid var(--border-main-color);
+    border-radius: 6px;
+    .flex-between;
+    &:hover {
+      .card-shadow;
+    }
+    .left-wrap {
+      flex: 1;
+      min-width: 0;
+      .flex-left;
+      gap: 6px;
+      .file-name {
+        flex: 1;
+        color: var(--font-main-color);
+        .single-ellipsis;
+      }
+    }
+    .right-wrap {
+      .delete-icon {
+        color: var(--font-tip-color);
+        &:hover {
+          color: var(--color-error);
+        }
+      }
+    }
+  }
+}
+.intel-empty {
+  margin: 200px auto;
+}
+.tip-wrap {
+  margin: 0 20px;
+  border: 1px solid var(--border-warning);
+  border-left: 3px solid var(--color-second-warning);
+  background-color: var(--color-warningBg);
+  color: var(--color-second-warning);
+  padding: 8px 12px 0 12px;
+  border-radius: 0 4px 4px 0;
+  margin-bottom: 12px;
+  font-size: 12px;
+  .flex-between;
+  .tip-text {
+    display: flex;
+    gap: 4px;
+    align-items: center;
+  }
+  .rated-wrap {
+    width: 400px;
+    display: flex;
+    gap: 4px;
+    align-items: center;
+    :deep(.intel-slider-horizontal) {
+      flex: 1;
+      top: -2px;
+      .intel-slider-rail {
+        height: 8px;
+        border-radius: 4px;
+      }
+      .intel-slider-track {
+        height: 8px;
+        border-radius: 4px;
+        background-color: var(--color-primary-tip) !important;
+      }
+      .intel-slider-handle::after {
+        top: 1px;
+        box-shadow: 0 0 0 2px var(--color-primary-second) !important;
+      }
+    }
+  }
+  .is-success {
+    .pr-6;
+    color: var(--color-success);
+  }
+  .is-failed {
+    color: var(--color-error);
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/KnowledgeDetial.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/KnowledgeDetial.vue
deleted file mode 100644
index 290a85cd8e..0000000000
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/KnowledgeDetial.vue
+++ /dev/null
@@ -1,302 +0,0 @@
-<template>
-  <div class="kb-detial-container">
-    <div class="header-wrap">
-      <div class="info-wrap">
-        <div class="name-wrap">{{ knowledgeData.name }}</div>
-        <div class="des-wrap" v-if="knowledgeData.description">
-          {{ knowledgeData.description }}
-        </div>
-      </div>
-      <div class="button-wrap">
-        <a-button
-          type="primary"
-          ghost
-          :icon="h(RollbackOutlined)"
-          @click="handleBack"
-          >{{ $t("common.back") }}</a-button
-        >
-      </div>
-    </div>
-    <div class="upload-wrap">
-      <a-upload-dragger
-        v-model:file-list="uploadFileList"
-        name="file"
-        multiple
-        :max-count="20"
-        :showUploadList="false"
-        :action="uploadFileApi"
-        accept=".csv,.doc,.docx,.enex,.epub,.html,.md,.odt,.pdf,.ppt,.pptx,.txt,"
-        :before-upload="handleBeforeUpload"
-        @change="handleChange"
-      >
-        <SvgIcon
-          name="icon-cloudupload-fill"
-          :size="50"
-          :style="{ color: 'var(--font-tip-color)' }"
-        />
-        <p class="upload-text">{{ $t("common.uploadTip") }}</p>
-        <div class="upload-tip">
-          <p>
-            {{ $t("knowledge.uploadTip") }}
-          </p>
-        </div>
-      </a-upload-dragger>
-    </div>
-
-    <a-empty v-if="notFile" :description="$t('knowledge.notFileTip')" />
-    <div class="files-container" v-else>
-      <a-row type="flex" wrap :gutter="[20, 20]">
-        <a-col
-          :span="8"
-          v-for="[key, value] in Object.entries(knowledgeData.file_map)"
-          :key="key"
-        >
-          <div class="file-item">
-            <div class="left-wrap">
-              <FileDoneOutlined
-                :style="{
-                  color: 'var(--color-success)',
-                  fontSize: '20px',
-                }"
-              />
-              <a-tooltip placement="topLeft" :title="key">
-                <div class="file-name">{{ key }}</div>
-              </a-tooltip>
-            </div>
-            <div class="right-wrap">
-              <a-tooltip placement="top" :title="$t('common.delete')">
-                <DeleteFilled
-                  class="delete-icon"
-                  @click="handleFileDelete(value as string)"
-                />
-              </a-tooltip>
-            </div>
-          </div>
-        </a-col>
-      </a-row>
-    </div>
-  </div>
-</template>
-
-<script setup lang="ts" name="KnowledgeBaseDetial">
-import { ref, reactive, createVNode, h } from "vue";
-import {
-  requestKnowledgeBaseRelation,
-  getKnowledgeBaseDetialByName,
-  requestFileDelete,
-  uploadFileUrl,
-} from "@/api/knowledgeBase";
-import { useNotification } from "@/utils/common";
-import {
-  CloseCircleFilled,
-  DeleteFilled,
-  RollbackOutlined,
-  FileDoneOutlined,
-} from "@ant-design/icons-vue";
-import { message, Modal, UploadFile, UploadProps } from "ant-design-vue";
-import { useI18n } from "vue-i18n";
-import { NextLoading } from "@/utils/loading";
-import eventBus from "@/utils/mitt";
-
-const props = defineProps({
-  kbName: {
-    type: String,
-    default: "",
-  },
-});
-
-const { t } = useI18n();
-const emit = defineEmits(["back"]);
-const { antNotification } = useNotification();
-const uploadFileList = ref([]);
-const knowledgeData = reactive<EmptyObjectType>({});
-const notFile = computed(() => {
-  const { file_map = {} } = knowledgeData;
-  return Object.keys(file_map).length === 0;
-});
-const uploadFileApi = computed(() => {
-  return uploadFileUrl + knowledgeData.name;
-});
-
-const queryKnowledgeBaseDetial = async () => {
-  const data: any = await getKnowledgeBaseDetialByName(props.kbName);
-  Object.assign(knowledgeData, data);
-};
-const handleBeforeUpload = (file: UploadProps["fileList"][number]) => {
-  const isFileSize = file.size / 1024 / 1024 < 200;
-
-  if (!isFileSize) {
-    message.error(t("knowledge.uploadValid"));
-  }
-
-  return isFileSize;
-};
-const handleChange = ({
-  fileList,
-  file,
-}: {
-  fileList: UploadFile[];
-  file: UploadFile;
-}) => {
-  const el = <HTMLElement>document.querySelector(".loading-next");
-  if (!el) NextLoading.start();
-  const { response, status } = file;
-  const { name } = knowledgeData;
-  try {
-    if (status === "done") {
-      requestKnowledgeBaseRelation(name, {
-        local_path: response,
-      });
-      handleSuccess(file);
-    } else if (status === "error") {
-      antNotification("error", t("common.error"), response.detail);
-    }
-
-    const isAllEnd = fileList.every((file: any) => file.status !== "uploading");
-
-    if (isAllEnd) {
-      NextLoading.done();
-      setTimeout(() => {
-        queryKnowledgeBaseDetial();
-        handleRefresh();
-      }, 100);
-    }
-  } catch (error) {
-    console.error(error);
-    if (NextLoading) NextLoading.done();
-  }
-};
-const handleSuccess = (file: UploadFile) => {
-  uploadFileList.value = uploadFileList.value.filter(
-    (item: UploadFile) => item.uid !== file.uid
-  );
-};
-const handleFileDelete = (local_path: string) => {
-  Modal.confirm({
-    title: t("common.delete"),
-    icon: createVNode(CloseCircleFilled, { class: "error-icon" }),
-    content: t("knowledge.deleteFileTip"),
-    okText: t("common.confirm"),
-    okType: "danger",
-    async onOk() {
-      const { name } = knowledgeData;
-      await requestFileDelete(name, { local_path });
-      queryKnowledgeBaseDetial();
-      handleRefresh();
-    },
-  });
-};
-
-const handleBack = () => {
-  emit("back");
-  eventBus.emit("reset");
-};
-const handleRefresh = () => {
-  eventBus.emit("refresh");
-};
-
-watch(
-  () => props.kbName,
-  (kbName) => {
-    if (kbName) queryKnowledgeBaseDetial();
-  },
-  { immediate: true, deep: true }
-);
-</script>
-
-<style lang="less" scoped>
-.kb-detial-container {
-  display: block !important;
-  .flex-column;
-  .header-wrap {
-    padding: 0 16px;
-    height: 60px;
-    border-bottom: 1px solid var(--border-main-color);
-    .flex-between;
-    gap: 16px;
-    min-width: 0;
-    .info-wrap {
-      flex: 1;
-      .flex-column;
-      gap: 4px;
-      min-width: 0;
-      .name-wrap {
-        font-size: 16px;
-        font-weight: 600;
-        flex: 1;
-        min-width: 0;
-        line-height: 16px;
-        .single-ellipsis;
-      }
-      .des-wrap {
-        color: var(--font-info-color);
-        font-size: 12px;
-        .single-ellipsis;
-      }
-    }
-    .button-wrap {
-      .vertical-center;
-      gap: 4px;
-    }
-  }
-  .upload-wrap {
-    padding: 16px;
-    :deep(.intel-upload-drag) {
-      background-color: var(--bg-content-color);
-    }
-    .upload-text {
-      color: var(--font-text-color);
-      margin: 8px 0;
-      font-weight: 500;
-      font-size: 16px;
-    }
-    .upload-tip {
-      color: var(--font-tip-color);
-      font-size: 12px;
-      line-height: 1.4;
-      margin-top: 12px;
-    }
-  }
-  .files-container {
-    flex: 1;
-    width: 100%;
-    padding: 12px 16px;
-    .file-item {
-      padding: 12px;
-      background-color: var(--bg-content-color);
-      border: 1px solid var(--border-main-color);
-      border-radius: 6px;
-      .flex-between;
-      &:hover {
-        .card-shadow;
-      }
-      .left-wrap {
-        flex: 1;
-        min-width: 0;
-        .flex-left;
-        gap: 6px;
-        .file-name {
-          flex: 1;
-          color: var(--font-main-color);
-          .single-ellipsis;
-        }
-      }
-      .right-wrap {
-        .delete-icon {
-          color: var(--font-tip-color);
-          &:hover {
-            color: var(--color-error);
-          }
-        }
-      }
-    }
-  }
-  .intel-empty {
-    flex: 1;
-    display: flex;
-    flex-direction: column;
-    justify-content: center;
-    align-items: center;
-  }
-}
-</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/SelectTypeDialog.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/SelectTypeDialog.vue
new file mode 100644
index 0000000000..8b9ab7978e
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/SelectTypeDialog.vue
@@ -0,0 +1,134 @@
+<template>
+  <a-modal
+    v-model:open="modelVisible"
+    width="800px"
+    centered
+    destroyOnClose
+    :keyboard="false"
+    :maskClosable="false"
+    :footer="null"
+    :aria-hidden="false"
+    @cancel="handleClose"
+    class="import-dialog"
+  >
+    <div class="guide-wrap">
+      <div class="guide-title">{{ $t("knowledge.selectTitle") }}</div>
+      <div class="guide-text">{{ $t("knowledge.selectDes") }}</div>
+      <div class="card-wrap">
+        <div class="item-wrap">
+          <div class="left-wrap">
+            <SvgIcon name="icon-knowledge" inherit :size="32" />
+          </div>
+          <div class="right-wrap">
+            <div class="title">{{ $t("knowledge.title") }}</div>
+            <div class="des">
+              {{ $t("knowledge.kbDes") }}
+            </div>
+            <a-button
+              class="special-button-primary"
+              :icon="h(PlusOutlined)"
+              @click="handleCreate"
+              >{{ $t("quickStart.create") }}</a-button
+            >
+          </div>
+        </div>
+        <div class="item-wrap">
+          <div class="left-wrap">
+            <SvgIcon name="icon-experience" inherit :size="32" />
+          </div>
+          <div class="right-wrap">
+            <div class="title">{{ $t("knowledge.experience") }}</div>
+            <div class="des">
+              {{ $t("knowledge.experienceDes") }}
+            </div>
+            <a-button
+              :class="{
+                'special-button-primary': true,
+                'is-disabled': created,
+              }"
+              :icon="h(PlusOutlined)"
+              :disabled="created"
+              @click="handleCreateExperience"
+              >{{ $t("quickStart.create") }}</a-button
+            >
+          </div>
+        </div>
+      </div>
+    </div>
+  </a-modal>
+</template>
+
+<script lang="ts" setup name="SelectTypeDialog">
+import { PlusOutlined } from "@ant-design/icons-vue";
+import { h } from "vue";
+
+const props = defineProps({
+  created: {
+    type: Boolean,
+    default: false,
+  },
+});
+
+const emit = defineEmits(["createKB", "close"]);
+const modelVisible = ref<boolean>(true);
+const handleCreate = () => {
+  emit("createKB", "knowledge");
+  handleClose();
+};
+const handleCreateExperience = async () => {
+  emit("createKB", "experience");
+  handleClose();
+};
+const handleClose = () => {
+  emit("close");
+};
+</script>
+
+<style scoped lang="less">
+.guide-wrap {
+  padding: 24px 0;
+  .guide-title {
+    font-size: 24px;
+    font-weight: 600;
+    color: var(--font-main-color);
+    text-align: center;
+  }
+  .guide-text {
+    text-align: center;
+    color: var(--font-tip-color);
+  }
+  .card-wrap {
+    display: flex;
+    gap: 32px;
+    margin-top: 24px;
+    .item-wrap {
+      flex: 1;
+      padding: 20px;
+      border-radius: 6px;
+      box-shadow: var(--bg-gradient-shadow);
+      display: flex;
+      gap: 12px;
+      .left-wrap {
+        .pt-6;
+        color: var(--color-second-primaryBg);
+      }
+      .right-wrap {
+        flex: 1;
+        .title {
+          font-size: 18px;
+          font-weight: 500;
+          line-height: 28px;
+          color: var(--font-main-color);
+          white-space: pre-wrap;
+        }
+        .des {
+          margin-top: 12px;
+          margin-bottom: 20px;
+          line-height: 20px;
+          color: var(--font-text-color);
+        }
+      }
+    }
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/UpdateDialog.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/UpdateDialog.vue
index f987ff5cb4..e95e7436f6 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/UpdateDialog.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/UpdateDialog.vue
@@ -17,14 +17,45 @@
       autocomplete="off"
       :label-col="{ style: { width: '100px' } }"
     >
-      <a-form-item :label="$t('knowledge.name')" name="name">
+      <a-form-item
+        :label="$t('knowledge.type')"
+        name="comp_subtype"
+        v-if="!isExperience"
+      >
+        <a-radio-group
+          v-model:value="form.comp_subtype"
+          @change="handleTypeChange"
+          :disabled="isEdit"
+        >
+          <a-radio value="origin_kb">{{ $t("knowledge.original") }}</a-radio>
+          <a-radio value="kbadmin_kb">{{ $t("knowledge.kbadmin") }}</a-radio>
+        </a-radio-group>
+      </a-form-item>
+      <a-form-item :label="$t('knowledge.name')" name="name" v-if="isOriginal">
         <a-input
           v-model:value.trim="form.name"
           :maxlength="30"
-          :disabled="isEdit"
+          :disabled="isEdit || isExperience"
           :placeholder="$t('knowledge.nameValid1')"
         />
       </a-form-item>
+      <a-form-item
+        :label="$t('knowledge.name')"
+        :rules="rules.kbName"
+        name="name"
+        v-else
+      >
+        <a-select
+          showSearch
+          v-model:value="form.name"
+          :placeholder="$t('knowledge.nameRequired')"
+          :disabled="isEdit || isExperience"
+        >
+          <a-select-option v-for="item in kbList" :key="item" :value="item">{{
+            item
+          }}</a-select-option>
+        </a-select>
+      </a-form-item>
       <a-form-item :label="$t('knowledge.des')">
         <a-textarea
           v-model:value.trim="form.description"
@@ -34,7 +65,7 @@
         />
       </a-form-item>
       <a-form-item :label="$t('pipeline.isActive')" name="active">
-        <a-radio-group v-model:value="form.active" :disabled="isActivated">
+        <a-radio-group v-model:value="form.active">
           <a-radio :value="true">{{ $t("pipeline.activated") }}</a-radio>
           <a-radio :value="false">{{ $t("pipeline.inactive") }}</a-radio>
         </a-radio-group>
@@ -59,10 +90,11 @@
 import {
   requestKnowledgeBaseCreate,
   requestKnowledgeBaseUpdate,
+  getkbadminList,
 } from "@/api/knowledgeBase";
 import { isValidName } from "@/utils/validate";
 import { FormInstance } from "ant-design-vue";
-import { computed, ref } from "vue";
+import { computed, ref, onMounted } from "vue";
 import { useI18n } from "vue-i18n";
 
 const props = defineProps({
@@ -74,11 +106,17 @@ const props = defineProps({
     type: String,
     default: "create",
   },
+  dialogFlag: {
+    type: String,
+    default: "knowledge",
+  },
 });
 interface FormType {
-  name: string;
+  name: string | undefined;
   description: string;
+  comp_type: string;
   active: boolean;
+  comp_subtype: string;
 }
 
 const validateName = async (rule: any, value: string) => {
@@ -89,7 +127,6 @@ const validateName = async (rule: any, value: string) => {
   if (len < 2 || len > 30) {
     return Promise.reject(t("knowledge.nameValid2"));
   }
-  console.log(isValidName(value));
   if (!isValidName(value)) {
     return Promise.reject(t("knowledge.nameValid3"));
   }
@@ -98,9 +135,11 @@ const validateName = async (rule: any, value: string) => {
 
 const { t } = useI18n();
 const emit = defineEmits(["close", "switch"]);
+const { dialogFlag } = props;
+
 const typeMap = {
-  create: t("knowledge.create"),
-  edit: t("knowledge.edit"),
+  create: t(`${dialogFlag}.create`),
+  edit: t(`${dialogFlag}.edit`),
 } as const;
 const dialogTitle = computed(() => {
   return typeMap[props.dialogType as keyof typeof typeMap];
@@ -108,20 +147,39 @@ const dialogTitle = computed(() => {
 const isEdit = computed(() => {
   return props.dialogType === "edit";
 });
-const isActivated = computed(() => {
-  return props.dialogData?.active;
+const isExperience = computed(() => {
+  return props.dialogFlag === "experience";
+});
+
+const isOriginal = computed(() => {
+  return form.comp_subtype === "origin_kb";
 });
 const modelVisible = ref<boolean>(true);
 const submitLoading = ref<boolean>(false);
 const formRef = ref<FormInstance>();
-const { name = "", description = "", active = false } = props.dialogData;
+const {
+  comp_subtype = "origin_kb",
+  name = undefined,
+  description = "",
+  active = false,
+  experience_active = false,
+} = props.dialogData;
 const form = reactive<FormType>({
-  name,
+  comp_subtype,
+  name: isExperience.value ? "Experience" : name,
   description,
-  active,
+  comp_type: dialogFlag,
+  active: isExperience.value ? experience_active : active,
 });
-
-const rules = reactive({
+const kbList = ref<EmptyArrayType>([]);
+const rules: FormRules = reactive({
+  comp_subtype: [
+    {
+      required: true,
+      message: t("knowledge.typeValid"),
+      trigger: "change",
+    },
+  ],
   name: [
     {
       required: true,
@@ -129,6 +187,13 @@ const rules = reactive({
       trigger: ["blur", "change"],
     },
   ],
+  kbName: [
+    {
+      required: true,
+      message: t("knowledge.nameRequired"),
+      trigger: "change",
+    },
+  ],
   active: [
     {
       required: true,
@@ -137,17 +202,36 @@ const rules = reactive({
     },
   ],
 });
+const handleTypeChange = () => {
+  form.name = undefined;
+};
+const queryKbadmin = async () => {
+  const data: any = await getkbadminList();
+  kbList.value = [].concat(data);
+};
+// Format parameter
+const formatFormParam = () => {
+  const { name, description, comp_type, active, comp_subtype } = form;
+  return {
+    name,
+    description,
+    comp_type,
+    comp_subtype: !isExperience.value ? comp_subtype : undefined,
+    active: !isExperience.value ? active : undefined,
+    experience_active: isExperience.value ? active : undefined,
+  };
+};
 // Submit
 const handleSubmit = () => {
   formRef.value?.validate().then(() => {
     submitLoading.value = true;
     const { name } = form;
-    const apiUrl =
-      props.dialogType === "edit"
-        ? requestKnowledgeBaseUpdate
-        : requestKnowledgeBaseCreate;
 
-    apiUrl(form)
+    const apiUrl = isEdit.value
+      ? requestKnowledgeBaseUpdate
+      : requestKnowledgeBaseCreate;
+
+    apiUrl(formatFormParam())
       .then(() => {
         emit("switch", name);
         handleCancel();
@@ -165,6 +249,9 @@ const handleSubmit = () => {
 const handleCancel = () => {
   emit("close");
 };
+onMounted(() => {
+  queryKbadmin();
+});
 </script>
 
 <style scoped lang="less">
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/index.ts b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/index.ts
index 7de279c52c..ebc0eee355 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/index.ts
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/index.ts
@@ -2,5 +2,8 @@
 // SPDX-License-Identifier: Apache-2.0
 
 import UpdateDialog from "./UpdateDialog.vue";
+import SelectTypeDialog from "./SelectTypeDialog.vue";
+import KnowledgeDetail from "./KnowledgeDetail.vue";
+import ExperienceDetail from "./Experience/ExperienceDetail.vue";
 
-export { UpdateDialog };
+export { UpdateDialog, SelectTypeDialog, KnowledgeDetail, ExperienceDetail };
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/index.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/index.vue
index 9c48a2e122..b8d2ecdc5e 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/index.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/KnowledgeBase/index.vue
@@ -2,7 +2,7 @@
   <div class="knowledge-base">
     <div class="menu-container">
       <div class="header-menu">
-        <a-button type="primary" @click="handleCreate">
+        <a-button type="primary" block @click="handleCreateSelect">
           <template #icon>
             <PlusOutlined />
           </template>
@@ -16,19 +16,44 @@
           :key="item.idx"
           @click="handleView(item)"
         >
-          <span class="active-icon" v-if="item.active"
+          <span
+            :class="{
+              'active-icon': true,
+              'is-experience': item.comp_type === 'experience',
+            }"
+            v-if="item.active || item.experience_active"
             ><CheckOutlined :style="{ fontSize: '12px' }"
           /></span>
           <div class="left-wrap">
             <SvgIcon
-              name="icon-knowledge"
+              :name="
+                item.comp_type === 'experience'
+                  ? 'icon-experience'
+                  : 'icon-knowledge'
+              "
               :style="{ color: 'var(--color-primary-second)' }"
             />
             <div class="des-wrap">
-              <div class="name-wrap">{{ item.name }}</div>
+              <div class="flex-left">
+                <div class="name-wrap">
+                  {{ item.name }}
+                </div>
+                <template v-if="item.comp_type === 'experience'">
+                  <span class="tag-wrap"> {{ $t("experience.unique") }}</span>
+                </template>
+                <template v-if="item?.comp_subtype === 'kbadmin_kb'">
+                  <span class="tag-wrap">kbadmin</span>
+                </template>
+              </div>
               <div class="total-wrap">
-                {{ $t("knowledge.total") }}
-                {{ Object.keys(item.file_map).length || 0 }}
+                <template v-if="item.comp_type === 'experience'">
+                  {{ $t("experience.total") }}
+                  {{ item.total }}
+                </template>
+                <template v-else-if="item?.comp_subtype === 'origin_kb'">
+                  {{ $t("knowledge.total") }}
+                  {{ item.total }}</template
+                >
               </div>
             </div>
           </div>
@@ -37,16 +62,44 @@
               <a @click.prevent class="expand-wrap"> ... </a>
               <template #overlay>
                 <a-menu>
-                  <a-menu-item
-                    key="activate"
-                    :disabled="item.active"
-                    @click="handleSwitchState(item)"
-                  >
-                    <CheckCircleFilled
-                      :style="{ color: 'var(--color-success)' }"
-                    />
-                    {{ $t("common.active") }}</a-menu-item
-                  >
+                  <template v-if="item.comp_type === 'knowledge'">
+                    <a-menu-item
+                      key="activate"
+                      @click="handleSwitchState(item)"
+                    >
+                      <template v-if="!item.active">
+                        <CheckCircleFilled
+                          :style="{ color: 'var(--color-success)' }"
+                        />
+                        {{ $t("common.active") }}
+                      </template>
+                      <template v-else>
+                        <PauseCircleFilled
+                          :style="{ color: 'var(--color-error)' }"
+                        />
+                        {{ $t("common.deactivate") }}
+                      </template>
+                    </a-menu-item>
+                  </template>
+                  <template v-else>
+                    <a-menu-item
+                      key="experience_active"
+                      @click="handleSwitchExperienceState(item)"
+                    >
+                      <template v-if="!item.experience_active">
+                        <CheckCircleFilled
+                          :style="{ color: 'var(--color-success)' }"
+                        />
+                        {{ $t("common.active") }}</template
+                      >
+                      <template v-else>
+                        <PauseCircleFilled
+                          :style="{ color: 'var(--color-error)' }"
+                        />
+                        {{ $t("common.deactivate") }}
+                      </template>
+                    </a-menu-item>
+                  </template>
                   <a-menu-item key="update" @click="handleUpdate(item)">
                     <EditFilled
                       :style="{ color: 'var(--color-primary-second)' }"
@@ -56,7 +109,7 @@
                   <a-menu-item
                     key="delete"
                     @click="handleDelete(item)"
-                    :disabled="item.active"
+                    :disabled="item.active || item.experience_active"
                   >
                     <DeleteFilled :style="{ color: 'var(--color-error)' }" />
                     {{ $t("common.delete") }}</a-menu-item
@@ -73,18 +126,25 @@
       v-if="updateDialog.visible"
       :dialog-data="updateDialog.data"
       :dialog-type="updateDialog.type"
+      :dialog-flag="updateDialog.flag"
       @switch="handleSwitch"
       @close="updateDialog.visible = false"
     />
+    <SelectTypeDialog
+      v-if="selectTypeDialog.visible"
+      :created="isCreated"
+      @close="selectTypeDialog.visible = false"
+      @createKB="handleCreate"
+    />
   </div>
 </template>
 
 <script lang="ts" setup name="KnowledgeBase">
 import { onMounted, reactive, createVNode } from "vue";
-import { UpdateDialog } from "./index";
+import { UpdateDialog, SelectTypeDialog } from "./index";
 import {
   getKnowledgeBaseList,
-  getKnowledgeBaseDetialByName,
+  getKnowledgeBaseDetailByName,
   requestKnowledgeBaseUpdate,
   requestKnowledgeBaseDelete,
 } from "@/api/knowledgeBase";
@@ -95,7 +155,7 @@ import {
   EditFilled,
   CheckCircleFilled,
   CloseCircleFilled,
-  FileDoneOutlined,
+  PauseCircleFilled,
 } from "@ant-design/icons-vue";
 import { useI18n } from "vue-i18n";
 import { Modal } from "ant-design-vue";
@@ -108,35 +168,49 @@ const selectedKB = ref<string>("");
 const updateDialog = reactive<DialogType>({
   visible: false,
   type: "create",
+  flag: "knowledge",
   data: {},
 });
+const selectTypeDialog = reactive<DialogType>({
+  visible: false,
+});
 
 const kbList = ref<EmptyArrayType>([]);
-
+const isCreated = computed(() =>
+  kbList.value.some((item) => item.comp_type === "experience")
+);
 const queryKnowledgeBaseList = async () => {
   const data: any = await getKnowledgeBaseList();
 
   kbList.value = [].concat(data);
 };
+const handleCreateSelect = () => {
+  selectTypeDialog.visible = true;
+};
 //create
-const handleCreate = () => {
+const handleCreate = (flag = "create") => {
   updateDialog.type = "create";
+  updateDialog.flag = flag;
   updateDialog.data = {};
   updateDialog.visible = true;
 };
 //edit
 const handleUpdate = async (row: EmptyObjectType) => {
-  const data: any = await getKnowledgeBaseDetialByName(row.name);
+  const data: any = await getKnowledgeBaseDetailByName(row.name);
 
   updateDialog.data = data;
   updateDialog.type = "edit";
+  updateDialog.flag = row.comp_type;
   updateDialog.visible = true;
 };
 //detail
 const handleView = async (row: EmptyObjectType) => {
-  const { idx, name } = row;
-  selectedKB.value = idx;
-  emit("view", name);
+  const { idx } = row;
+
+  if (row.comp_subtype !== "kbadmin_kb") {
+    selectedKB.value = idx;
+    emit("view", row);
+  }
 };
 //delete
 const handleDelete = (row: EmptyObjectType) => {
@@ -153,21 +227,40 @@ const handleDelete = (row: EmptyObjectType) => {
 
       if (selectedKB.value === idx) {
         selectedKB.value = "";
-        emit("view", "");
+        emit("view", { name: "" });
       }
     },
   });
 };
 //activate
 const handleSwitchState = (row: EmptyObjectType) => {
-  const { name } = row;
+  const { name, active } = row;
 
   Modal.confirm({
     title: t("common.prompt"),
     content: t("knowledge.activeTip"),
     okText: t("common.confirm"),
     async onOk() {
-      await requestKnowledgeBaseUpdate({ name, active: true });
+      await requestKnowledgeBaseUpdate({ name, active: !active });
+      handleSearch();
+    },
+  });
+};
+const handleSwitchExperienceState = (row: EmptyObjectType) => {
+  const { name, experience_active } = row;
+
+  const text = experience_active
+    ? t("experience.deactivateTip")
+    : t("experience.activeTip");
+  Modal.confirm({
+    title: t("common.prompt"),
+    content: text,
+    okText: t("common.confirm"),
+    async onOk() {
+      await requestKnowledgeBaseUpdate({
+        name,
+        experience_active: !experience_active,
+      });
       handleSearch();
     },
   });
@@ -216,9 +309,6 @@ onUnmounted(() => {
       padding: 0 12px;
       height: 60px;
       border-bottom: 1px solid var(--border-main-color);
-      .intel-btn {
-        width: 100%;
-      }
     }
     .list-container {
       flex: 1;
@@ -227,6 +317,7 @@ onUnmounted(() => {
       padding: 0 16px;
       .kb-list {
         width: 100%;
+        height: 60px;
         border: 1px solid var(--border-main-color);
         border-radius: 6px;
         padding: 8px;
@@ -252,12 +343,24 @@ onUnmounted(() => {
             gap: 8px;
             .name-wrap {
               font-weight: 600;
-              flex: 1;
               min-width: 0;
               line-height: 16px;
               text-align: left;
               .single-ellipsis;
             }
+            .tag-wrap {
+              display: inline-flex;
+              align-items: center;
+              justify-content: center;
+              height: 16px;
+              line-height: 1;
+              padding: 0 6px;
+              border-radius: 10px;
+              font-size: 10px;
+              margin-left: 4px;
+              color: var(--color-primary-tip);
+              background-color: var(--color-second-primaryBg);
+            }
             .total-wrap {
               color: var(--font-info-color);
               font-size: 12px;
@@ -289,6 +392,9 @@ onUnmounted(() => {
           background-color: var(--color-success);
           color: var(--color-white);
           .vertical-center;
+          &.is-experience {
+            background-color: var(--color-purple);
+          }
         }
       }
     }
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/index.ts b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/index.ts
index cfbbc273ed..b49736249a 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/components/index.ts
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/components/index.ts
@@ -3,8 +3,8 @@
 
 import Chatbot from "./Chatbot/index.vue";
 import KnowledgeBase from "./KnowledgeBase/index.vue";
-import SystemChart from "@/views/pipeline/components/SystemChart.vue";
-import KnowledgeDetial from "./KnowledgeBase/KnowledgeDetial.vue";
-import Pipeline from "../../pipeline/index.vue";
+import SystemChart from "@/views/settings/components/System/SystemChart.vue";
+import DetailComponent from "./KnowledgeBase/DetailComponent.vue";
+import ChatHistory from "./Chatbot/ChatHistory.vue";
 
-export { Chatbot, KnowledgeBase, SystemChart, KnowledgeDetial, Pipeline };
+export { Chatbot, KnowledgeBase, SystemChart, DetailComponent, ChatHistory };
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/index.vue b/EdgeCraftRAG/ui/vue/src/views/chatbot/index.vue
index d7aa155d59..39066c0e2b 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/index.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/index.vue
@@ -1,18 +1,23 @@
 <template>
   <div class="chat-container">
     <a-layout class="content-container">
-      <a-layout-sider :width="currentMenu === 'knowledge' ? 240 : 0">
+      <a-layout-sider :width="expandMenu ? 260 : 0" class="sider-wrap">
+        <div class="fold-but" @click="expandMenu = !expandMenu">
+          <DoubleLeftOutlined v-if="expandMenu" class="fold-icon" />
+          <DoubleRightOutlined v-else />
+        </div>
         <KnowledgeBase
-          @view="handleViewKBDetial"
+          @view="handleViewKBDetail"
           v-if="currentMenu === 'knowledge'"
         />
+        <ChatHistory v-else />
       </a-layout-sider>
       <a-layout-content>
         <keep-alive>
           <component
             :is="currentComponent"
             class="body-wrap"
-            :kb-name="kbName"
+            :kb-info="kbInfo"
             @back="handleBack"
           />
         </keep-alive>
@@ -22,14 +27,21 @@
 </template>
 
 <script lang="ts" setup name="Chatbot">
-import { onMounted, computed } from "vue";
-import { Chatbot, KnowledgeDetial, KnowledgeBase } from "./components";
+import { computed } from "vue";
+import {
+  Chatbot,
+  DetailComponent,
+  KnowledgeBase,
+  ChatHistory,
+} from "./components";
+import { DoubleLeftOutlined, DoubleRightOutlined } from "@ant-design/icons-vue";
 
 const route = useRoute();
 
 const currentMenu = ref<string>("chat");
 const currentPage = ref<string>("chat");
-const kbName = ref<string>("");
+const expandMenu = ref<boolean>(true);
+let kbInfo = reactive<EmptyObjectType>({});
 
 const componentList = ref<EmptyArrayType>([
   {
@@ -42,7 +54,7 @@ const componentList = ref<EmptyArrayType>([
     label: "knowledge.title",
     id: "knowledge",
     icon: "icon-knowledge",
-    component: markRaw(KnowledgeDetial),
+    component: markRaw(DetailComponent),
   },
 ]);
 
@@ -51,14 +63,16 @@ const currentComponent = computed(() => {
     ?.component;
 });
 
-const handleViewKBDetial = (name: string) => {
-  kbName.value = name;
-  if (kbName.value) currentPage.value = "knowledge";
+const handleViewKBDetail = (row: EmptyObjectType) => {
+  Object.assign(kbInfo, row);
+
+  if (kbInfo.name) currentPage.value = "knowledge";
   else currentPage.value = "chat";
 };
 const handleBack = () => {
   currentPage.value = "chat";
 };
+
 watch(
   () => route,
   (route) => {
@@ -71,7 +85,6 @@ watch(
   },
   { immediate: true, deep: true }
 );
-onMounted(() => {});
 </script>
 
 <style scoped lang="less">
@@ -91,4 +104,29 @@ onMounted(() => {});
     }
   }
 }
+.sider-wrap {
+  position: relative;
+  &:hover {
+    .fold-icon {
+      display: block;
+    }
+  }
+  .fold-but {
+    position: absolute;
+    top: 50%;
+    right: -30px;
+    cursor: pointer;
+    z-index: 99;
+    font-size: 20px;
+    width: 40px;
+    height: 50px;
+    padding: 12px 0;
+    text-align: end;
+    color: var(--font-tip-color);
+  }
+  .fold-icon {
+    display: none;
+    font-weight: 600;
+  }
+}
 </style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/chatbot/type.ts b/EdgeCraftRAG/ui/vue/src/views/chatbot/type.ts
index b426be5df8..044af6ad9f 100644
--- a/EdgeCraftRAG/ui/vue/src/views/chatbot/type.ts
+++ b/EdgeCraftRAG/ui/vue/src/views/chatbot/type.ts
@@ -9,13 +9,17 @@ export interface Benchmark {
 export interface IMessage {
   role: string;
   content: string;
+  query?: string;
+  errorMessage?: string;
   benchmark?: Benchmark | undefined;
 }
 export interface ThinkType {
   enable_thinking?: boolean;
+  enable_rag_retrieval?: boolean;
 }
 export interface ConfigType {
   top_n: number;
+  k: number;
   temperature: number;
   top_p: number;
   top_k: number;
diff --git a/EdgeCraftRAG/ui/vue/src/views/error/404.vue b/EdgeCraftRAG/ui/vue/src/views/error/404.vue
index 4683c892f2..ce18c7340a 100644
--- a/EdgeCraftRAG/ui/vue/src/views/error/404.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/error/404.vue
@@ -2,12 +2,11 @@
   <div class="not-found">
     <img :src="notFound" alt="" class="not-found-icon" />
     <p>{{ $t("error.notFoundTip") }}</p>
-    <a-button
-      type="primary"
-      size="large"
-      :icon="h(HomeFilled)"
-      @click="handleGoHome"
-      >{{ $t("error.back") }}
+    <a-button type="primary" size="large" @click="handleGoHome">
+      <template #icon>
+        <HomeFilled />
+      </template>
+      {{ $t("error.back") }}
     </a-button>
   </div>
 </template>
@@ -16,8 +15,6 @@
 import notFound from "@/assets/svgs/404-icon.svg";
 import router from "@/router";
 import { HomeFilled } from "@ant-design/icons-vue";
-import { h } from "vue";
-
 const handleGoHome = () => {
   router.push("/");
 };
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/QuickStart.vue b/EdgeCraftRAG/ui/vue/src/views/main/QuickStart.vue
similarity index 98%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/QuickStart.vue
rename to EdgeCraftRAG/ui/vue/src/views/main/QuickStart.vue
index a817fbba68..93c5abb1b9 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/QuickStart.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/main/QuickStart.vue
@@ -50,7 +50,7 @@
   </a-modal>
 </template>
 
-<script lang="ts" setup name="EditDialog">
+<script lang="ts" setup name="QuickStart">
 import { userAppStore } from "@/store/user";
 import { PlusOutlined } from "@ant-design/icons-vue";
 import { computed, h } from "vue";
diff --git a/EdgeCraftRAG/ui/vue/src/views/main/index.vue b/EdgeCraftRAG/ui/vue/src/views/main/index.vue
index a2ab2a0874..2c6a416d07 100644
--- a/EdgeCraftRAG/ui/vue/src/views/main/index.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/main/index.vue
@@ -58,7 +58,8 @@
 <script lang="ts" setup name="Chatbot">
 import router from "@/router";
 import { onMounted, reactive } from "vue";
-import { QuickStart, SystemChart } from "../pipeline/components/index";
+import SystemChart from "@/views/settings/components/System/SystemChart.vue";
+import QuickStart from "./QuickStart.vue";
 import { getSystemStatus } from "@/api/pipeline";
 
 const route = useRoute();
@@ -68,17 +69,17 @@ let systemData = reactive<EmptyObjectType>({});
 const componentList = ref<EmptyArrayType>([
   {
     label: "chat.title",
-    path: "/rag/chatbot",
+    path: "/chatbot",
     icon: "icon-chat",
   },
   {
     label: "knowledge.title",
-    path: "/rag/chatbot?type=kb",
+    path: "/chatbot?type=kb",
     icon: "icon-knowledge",
   },
   {
     label: "chat.setting",
-    path: "/rag/pipeline",
+    path: "/settings",
     icon: "icon-setting",
   },
 ]);
@@ -89,7 +90,7 @@ const handleMenuChange = (path: string) => {
 };
 //create
 const handleCreate = () => {
-  router.push({ name: "Pipeline" });
+  router.push({ name: "Setting" });
 };
 const querySystemStatus = async () => {
   const data = await getSystemStatus();
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Indexer.vue b/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Indexer.vue
deleted file mode 100644
index d1e76b4649..0000000000
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Indexer.vue
+++ /dev/null
@@ -1,305 +0,0 @@
-<template>
-  <a-form
-    :model="form"
-    :rules="rules"
-    name="indexer"
-    layout="vertical"
-    ref="formRef"
-    autocomplete="off"
-    class="form-wrap"
-  >
-    <a-form-item :label="$t('pipeline.config.indexerType')" name="indexer_type">
-      <a-select
-        showSearch
-        v-model:value="form.indexer_type"
-        :placeholder="$t('pipeline.valid.indexerType')"
-      >
-        <a-select-option
-          v-for="item in indexerList"
-          :key="item.value"
-          :value="item.value"
-          >{{ item.name }}</a-select-option
-        >
-      </a-select>
-      <FormTooltip :title="$t('pipeline.desc.indexerType')" />
-    </a-form-item>
-    <div class="option-introduction">
-      <InfoCircleOutlined />
-      {{ $t(optionIntroduction!) }}
-    </div>
-    <a-form-item
-      :label="$t('pipeline.config.embedding')"
-      :name="['embedding_model', 'model_id']"
-      :rules="rules.model_id"
-    >
-      <a-select
-        showSearch
-        v-model:value="form.embedding_model.model_id"
-        :placeholder="$t('pipeline.valid.embedding')"
-        @change="handleModelChange"
-        @dropdownVisibleChange="handleModelVisible"
-      >
-        <a-select-option v-for="item in modelList" :key="item" :value="item">{{
-          item
-        }}</a-select-option>
-      </a-select>
-      <FormTooltip :title="$t('pipeline.desc.embedding')" />
-    </a-form-item>
-    <a-form-item
-      :label="$t('pipeline.config.embeddingDevice')"
-      :name="['embedding_model', 'device']"
-      :rules="rules.device"
-    >
-      <a-select
-        showSearch
-        v-model:value="form.embedding_model.device"
-        :placeholder="$t('pipeline.valid.embeddingDevice')"
-        @dropdownVisibleChange="handleDeviceVisible"
-      >
-        <a-select-option v-for="item in deviceList" :key="item" :value="item">{{
-          item
-        }}</a-select-option>
-      </a-select>
-      <FormTooltip :title="$t('pipeline.desc.embeddingDevice')" />
-    </a-form-item>
-    <a-form-item
-      :label="$t('pipeline.config.vector_uri')"
-      name="vector_uri"
-      :rules="rules.vector_uri"
-      v-if="form.indexer_type === 'milvus_vector'"
-    >
-      <a-input
-        v-model:value="form.vector_uri"
-        :addon-before="protocol"
-        :placeholder="$t('pipeline.valid.vector_uri')"
-        @change="handleUriChange"
-      >
-        <template #addonAfter>
-          <a-button
-            type="primary"
-            class="text-btn"
-            :disabled="!isPass"
-            @click="handleTestUrl"
-          >
-            <CheckCircleFilled
-              v-if="validatePass"
-              :style="{ color: 'var(--color-success)', fontSize: '18px' }"
-            />
-            <span v-else> {{ $t("pipeline.desc.test") }}</span>
-          </a-button>
-        </template>
-      </a-input>
-      <FormTooltip :title="$t('pipeline.desc.vector_uri')" />
-    </a-form-item>
-  </a-form>
-</template>
-
-<script lang="ts" setup name="Indexer">
-import { getRunDevice, getModelList, requestUrlVerify } from "@/api/pipeline";
-import type { FormInstance } from "ant-design-vue";
-import { reactive, ref, onMounted } from "vue";
-import { Indexer } from "../../enum.ts";
-import { ModelType } from "../../type.ts";
-import { InfoCircleOutlined, CheckCircleFilled } from "@ant-design/icons-vue";
-import { useI18n } from "vue-i18n";
-import { validateIpPort } from "@/utils/validate.ts";
-import { useNotification } from "@/utils/common";
-
-const { t } = useI18n();
-const { antNotification } = useNotification();
-const props = defineProps({
-  formData: {
-    type: Object,
-    default: () => {},
-  },
-  formType: {
-    type: String,
-    default: "create",
-  },
-});
-interface FormType {
-  indexer_type: string;
-  vector_uri?: string;
-  embedding_model: ModelType;
-}
-const validateUnique = async (rule: any, value: string) => {
-  if (!value) {
-    return Promise.reject(t("pipeline.valid.urlValid1"));
-  }
-  if (!validateIpPort(value)) {
-    return Promise.reject(t("pipeline.valid.urlValid2"));
-  }
-  isPass.value = true;
-  return Promise.resolve();
-};
-const handleUrlFormat = (url: string) => {
-  if (!url) return "";
-  return url.replace(/http:\/\//g, "");
-};
-const {
-  indexer_type = "faiss_vector",
-  vector_uri = "",
-  embedding_model = {
-    model_id: "BAAI/bge-small-en-v1.5",
-    model_path: "./models/BAAI/bge-small-en-v1.5",
-    device: "AUTO",
-    weight: "INT4",
-  },
-} = props.formData?.indexer || {};
-
-const isPass = ref<boolean>(false);
-const validatePass = ref<boolean>(false);
-const protocol = ref<string>("http://");
-const formRef = ref<FormInstance>();
-const form = reactive<FormType>({
-  indexer_type,
-  vector_uri: handleUrlFormat(vector_uri),
-  embedding_model,
-});
-const rules = reactive({
-  indexer_type: [
-    {
-      required: true,
-      message: t("pipeline.valid.indexerType"),
-      trigger: "change",
-    },
-  ],
-  model_id: [
-    {
-      required: true,
-      message: t("pipeline.valid.embedding"),
-      trigger: "change",
-    },
-  ],
-  device: [
-    {
-      required: true,
-      message: t("pipeline.valid.embeddingDevice"),
-      trigger: "change",
-    },
-  ],
-  vector_uri: [
-    {
-      required: true,
-      validator: validateUnique,
-      trigger: "blur",
-    },
-  ],
-});
-const indexerList = Indexer;
-const deviceList = ref<EmptyArrayType>([]);
-const modelList = ref<EmptyArrayType>([]);
-
-const optionIntroduction = computed(() => {
-  const { indexer_type } = form;
-
-  return indexerList.find((item) => item.value === indexer_type)?.describe;
-});
-
-// Handling Device Folding Events
-const handleDeviceVisible = async (visible: boolean) => {
-  if (visible) {
-    try {
-      const data: any = await getRunDevice();
-      deviceList.value = [].concat(data);
-    } catch (err) {
-      console.error(err);
-    }
-  }
-};
-// Handling Model Folding Events
-const handleModelVisible = async (visible: boolean) => {
-  if (visible) {
-    try {
-      const data: any = await getModelList("embedding");
-      modelList.value = [].concat(data);
-    } catch (err) {
-      console.error(err);
-    }
-  }
-};
-//Complete model_cath
-const handleModelChange = (value: string) => {
-  form.embedding_model.model_path = `./models/${value}`;
-};
-const handleTestUrl = async () => {
-  const vector_uri = protocol.value + form.vector_uri;
-  const { status = "" } = await requestUrlVerify({ vector_uri });
-
-  if (status !== "200") {
-    antNotification("error", t("common.error"), t("pipeline.valid.urlValid3"));
-    return;
-  }
-  validatePass.value = true;
-  antNotification(
-    "success",
-    t("common.success"),
-    t("pipeline.valid.urlValid4")
-  );
-};
-const handleUriChange = () => {
-  isPass.value = false;
-  validatePass.value = false;
-};
-// Format parameter
-const formatFormParam = () => {
-  const { indexer_type, vector_uri, embedding_model } = form;
-
-  return {
-    indexer_type,
-    embedding_model,
-    vector_uri:
-      indexer_type === "milvus_vector"
-        ? protocol.value + vector_uri
-        : undefined,
-  };
-};
-// Validate the form, throw results form
-const handleValidate = (): Promise<object> => {
-  return new Promise((resolve) => {
-    formRef.value
-      ?.validate()
-      .then(() => {
-        if (form.indexer_type === "milvus_vector" && !validatePass.value) {
-          antNotification(
-            "warning",
-            t("common.prompt"),
-            t("pipeline.valid.urlValid5")
-          );
-          return;
-        }
-        resolve({
-          result: true,
-          data: { indexer: formatFormParam() },
-        });
-      })
-      .catch(() => {
-        resolve({ result: false });
-      });
-  });
-};
-defineExpose({
-  validate: handleValidate,
-});
-
-onMounted(() => {
-  if (props.formType === "update") {
-    isPass.value = true;
-    validatePass.value = true;
-  }
-});
-</script>
-
-<style scoped lang="less">
-:deep(.intel-input-group) {
-  .intel-input-group-addon {
-    overflow: hidden;
-  }
-}
-.text-btn {
-  width: 72px;
-  height: 30px;
-  margin: 0 -11px;
-  border-radius: 0 6px 6px 0;
-}
-</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Retriever.vue b/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Retriever.vue
deleted file mode 100644
index eb12bef097..0000000000
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Retriever.vue
+++ /dev/null
@@ -1,135 +0,0 @@
-<template>
-  <a-form
-    :model="form"
-    :rules="rules"
-    name="retriever"
-    layout="vertical"
-    ref="formRef"
-    autocomplete="off"
-    class="form-wrap"
-  >
-    <a-form-item
-      :label="$t('pipeline.config.retrieverType')"
-      name="retriever_type"
-    >
-      <a-select
-        v-model:value="form.retriever_type"
-        showSearch
-        :placeholder="$t('pipeline.valid.retrieverType')"
-      >
-        <a-select-option
-          v-for="item in retrieverList"
-          :key="item.value"
-          :value="item.value"
-          >{{ item.name }}</a-select-option
-        >
-      </a-select>
-      <FormTooltip :title="$t('pipeline.desc.retrieverType')" />
-    </a-form-item>
-    <div class="option-introduction">
-      <InfoCircleOutlined />
-      {{ $t(optionIntroduction!) }}
-    </div>
-    <a-form-item
-      :label="$t('pipeline.config.topk')"
-      name="retrieve_topk"
-      class="slider-wrap"
-    >
-      <a-slider
-        v-model:value="form.retrieve_topk"
-        :min="1"
-        :max="200"
-        :marks="sliderMarks.retrieval"
-      />
-      <a-form-item noStyle>
-        <a-input-number
-          v-model:value="form.retrieve_topk"
-          :min="1"
-          :max="200"
-          @change="handleTopkChange"
-        />
-      </a-form-item>
-      <FormTooltip :title="$t('pipeline.desc.topk')" />
-    </a-form-item>
-  </a-form>
-</template>
-
-<script lang="ts" setup name="Retriever">
-import type { FormInstance } from "ant-design-vue";
-import { reactive, ref } from "vue";
-import { Retriever } from "../../enum.ts";
-import { InfoCircleOutlined } from "@ant-design/icons-vue";
-import { useI18n } from "vue-i18n";
-
-const { t } = useI18n();
-const props = defineProps({
-  formData: {
-    type: Object,
-    default: () => {},
-  },
-});
-interface FormType {
-  retriever_type: string;
-  retrieve_topk: number;
-}
-const { retriever_type = "vectorsimilarity", retrieve_topk = 30 } =
-  props.formData?.retriever || {};
-
-const formRef = ref<FormInstance>();
-const form = reactive<FormType>({
-  retriever_type,
-  retrieve_topk,
-});
-const rules = reactive({
-  retriever_type: [
-    {
-      required: true,
-      message: t("pipeline.valid.retrieverType"),
-      trigger: "blur",
-    },
-  ],
-  retrieve_topk: [
-    {
-      required: true,
-      message: t("pipeline.valid.topk"),
-      trigger: ["change", "blur"],
-    },
-  ],
-});
-const retrieverList = Retriever;
-const optionIntroduction = computed(() => {
-  const { retriever_type } = form;
-
-  return retrieverList.find((item) => item.value === retriever_type)?.describe;
-});
-const sliderMarks = reactive<EmptyObjectType>({
-  retrieval: {
-    1: "1",
-    200: "200",
-  },
-});
-const handleTopkChange = () => {
-  formRef.value?.validateFields(["retrieve_topk"]);
-};
-// Validate the form, throw results form
-const handleValidate = (): Promise<object> => {
-  return new Promise((resolve) => {
-    formRef.value
-      ?.validate()
-      .then(() => {
-        resolve({
-          result: true,
-          data: { retriever: form },
-        });
-      })
-      .catch(() => {
-        resolve({ result: false });
-      });
-  });
-};
-defineExpose({
-  validate: handleValidate,
-});
-</script>
-
-<style scoped lang="less"></style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/columnsList.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/columnsList.ts
new file mode 100644
index 0000000000..f508282abd
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/columnsList.ts
@@ -0,0 +1,64 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+const getTableColumns = (t: (key: string) => string): TableColumns[] => [
+  {
+    title: t("agent.name"),
+    key: "name",
+    dataIndex: "name",
+    fixed: "left",
+    minWidth: 100,
+    visible: true,
+    disabled: true,
+  },
+  {
+    title: t("agent.id"),
+    dataIndex: "idx",
+    key: "idx",
+    minWidth: 100,
+    ellipsis: true,
+    visible: true,
+  },
+  {
+    title: t("agent.pipeline"),
+    dataIndex: "pipeline_idx",
+    key: "pipeline_idx",
+    minWidth: 100,
+    ellipsis: true,
+    visible: true,
+  },
+  {
+    title: t("agent.label.type"),
+    dataIndex: "type",
+    key: "type",
+    minWidth: 60,
+    ellipsis: true,
+    visible: true,
+  },
+  {
+    title: t("agent.configs"),
+    dataIndex: "configs",
+    key: "configs",
+    minWidth: 120,
+    ellipsis: true,
+    visible: true,
+  },
+  {
+    title: t("agent.status"),
+    dataIndex: "active",
+    key: "active",
+    minWidth: 80,
+    ellipsis: true,
+    visible: true,
+  },
+  {
+    title: t("pipeline.operation"),
+    key: "operation",
+    dataIndex: "operation",
+    fixed: "right",
+    visible: true,
+    disabled: true,
+  },
+];
+
+export default getTableColumns;
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/DynamicConfigs.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/DynamicConfigs.vue
new file mode 100644
index 0000000000..b767282194
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/DynamicConfigs.vue
@@ -0,0 +1,116 @@
+<template>
+  <div class="dynamic-configs-form">
+    <a-form
+      :model="form"
+      layout="vertical"
+      autocomplete="off"
+      class="form-wrap"
+      name="Configs"
+    >
+      <template v-for="field in schema" :key="field.key">
+        <a-form-item :label="field.label" class="slider-wrap">
+          <div v-if="field.type === 'number'" class="flex-left">
+            <a-slider
+              v-model:value="form[field.key]"
+              :min="0"
+              :max="200"
+              :marks="sliderMarks"
+            />
+            <a-form-item noStyle>
+              <a-input-number
+                v-model:value="form[field.key]"
+                :min="0"
+                :max="200"
+              />
+            </a-form-item>
+          </div>
+          <template v-else-if="field.type === 'boolean'">
+            {{ $t("common.no") }}
+            <a-switch v-model:checked="form[field.key]" size="small" />
+            {{ $t("common.yes") }}
+          </template>
+          <a-input
+            v-else
+            allowClear
+            v-model:value="form[field.key]"
+            :placeholder="$t('common.inputTip')"
+          />
+        </a-form-item>
+      </template>
+    </a-form>
+  </div>
+</template>
+
+<script lang="ts" setup name="DynamicConfigs">
+import { formatTextStrict } from "@/utils/common";
+import { computed, reactive, watch } from "vue";
+import type { PropType } from "vue";
+
+type RawConfigValue = number | boolean | string | { [k: string]: any };
+
+const props = defineProps({
+  configs: {
+    type: Object as PropType<EmptyObjectType>,
+    default: () => ({}),
+    required: true,
+  },
+  modelValue: {
+    type: Object as PropType<EmptyObjectType>,
+    default: () => ({}),
+  },
+});
+const emit = defineEmits(["update:modelValue"]);
+
+const typeMap: Record<string, Field["type"]> = {
+  string: "string",
+  number: "number",
+  boolean: "boolean",
+};
+type Field = {
+  key: string;
+  label: string;
+  type: "number" | "boolean" | "string";
+  params: EmptyObjectType;
+};
+
+const sliderMarks = reactive({ 0: "0", 200: "200" });
+
+const inferField = (key: string, value: RawConfigValue): Field => {
+  const valueType = typeof value;
+  const type = typeMap[valueType] || "string";
+  const params = { default: value };
+
+  const label = formatTextStrict(key);
+  return { key, label, type, params };
+};
+
+const schema = computed(() =>
+  Object.entries(props.configs).map(([k, v]) => inferField(k, v))
+);
+
+const form = reactive<EmptyObjectType>({ ...props.modelValue });
+
+watch(
+  () => props.modelValue,
+  (data) => {
+    Object.assign(form, data);
+  },
+  { deep: true }
+);
+
+watch(form, (newForm) => emit("update:modelValue", { ...newForm }), {
+  deep: true,
+});
+</script>
+
+<style scoped lang="less">
+.slider-wrap {
+  .flex-left {
+    gap: 6px;
+  }
+  .intel-input-number {
+    position: relative;
+    top: -10px;
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/Table.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/Table.vue
new file mode 100644
index 0000000000..48764d1b53
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/Table.vue
@@ -0,0 +1,204 @@
+<template>
+  <div class="table-container">
+    <div class="header-wrap">
+      <span class="title">{{ $t("agent.agent") }}</span>
+      <div class="btn-wrap">
+        <a-button type="primary" @click="handleCreate">
+          <template #icon>
+            <PlusOutlined />
+          </template>
+          {{ $t("agent.create") }}</a-button
+        >
+      </div>
+    </div>
+    <a-table
+      :columns="tableColumns"
+      :data-source="tableList"
+      :pagination="false"
+      :loading="loading"
+      :scroll="{ x: 'max-content' }"
+    >
+      <template #bodyCell="{ column, record }">
+        <template v-if="column.dataIndex === 'active'">
+          <span>
+            <a-tag
+              :bordered="false"
+              :color="record.active ? 'success' : 'default'"
+            >
+              {{ record.active ? $t("agent.activated") : $t("agent.inactive") }}
+            </a-tag>
+          </span>
+        </template>
+        <template v-if="column.dataIndex === 'configs'">
+          <span v-if="!Object.keys(record?.configs || {}).length">--</span>
+          <div class="tag-wrap" v-else>
+            <a-tag
+              v-for="(value, key) in record?.configs"
+              color="processing"
+              class="tag-item"
+            >
+              {{ key }}: {{ value }}
+            </a-tag>
+          </div>
+        </template>
+        <template v-else-if="column.dataIndex === 'operation'">
+          <a-space wrap>
+            <a-button
+              type="primary"
+              ghost
+              size="small"
+              :disabled="record.active"
+              @click="handleUpdate(record)"
+            >
+              {{ $t("common.update") }}</a-button
+            >
+            <a-button
+              danger
+              size="small"
+              :disabled="record.active"
+              @click="handleDelete(record)"
+              >{{ $t("common.delete") }}
+            </a-button>
+          </a-space>
+        </template>
+      </template>
+    </a-table>
+    <a-pagination
+      v-if="paginationData.total > 10"
+      v-model:current="paginationData.pageNum"
+      v-model:pageSize="paginationData.pageSize"
+      showSizeChanger
+      :total="paginationData.total"
+    />
+  </div>
+</template>
+
+<script lang="ts" setup name="Table">
+import { CloseCircleFilled, PlusOutlined } from "@ant-design/icons-vue";
+import { createVNode, ref } from "vue";
+import { useI18n } from "vue-i18n";
+import getTableColumns from "../columnsList";
+import { Modal } from "ant-design-vue";
+import { requestAgentDelete, requestAgentUpdate } from "@/api/agent";
+
+const { t } = useI18n();
+
+const props = defineProps({
+  tableData: {
+    type: Array,
+    default: () => [],
+  },
+  loading: {
+    type: Boolean,
+    default: false,
+  },
+});
+
+const emit = defineEmits(["create", "update", "search"]);
+const paginationData = reactive<paginationType>({
+  total: props.tableData.length || 0,
+  pageNum: 1,
+  pageSize: 10,
+});
+const tableColumns = computed(() => getTableColumns(t));
+
+const tableList = computed(() => {
+  const { pageNum, pageSize } = paginationData;
+  const start = (pageNum - 1) * pageSize;
+  const end = start + pageSize;
+  return props.tableData.slice(start, end);
+});
+//create
+const handleCreate = () => {
+  emit("create");
+};
+//edit
+const handleUpdate = (row: EmptyObjectType) => {
+  emit("update", row);
+};
+//delete
+const handleDelete = (row: EmptyObjectType) => {
+  Modal.confirm({
+    title: t("common.delete"),
+    icon: createVNode(CloseCircleFilled, { class: "error-icon" }),
+    content: t("agent.deleteTip"),
+    okText: t("common.confirm"),
+    okType: "danger",
+    async onOk() {
+      await requestAgentDelete(row.name);
+      paginationData.pageNum = 1;
+      emit("search");
+    },
+  });
+};
+</script>
+
+<style scoped lang="less">
+.table-container {
+  .p-16;
+  .pb-24;
+  border-radius: 8px;
+  background-color: var(--bg-content-color);
+
+  .header-wrap {
+    .flex-between;
+    .mb-20;
+  }
+  .title {
+    .fs-16;
+    font-weight: 600;
+    color: var(--font-main-color);
+  }
+  .btn-wrap {
+    display: flex;
+    gap: 12px;
+  }
+  .intel-tag {
+    border-radius: 10px;
+    font-weight: 600;
+    display: inline-flex;
+    align-items: center;
+    line-height: 18px;
+  }
+  .tag-wrap {
+    display: grid;
+    grid-template-columns: 1fr 1fr 1fr;
+    gap: 8px;
+  }
+}
+.click-link {
+  color: var(--color-primary);
+  cursor: pointer;
+  transition: color 0.3s;
+  &:hover {
+    color: var(--color-primary-hover);
+    text-decoration: underline;
+  }
+}
+
+.custom-benchmark {
+  position: absolute;
+  top: -40px;
+  height: 36px;
+  z-index: 20;
+
+  .container {
+    padding: 8px 16px;
+  }
+
+  h2 {
+    font-size: 14px;
+    padding: 0;
+    font-weight: 500;
+    color: #595959;
+    justify-content: end;
+  }
+}
+.not-configs {
+  padding: 16px 0;
+  width: 100%;
+  :deep(.intel-empty-image) {
+    height: 60px;
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/UpdateDialog.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/UpdateDialog.vue
new file mode 100644
index 0000000000..09f2dc9bd5
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/UpdateDialog.vue
@@ -0,0 +1,382 @@
+<template>
+  <a-modal
+    v-model:open="modelVisible"
+    width="800px"
+    centered
+    destroyOnClose
+    :title="dialogTitle"
+    :keyboard="false"
+    :maskClosable="false"
+    @cancel="handleCancel"
+    class="experience-dialog"
+  >
+    <div class="enter-wrap">
+      <a-form
+        :model="form"
+        :rules="rules"
+        name="form"
+        ref="formRef"
+        autocomplete="off"
+        class="form-wrap"
+        layout="vertical"
+      >
+        <a-form-item
+          :label="$t('agent.label.name')"
+          name="name"
+          :rules="rules.name"
+        >
+          <a-input
+            v-model:value="form.name"
+            :disabled="isEdit"
+            :placeholder="$t('agent.valid.name')"
+          />
+        </a-form-item>
+
+        <a-form-item :label="$t('agent.label.type')" name="type">
+          <a-select
+            showSearch
+            v-model:value="form.type"
+            :disabled="isEdit"
+            :placeholder="$t('agent.valid.type')"
+            @change="handleTypeChange"
+          >
+            <a-select-option
+              v-for="item in agentTypeList"
+              :key="item.value"
+              :value="item.value"
+              >{{ item.name }}</a-select-option
+            >
+          </a-select>
+        </a-form-item>
+        <a-form-item :label="$t('agent.label.pipeline')" name="pipeline_idx">
+          <a-select
+            showSearch
+            v-model:value="form.pipeline_idx"
+            :disabled="isEdit"
+            :placeholder="$t('agent.valid.pipeline')"
+            @dropdownVisibleChange="handlePipelineVisible"
+          >
+            <a-select-option
+              v-for="item in pipelineList"
+              :key="item.idx"
+              :value="item.idx"
+              >{{ item.name }}</a-select-option
+            >
+          </a-select>
+        </a-form-item>
+        <a-form-item
+          :label="$t('agent.label.configs')"
+          name="configs"
+          class="gt-wrap"
+          v-if="form.type"
+        >
+          <div class="configs-wrap">
+            <DynamicConfigs :configs="configsTemplate" v-model="form.configs" />
+          </div>
+        </a-form-item>
+      </a-form>
+    </div>
+    <template #footer>
+      <a-button type="primary" ghost @click="handleCancel">{{
+        $t("common.cancel")
+      }}</a-button>
+      <a-button
+        key="submit"
+        type="primary"
+        :loading="submitLoading"
+        @click="handleSubmit"
+        >{{ $t("common.submit") }}</a-button
+      >
+    </template>
+  </a-modal>
+</template>
+
+<script lang="ts" setup name="UpdateDialog">
+import { FormInstance } from "ant-design-vue";
+import { reactive, computed, ref } from "vue";
+import { useI18n } from "vue-i18n";
+import { AgentType } from "../enum";
+import {
+  requestAgentCreate,
+  requestAgentUpdate,
+  getAgentConfigs,
+} from "@/api/agent";
+import { getPipelineList } from "@/api/pipeline";
+import { DynamicConfigs } from "./index";
+import { isValidPipelineName } from "@/utils/validate";
+
+interface FormType {
+  idx?: string;
+  name: string;
+  type: string | undefined;
+  pipeline_idx: string | undefined;
+  active: boolean;
+  configs: any;
+}
+
+const props = defineProps({
+  dialogData: {
+    type: Object,
+    default: () => ({}),
+  },
+  dialogType: {
+    type: String,
+    default: "create",
+  },
+});
+
+const { t } = useI18n();
+const emit = defineEmits(["close", "search"]);
+
+const typeMap = {
+  create: t("agent.create"),
+  edit: t("agent.edit"),
+} as const;
+const validateName = async (rule: any, value: string) => {
+  if (!value) {
+    return Promise.reject(t("pipeline.valid.nameValid1"));
+  }
+  const len = value.length;
+  if (len < 2 || len > 30) {
+    return Promise.reject(t("pipeline.valid.nameValid2"));
+  }
+  if (!isValidPipelineName(value)) {
+    return Promise.reject(t("pipeline.valid.nameValid3"));
+  }
+  return Promise.resolve();
+};
+const dialogTitle = computed(() => {
+  return typeMap[props.dialogType as keyof typeof typeMap];
+});
+const isEdit = computed(() => props.dialogType === "edit");
+const agentTypeList = computed(() => AgentType);
+
+const {
+  name = "",
+  type = undefined,
+  pipeline_idx = undefined,
+  active = false,
+  configs = {},
+} = props.dialogData || {};
+
+// visible & loading
+const modelVisible = ref<boolean>(true);
+const submitLoading = ref<boolean>(false);
+const formRef = ref<FormInstance>();
+const pipelineList = ref<EmptyArrayType>([]);
+
+const configsTemplate = ref<EmptyObjectType>(configs);
+const form = reactive<FormType>({
+  name,
+  type,
+  pipeline_idx,
+  active,
+  configs,
+});
+
+const rules: FormRules = reactive({
+  name: [
+    {
+      required: true,
+      validator: validateName,
+      trigger: ["blur", "change"],
+    },
+  ],
+  type: [
+    {
+      required: true,
+      message: t("agent.valid.type"),
+      trigger: "change",
+    },
+  ],
+  pipeline_idx: [
+    {
+      required: true,
+      message: t("agent.valid.pipeline"),
+      trigger: "change",
+    },
+  ],
+  key: [
+    {
+      required: true,
+      message: t("agent.valid.key"),
+      trigger: "change",
+    },
+  ],
+  value: [
+    {
+      required: true,
+      message: t("agent.valid.value"),
+      trigger: "change",
+    },
+  ],
+  active: [
+    {
+      required: true,
+      trigger: "change",
+    },
+  ],
+});
+
+/* ---- pipeline utils ---- */
+const handlePipelineVisible = (visible: boolean) => {
+  if (visible) {
+    try {
+      queryPipelineList();
+    } catch (err) {
+      console.error(err);
+    }
+  }
+};
+
+const queryPipelineList = async () => {
+  const data: any = await getPipelineList();
+  pipelineList.value = [].concat(data);
+};
+/* ---- type change ---- */
+const handleTypeChange = () => {
+  queryConfigs();
+};
+
+const queryConfigs = async () => {
+  try {
+    const { type } = form;
+    if (!type) return;
+    const data: any = await getAgentConfigs(type!);
+    configsTemplate.value = { ...data };
+    form.configs = {
+      ...configsTemplate.value,
+    };
+  } catch (err) {
+    console.error(err);
+  }
+};
+
+const formatFormParam = () => {
+  const { name } = form;
+  const { idx } = props.dialogData;
+  return {
+    ...form,
+    name,
+    idx: isEdit.value ? idx : undefined,
+  };
+};
+
+const handleSubmit = () => {
+  formRef.value?.validate().then(() => {
+    submitLoading.value = true;
+    const payload = formatFormParam();
+    const api = isEdit.value
+      ? requestAgentUpdate(form.name, payload)
+      : requestAgentCreate(payload);
+
+    api
+      .then(() => {
+        emit("search");
+        handleCancel();
+      })
+      .catch((error: any) => {
+        console.error(error);
+      })
+      .finally(() => {
+        submitLoading.value = false;
+      });
+  });
+};
+
+const handleCancel = () => {
+  emit("close");
+};
+onMounted(() => {
+  if (isEdit.value) {
+    queryPipelineList();
+  }
+});
+</script>
+
+<style scoped lang="less">
+.enter-wrap {
+  width: 100%;
+  .title-wrap {
+    font-size: 20px;
+    font-weight: 600;
+    margin-bottom: 16px;
+    color: var(--font-main-color);
+  }
+  .form-wrap {
+    .gt-wrap {
+      margin-bottom: 0;
+      :deep(.intel-form-item-control-input-content) {
+        display: block;
+      }
+    }
+    .configs-wrap {
+      border: 1px solid var(--border-main-color);
+      background-color: var(--bg-card-color);
+      padding: 16px;
+      margin-bottom: 16px;
+      border-radius: 6px;
+      width: 1005;
+    }
+    .item-wrap {
+      width: 100%;
+      position: relative;
+      gap: 12px;
+      padding-bottom: 8px;
+      :deep(.intel-form-item) {
+        flex: 1;
+      }
+    }
+    .icon-wrap {
+      cursor: pointer;
+      display: inline-flex;
+      gap: 8px;
+      width: 20px;
+      &.absolute {
+        position: relative;
+        top: -12px;
+      }
+      .anticon {
+        font-size: 16px;
+        &:hover {
+          color: var(--color-primary);
+        }
+        &.anticon-delete {
+          &:hover {
+            color: var(--color-error) !important;
+          }
+        }
+        &.anticon-minus-circle {
+          &:hover {
+            color: var(--color-error) !important;
+          }
+        }
+      }
+    }
+    .add-wrap {
+      .flex-end;
+      gap: 6px;
+      cursor: pointer;
+      color: var(--color-primary);
+      &:hover {
+        color: var(--color-primary-hover);
+      }
+      &.vertical-center {
+        justify-content: center !important;
+      }
+    }
+  }
+  .operate-wrap {
+    height: 28px;
+    border-radius: 4px;
+    cursor: pointer;
+    gap: 4px;
+    border: 1px dashed var(--border-main-color);
+    .vertical-center;
+    &:hover {
+      border: 1px dashed var(--color-primary-hover);
+      color: var(--color-primary-hover);
+    }
+  }
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/index.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/index.ts
new file mode 100644
index 0000000000..cc6876330d
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/components/index.ts
@@ -0,0 +1,8 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+import Table from "./Table.vue";
+import UpdateDialog from "./UpdateDialog.vue";
+import DynamicConfigs from "./DynamicConfigs.vue";
+
+export { Table, UpdateDialog, DynamicConfigs };
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/enum.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/enum.ts
new file mode 100644
index 0000000000..b9f2afa271
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/enum.ts
@@ -0,0 +1,13 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+export const AgentType = [
+  {
+    name: "Simple",
+    value: "simple",
+  },
+  {
+    name: "Deep Search",
+    value: "deep_search",
+  },
+] as const;
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/index.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/index.vue
new file mode 100644
index 0000000000..47da93d7ed
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/index.vue
@@ -0,0 +1,74 @@
+<template>
+  <div class="agent-container">
+    <Table
+      :loading
+      :table-data="tableData"
+      @create="handleCreate"
+      @search="handleSearch"
+      @update="handleUpdate"
+    />
+    <!-- updateDialog -->
+    <UpdateDialog
+      v-if="updateDialog.visible"
+      :dialog-data="updateDialog.data"
+      :dialog-type="updateDialog.type"
+      @search="handleSearch"
+      @close="updateDialog.visible = false"
+    />
+  </div>
+</template>
+
+<script lang="ts" setup name="Agent">
+import { getAgentList, getAgentDetailByName } from "@/api/agent";
+import { onMounted, reactive, ref } from "vue";
+import { UpdateDialog, Table } from "./components";
+
+const loading = ref<boolean>(true);
+const updateDialog = reactive<DialogType>({
+  visible: false,
+  data: {},
+  type: "create",
+});
+
+const tableData = ref<EmptyArrayType>([]);
+
+const queryAgentList = async () => {
+  try {
+    loading.value = true;
+    const data: any = await getAgentList();
+    tableData.value = Object.values(data);
+  } catch (error) {
+    console.log(error);
+  } finally {
+    loading.value = false;
+  }
+};
+
+//create
+const handleCreate = () => {
+  updateDialog.visible = true;
+  updateDialog.type = "create";
+  updateDialog.data = {};
+};
+//edit
+const handleUpdate = async (row: EmptyObjectType) => {
+  const data: any = await getAgentDetailByName(row.name);
+  updateDialog.data = { ...updateDialog.data, ...data };
+  updateDialog.visible = true;
+  updateDialog.type = "edit";
+};
+//search
+const handleSearch = () => {
+  queryAgentList();
+};
+
+onMounted(() => {
+  queryAgentList();
+});
+</script>
+
+<style scoped lang="less">
+.agent-container {
+  .mt-24;
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/type.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/type.ts
new file mode 100644
index 0000000000..1ceaa77944
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Agent/type.ts
@@ -0,0 +1,10 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+export interface ModelType {
+  model_id: string | undefined;
+  model_path: string;
+  model_url?: string;
+  device: string;
+  weight?: string;
+}
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/columnsList.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/columnsList.ts
similarity index 100%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/columnsList.ts
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/columnsList.ts
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/DetailDrawer.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/DetailDrawer.vue
similarity index 90%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/DetailDrawer.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/DetailDrawer.vue
index 616ca925f2..a2aca72f05 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/DetailDrawer.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/DetailDrawer.vue
@@ -83,6 +83,17 @@
                 formData.indexer.indexer_type
               }}</span>
             </li>
+            <li
+              class="item-wrap"
+              v-if="formData.indexer.indexer_type === 'kbadmin_indexer'"
+            >
+              <span class="label-wrap">{{
+                $t("pipeline.config.embeddingUrl")
+              }}</span>
+              <span class="content-wrap">{{
+                formData.indexer?.embedding_url
+              }}</span>
+            </li>
             <li class="item-wrap">
               <span class="label-wrap">{{
                 $t("pipeline.config.embedding")
@@ -101,13 +112,17 @@
             </li>
             <li
               class="item-wrap"
-              v-if="formData.indexer.indexer_type === 'milvus_vector'"
+              v-if="
+                ['kbadmin_indexer', 'milvus_vector'].includes(
+                  formData.indexer.indexer_type
+                )
+              "
             >
               <span class="label-wrap">{{
-                $t("pipeline.config.vector_uri")
+                $t("pipeline.config.vector_url")
               }}</span>
               <span class="content-wrap">{{
-                formData.indexer.vector_uri
+                formData.indexer?.vector_url
               }}</span>
             </li>
           </ul>
@@ -165,6 +180,10 @@
               <span class="content-wrap">{{ item.processor_type }}</span>
             </li>
             <template v-if="item.processor_type === 'reranker'">
+              <li class="item-wrap">
+                <span class="label-wrap">{{ $t("pipeline.config.topn") }}</span>
+                <span class="content-wrap">{{ item.top_n }}</span>
+              </li>
               <li class="item-wrap">
                 <span class="label-wrap">{{
                   $t("pipeline.config.rerank")
@@ -198,7 +217,9 @@
               <span class="label-wrap">{{
                 $t("pipeline.config.generatorType")
               }}</span>
-              <span class="content-wrap"> chatqna </span>
+              <span class="content-wrap">
+                {{ formData.generator.generator_type }}
+              </span>
             </li>
             <li class="item-wrap">
               <span class="label-wrap">{{ $t("pipeline.config.llm") }}</span>
@@ -266,11 +287,15 @@ const postProcessorActive = ref<string>("postProcessor");
 const generatorActive = ref<string>("generator");
 
 const isHierarchical = computed(() => {
-  return formData.node_parser.parser_type === "hierarchical";
+  return (
+    formData.node_parser.parser_type === "hierarchical" ||
+    formData.node_parser.parser_type === "kbadmin_parser"
+  );
 });
 const isSentencewindow = computed(() => {
   return formData.node_parser.parser_type === "sentencewindow";
 });
+
 const handleClose = () => {
   emit("close");
 };
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/ImportDialog.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/ImportDialog.vue
similarity index 86%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/ImportDialog.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/ImportDialog.vue
index 62227db062..ed266f2681 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/ImportDialog.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/ImportDialog.vue
@@ -17,6 +17,7 @@
       :action="importUrl"
       accept=".json"
       :showUploadList="false"
+      :before-upload="handleBeforeUpload"
       @change="handleChange"
     >
       <SvgIcon
@@ -41,6 +42,7 @@ import { ref } from "vue";
 import { useNotification } from "@/utils/common";
 import { NextLoading } from "@/utils/loading";
 import { useI18n } from "vue-i18n";
+import { message, UploadProps } from "ant-design-vue";
 
 const { t } = useI18n();
 const { antNotification } = useNotification();
@@ -49,6 +51,16 @@ const emit = defineEmits(["search", "close"]);
 const modelVisible = ref<boolean>(true);
 const fileList = ref([]);
 
+const handleBeforeUpload = (file: UploadProps["fileList"][number]) => {
+  const isFileSize = file.size / 1024 / 1024 < 10;
+
+  if (!isFileSize) {
+    message.error(t("pipeline.pipelineFormatTip"));
+    return;
+  }
+
+  return isFileSize;
+};
 const handleChange = (info: any) => {
   const el = <HTMLElement>document.querySelector(".loading-next");
   if (!el) NextLoading.start();
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/Table.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/Table.vue
similarity index 91%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/Table.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/Table.vue
index b997be75cb..2f097cf86f 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/Table.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/Table.vue
@@ -24,6 +24,7 @@
       :columns="tableColumns"
       :data-source="tableList"
       :pagination="false"
+      :loading="loading"
       :scroll="{ x: 'max-content' }"
     >
       <template #bodyCell="{ column, record }">
@@ -36,14 +37,14 @@
           {{
             record.postprocessor
               .map((item: any) => item?.processor_type)
-              .join(", ")
+              .join(",")
           }}
         </template>
         <template v-if="column.dataIndex === 'rerank'">
           {{
             record.postprocessor
               .map((item: any) => item?.model?.model_id)
-              .join(", ") || "--"
+              .join(" ") || "--"
           }}
         </template>
         <template v-if="column.dataIndex === 'status'">
@@ -92,6 +93,14 @@
               @click="handleDelete(record)"
               >{{ $t("common.delete") }}
             </a-button>
+            <a-button
+              type="primary"
+              ghost
+              size="small"
+              class="intel-btn-primary-second"
+              @click="handleExport(record)"
+              >{{ $t("common.export") }}</a-button
+            >
             <a-button
               v-if="record.status?.active"
               type="primary"
@@ -133,7 +142,8 @@ import { Modal } from "ant-design-vue";
 import { createVNode, h, ref } from "vue";
 import { useI18n } from "vue-i18n";
 import TableColumns from "@/components/TableColumns.vue";
-import getTableColumns from "./columnsList";
+import { downloadJson } from "@/utils/common";
+import getTableColumns from "../columnsList";
 
 const { t } = useI18n();
 const pipelineStore = pipelineAppStore();
@@ -143,6 +153,10 @@ const props = defineProps({
     type: Array,
     default: () => [],
   },
+  loading: {
+    type: Boolean,
+    default: false,
+  },
 });
 
 const emit = defineEmits(["update", "create", "view", "import", "search"]);
@@ -153,6 +167,7 @@ const paginationData = reactive<paginationType>({
 });
 const tableColumns = ref<TableColumns[]>([]);
 const allColumns = computed(() => getTableColumns(t));
+
 const tableList = computed(() => {
   const { pageNum, pageSize } = paginationData;
   const start = (pageNum - 1) * pageSize;
@@ -204,6 +219,13 @@ const handleDelete = (row: EmptyObjectType) => {
     },
   });
 };
+// export
+const handleExport = async (row: EmptyObjectType) => {
+  const data: any = await getPipelineDetailByName(row.name);
+  const pipelineJson = JSON.parse(data);
+
+  downloadJson(data, pipelineJson.name);
+};
 const handleColumnChange = (checkedColumns: TableColumns[]) => {
   tableColumns.value = [...checkedColumns];
 };
@@ -233,7 +255,6 @@ watch(
 .table-container {
   .p-16;
   .pb-24;
-  .mt-20;
   border-radius: 8px;
   background-color: var(--bg-content-color);
 
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Activated.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Activated.vue
similarity index 97%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Activated.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Activated.vue
index b3da88a5d1..7670be85de 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Activated.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Activated.vue
@@ -39,7 +39,7 @@ const formRef = ref<FormInstance>();
 const form = reactive<FormType>({
   active,
 });
-const rules = reactive({
+const rules: FormRules = reactive({
   active: [{ required: true, trigger: "change" }],
 });
 // Validate the form, throw results form
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Basic.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Basic.vue
similarity index 74%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Basic.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Basic.vue
index d4d7c7bd71..c18e73eb96 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Basic.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Basic.vue
@@ -20,6 +20,7 @@
 </template>
 
 <script lang="ts" setup name="Basic">
+import { isValidPipelineName } from "@/utils/validate";
 import type { FormInstance } from "ant-design-vue";
 import { reactive, ref, computed } from "vue";
 import { useI18n } from "vue-i18n";
@@ -36,6 +37,19 @@ const props = defineProps({
     default: "create",
   },
 });
+const validateName = async (rule: any, value: string) => {
+  if (!value) {
+    return Promise.reject(t("pipeline.valid.nameValid1"));
+  }
+  const len = value.length;
+  if (len < 2 || len > 30) {
+    return Promise.reject(t("pipeline.valid.nameValid2"));
+  }
+  if (!isValidPipelineName(value)) {
+    return Promise.reject(t("pipeline.valid.nameValid3"));
+  }
+  return Promise.resolve();
+};
 const disabledName = computed(() => {
   const { formType } = props;
   return formType === "update";
@@ -49,18 +63,12 @@ const formRef = ref<FormInstance>();
 const form = reactive<FormType>({
   name,
 });
-const rules = reactive({
+const rules: FormRules = reactive({
   name: [
     {
       required: true,
-      message: t("pipeline.valid.nameValid1"),
-      trigger: "blur",
-    },
-    {
-      min: 2,
-      max: 30,
-      message: t("pipeline.valid.nameValid2"),
-      trigger: "blur",
+      validator: validateName,
+      trigger: ["blur", "change"],
     },
   ],
 });
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/CreateDialog.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/CreateDialog.vue
similarity index 94%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/CreateDialog.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/CreateDialog.vue
index 377bb57ba9..28515b4ce7 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/CreateDialog.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/CreateDialog.vue
@@ -20,13 +20,11 @@
       </div>
     </div>
     <div class="body-container">
-      <keep-alive>
-        <component
-          :is="currentComponent"
-          :form-data="formData"
-          ref="pipelineRef"
-        />
-      </keep-alive>
+      <component
+        :is="currentComponent"
+        :form-data="formData"
+        ref="pipelineRef"
+      />
     </div>
     <template #footer>
       <div class="flex-between">
@@ -140,12 +138,17 @@ const handleLast = () => {
 //next，update form
 const handleNext = async () => {
   if (pipelineRef.value) {
-    const { result = false, data = {} } = await pipelineRef.value?.validate();
+    const {
+      result = false,
+      data = {},
+      dest = null,
+    } = await pipelineRef.value?.validate();
 
     if (result) {
       Object.assign(formData, data);
+
       if (currentStep.value < 7) {
-        currentStep.value++;
+        currentStep.value = dest ? dest : currentStep.value + 1;
       }
     } else {
       console.log(t("pipeline.validErr"));
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/EditDialog.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/EditDialog.vue
similarity index 97%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/EditDialog.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/EditDialog.vue
index 0f769e9228..3e7db0625c 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/EditDialog.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/EditDialog.vue
@@ -148,14 +148,18 @@ const handleSelect = async (value?: number) => {
     if (result) {
       await Object.assign(formData, data);
       if (value) currentStep.value = value;
+      return true;
     } else {
       console.log(t("pipeline.validErr"));
+      return false;
     }
   }
+  return false;
 };
 // Submit
 const handleSubmit = async () => {
-  await handleSelect();
+  const isValid = await handleSelect();
+  if (!isValid) return;
   submitLoading.value = true;
   const { name } = props.dialogData;
 
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Generator.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Generator.vue
similarity index 66%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Generator.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Generator.vue
index cbe0af28d9..bf378c210b 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/Generator.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Generator.vue
@@ -27,12 +27,87 @@
       <FormTooltip :title="$t('pipeline.desc.generatorType')" />
     </a-form-item>
     <a-form-item :label="$t('pipeline.config.llm')" name="inference_type">
-      <a-radio-group v-model:value="form.inference_type">
+      <a-radio-group
+        v-model:value="form.inference_type"
+        @change="handleTypeChange"
+      >
         <a-radio value="vllm">{{ $t("pipeline.config.vllm") }}</a-radio>
         <a-radio value="local">{{ $t("pipeline.config.local") }}</a-radio>
       </a-radio-group>
     </a-form-item>
-    <template v-if="form.inference_type === 'local'">
+    <template v-if="isVllm">
+      <a-form-item name="vllm_endpoint" :rules="rules.vllm_endpoint">
+        <template #label>
+          {{ $t("pipeline.config.vllm_url") }}
+          <span class="eg-wrap"> {{ $t("pipeline.valid.vllm_url") }}</span>
+        </template>
+        <a-input
+          v-model:value="form.vllm_endpoint"
+          :placeholder="$t('pipeline.valid.vllm_url')"
+          @change="handleUrlChange"
+        >
+          <template #addonBefore>
+            <a-select v-model:value="protocol">
+              <a-select-option value="http://">Http://</a-select-option>
+              <a-select-option value="https://">Https://</a-select-option>
+            </a-select>
+          </template>
+          <template #addonAfter>
+            <a-button
+              type="primary"
+              class="text-btn"
+              :disabled="!isPass"
+              @click.stop="handleQueryVllmModel"
+            >
+              <CheckCircleFilled
+                v-if="isConnected"
+                :style="{ color: 'var(--color-success)', fontSize: '18px' }"
+              />
+              <span v-else> {{ $t("common.connect") }}</span>
+            </a-button>
+          </template>
+        </a-input>
+        <FormTooltip :title="$t('pipeline.desc.vllm_url')" />
+      </a-form-item>
+      <a-form-item
+        :label="$t('pipeline.config.language')"
+        :name="['model', 'model_id']"
+        :rules="rules.model_id"
+      >
+        <div class="model-wrap">
+          <a-select
+            v-model:value="form.model.model_id"
+            :placeholder="$t('pipeline.valid.language')"
+            @dropdownVisibleChange="handleVllmModelVisible"
+            allowClear
+            showSearch
+            class="select-wrap"
+          >
+            <a-select-option
+              v-for="item in vllmModelList"
+              :key="item"
+              :value="item"
+              >{{ item }}</a-select-option
+            >
+          </a-select>
+          <a-button
+            type="primary"
+            class="text-btn"
+            :disabled="!form.model.model_id"
+            @click="handleTestUrl"
+            enter-button
+          >
+            <CheckCircleFilled
+              v-if="validatePass"
+              :style="{ color: 'var(--color-success)', fontSize: '18px' }"
+            />
+            <span v-else> {{ $t("pipeline.desc.test") }}</span>
+          </a-button>
+        </div>
+        <FormTooltip :title="$t('pipeline.desc.language')" />
+      </a-form-item>
+    </template>
+    <template v-else>
       <a-form-item
         :label="$t('pipeline.config.language')"
         :name="['model', 'model_id']"
@@ -95,48 +170,6 @@
         <FormTooltip :title="t('pipeline.desc.weights')" />
       </a-form-item>
     </template>
-    <template v-else>
-      <a-form-item
-        :label="$t('pipeline.config.language')"
-        name="modelName"
-        :rules="rules.modelName"
-      >
-        <a-input
-          v-model:value.trim="form.modelName"
-          :placeholder="$t('pipeline.valid.modelName')"
-        >
-        </a-input>
-        <FormTooltip :title="$t('pipeline.desc.language')" />
-      </a-form-item>
-      <a-form-item
-        :label="$t('pipeline.config.vllm_url')"
-        name="vllm_endpoint"
-        :rules="rules.vllm_endpoint"
-      >
-        <a-input
-          v-model:value="form.vllm_endpoint"
-          :addon-before="protocol"
-          :placeholder="$t('pipeline.valid.vllm_url')"
-          @change="handleUrlChange"
-        >
-          <template #addonAfter>
-            <a-button
-              type="primary"
-              class="text-btn"
-              :disabled="!isPass"
-              @click="handleTestUrl"
-            >
-              <CheckCircleFilled
-                v-if="validatePass"
-                :style="{ color: 'var(--color-success)', fontSize: '18px' }"
-              />
-              <span v-else> {{ $t("pipeline.desc.test") }}</span>
-            </a-button>
-          </template>
-        </a-input>
-        <FormTooltip :title="$t('pipeline.desc.vllm_url')" />
-      </a-form-item>
-    </template>
   </a-form>
 </template>
 
@@ -153,7 +186,7 @@ import { Generator } from "../../enum.ts";
 import { ModelType } from "../../type.ts";
 import { useI18n } from "vue-i18n";
 import { CheckCircleFilled } from "@ant-design/icons-vue";
-import { validateIpPort } from "@/utils/validate.ts";
+import { validateServiceAddress } from "@/utils/validate.ts";
 import { useNotification } from "@/utils/common";
 
 const { t } = useI18n();
@@ -173,14 +206,15 @@ interface FormType {
   inference_type: string;
   model: ModelType;
   vllm_endpoint?: string;
-  modelName?: string;
 }
+const host = window.location.hostname;
 const validateUnique = async (rule: any, value: string) => {
   if (!value) {
-    return Promise.reject(t("pipeline.valid.urlValid1"));
+    return Promise.reject(t("pipeline.valid.vllmUrlValid1"));
   }
-  if (!validateIpPort(value)) {
-    return Promise.reject(t("pipeline.valid.urlValid2"));
+  const serverUrl = protocol.value + value;
+  if (!validateServiceAddress(serverUrl)) {
+    return Promise.reject(t("pipeline.valid.vllmUrlValid2"));
   }
 
   isPass.value = true;
@@ -188,12 +222,12 @@ const validateUnique = async (rule: any, value: string) => {
 };
 const handleUrlFormat = (url: string) => {
   if (!url) return "";
-  return url.replace(/http:\/\//g, "");
+  return url.replace(/https?:\/\//g, "");
 };
 const {
   generator_type = "chatqna",
   inference_type = "vllm",
-  vllm_endpoint = "",
+  vllm_endpoint = `${host}:8086`,
   model = {
     model_id: undefined,
     model_path: "",
@@ -204,16 +238,17 @@ const {
 
 const isPass = ref<boolean>(false);
 const validatePass = ref<boolean>(false);
+const isConnected = ref<boolean>(false);
+
 const protocol = ref<string>("http://");
 const formRef = ref<FormInstance>();
 const form = reactive<FormType>({
   generator_type,
   inference_type,
   vllm_endpoint: handleUrlFormat(vllm_endpoint),
-  modelName: inference_type === "vllm" ? model.model_id : "",
   model,
 });
-const rules = reactive({
+const rules: FormRules = reactive({
   generator_type: [
     {
       required: true,
@@ -256,23 +291,26 @@ const rules = reactive({
       trigger: "blur",
     },
   ],
-  modelName: [
-    {
-      required: true,
-      message: t("pipeline.valid.modelName"),
-      trigger: "change",
-    },
-  ],
 });
 const generatorList = Generator;
 const generatorWeightList = ref<EmptyArrayType>([]);
 const modelList = ref<EmptyArrayType>([]);
+const vllmModelList = ref<EmptyArrayType>([]);
 const deviceList = ref<EmptyArrayType>([]);
 
+const isVllm = computed(() => {
+  return form.inference_type === "vllm";
+});
+
 // Complete model_cath
 const handleModelChange = () => {
   form.model.weight = "";
 };
+// Reset  model_ID
+const handleTypeChange = () => {
+  form.model.model_id = undefined;
+};
+
 // Handling Model Folding Events
 const handleModelVisible = async (visible: boolean) => {
   if (visible) {
@@ -284,6 +322,35 @@ const handleModelVisible = async (visible: boolean) => {
     }
   }
 };
+
+const handleQueryVllmModel = async () => {
+  try {
+    const server_address = protocol.value + form.vllm_endpoint;
+    const data: any = await getModelList("vLLM", {
+      server_address,
+    });
+    vllmModelList.value = [].concat(data);
+    isConnected.value = !!vllmModelList.value.length;
+    antNotification(
+      "success",
+      t("common.success"),
+      t("request.pipeline.connectSucc")
+    );
+  } catch (err) {
+    console.error(err);
+  }
+};
+
+// Handling Model Folding Events
+const handleVllmModelVisible = async (visible: boolean) => {
+  if (visible) {
+    if (!isConnected.value) {
+      antNotification("error", t("common.error"), t("pipeline.valid.modelTip"));
+      return;
+    }
+  }
+};
+
 const handleModelPath = (
   modelId: string,
   weights?: string,
@@ -323,7 +390,7 @@ const handleWeightVisible = async (visible: boolean) => {
   if (visible) {
     try {
       const { model_id } = form.model;
-      const data: any = await getModelWeight(model_id);
+      const data: any = await getModelWeight(model_id!);
       generatorWeightList.value = [].concat(data);
     } catch (err) {
       console.error(err);
@@ -333,41 +400,45 @@ const handleWeightVisible = async (visible: boolean) => {
 const handleUrlChange = () => {
   isPass.value = false;
   validatePass.value = false;
+  isConnected.value = false;
 };
 // Format parameter
 const formatFormParam = () => {
-  const { inference_type, model, modelName, vllm_endpoint } = form;
+  const { generator_type, inference_type, model, vllm_endpoint } = form;
   const { model_id, weight } = model;
-  model.model_path = handleModelPath(model_id, weight);
-  model.model_id = inference_type === "vllm" ? modelName : model_id;
+  model.model_path = handleModelPath(model_id!, weight);
   return {
+    generator_type,
     inference_type,
     prompt_path: "./default_prompt.txt",
-    model,
-    vllm_endpoint:
-      inference_type === "vllm" ? protocol.value + vllm_endpoint : undefined,
+    model: isVllm.value ? { model_id } : model,
+    vllm_endpoint: isVllm.value ? protocol.value + vllm_endpoint : undefined,
   };
 };
 
 const handleTestUrl = async () => {
-  formRef.value?.validateFields(["modelName"]);
-  const { modelName } = form;
-  if (!modelName) return;
+  formRef.value?.validateFields([["model", "model_id"]]);
+  const { model_id } = form.model;
+  if (!model_id) return;
   const server_address = protocol.value + form.vllm_endpoint;
 
-  const { status = "" } = await requestUrlVllm({
+  const { status = "" } = (await requestUrlVllm({
     server_address,
-    model_name: modelName,
-  });
+    model_name: model_id,
+  })) as any;
   if (status !== "200") {
-    antNotification("error", t("common.error"), t("pipeline.valid.urlValid3"));
+    antNotification(
+      "error",
+      t("common.error"),
+      t("pipeline.valid.vllmUrlValid3")
+    );
     return;
   }
   validatePass.value = true;
   antNotification(
     "success",
     t("common.success"),
-    t("pipeline.valid.urlValid4")
+    t("pipeline.valid.vllmUrlValid4")
   );
 };
 // Validate the form, throw results form
@@ -376,11 +447,11 @@ const handleValidate = (): Promise<object> => {
     formRef.value
       ?.validate()
       .then(() => {
-        if (form.inference_type === "vllm" && !validatePass.value) {
+        if (isVllm.value && !validatePass.value) {
           antNotification(
             "warning",
             t("common.prompt"),
-            t("pipeline.valid.urlValid5")
+            t("pipeline.valid.vllmUrlValid5")
           );
           return;
         }
@@ -398,9 +469,12 @@ defineExpose({
   validate: handleValidate,
 });
 onMounted(() => {
-  if (props.formType === "update") {
-    isPass.value = true;
-    validatePass.value = true;
+  if (props.formType === "update" && isVllm.value) {
+    isConnected.value = true;
+    isPass.value = validatePass.value = true;
+    handleQueryVllmModel();
+  } else if (form.vllm_endpoint) {
+    formRef.value?.validateFields([["vllm_endpoint"]]);
   }
 });
 </script>
@@ -409,6 +483,22 @@ onMounted(() => {
 :deep(.intel-input-group) {
   .intel-input-group-addon {
     overflow: hidden;
+    .intel-select-selector {
+      border: 1px solid transparent !important;
+    }
+  }
+}
+.model-wrap {
+  flex: 1;
+  .flex-left;
+  :deep(.intel-select-selector) {
+    border-radius: 6px 0 0 6px;
+  }
+  .select-wrap {
+    width: calc(100% - 72px);
+  }
+  .text-btn {
+    margin: 0;
   }
 }
 .text-btn {
@@ -416,5 +506,7 @@ onMounted(() => {
   height: 30px;
   margin: 0 -11px;
   border-radius: 0 6px 6px 0;
+  padding: 0;
+  .vertical-center;
 }
 </style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Indexer.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Indexer.vue
new file mode 100644
index 0000000000..d5be062428
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Indexer.vue
@@ -0,0 +1,463 @@
+<template>
+  <a-form
+    :model="form"
+    :rules="rules"
+    name="indexer"
+    layout="vertical"
+    ref="formRef"
+    autocomplete="off"
+    class="form-wrap"
+  >
+    <div class="column-wrap">
+      <a-form-item
+        :label="$t('pipeline.config.indexerType')"
+        class="row-item"
+        name="indexer_type"
+      >
+        <div class="flex-left">
+          <a-select
+            showSearch
+            v-model:value="form.indexer_type"
+            :placeholder="$t('pipeline.valid.indexerType')"
+            @change="handleTypeChange"
+          >
+            <a-select-option
+              v-for="item in indexerList"
+              :key="item.value"
+              :value="item.value"
+              >{{ item.name }}</a-select-option
+            >
+          </a-select>
+          <FormTooltip :title="$t('pipeline.desc.indexerType')" />
+        </div>
+
+        <div class="option-introduction">
+          <InfoCircleOutlined />
+          {{ $t(optionIntroduction!) }}
+        </div>
+      </a-form-item>
+    </div>
+    <a-form-item
+      :label="$t('pipeline.config.embedding')"
+      :name="['embedding_model', 'model_id']"
+      :rules="rules.model_id"
+    >
+      <a-select
+        showSearch
+        v-model:value="form.embedding_model.model_id"
+        :placeholder="$t('pipeline.valid.embedding')"
+        @change="handleModelChange"
+        @dropdownVisibleChange="handleModelVisible"
+      >
+        <a-select-option v-for="item in modelList" :key="item" :value="item">{{
+          item
+        }}</a-select-option>
+      </a-select>
+      <FormTooltip :title="$t('pipeline.desc.embedding')" />
+    </a-form-item>
+    <a-form-item
+      name="embedding_url"
+      :rules="rules.embedding_url"
+      v-if="isKbadmin"
+    >
+      <template #label>
+        {{ $t("pipeline.config.embeddingUrl") }}
+        <span class="eg-wrap"> {{ $t("pipeline.valid.embeddingUrl") }}</span>
+      </template>
+      <a-input
+        v-model:value="form.embedding_url"
+        :placeholder="$t('pipeline.valid.embeddingUrl')"
+      >
+        <template #addonBefore>
+          <a-select v-model:value="modelProtocol">
+            <a-select-option value="http://">Http://</a-select-option>
+            <a-select-option value="https://">Https://</a-select-option>
+          </a-select>
+        </template>
+      </a-input>
+      <FormTooltip :title="$t('pipeline.desc.embeddingUrl')" />
+    </a-form-item>
+    <a-form-item
+      v-if="!isKbadmin"
+      :label="$t('pipeline.config.embeddingDevice')"
+      :name="['embedding_model', 'device']"
+      :rules="rules.device"
+    >
+      <a-select
+        showSearch
+        v-model:value="form.embedding_model.device"
+        :placeholder="$t('pipeline.valid.embeddingDevice')"
+        @dropdownVisibleChange="handleDeviceVisible"
+      >
+        <a-select-option v-for="item in deviceList" :key="item" :value="item">{{
+          item
+        }}</a-select-option>
+      </a-select>
+      <FormTooltip :title="$t('pipeline.desc.embeddingDevice')" />
+    </a-form-item>
+    <a-form-item
+      name="vector_url"
+      :rules="rules.vector_url"
+      v-if="isMilvus || isKbadmin"
+    >
+      <template #label>
+        {{ $t("pipeline.config.vector_url") }}
+        <span class="eg-wrap">
+          {{ $t(`${TIP_MESSAGES[form.indexer_type]}`) }}</span
+        >
+      </template>
+      <a-input
+        v-model:value="form.vector_url"
+        :placeholder="$t(`${TIP_MESSAGES[form.indexer_type]}`)"
+        @change="handleUriChange"
+      >
+        <template #addonBefore>
+          <a-select v-model:value="protocol">
+            <a-select-option value="http://">Http://</a-select-option>
+            <a-select-option value="https://">Https://</a-select-option>
+          </a-select>
+        </template>
+        <template #addonAfter v-if="isMilvus">
+          <a-button
+            type="primary"
+            class="text-btn"
+            :disabled="!isPass"
+            @click="handleTestUrl"
+          >
+            <CheckCircleFilled
+              v-if="validatePass"
+              :style="{ color: 'var(--color-success)', fontSize: '18px' }"
+            />
+            <span v-else> {{ $t("pipeline.desc.test") }}</span>
+          </a-button>
+        </template>
+      </a-input>
+      <FormTooltip :title="$t('pipeline.desc.vector_url')" />
+    </a-form-item>
+  </a-form>
+</template>
+
+<script lang="ts" setup name="Indexer">
+import { getRunDevice, getModelList, requestUrlVerify } from "@/api/pipeline";
+import type { FormInstance } from "ant-design-vue";
+import { reactive, ref, onMounted } from "vue";
+import { Indexer } from "../../enum.ts";
+import { ModelType } from "../../type.ts";
+import { InfoCircleOutlined, CheckCircleFilled } from "@ant-design/icons-vue";
+import { useI18n } from "vue-i18n";
+import { validateServiceAddress } from "@/utils/validate.ts";
+import { useNotification } from "@/utils/common";
+import { SelectValue } from "ant-design-vue/es/select/index";
+import { RuleObject } from "ant-design-vue/es/form/interface";
+
+const { t } = useI18n();
+const { antNotification } = useNotification();
+const props = defineProps({
+  formData: {
+    type: Object,
+    default: () => {},
+  },
+  formType: {
+    type: String,
+    default: "create",
+  },
+});
+interface FormType {
+  indexer_type: string;
+  vector_url?: string;
+  embedding_url?: string;
+  embedding_model: ModelType;
+}
+
+const host = window.location.hostname;
+const {
+  indexer_type = "faiss_vector",
+  vector_url = "",
+  embedding_url = `${host}:13020`,
+  embedding_model = {
+    model_id: "BAAI/bge-small-en-v1.5",
+    model_path: "./models/BAAI/bge-small-en-v1.5",
+    device: "AUTO",
+    weight: "INT4",
+  },
+} = props.formData?.indexer || {};
+const { parser_type = "" } = props.formData?.node_parser || {};
+const TIP_MESSAGES = {
+  kbadmin_indexer: "pipeline.valid.kb_vector_url",
+  milvus_vector: "pipeline.valid.vector_url",
+} as const;
+const VALIDATION_MESSAGES = {
+  vector: {
+    required: "pipeline.valid.urlValid1",
+    format: "pipeline.valid.urlValid2",
+  },
+  model: {
+    required: "pipeline.valid.modelRequired",
+    format: "pipeline.valid.modelFormat",
+  },
+} as const;
+const validateUnique = (type: "vector" | "model") => {
+  return async (rule: RuleObject, value: string) => {
+    const messages = VALIDATION_MESSAGES[type];
+    if (!value) {
+      return Promise.reject(new Error(t(messages.required)));
+    }
+    const serverUrl = protocol.value + value;
+    if (!validateServiceAddress(serverUrl)) {
+      return Promise.reject(new Error(t(messages.format)));
+    }
+    isPass.value = true;
+    return Promise.resolve();
+  };
+};
+
+const validateIndeserType = async (rule: any, value: string) => {
+  if (!value) {
+    return Promise.reject(t("pipeline.valid.indexerType"));
+  }
+  if (parser_type === "kbadmin_parser" && value !== "kbadmin_indexer") {
+    return Promise.reject(t("pipeline.valid.indexerTypeValid1"));
+  }
+  return Promise.resolve();
+};
+
+const handleUrlFormat = (url: string) => {
+  if (!url) return "";
+  return url.replace(/https?:\/\//g, "");
+};
+
+const isPass = ref<boolean>(false);
+const validatePass = ref<boolean>(false);
+const protocol = ref<string>("http://");
+const modelProtocol = ref<string>("http://");
+const formRef = ref<FormInstance>();
+const form = reactive<FormType>({
+  indexer_type,
+  vector_url: vector_url
+    ? handleUrlFormat(vector_url)
+    : `${host}:${indexer_type === "kbadmin_indexer" ? "29530" : "19530"}`,
+  embedding_url: handleUrlFormat(embedding_url),
+  embedding_model: {
+    ...embedding_model,
+    model_id:
+      props.formType === "update"
+        ? embedding_model.model_id
+        : indexer_type === "kbadmin_indexer"
+        ? undefined
+        : embedding_model.model_id,
+  },
+});
+const rules: FormRules = reactive({
+  indexer_type: [
+    {
+      required: true,
+      validator: validateIndeserType,
+      trigger: "change",
+    },
+  ],
+  model_id: [
+    {
+      required: true,
+      message: t("pipeline.valid.embedding"),
+      trigger: "change",
+    },
+  ],
+  device: [
+    {
+      required: true,
+      message: t("pipeline.valid.embeddingDevice"),
+      trigger: "change",
+    },
+  ],
+  vector_url: [
+    {
+      required: true,
+      validator: validateUnique("vector"),
+      trigger: "blur",
+    },
+  ],
+
+  embedding_url: [
+    {
+      required: true,
+      validator: validateUnique("model"),
+      trigger: "change",
+    },
+  ],
+});
+
+const deviceList = ref<EmptyArrayType>([]);
+const modelList = ref<EmptyArrayType>([]);
+const isCreate = computed(() => {
+  return props.formType === "create";
+});
+const isKbadmin = computed(() => {
+  return form.indexer_type === "kbadmin_indexer";
+});
+const isMilvus = computed(() => {
+  return form.indexer_type === "milvus_vector";
+});
+const indexerList = computed(() => {
+  if (isCreate.value) {
+    return Indexer;
+  }
+  return isKbadmin.value
+    ? Indexer.filter((item) => item.value === "kbadmin_indexer")
+    : Indexer.filter((item) => item.value !== "kbadmin_indexer");
+});
+const optionIntroduction = computed(() => {
+  const { indexer_type } = form;
+
+  return Indexer.find((item) => item.value === indexer_type)?.describe;
+});
+
+const handleTypeChange = (value: SelectValue) => {
+  if (value === "kbadmin_indexer") {
+    antNotification(
+      "warning",
+      t("common.prompt"),
+      t("pipeline.valid.indexerTypeTip")
+    );
+  }
+  if (isCreate.value) {
+    form.embedding_model.model_id = undefined;
+    form.embedding_model.model_path = "";
+    form.vector_url = `${host}:${isKbadmin.value ? "29530" : "19530"}`;
+    if (value === "milvus_vector") {
+      nextTick(() => formRef.value?.validateFields([["vector_url"]]));
+    }
+  }
+};
+// Handling Device Folding Events
+const handleDeviceVisible = async (visible: boolean) => {
+  if (visible) {
+    try {
+      const data: any = await getRunDevice();
+      deviceList.value = [].concat(data);
+    } catch (err) {
+      console.error(err);
+    }
+  }
+};
+// Handling Model Folding Events
+const handleModelVisible = async (visible: boolean) => {
+  if (visible) {
+    try {
+      const modelType = isKbadmin.value
+        ? "kbadmin_embedding_model"
+        : "embedding";
+      const data: any = await getModelList(modelType);
+      modelList.value = [].concat(data);
+    } catch (err) {
+      console.error(err);
+    }
+  }
+};
+//Complete model_cath
+const handleModelChange = (value: SelectValue) => {
+  form.embedding_model.model_path = `./models/${value}`;
+};
+const handleTestUrl = async () => {
+  const vector_url = protocol.value + form.vector_url;
+  const { status = "" } = (await requestUrlVerify({ vector_url })) as any;
+
+  if (status !== "200") {
+    antNotification("error", t("common.error"), t("pipeline.valid.urlValid3"));
+    return;
+  }
+  validatePass.value = true;
+  antNotification(
+    "success",
+    t("common.success"),
+    t("pipeline.valid.urlValid4")
+  );
+};
+const handleUriChange = () => {
+  isPass.value = false;
+  validatePass.value = false;
+};
+// Format parameter
+const formatFormParam = () => {
+  const { indexer_type, vector_url, embedding_url, embedding_model } = form;
+
+  return {
+    indexer_type,
+    embedding_model: embedding_model,
+    vector_url:
+      isMilvus.value || isKbadmin.value
+        ? protocol.value + vector_url
+        : undefined,
+    embedding_url: isKbadmin.value
+      ? modelProtocol.value + embedding_url
+      : undefined,
+  };
+};
+const generateFormData = () => {
+  const baseData = { indexer: formatFormParam() };
+  const { retriever } = props.formData;
+
+  if (isKbadmin.value && parser_type !== "kbadmin_parser") {
+    return {
+      ...baseData,
+      node_parser: { parser_type: "kbadmin_parser" },
+      retriever: { ...retriever, retriever_type: "kbadmin_retriever" },
+    };
+  }
+
+  return baseData;
+};
+// Validate the form, throw results form
+const handleValidate = (): Promise<object> => {
+  return new Promise((resolve) => {
+    formRef.value
+      ?.validate()
+      .then(() => {
+        if (isMilvus.value && !validatePass.value) {
+          antNotification(
+            "warning",
+            t("common.prompt"),
+            t("pipeline.valid.urlValid5")
+          );
+          return;
+        }
+        resolve({
+          result: true,
+          data: generateFormData(),
+        });
+      })
+      .catch(() => {
+        resolve({ result: false });
+      });
+  });
+};
+defineExpose({
+  validate: handleValidate,
+});
+
+onMounted(() => {
+  if (isMilvus.value) {
+    if (props.formType === "update") {
+      isPass.value = validatePass.value = true;
+    } else {
+      formRef.value?.validateFields([["vector_url"]]);
+    }
+  }
+});
+</script>
+
+<style scoped lang="less">
+:deep(.intel-input-group) {
+  .intel-input-group-addon {
+    overflow: hidden;
+    .intel-select-selector {
+      border: 1px solid transparent !important;
+    }
+  }
+}
+.text-btn {
+  width: 72px;
+  height: 30px;
+  margin: 0 -11px;
+  border-radius: 0 6px 6px 0;
+}
+</style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/NodeParser.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/NodeParser.vue
similarity index 73%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/NodeParser.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/NodeParser.vue
index d72119e8e6..a1ae33c207 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/NodeParser.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/NodeParser.vue
@@ -13,9 +13,10 @@
       name="parser_type"
     >
       <a-select
-        v-model:value="form.parser_type"
         showSearch
+        v-model:value="form.parser_type"
         :placeholder="$t('pipeline.valid.nodeParserType')"
+        @change="handleTypeChange"
       >
         <a-select-option
           v-for="item in nodeParserList"
@@ -30,7 +31,7 @@
       <InfoCircleOutlined />
       {{ $t(optionIntroduction!) }}
     </div>
-    <template v-if="!isHierarchical && !isSentencewindow">
+    <template v-if="!isHierarchical && !isSentencewindow && !isKbadmin">
       <a-form-item
         :label="$t('pipeline.config.chunkSize')"
         name="chunk_size"
@@ -83,7 +84,7 @@
           v-model:value="form.window_size"
           :min="1"
           :max="10"
-          :marks="sliderMarks.size"
+          :marks="sliderMarks.window"
         />
         <a-form-item noStyle>
           <a-input-number
@@ -105,13 +106,20 @@ import { computed, reactive, ref } from "vue";
 import { NodeParser } from "../../enum.ts";
 import { InfoCircleOutlined } from "@ant-design/icons-vue";
 import { useI18n } from "vue-i18n";
+import { useNotification } from "@/utils/common";
+import { SelectValue } from "ant-design-vue/es/select/index";
 
 const { t } = useI18n();
+const { antNotification } = useNotification();
 const props = defineProps({
   formData: {
     type: Object,
     default: () => {},
   },
+  formType: {
+    type: String,
+    default: "create",
+  },
 });
 interface FormType {
   parser_type: string;
@@ -132,9 +140,7 @@ const validate = {
     }
   },
   chunkOverlap: async (_rule: any, value: number) => {
-    if (!value) {
-      return Promise.reject(t("pipeline.valid.chunkOverlapValid1"));
-    } else if (form?.chunk_size && value > form?.chunk_size) {
+    if (form?.chunk_size && value > form?.chunk_size) {
       return Promise.reject(t("pipeline.valid.chunkOverlapValid2"));
     } else {
       return Promise.resolve();
@@ -158,7 +164,7 @@ const form = reactive<FormType>({
   chunk_sizes,
   window_size,
 });
-const rules = reactive({
+const rules: FormRules = reactive({
   parser_type: [
     {
       required: true,
@@ -189,17 +195,30 @@ const rules = reactive({
   ],
 });
 
-const nodeParserList = NodeParser;
+const isCreate = computed(() => {
+  return props.formType === "create";
+});
 const isHierarchical = computed(() => {
   return form.parser_type === "hierarchical";
 });
+const isKbadmin = computed(() => {
+  return form.parser_type === "kbadmin_parser";
+});
 const isSentencewindow = computed(() => {
   return form.parser_type === "sentencewindow";
 });
+const nodeParserList = computed(() => {
+  if (isCreate.value) {
+    return NodeParser;
+  }
+  return isKbadmin.value
+    ? NodeParser.filter((item) => item.value === "kbadmin_parser")
+    : NodeParser.filter((item) => item.value !== "kbadmin_parser");
+});
 const optionIntroduction = computed(() => {
   const { parser_type } = form;
 
-  return nodeParserList.find((item) => item.value === parser_type)?.describe;
+  return NodeParser.find((item) => item.value === parser_type)?.describe;
 });
 const sliderMarks = reactive<EmptyObjectType>({
   size: {
@@ -210,7 +229,20 @@ const sliderMarks = reactive<EmptyObjectType>({
     0: "0",
     400: "400",
   },
+  window: {
+    1: "1",
+    10: "10",
+  },
 });
+
+const handleTypeChange = (value: SelectValue) => {
+  if (value === "kbadmin_parser")
+    antNotification(
+      "warning",
+      t("common.prompt"),
+      t("pipeline.valid.nodeParserTypeTip")
+    );
+};
 const handleChunkSizeChange = () => {
   formRef.value?.validateFields(["chunk_size"]);
 };
@@ -225,19 +257,44 @@ const formatFormParam = () => {
   const { parser_type, chunk_size, chunk_overlap, chunk_sizes, window_size } =
     form;
 
+  const chunkSizes = isHierarchical.value ? chunk_sizes : undefined;
+  const windowSize = isSentencewindow.value ? window_size : undefined;
+
+  const chunkSize =
+    !isHierarchical.value && !isSentencewindow.value && !isKbadmin.value
+      ? chunk_size
+      : undefined;
+
+  const chunkOverlap = isHierarchical.value
+    ? 20
+    : isKbadmin.value
+    ? undefined
+    : !isSentencewindow.value
+    ? chunk_overlap
+    : undefined;
+
   return {
     parser_type,
-    chunk_sizes: isHierarchical.value ? chunk_sizes : undefined,
-    window_size: isSentencewindow.value ? window_size : undefined,
-    chunk_size:
-      !isHierarchical.value && !isSentencewindow.value ? chunk_size : undefined,
-    chunk_overlap: isHierarchical.value
-      ? 20
-      : !isSentencewindow.value
-      ? chunk_overlap
-      : undefined,
+    chunk_sizes: chunkSizes,
+    window_size: windowSize,
+    chunk_size: chunkSize,
+    chunk_overlap: chunkOverlap,
   };
 };
+const generateFormData = () => {
+  const baseData = { node_parser: formatFormParam() };
+  const { indexer, retriever } = props.formData;
+
+  if (isKbadmin.value) {
+    return {
+      ...baseData,
+      indexer: { ...indexer, indexer_type: "kbadmin_indexer" },
+      retriever: { ...retriever, retriever_type: "kbadmin_retriever" },
+    };
+  }
+
+  return baseData;
+};
 // Validate the form, throw results form
 const handleValidate = (): Promise<object> => {
   return new Promise((resolve) => {
@@ -246,7 +303,7 @@ const handleValidate = (): Promise<object> => {
       .then(() => {
         resolve({
           result: true,
-          data: { node_parser: formatFormParam() },
+          data: generateFormData(),
         });
       })
       .catch(() => {
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/PostProcessor.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/PostProcessor.vue
similarity index 76%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/PostProcessor.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/PostProcessor.vue
index 0a0aa8e279..98614b3a70 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/PostProcessor.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/PostProcessor.vue
@@ -22,6 +22,7 @@
           showSearch
           v-model:value="processor.processor_type"
           :placeholder="$t('pipeline.valid.postProcessorType')"
+          @change="(value) => handleTypeChange(value, processor)"
         >
           <a-select-option
             v-for="item in postProcessorList"
@@ -48,7 +49,7 @@
             v-model:value="processor.reranker_model.model_id"
             :placeholder="$t('pipeline.valid.rerank')"
             @dropdownVisibleChange="handleModelVisible"
-            @change="(value:string) => handleModelChange(processor.reranker_model, value)"
+            @change="(value:SelectValue) => handleModelChange(processor.reranker_model, value)"
           >
             <a-select-option
               v-for="item in modelList"
@@ -77,10 +78,31 @@
               >{{ item }}</a-select-option
             >
           </a-select>
-          <FormTooltip
-            :title="$t('pipeline.desc.rerankDevice')"
-          /> </a-form-item
-      ></template>
+          <FormTooltip :title="$t('pipeline.desc.rerankDevice')" />
+        </a-form-item>
+        <a-form-item
+          :label="$t('pipeline.config.topn')"
+          :name="['postprocessor', index, 'top_n']"
+          :rules="rules.topn"
+          class="slider-wrap"
+        >
+          <a-slider
+            v-model:value="processor.top_n"
+            :min="1"
+            :max="100"
+            :marks="sliderMarks.top_n"
+          />
+          <a-form-item noStyle>
+            <a-input-number
+              v-model:value="processor.top_n"
+              :min="1"
+              :max="100"
+              @change="handleTopnChange"
+            />
+          </a-form-item>
+          <FormTooltip :title="$t('generation.desc.top_n')" />
+        </a-form-item>
+      </template>
       <div class="icon-wrap">
         <a-tooltip
           placement="topRight"
@@ -112,6 +134,7 @@ import { PostProcessor } from "../../enum.ts";
 import { ModelType } from "../../type.ts";
 import { InfoCircleOutlined } from "@ant-design/icons-vue";
 import { useI18n } from "vue-i18n";
+import { SelectValue } from "ant-design-vue/es/select/index";
 
 const { t } = useI18n();
 const props = defineProps({
@@ -129,7 +152,7 @@ interface ProcessorType {
 interface FormType {
   postprocessor: ProcessorType[];
 }
-const { postprocessor = [] } = props.formData.postprocessor || [];
+const { postprocessor = [] } = props.formData || [];
 
 const defaultConfig = [
   {
@@ -147,7 +170,7 @@ const formRef = ref<FormInstance>();
 const form = reactive<FormType>({
   postprocessor: postprocessor.length ? postprocessor : defaultConfig,
 });
-const rules = reactive({
+const rules: FormRules = reactive({
   processor_type: [
     {
       required: true,
@@ -155,6 +178,13 @@ const rules = reactive({
       trigger: "change",
     },
   ],
+  topn: [
+    {
+      required: true,
+      message: t("pipeline.valid.topn"),
+      trigger: ["change", "blur"],
+    },
+  ],
   model_id: [
     {
       required: true,
@@ -171,6 +201,12 @@ const rules = reactive({
     },
   ],
 });
+const sliderMarks = reactive<EmptyObjectType>({
+  topn: {
+    1: "1",
+    100: "100",
+  },
+});
 const postProcessorList = PostProcessor;
 const modelList = ref<EmptyArrayType>([]);
 const deviceList = ref<EmptyArrayType>([]);
@@ -180,6 +216,22 @@ const getDisable = (value: string) => {
 const getOptionIntroduction = (value: string) => {
   return postProcessorList.find((item) => item.value === value)?.describe;
 };
+const handleTypeChange = (value: SelectValue, row: EmptyObjectType) => {
+  if (value === "reranker") {
+    Object.assign(row, {
+      top_n: 25,
+      reranker_model: {
+        model_id: "BAAI/bge-reranker-large",
+        model_path: "./models/BAAI/bge-reranker-large",
+        device: "AUTO",
+        weight: "INT4",
+      },
+    });
+  }
+};
+const handleTopnChange = () => {
+  formRef.value?.validateFields(["topn"]);
+};
 // Handling Model Folding Events
 const handleModelVisible = async (visible: boolean) => {
   if (visible) {
@@ -198,6 +250,7 @@ const handleModelChange = (item: EmptyObjectType, value: string) => {
 const handleAdd = () => {
   form.postprocessor.push({
     processor_type: "",
+    top_n: 25,
     reranker_model: {
       model_id: "",
       model_path: "",
@@ -220,6 +273,19 @@ const handleDeviceVisible = async (visible: boolean) => {
     }
   }
 };
+// Format parameter
+const formatFormParam = () => {
+  const { postprocessor } = form;
+  return postprocessor.map((item) => {
+    if (item.processor_type === "metadata_replace") {
+      return {
+        processor_type: item.processor_type,
+      };
+    } else {
+      return item;
+    }
+  });
+};
 // Validate the form, throw results form
 const handleValidate = (): Promise<object> => {
   return new Promise((resolve) => {
@@ -228,7 +294,7 @@ const handleValidate = (): Promise<object> => {
       .then(() => {
         resolve({
           result: true,
-          data: form,
+          data: { postprocessor: formatFormParam() },
         });
       })
       .catch(() => {
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Retriever.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Retriever.vue
new file mode 100644
index 0000000000..7f77011cd6
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/Retriever.vue
@@ -0,0 +1,216 @@
+<template>
+  <a-form
+    :model="form"
+    :rules="rules"
+    name="retriever"
+    layout="vertical"
+    ref="formRef"
+    autocomplete="off"
+    class="form-wrap"
+  >
+    <div class="column-wrap">
+      <a-form-item
+        :label="$t('pipeline.config.retrieverType')"
+        name="retriever_type"
+        ><div class="flex-left">
+          <a-select
+            showSearch
+            v-model:value="form.retriever_type"
+            :placeholder="$t('pipeline.valid.retrieverType')"
+            @change="handleTypeChange"
+          >
+            <a-select-option
+              v-for="item in retrieverList"
+              :key="item.value"
+              :value="item.value"
+              >{{ item.name }}</a-select-option
+            >
+          </a-select>
+          <FormTooltip :title="$t('pipeline.desc.retrieverType')" />
+        </div>
+        <div class="option-introduction">
+          <InfoCircleOutlined />
+          {{ $t(optionIntroduction!) }}
+        </div>
+      </a-form-item>
+    </div>
+
+    <a-form-item
+      :label="$t('pipeline.config.topk')"
+      name="retrieve_topk"
+      class="slider-wrap"
+    >
+      <a-slider
+        v-model:value="form.retrieve_topk"
+        :min="1"
+        :max="500"
+        :marks="sliderMarks.retrieval"
+      />
+      <a-form-item noStyle>
+        <a-input-number
+          v-model:value="form.retrieve_topk"
+          :min="1"
+          :max="500"
+          @change="handleTopkChange"
+        />
+      </a-form-item>
+      <FormTooltip :title="$t('pipeline.desc.topk')" />
+    </a-form-item>
+  </a-form>
+</template>
+
+<script lang="ts" setup name="Retriever">
+import type { FormInstance } from "ant-design-vue";
+import { reactive, ref } from "vue";
+import { Retriever } from "../../enum.ts";
+import { InfoCircleOutlined } from "@ant-design/icons-vue";
+import { useI18n } from "vue-i18n";
+import { useNotification } from "@/utils/common";
+import { SelectValue } from "ant-design-vue/es/select/index";
+
+const { t } = useI18n();
+const { antNotification } = useNotification();
+
+const props = defineProps({
+  formData: {
+    type: Object,
+    default: () => {},
+  },
+  formType: {
+    type: String,
+    default: "create",
+  },
+});
+interface FormType {
+  retriever_type: string;
+  retrieve_topk: number;
+}
+
+const { retriever_type = "vectorsimilarity", retrieve_topk = 30 } =
+  props.formData?.retriever || {};
+const { indexer_type = "" } = props.formData?.indexer || {};
+
+const validateIndeserType = async (rule: any, value: string) => {
+  if (!value) {
+    return Promise.reject(t("pipeline.valid.retrieverType"));
+  }
+  if (indexer_type === "kbadmin_indexer" && value !== "kbadmin_retriever") {
+    return Promise.reject(t("pipeline.valid.retrieverTypeFormat"));
+  }
+  return Promise.resolve();
+};
+
+const formRef = ref<FormInstance>();
+const form = reactive<FormType>({
+  retriever_type,
+  retrieve_topk,
+});
+const rules: FormRules = reactive({
+  retriever_type: [
+    {
+      required: true,
+      validator: validateIndeserType,
+      trigger: "change",
+    },
+  ],
+  retrieve_topk: [
+    {
+      required: true,
+      message: t("pipeline.valid.topk"),
+      trigger: ["change", "blur"],
+    },
+  ],
+});
+
+const isCreate = computed(() => {
+  return props.formType === "create";
+});
+const isKbadmin = computed(() => {
+  return form.retriever_type === "kbadmin_retriever";
+});
+const retrieverList = computed(() => {
+  if (isCreate.value) {
+    return Retriever;
+  }
+  return isKbadmin.value
+    ? Retriever.filter((item) => item.value === "kbadmin_retriever")
+    : Retriever.filter((item) => item.value !== "kbadmin_retriever");
+});
+const optionIntroduction = computed(() => {
+  const { retriever_type } = form;
+
+  return Retriever.find((item) => item.value === retriever_type)?.describe;
+});
+const sliderMarks = reactive<EmptyObjectType>({
+  retrieval: {
+    1: "1",
+    500: "500",
+  },
+});
+const handleTypeChange = (value: SelectValue) => {
+  if (value === "kbadmin_retriever")
+    antNotification(
+      "warning",
+      t("common.prompt"),
+      t("pipeline.valid.retrieverTypeTip")
+    );
+};
+const handleTopkChange = () => {
+  formRef.value?.validateFields(["retrieve_topk"]);
+};
+const generateFormData = () => {
+  const baseData = { retriever: form };
+  const { indexer } = props.formData;
+
+  if (isKbadmin.value && indexer_type !== "kbadmin_indexer") {
+    antNotification(
+      "warning",
+      t("common.prompt"),
+      t("pipeline.valid.retrieverTypeTip")
+    );
+    return {
+      ...baseData,
+      node_parser: { parser_type: "kbadmin_parser" },
+      indexer: {
+        ...indexer,
+        indexer_type: "kbadmin_indexer",
+        embedding_url: "",
+        vector_url: "",
+      },
+    };
+  }
+
+  return baseData;
+};
+// Validate the form, throw results form
+const handleValidate = (): Promise<object> => {
+  return new Promise((resolve) => {
+    formRef.value
+      ?.validate()
+      .then(() => {
+        let dest = null;
+        if (indexer_type !== "kbadmin_indexer" && isKbadmin.value) {
+          antNotification(
+            "warning",
+            t("common.prompt"),
+            t("pipeline.valid.retrieverValid")
+          );
+          dest = 3;
+        }
+        resolve({
+          result: true,
+          data: generateFormData(),
+          dest,
+        });
+      })
+      .catch(() => {
+        resolve({ result: false });
+      });
+  });
+};
+defineExpose({
+  validate: handleValidate,
+});
+</script>
+
+<style scoped lang="less"></style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/index.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/index.ts
similarity index 100%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/UpdateDialog/index.ts
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/UpdateDialog/index.ts
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/index.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/index.ts
similarity index 58%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/index.ts
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/index.ts
index 275d4eee6c..86e2ee7b24 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/index.ts
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/components/index.ts
@@ -3,11 +3,8 @@
 
 import DetailDrawer from "./DetailDrawer.vue";
 import ImportDialog from "./ImportDialog.vue";
-import QuickStart from "./QuickStart.vue";
-import System from "./System.vue";
-import SystemChart from "./SystemChart.vue";
 import Table from "./Table.vue";
 import CreateDialog from "./UpdateDialog/CreateDialog.vue";
 import EditDialog from "./UpdateDialog/EditDialog.vue";
 
-export { CreateDialog, DetailDrawer, EditDialog, ImportDialog, QuickStart, System, SystemChart, Table };
+export { CreateDialog, DetailDrawer, EditDialog, ImportDialog, Table };
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/enum.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/enum.ts
similarity index 80%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/enum.ts
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/enum.ts
index 712afd807f..b2f8a9598e 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/enum.ts
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/enum.ts
@@ -22,6 +22,11 @@ export const NodeParser = [
     value: "unstructured",
     describe: "pipeline.desc.unstructured",
   },
+  {
+    name: "kbadmin",
+    value: "kbadmin_parser",
+    describe: "pipeline.desc.kbadmin",
+  },
 ] as const;
 
 export const Indexer = [
@@ -40,6 +45,11 @@ export const Indexer = [
     value: "milvus_vector",
     describe: "pipeline.desc.milvusVector",
   },
+  {
+    name: "kbadmin",
+    value: "kbadmin_indexer",
+    describe: "pipeline.desc.kbadmin",
+  },
 ] as const;
 export const Retriever = [
   {
@@ -57,6 +67,11 @@ export const Retriever = [
     value: "bm25",
     describe: "pipeline.desc.bm25",
   },
+  {
+    name: "kbadmin",
+    value: "kbadmin_retriever",
+    describe: "pipeline.desc.kbadmin",
+  },
 ] as const;
 
 export const PostProcessor = [
@@ -74,7 +89,11 @@ export const PostProcessor = [
 
 export const Generator = [
   {
-    name: "Chatqna",
+    name: "ChatQnA",
     value: "chatqna",
   },
+  {
+    name: "FreeChat",
+    value: "freechat",
+  },
 ] as const;
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/index.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/index.vue
similarity index 55%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/index.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/index.vue
index b0ff597a5f..c68b8b0055 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/index.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/index.vue
@@ -1,20 +1,7 @@
 <template>
-  <div class="setting-container">
-    <a-affix :offset-top="450">
-      <div class="chatbot-wrap" @click="jumpChatbot">
-        <SvgIcon
-          name="icon-chatbot"
-          :size="40"
-          :style="{ color: 'var(--color-big-icon)' }"
-          inherit
-        />
-        <div>{{ $t("common.chatbot") }}</div>
-      </div></a-affix
-    >
-    <!-- system status -->
-    <System />
-    <!-- pipelines list -->
+  <div class="pipeline-container">
     <Table
+      :loading
       :table-data="tableData"
       @create="handleCreate"
       @update="handleUpdate"
@@ -50,25 +37,18 @@
   </div>
 </template>
 
-<script lang="ts" setup name="xxx">
+<script lang="ts" setup name="Pipeline">
 import { getPipelineDetailByName, getPipelineList } from "@/api/pipeline";
-import router from "@/router";
-import { pipelineAppStore } from "@/store/pipeline";
-import { useNotification } from "@/utils/common";
 import { onMounted, reactive, ref } from "vue";
 import {
   CreateDialog,
   DetailDrawer,
   EditDialog,
   ImportDialog,
-  System,
   Table,
 } from "./components";
-import { useI18n } from "vue-i18n";
 
-const { t } = useI18n();
-const { antNotification } = useNotification();
-const pipelineStore = pipelineAppStore();
+const loading = ref<boolean>(true);
 const createDialog = reactive<DialogType>({
   visible: false,
 });
@@ -87,9 +67,15 @@ const importDialog = reactive<DialogType>({
 const tableData = ref<EmptyArrayType>([]);
 
 const queryPipelineList = async () => {
-  const data: any = await getPipelineList();
-
-  tableData.value = [].concat(data);
+  try {
+    loading.value = true;
+    const data: any = await getPipelineList();
+    tableData.value = [].concat(data);
+  } catch (error) {
+    console.log(error);
+  } finally {
+    loading.value = false;
+  }
 };
 
 //create
@@ -99,7 +85,6 @@ const handleCreate = () => {
 //edit
 const handleUpdate = async (row: EmptyObjectType) => {
   const data: any = await getPipelineDetailByName(row.name);
-
   editDialog.data = JSON.parse(data);
   editDialog.visible = true;
 };
@@ -118,56 +103,14 @@ const handleSearch = () => {
 const handleImport = () => {
   importDialog.visible = true;
 };
-//Jump Chatbot
-const jumpChatbot = () => {
-  if (pipelineStore.activatedPipeline) {
-    router.push({ name: "Chatbot" });
-  } else {
-    antNotification(
-      "warning",
-      t("common.prompt"),
-      t("pipeline.notActivatedTip")
-    );
-  }
-};
+
 onMounted(() => {
   queryPipelineList();
 });
 </script>
 
 <style scoped lang="less">
-.setting-container {
-  position: relative;
-  display: block !important;
-  padding: 24px;
-  width: 100%;
-
-  .chatbot-wrap {
-    display: none;
-    padding: 12px 8px;
-    position: absolute;
-    transform: translateY(-50%);
-    top: 40%;
-    left: -80px;
-    z-index: 99;
-    background-color: var(--bg-content-color);
-    box-shadow: 0px 2px 4px 0px var(--bg-box-shadow);
-    border-radius: 6px;
-    // display: flex;
-    flex-direction: column;
-    align-items: center;
-    cursor: pointer;
-    font-size: 14px;
-    font-weight: 500;
-    color: var(--font-main-color);
-    &:hover {
-      color: var(--color-primary);
-    }
-  }
-  @media (max-width: 1100px) {
-    .chatbot-wrap {
-      left: 0;
-    }
-  }
+.pipeline-container {
+  .mt-24;
 }
 </style>
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/type.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/type.ts
new file mode 100644
index 0000000000..1ceaa77944
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/Pipeline/type.ts
@@ -0,0 +1,10 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+export interface ModelType {
+  model_id: string | undefined;
+  model_path: string;
+  model_url?: string;
+  device: string;
+  weight?: string;
+}
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/SystemChart.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/System/SystemChart.vue
similarity index 98%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/SystemChart.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/System/SystemChart.vue
index ccc6ff57f3..82bf8eb969 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/SystemChart.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/System/SystemChart.vue
@@ -1,5 +1,5 @@
 <template>
-  <div>
+  <div class="illustration-wrap">
     <a-row type="flex" wrap :gutter="[20, 20]">
       <a-col :span="chartCol">
         <v-chart
@@ -304,9 +304,12 @@ const memoryOption = computed(() => ({
 </script>
 
 <style scoped lang="less">
+.illustration-wrap {
+  flex: 1;
+}
 .chart-wrap {
   width: 100%;
-  height: 170px;
+  height: 172px;
   border-radius: 8px;
   background-color: var(--bg-card-color);
   overflow: hidden;
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/System.vue b/EdgeCraftRAG/ui/vue/src/views/settings/components/System/index.vue
similarity index 54%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/components/System.vue
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/System/index.vue
index 52e5cb287b..123af96a99 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/components/System.vue
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/System/index.vue
@@ -2,30 +2,32 @@
   <div class="system-container">
     <a-collapse v-model:activeKey="activeKey" expandIconPosition="end">
       <a-collapse-panel key="status" :header="$t('system.title')">
-        <SystemChart :system-data="systemData" :chart-col="chartCol" />
-        <div class="info-wrap">
-          <a-descriptions
-            :title="$t('system.info')"
-            :column="1"
-            :label-style="{ color: 'var(--font-text-color)' }"
-            :content-style="{
-              color: 'var(--font-main-color)',
-              justifyContent: 'end',
-            }"
-          >
-            <a-descriptions-item :label="$t('system.kernel')">{{
-              systemData.kernel
-            }}</a-descriptions-item>
-            <a-descriptions-item :label="$t('system.processor')">{{
-              systemData.processor
-            }}</a-descriptions-item>
-            <a-descriptions-item :label="$t('system.os')">{{
-              systemData.os
-            }}</a-descriptions-item>
-            <a-descriptions-item :label="$t('system.time')">{{
-              systemData.currentTime
-            }}</a-descriptions-item>
-          </a-descriptions>
+        <div class="chart-container">
+          <SystemChart :system-data="systemData" :chart-col="chartCol" />
+          <div class="info-wrap">
+            <a-descriptions
+              :title="$t('system.info')"
+              :column="1"
+              :label-style="{ color: 'var(--font-info-color)' }"
+              :content-style="{
+                color: 'var(--font-text-color)',
+                justifyContent: 'end',
+              }"
+            >
+              <a-descriptions-item :label="$t('system.kernel')">{{
+                systemData.kernel
+              }}</a-descriptions-item>
+              <a-descriptions-item :label="$t('system.processor')">{{
+                systemData.processor
+              }}</a-descriptions-item>
+              <a-descriptions-item :label="$t('system.os')">{{
+                systemData.os
+              }}</a-descriptions-item>
+              <a-descriptions-item :label="$t('system.time')">{{
+                systemData.currentTime
+              }}</a-descriptions-item>
+            </a-descriptions>
+          </div>
         </div>
       </a-collapse-panel>
     </a-collapse>
@@ -35,8 +37,8 @@
 <script lang="ts" setup name="System">
 import { getSystemStatus } from "@/api/pipeline";
 import { onMounted, onUnmounted, ref } from "vue";
-import { SystemChart } from "./index";
-import { SystemType } from "../type";
+import SystemChart from "./SystemChart.vue";
+import { SystemType } from "./type";
 
 const activeKey = ref<string>("status");
 const intervalId = ref<any>(null);
@@ -62,8 +64,9 @@ const querySystemStatus = async () => {
 };
 
 onMounted(() => {
-  querySystemStatus();
-  intervalId.value = setInterval(querySystemStatus, 50000);
+  setTimeout(() => querySystemStatus(), 10);
+
+  intervalId.value = setInterval(querySystemStatus, 60000);
 });
 onUnmounted(() => {
   clearInterval(intervalId.value);
@@ -99,18 +102,28 @@ onUnmounted(() => {
       }
     }
   }
+  .chart-container {
+    .flex-left;
+    gap: 20px;
+  }
   .info-wrap {
     border-radius: 8px;
     background-color: var(--bg-card-color);
-    padding: 16px 16px 0 16px;
-    margin-top: 20px;
-    width: 500px;
+    padding: 8px 16px 0 16px;
+    width: 400px;
     :deep(.intel-descriptions) {
       .intel-descriptions-header {
         margin-bottom: 12px;
       }
+      .intel-descriptions-row {
+        display: flex;
+        flex-wrap: wrap;
+        gap: 8px;
+      }
       .intel-descriptions-item {
         padding-bottom: 8px;
+        flex: 1 1 auto;
+        min-width: 250px;
       }
     }
   }
diff --git a/EdgeCraftRAG/ui/vue/src/views/pipeline/type.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/System/type.ts
similarity index 74%
rename from EdgeCraftRAG/ui/vue/src/views/pipeline/type.ts
rename to EdgeCraftRAG/ui/vue/src/views/settings/components/System/type.ts
index f842d086da..cdc98abd09 100644
--- a/EdgeCraftRAG/ui/vue/src/views/pipeline/type.ts
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/System/type.ts
@@ -1,13 +1,6 @@
 // Copyright (C) 2025 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 
-export interface ModelType {
-  model_id: string;
-  model_path: string;
-  device: string;
-  weight?: string;
-}
-
 export interface SystemType {
   cpuUsage: number;
   gpuUsage: number;
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/components/index.ts b/EdgeCraftRAG/ui/vue/src/views/settings/components/index.ts
new file mode 100644
index 0000000000..e123a052e7
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/components/index.ts
@@ -0,0 +1,8 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+import System from "./System/index.vue";
+import Pipeline from "./Pipeline/index.vue";
+import Agent from "./Agent/index.vue";
+
+export { System, Pipeline, Agent };
diff --git a/EdgeCraftRAG/ui/vue/src/views/settings/index.vue b/EdgeCraftRAG/ui/vue/src/views/settings/index.vue
new file mode 100644
index 0000000000..ec782aeca0
--- /dev/null
+++ b/EdgeCraftRAG/ui/vue/src/views/settings/index.vue
@@ -0,0 +1,63 @@
+<template>
+  <div class="setting-container">
+    <!-- system status -->
+    <System />
+    <!-- Agent -->
+    <Agent />
+    <!-- Pipeline -->
+    <Pipeline />
+  </div>
+</template>
+<script lang="ts" setup name="Settings">
+import { Pipeline, System, Agent } from "./components";
+</script>
+
+<style scoped lang="less">
+.setting-container {
+  position: relative;
+  display: block !important;
+  padding: 24px;
+  width: 100%;
+
+  .chatbot-wrap {
+    display: none;
+    padding: 12px 8px;
+    position: absolute;
+    transform: translateY(-50%);
+    top: 40%;
+    left: -80px;
+    z-index: 99;
+    background-color: var(--bg-content-color);
+    box-shadow: 0px 2px 4px 0px var(--bg-box-shadow);
+    border-radius: 6px;
+    // display: flex;
+    flex-direction: column;
+    align-items: center;
+    cursor: pointer;
+    font-size: 14px;
+    font-weight: 500;
+    color: var(--font-main-color);
+    &:hover {
+      color: var(--color-primary);
+    }
+  }
+  :deep(.intel-tabs) {
+    .mt-20;
+    .intel-tabs-nav {
+      margin: 0;
+    }
+    .intel-tabs-nav::before {
+      border-bottom: none;
+    }
+    .title-wrap {
+      .flex-left;
+      gap: 4px;
+    }
+  }
+  @media (max-width: 1100px) {
+    .chatbot-wrap {
+      left: 0;
+    }
+  }
+}
+</style>
diff --git a/FinanceAgent/docker_compose/intel/hpu/gaudi/compose.yaml b/FinanceAgent/docker_compose/intel/hpu/gaudi/compose.yaml
index 8c6d579c3c..2703fa9be0 100644
--- a/FinanceAgent/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/FinanceAgent/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -24,7 +24,7 @@ x-common-agent-environment:
 services:
 
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.22.0
     container_name: vllm-gaudi-server
     ports:
       - "8086:8000"
diff --git a/GraphRAG/tests/test_compose_on_gaudi.sh b/GraphRAG/tests/test_compose_on_gaudi.sh
index b6852c962a..c9a2be5a84 100755
--- a/GraphRAG/tests/test_compose_on_gaudi.sh
+++ b/GraphRAG/tests/test_compose_on_gaudi.sh
@@ -35,7 +35,7 @@ function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     source set_env.sh
     unset OPENAI_API_KEY
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     # Start Docker Containers
     docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
 
@@ -153,34 +153,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$host_ip/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose -f compose.yaml down
@@ -208,10 +180,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/GraphRAG/tests/test_ui_on_gaudi.sh b/GraphRAG/tests/test_ui_on_gaudi.sh
new file mode 100755
index 0000000000..87a87edfa2
--- /dev/null
+++ b/GraphRAG/tests/test_ui_on_gaudi.sh
@@ -0,0 +1,112 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -x
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+export host_ip=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log 2>&1
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    source set_env.sh
+    unset OPENAI_API_KEY
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    # Start Docker Containers
+    docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs tgi-gaudi-server > ${LOG_PATH}/tgi_service_start.log 2>&1
+        if grep -q Connected ${LOG_PATH}/tgi_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+}
+
+function validate_frontend() {
+    cd $WORKPATH/ui/svelte
+    local conda_env_name="OPEA_e2e"
+    export PATH=${HOME}/miniforge3/bin/:$PATH
+    if conda info --envs | grep -q "$conda_env_name"; then
+        echo "$conda_env_name exist!"
+    else
+        conda create -n ${conda_env_name} python=3.12 -y
+    fi
+    source activate ${conda_env_name}
+
+    sed -i "s/localhost/$host_ip/g" playwright.config.ts
+
+    conda install -c conda-forge nodejs=22.6.0 -y
+    npm install && npm ci && npx playwright install --with-deps
+    node -v && npm -v && pip list
+
+    exit_status=0
+    npx playwright test || exit_status=$?
+
+    if [ $exit_status -ne 0 ]; then
+        echo "[TEST INFO]: ---------frontend test failed---------"
+        exit $exit_status
+    else
+        echo "[TEST INFO]: ---------frontend test passed---------"
+    fi
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    docker compose -f compose.yaml down
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_frontend"
+    validate_frontend
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/GraphRAG/ui/svelte/package.json b/GraphRAG/ui/svelte/package.json
index c7bae7c400..a3ef00d7fc 100644
--- a/GraphRAG/ui/svelte/package.json
+++ b/GraphRAG/ui/svelte/package.json
@@ -18,7 +18,7 @@
     "@fortawesome/free-solid-svg-icons": "6.2.0",
     "@playwright/test": "^1.45.2",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "@tailwindcss/typography": "0.5.7",
     "@types/debug": "4.1.7",
diff --git a/HybridRAG/docker_compose/intel/hpu/gaudi/README.md b/HybridRAG/docker_compose/intel/hpu/gaudi/README.md
index 3f9fc045ef..2ca481e202 100644
--- a/HybridRAG/docker_compose/intel/hpu/gaudi/README.md
+++ b/HybridRAG/docker_compose/intel/hpu/gaudi/README.md
@@ -47,15 +47,15 @@ The HybridRAG docker images should automatically be downloaded from the `OPEA re
 
 ```
 [+] Running 9/9
- ✔ Container redis-vector-db                Healthy                                                                           6.4s
- ✔ Container vllm-service                   Started                                                                           0.4s
- ✔ Container tei-embedding-server           Started                                                                           0.9s
- ✔ Container neo4j-apoc                     Healthy                                                                          11.4s
- ✔ Container tei-reranking-server           Started                                                                           0.8s
- ✔ Container retriever-redis-server         Started                                                                           1.0s
- ✔ Container dataprep-redis-server          Started                                                                           6.5s
- ✔ Container text2cypher-gaudi-container    Started                                                                          12.2s
- ✔ Container hybridrag-xeon-backend-server  Started                                                                          12.4s
+ ✔ Container redis-vector-db                      Healthy                                                                           6.4s
+ ✔ Container vllm-service                         Started                                                                           0.4s
+ ✔ Container tei-embedding-server                 Started                                                                           0.9s
+ ✔ Container neo4j-apoc                           Healthy                                                                          11.4s
+ ✔ Container tei-reranking-server                 Started                                                                           0.8s
+ ✔ Container retriever-redis-server               Started                                                                           1.0s
+ ✔ Container dataprep-redis-server                Started                                                                           6.5s
+ ✔ Container text2query-cypher-gaudi-container    Started                                                                          12.2s
+ ✔ Container hybridrag-xeon-backend-server        Started                                                                          12.4s
 ```
 
 To rebuild the docker image for the hybridrag-xeon-backend-server container:
@@ -78,7 +78,7 @@ For the default deployment, the following 10 containers should have started:
 ```
 CONTAINER ID   IMAGE                                                                                       COMMAND                  CREATED        STATUS                  PORTS                                                                                            NAMES
 a9286abd0015   opea/hybridrag:latest                                                                       "python hybridrag.py"    15 hours ago   Up 15 hours             0.0.0.0:8888->8888/tcp, :::8888->8888/tcp                                                        hybridrag-xeon-backend-server
-8477b154dc72   opea/text2cypher-gaudi:latest                                                               "/bin/sh -c 'bash ru…"   15 hours ago   Up 15 hours             0.0.0.0:11801->9097/tcp, [::]:11801->9097/tcp                                                    text2cypher-gaudi-container
+8477b154dc72   opea/text2query-cypher:latest                                                               "/bin/sh -c 'bash ru…"   15 hours ago   Up 15 hours             0.0.0.0:11801->9097/tcp, [::]:11801->9097/tcp                                                    text2query-cypher-gaudi-container
 688e01a431fa   opea/dataprep:latest                                                                        "sh -c 'python $( [ …"   15 hours ago   Up 15 hours             0.0.0.0:6007->5000/tcp, [::]:6007->5000/tcp                                                      dataprep-redis-server
 54f574fe54bb   opea/retriever:latest                                                                       "python opea_retriev…"   15 hours ago   Up 15 hours             0.0.0.0:7000->7000/tcp, :::7000->7000/tcp                                                        retriever-redis-server
 5028eb66617c   ghcr.io/huggingface/text-embeddings-inference:cpu-1.6                                       "text-embeddings-rou…"   15 hours ago   Up 15 hours             0.0.0.0:8808->80/tcp, [::]:8808->80/tcp                                                          tei-reranking-server
diff --git a/HybridRAG/docker_compose/intel/hpu/gaudi/compose.yaml b/HybridRAG/docker_compose/intel/hpu/gaudi/compose.yaml
index 1689f6a8fe..06fc3df548 100644
--- a/HybridRAG/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/HybridRAG/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -3,8 +3,8 @@
 
 services:
   text2cypher-gaudi:
-    image: ${REGISTRY:-opea}/text2cypher-gaudi:${TAG:-latest}
-    container_name: text2cypher-gaudi-container
+    image: ${REGISTRY:-opea}/text2query-cypher:${TAG:-latest}
+    container_name: text2query-cypher-gaudi-container
     ports:
       - "11801:9097"
     depends_on:
@@ -26,6 +26,7 @@ services:
       NEO4J_USERNAME: ${NEO4J_USERNAME}
       NEO4J_PASSWORD: ${NEO4J_PASSWORD}
       host_ip: ${host_ip}
+      TEXT2QUERY_COMPONENT_NAME: "OPEA_TEXT2QUERY_CYPHER"
     runtime: habana
     cap_add:
       - SYS_NICE
@@ -140,7 +141,7 @@ services:
       HF_HUB_ENABLE_HF_TRANSFER: 0
     command: --model-id ${RERANK_MODEL_ID} --auto-truncate
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - "9009:80"
diff --git a/HybridRAG/docker_image_build/build.yaml b/HybridRAG/docker_image_build/build.yaml
index 7c23807736..775e63c384 100644
--- a/HybridRAG/docker_image_build/build.yaml
+++ b/HybridRAG/docker_image_build/build.yaml
@@ -13,18 +13,12 @@ services:
       context: ../
       dockerfile: ./Dockerfile
     image: ${REGISTRY:-opea}/hybridrag:${TAG:-latest}
-  text2cypher:
+  text2query-cypher:
     build:
       context: GenAIComps
-      dockerfile:  comps/text2cypher/src/Dockerfile.intel_hpu
+      dockerfile:  comps/text2query/src/Dockerfile.cypher.intel_hpu
     extends: hybridrag
-    image: ${REGISTRY:-opea}/text2cypher-gaudi:${TAG:-latest}
-  vllm:
-    build:
-      context: vllm
-      dockerfile: docker/Dockerfile.cpu
-    extends: hybridrag
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: ${REGISTRY:-opea}/text2query-cypher:${TAG:-latest}
   dataprep:
     build:
       context: GenAIComps
diff --git a/HybridRAG/hybridrag.py b/HybridRAG/hybridrag.py
index a7d48cd809..ae1a26f329 100644
--- a/HybridRAG/hybridrag.py
+++ b/HybridRAG/hybridrag.py
@@ -255,14 +255,14 @@ def __init__(self, host="0.0.0.0", port=8000):
         self.endpoint = str(MegaServiceEndpoint.HYBRID_RAG)
 
     async def exec_text2cypher(self, prompt):
-        url = f"http://{TEXT2CYPHER_SERVER_HOST_IP}:{TEXT2CYPHER_SERVER_PORT}/v1/text2cypher"
+        url = f"http://{TEXT2CYPHER_SERVER_HOST_IP}:{TEXT2CYPHER_SERVER_PORT}/v1/text2query"
         headers = {"Content-Type": "application/json"}
         if refresh_db == "False":
-            data = {"input_text": prompt, "seeding": {"refresh_db": "False"}}
+            data = {"query": prompt, "options": {"refresh_db": "False"}}
         elif cypher_insert is not None:
-            data = {"input_text": prompt, "seeding": {"cypher_insert": "'${cypher_insert}'", "refresh_db": "True"}}
+            data = {"query": prompt, "options": {"cypher_insert": "'${cypher_insert}'", "refresh_db": "True"}}
         else:
-            data = {"input_text": prompt}
+            data = {"query": prompt}
         response = requests.post(url, json=data)
         data = response.json()
         data_str = str(data)
@@ -295,12 +295,12 @@ def add_remote_service(self):
         )
 
         text2cypher = MicroService(
-            name="text2cypher",
+            name="text2query",
             host=TEXT2CYPHER_SERVER_HOST_IP,
             port=TEXT2CYPHER_SERVER_PORT,
-            endpoint="/text2cypher",
+            endpoint="/text2query",
             use_remote_service=True,
-            service_type=ServiceType.TEXT2CYPHER,
+            service_type=ServiceType.TEXT2QUERY,
         )
 
         retriever = MicroService(
diff --git a/HybridRAG/tests/test_compose_on_gaudi.sh b/HybridRAG/tests/test_compose_on_gaudi.sh
index 39ced4f92c..2577575f02 100755
--- a/HybridRAG/tests/test_compose_on_gaudi.sh
+++ b/HybridRAG/tests/test_compose_on_gaudi.sh
@@ -27,16 +27,8 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    # make sure NOT change the pwd
-    cd ../
-
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    service_list="hybridrag hybridrag-ui dataprep retriever text2cypher vllm nginx"
+    service_list="hybridrag hybridrag-ui dataprep retriever text2query-cypher nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log 2>&1
 
     docker images && sleep 1s
@@ -44,7 +36,7 @@ function build_docker_images() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     # Start Docker Containers
     docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     n=0
@@ -80,9 +72,9 @@ function validate_service() {
 
     local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
 
-    if [ "$DOCKER_NAME" = "text2cypher-gaudi-container" ]; then
+    if [ "$DOCKER_NAME" = "text2query-cypher-gaudi-container" ]; then
         docker ps
-        docker logs text2cypher-gaudi-container
+        docker logs text2query-cypher-gaudi-container
     fi
 
     if [ "$HTTP_STATUS" -eq 200 ]; then
@@ -97,7 +89,7 @@ function validate_service() {
             docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
             if [ "$DOCKER_NAME" = "hybridrag-xeon-backend-server" ]; then
                 docker ps
-                docker logs text2cypher-gaudi-container
+                docker logs text2query-cypher-gaudi-container
             fi
             exit 1
         fi
@@ -106,7 +98,7 @@ function validate_service() {
         docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
         if [ "$DOCKER_NAME" = "hybridrag-xeon-backend-server" ]; then
             docker ps
-            docker logs text2cypher-gaudi-container
+            docker logs text2query-cypher-gaudi-container
         fi
         exit 1
     fi
@@ -164,42 +156,13 @@ function validate_megaservice() {
 }
 
 function validate_text2cypher() {
-    # text2cypher service
+    # text2query-cypher service
     validate_service \
-        "${ip_address}:11801/v1/text2cypher" \
+        "${ip_address}:11801/v1/text2query" \
         "\[" \
         "text2cypher-gaudi" \
-        "text2cypher-gaudi-container" \
-        '{"input_text": "what are the symptoms for Diabetes?"}'
-}
-
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
+        "text2query-cypher-gaudi-container" \
+        '{"query": "what are the symptoms for Diabetes?"}'
 }
 
 function stop_docker() {
@@ -233,10 +196,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/HybridRAG/tests/test_ui_on_gaudi.sh b/HybridRAG/tests/test_ui_on_gaudi.sh
new file mode 100755
index 0000000000..b13bc515e9
--- /dev/null
+++ b/HybridRAG/tests/test_ui_on_gaudi.sh
@@ -0,0 +1,113 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -e
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+cd $WORKPATH/docker_compose/intel/hpu/gaudi
+source set_env.sh
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="hybridrag hybridrag-ui dataprep retriever text2cypher-gaudi nginx"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log 2>&1
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    # Start Docker Containers
+    docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs vllm-service > ${LOG_PATH}/vllm_service_start.log 2>&1
+        if grep -q complete ${LOG_PATH}/vllm_service_start.log; then
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+}
+
+function validate_frontend() {
+    cd $WORKPATH/ui/svelte
+    local conda_env_name="OPEA_e2e"
+    export PATH=${HOME}/miniforge3/bin/:$PATH
+    if conda info --envs | grep -q "$conda_env_name"; then
+        echo "$conda_env_name exist!"
+    else
+        conda create -n ${conda_env_name} python=3.12 -y
+    fi
+
+    source activate ${conda_env_name}
+
+    sed -i "s/localhost/$ip_address/g" playwright.config.ts
+
+    conda install -c conda-forge nodejs=22.6.0 -y
+    npm install && npm ci && npx playwright install --with-deps
+    node -v && npm -v && pip list
+
+    exit_status=0
+    npx playwright test || exit_status=$?
+
+    if [ $exit_status -ne 0 ]; then
+        echo "[TEST INFO]: ---------frontend test failed---------"
+        exit $exit_status
+    else
+        echo "[TEST INFO]: ---------frontend test passed---------"
+    fi
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/hpu/gaudi
+    docker compose -f compose.yaml down
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_frontend"
+    validate_frontend
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/HybridRAG/ui/svelte/package.json b/HybridRAG/ui/svelte/package.json
index eaa981570a..d62d64712b 100644
--- a/HybridRAG/ui/svelte/package.json
+++ b/HybridRAG/ui/svelte/package.json
@@ -18,7 +18,7 @@
     "@fortawesome/free-solid-svg-icons": "6.2.0",
     "@playwright/test": "^1.45.2",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "@tailwindcss/typography": "0.5.7",
     "@types/debug": "4.1.7",
diff --git a/MultimodalQnA/tests/test_compose_milvus_on_epyc.sh b/MultimodalQnA/tests/test_compose_milvus_on_epyc.sh
index 46b19822d8..5ab2354ffa 100644
--- a/MultimodalQnA/tests/test_compose_milvus_on_epyc.sh
+++ b/MultimodalQnA/tests/test_compose_milvus_on_epyc.sh
@@ -73,6 +73,7 @@ function setup_env() {
 function start_services() {
     echo "Starting services..."
     cd $WORKPATH/docker_compose/amd/cpu/epyc
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     docker compose -f compose_milvus.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 2m
     echo "Services started."
diff --git a/MultimodalQnA/tests/test_compose_milvus_on_xeon.sh b/MultimodalQnA/tests/test_compose_milvus_on_xeon.sh
index f63877e6f8..4c7a1f6120 100644
--- a/MultimodalQnA/tests/test_compose_milvus_on_xeon.sh
+++ b/MultimodalQnA/tests/test_compose_milvus_on_xeon.sh
@@ -71,6 +71,7 @@ function setup_env() {
 function start_services() {
     echo "Starting services..."
     cd $WORKPATH/docker_compose/intel/cpu/xeon
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     docker compose -f compose_milvus.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 2m
     echo "Services started."
diff --git a/MultimodalQnA/tests/test_compose_on_epyc.sh b/MultimodalQnA/tests/test_compose_on_epyc.sh
index fe753930b3..e23c018906 100644
--- a/MultimodalQnA/tests/test_compose_on_epyc.sh
+++ b/MultimodalQnA/tests/test_compose_on_epyc.sh
@@ -72,6 +72,7 @@ function setup_env() {
 function start_services() {
     echo "Starting services..."
     cd $WORKPATH/docker_compose/amd/cpu/epyc
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 2m
     echo "Services started."
diff --git a/MultimodalQnA/tests/test_compose_on_gaudi.sh b/MultimodalQnA/tests/test_compose_on_gaudi.sh
index 4f9c637936..107a5212de 100644
--- a/MultimodalQnA/tests/test_compose_on_gaudi.sh
+++ b/MultimodalQnA/tests/test_compose_on_gaudi.sh
@@ -67,7 +67,7 @@ function setup_env() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     # Start Docker Containers
     docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 1m
diff --git a/MultimodalQnA/tests/test_compose_on_xeon.sh b/MultimodalQnA/tests/test_compose_on_xeon.sh
index 47a5051557..f7de0bfef6 100644
--- a/MultimodalQnA/tests/test_compose_on_xeon.sh
+++ b/MultimodalQnA/tests/test_compose_on_xeon.sh
@@ -70,6 +70,7 @@ function setup_env() {
 function start_services() {
     echo "Starting services..."
     cd $WORKPATH/docker_compose/intel/cpu/xeon
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     sleep 2m
     echo "Services started."
diff --git a/MultimodalQnA/tests/test_compose_vllm_on_rocm.sh b/MultimodalQnA/tests/test_compose_vllm_on_rocm.sh
index 56774e87a7..1283282d08 100644
--- a/MultimodalQnA/tests/test_compose_vllm_on_rocm.sh
+++ b/MultimodalQnA/tests/test_compose_vllm_on_rocm.sh
@@ -44,6 +44,7 @@ function setup_env() {
 
 function start_services() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     docker compose -f compose_vllm.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
     n=0
     until [[ "$n" -ge 100 ]]; do
diff --git a/MultimodalQnA/ui/gradio/multimodalqna_ui_gradio.py b/MultimodalQnA/ui/gradio/multimodalqna_ui_gradio.py
index 2f5ec2892f..430ef999c4 100644
--- a/MultimodalQnA/ui/gradio/multimodalqna_ui_gradio.py
+++ b/MultimodalQnA/ui/gradio/multimodalqna_ui_gradio.py
@@ -383,8 +383,17 @@ def ingest_with_caption(filepath, text_caption, audio_caption, request: gr.Reque
     is_audio_caption = audio_caption is not None
     if is_audio_caption:
         verified_audio_path = os.path.normpath(audio_caption)
+        if not verified_audio_path.startswith(static_dir):
+            print("Found malicious audio file path!")
+            yield (
+                gr.Textbox(
+                    visible=True,
+                    value="Your uploaded audio file's path is not allowed. Please upload a valid file.",
+                )
+            )
+            return
         caption_basename = "{}{}".format(os.path.splitext(basename)[0], os.path.splitext(verified_audio_path)[-1])
-        caption_file = audio_caption
+        caption_file = verified_audio_path
     else:
         caption_basename = "{}.txt".format(os.path.splitext(basename)[0])
         caption_file = os.path.join(static_dir, caption_basename)
diff --git a/PolyLingua/.env.example b/PolyLingua/.env.example
new file mode 100644
index 0000000000..a48a3de7cd
--- /dev/null
+++ b/PolyLingua/.env.example
@@ -0,0 +1,119 @@
+# ================================================
+# PolyLingua Environment Configuration
+# ================================================
+# Copy this file to .env and update with your values
+# Run: cp .env.example .env
+# Then edit .env with your actual configuration
+
+# ================================================
+# HuggingFace Configuration
+# ================================================
+# Required: Get your token from https://huggingface.co/settings/tokens
+# This is needed to download models from HuggingFace Hub
+HF_TOKEN=hf_xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx
+
+# ================================================
+# Model Configuration
+# ================================================
+# LLM model ID from HuggingFace
+# Default model supports multilingual translation
+LLM_MODEL_ID=swiss-ai/Apertus-8B-Instruct-2509
+
+# Directory to cache downloaded models
+# Models can be large (several GB), ensure sufficient disk space
+MODEL_CACHE=./data
+
+# ================================================
+# Host Configuration
+# ================================================
+# Your server/machine IP address
+# Use 'localhost' for local development
+# Use actual IP (e.g., 192.168.1.100) for network access
+host_ip=localhost
+
+# ================================================
+# Backend Service Configuration
+# ================================================
+# vLLM (vLLM Inference) endpoint
+# This is the LLM inference service endpoint
+VLLM_ENDPOINT=http://localhost:8028
+
+# LLM microservice configuration
+# Host and port for the LLM microservice
+LLM_SERVICE_HOST_IP=localhost
+LLM_SERVICE_PORT=9000
+
+# PolyLingua megaservice configuration
+# Main translation service host and port
+MEGA_SERVICE_HOST_IP=localhost
+MEGA_SERVICE_PORT=8888
+
+# Backend service details
+BACKEND_SERVICE_NAME=polylingua
+BACKEND_SERVICE_IP=localhost
+BACKEND_SERVICE_PORT=8888
+
+# ================================================
+# Frontend Configuration
+# ================================================
+# Backend endpoint URL for the frontend
+# This is what the UI uses to connect to the backend
+BACKEND_SERVICE_ENDPOINT=http://localhost:8888
+
+# Frontend service configuration
+# Next.js development server configuration
+FRONTEND_SERVICE_IP=localhost
+FRONTEND_SERVICE_PORT=5173
+
+# ================================================
+# Docker Configuration
+# ================================================
+# Docker registry for pulling images
+# Use 'opea' for official OPEA images
+REGISTRY=opea
+
+# Docker image tag
+# Use 'latest' for most recent version
+TAG=latest
+
+# ================================================
+# Nginx Configuration
+# ================================================
+# Nginx reverse proxy port
+# Default HTTP port
+NGINX_PORT=80
+
+# ================================================
+# Proxy Settings (Optional)
+# ================================================
+# Configure if behind a corporate proxy
+# Leave empty if not using a proxy
+
+# HTTP proxy URL (e.g., http://proxy.company.com:8080)
+http_proxy=
+
+# HTTPS proxy URL (e.g., http://proxy.company.com:8080)
+https_proxy=
+
+# Comma-separated list of hosts to bypass proxy
+no_proxy=localhost,127.0.0.1
+
+# ================================================
+# Quick Start Guide
+# ================================================
+#
+# 1. Copy this file:
+#    cp .env.example .env
+#
+# 2. Edit .env and set your HF_TOKEN
+#
+# 3. Update host_ip if deploying to network
+#    (use actual IP instead of localhost)
+#
+# 4. Start services:
+#    docker compose up -d
+#
+# 5. Access UI at:
+#    http://localhost:5173 (or http://<host_ip>:5173)
+#
+# ================================================
diff --git a/PolyLingua/.gitignore b/PolyLingua/.gitignore
new file mode 100644
index 0000000000..cb3baf35fa
--- /dev/null
+++ b/PolyLingua/.gitignore
@@ -0,0 +1,68 @@
+# Environment variables
+.env
+.env.local
+
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+# Python library directories (but allow ui/lib)
+/lib/
+/lib64/
+!ui/lib/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+
+# Virtual environments
+venv/
+env/
+ENV/
+.venv
+
+# Model cache
+data/
+models/
+*.bin
+*.safetensors
+
+# IDEs
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+
+# OS
+.DS_Store
+Thumbs.db
+
+# Logs
+*.log
+logs/
+
+# Temporary files
+tmp/
+temp/
+*.tmp
+
+# Node modules (for UI)
+ui/node_modules/
+ui/.next/
+ui/out/
+ui/build/
+
+# Docker
+docker-compose.override.yml
diff --git a/PolyLingua/Dockerfile b/PolyLingua/Dockerfile
new file mode 100644
index 0000000000..5bdedaf097
--- /dev/null
+++ b/PolyLingua/Dockerfile
@@ -0,0 +1,25 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+FROM python:3.11-slim
+
+WORKDIR /home/user
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy requirements and install Python dependencies
+COPY requirements.txt .
+RUN pip install --no-cache-dir --upgrade pip && \
+    pip install --no-cache-dir -r requirements.txt
+
+# Copy polylingua service
+COPY polylingua.py .
+
+# Expose service port
+EXPOSE 8888
+
+# Run the polylingua service
+ENTRYPOINT ["python", "polylingua.py"]
diff --git a/PolyLingua/README.md b/PolyLingua/README.md
new file mode 100644
index 0000000000..26bff952f9
--- /dev/null
+++ b/PolyLingua/README.md
@@ -0,0 +1,298 @@
+# PolyLingua
+
+A production-ready translation service built with **OPEA (Open Platform for Enterprise AI)** components, featuring a modern Next.js UI and microservices architecture.
+
+## Table of Contents
+
+1. [Components](#components)
+2. [Quick Start](#quick-start)
+3. [Configuration](#configuration)
+4. [Development](#development)
+5. [Operations](#operations)
+6. [Troubleshooting](#troubleshooting)
+7. [Resources](#resources)
+8. [Support](#support)
+
+## Components
+
+1. **vLLM Service** - High-performance LLM inference engine for model serving
+2. **LLM Microservice** - OPEA wrapper providing standardized API
+3. **PolyLingua Megaservice** - Orchestrator that formats prompts and routes requests
+4. **UI Service** - Next.js 14 frontend with React and TypeScript
+5. **Nginx** - Reverse proxy for unified access
+
+## 🚀 Quick Start
+
+### Prerequisites
+
+- Docker and Docker Compose
+- Git
+- HuggingFace Account (for model access)
+- 8GB+ RAM recommended
+- ~10GB disk space for models
+
+### 1. Clone and Setup
+
+```bash
+cd PolyLingua
+
+# Configure environment variables
+./set_env.sh
+```
+
+You'll be prompted for:
+
+- **HuggingFace API Token** - Get from https://huggingface.co/settings/tokens
+- **Model ID** - Default: `swiss-ai/Apertus-8B-Instruct-2509` (translation-optimized model)
+- **Host IP** - Your server's IP address
+- **Ports and proxy settings**
+
+### 2. Build Images
+
+```bash
+./deploy/build.sh
+```
+
+This builds:
+
+- Translation backend service
+- Next.js UI service
+
+### 3. Start Services
+
+```bash
+./deploy/start.sh
+```
+
+Wait for services to initialize (~2-5 minutes for first run as models download).
+
+### 4. Access the Application
+
+- **Web UI**: http://localhost:80
+- **API Endpoint**: http://localhost:8888/v1/translation
+
+### 5. Test the Service
+
+```bash
+./deploy/test.sh
+```
+
+Or test manually:
+
+```bash
+curl -X POST http://localhost:8888/v1/translation \
+  -H "Content-Type: application/json" \
+  -d '{
+    "language_from": "English",
+    "language_to": "Spanish",
+    "source_language": "Hello, how are you today?"
+  }'
+```
+
+## 📋 Configuration
+
+### Environment Variables
+
+Key variables in `.env`:
+
+| Variable       | Description                  | Default                             |
+| -------------- | ---------------------------- | ----------------------------------- |
+| `HF_TOKEN`     | HuggingFace API token        | Required                            |
+| `LLM_MODEL_ID` | Model to use for translation | `swiss-ai/Apertus-8B-Instruct-2509` |
+| `MODEL_CACHE`  | Directory for model storage  | `./data`                            |
+| `host_ip`      | Server IP address            | `localhost`                         |
+| `NGINX_PORT`   | External port for web access | `80`                                |
+
+See `.env.example` for full configuration options.
+
+### Supported Models
+
+The service works with any HuggingFace text generation model. Recommended models:
+
+- **swiss-ai/Apertus-8B-Instruct-2509** - Multilingual translation (default)
+- **haoranxu/ALMA-7B** - Specialized translation model
+
+## 🛠️ Development
+
+### Project Structure
+
+```
+PolyLingua/
+├── polylingua.py          # Backend polylingua service
+├── requirements.txt       # Python dependencies
+├── Dockerfile            # Backend container definition
+├── docker-compose.yaml   # Multi-service orchestration
+├── set_env.sh           # Environment setup script
+├── .env.example         # Environment template
+├── ui/                  # Next.js frontend
+│   ├── app/            # Next.js app directory
+│   ├── components/     # React components
+│   ├── Dockerfile      # UI container definition
+│   └── package.json    # Node dependencies
+└── deploy/             # Deployment scripts
+    ├── nginx.conf      # Nginx configuration
+    ├── build.sh        # Image build script
+    ├── start.sh        # Service startup script
+    ├── stop.sh         # Service shutdown script
+    └── test.sh         # API testing script
+```
+
+### Running Locally (Development)
+
+**Backend:**
+
+```bash
+# Install dependencies
+pip install -r requirements.txt
+
+# Set environment variables
+export LLM_SERVICE_HOST_IP=localhost
+export LLM_SERVICE_PORT=9000
+export MEGA_SERVICE_PORT=8888
+
+# Run service
+python polylingua.py
+```
+
+**Frontend:**
+
+```bash
+cd ui
+npm install
+npm run dev
+```
+
+### API Reference
+
+#### POST /v1/translation
+
+Translate text between languages.
+
+**Request:**
+
+```json
+{
+  "language_from": "English",
+  "language_to": "Spanish",
+  "source_language": "Your text to translate"
+}
+```
+
+**Response:**
+
+```json
+{
+  "model": "polylingua",
+  "choices": [
+    {
+      "index": 0,
+      "message": {
+        "role": "assistant",
+        "content": "Translated text here"
+      },
+      "finish_reason": "stop"
+    }
+  ],
+  "usage": {}
+}
+```
+
+## 🔧 Operations
+
+### View Logs
+
+```bash
+# All services
+docker compose logs -f
+
+# Specific service
+docker compose logs -f polylingua-xeon-backend-server
+docker compose logs -f polylingua-ui-server
+```
+
+### Stop Services
+
+```bash
+./deploy/stop.sh
+```
+
+### Update Services
+
+```bash
+# Rebuild images
+./deploy/build.sh
+
+# Restart services
+docker compose down
+./deploy/start.sh
+```
+
+### Clean Up
+
+```bash
+# Stop and remove containers
+docker compose down
+
+# Remove volumes (including model cache)
+docker compose down -v
+```
+
+## 🐛 Troubleshooting
+
+### Service won't start
+
+1. Check if ports are available:
+
+   ```bash
+   sudo lsof -i :80,8888,9000,8028,5173
+   ```
+
+2. Verify environment variables:
+
+   ```bash
+   cat .env
+   ```
+
+3. Check service health:
+   ```bash
+   docker compose ps
+   docker compose logs
+   ```
+
+### Model download fails
+
+- Ensure `HF_TOKEN` is set correctly
+- Check internet connection
+- Verify model ID exists on HuggingFace
+- Check disk space in `MODEL_CACHE` directory
+
+### Translation errors
+
+- Wait for vLLM service to fully initialize (check logs)
+- Verify LLM service is healthy: `curl http://localhost:9000/v1/health`
+- Check vLLM service: `curl http://localhost:8028/health`
+
+### UI can't connect to backend
+
+- Verify `BACKEND_SERVICE_ENDPOINT` in `.env`
+- Check if backend is running: `docker compose ps`
+- Test API directly: `curl http://localhost:8888/v1/translation`
+
+## 🔗 Resources
+
+- [OPEA Project](https://github.com/opea-project)
+- [GenAIComps](https://github.com/opea-project/GenAIComps)
+- [GenAIExamples](https://github.com/opea-project/GenAIExamples)
+- [vLLM](https://github.com/vllm-project/vllm)
+
+## 📧 Support
+
+For issues and questions:
+
+- Open an issue on GitHub
+- Check existing issues for solutions
+- Review OPEA documentation
+
+---
+
+**Built with OPEA - Open Platform for Enterprise AI** 🚀
diff --git a/PolyLingua/deploy/build.sh b/PolyLingua/deploy/build.sh
new file mode 100755
index 0000000000..143786a9ac
--- /dev/null
+++ b/PolyLingua/deploy/build.sh
@@ -0,0 +1,44 @@
+#!/bin/bash
+# Copyright (C) 2024
+# SPDX-License-Identifier: Apache-2.0
+
+set -e
+
+echo "======================================"
+echo "Building OPEA PolyLingua Service Images"
+echo "======================================"
+
+# Source environment variables
+if [ -f .env ]; then
+    echo "Loading environment from .env file..."
+    export $(cat .env | grep -v '^#' | xargs)
+else
+    echo "Warning: .env file not found. Using default values."
+    echo "Run './set_env.sh' to configure environment variables."
+fi
+
+# Build polylingua backend
+echo ""
+echo "Building polylingua backend service..."
+docker build --no-cache -t ${REGISTRY:-opea}/polylingua:${TAG:-latest} -f Dockerfile .
+
+# Build polylingua UI
+echo ""
+echo "Building polylingua UI service..."
+docker build --no-cache \
+  --build-arg BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT} \
+  -t ${REGISTRY:-opea}/polylingua-ui:${TAG:-latest} \
+  -f ui/Dockerfile ./ui
+
+echo ""
+echo "======================================"
+echo "Build completed successfully!"
+echo "======================================"
+echo ""
+echo "Images built:"
+echo "  - ${REGISTRY:-opea}/polylingua:${TAG:-latest}"
+echo "  - ${REGISTRY:-opea}/polylingua-ui:${TAG:-latest}"
+echo ""
+echo "To start the services, run:"
+echo "  ./deploy/start.sh"
+echo ""
diff --git a/PolyLingua/deploy/nginx.conf b/PolyLingua/deploy/nginx.conf
new file mode 100644
index 0000000000..7476021049
--- /dev/null
+++ b/PolyLingua/deploy/nginx.conf
@@ -0,0 +1,70 @@
+# Copyright (C) 2024
+# SPDX-License-Identifier: Apache-2.0
+
+events {
+    worker_connections 1024;
+}
+
+http {
+    include /etc/nginx/mime.types;
+    default_type application/octet-stream;
+
+    log_format main '$remote_addr - $remote_user [$time_local] "$request" '
+                    '$status $body_bytes_sent "$http_referer" '
+                    '"$http_user_agent" "$http_x_forwarded_for"';
+
+    access_log /var/log/nginx/access.log main;
+    error_log /var/log/nginx/error.log warn;
+
+    sendfile on;
+    keepalive_timeout 65;
+
+    # Frontend server
+    upstream frontend {
+        server polylingua-ui-server:5173;
+    }
+
+    # Backend server
+    upstream backend {
+        server polylingua-xeon-backend-server:8888;
+    }
+
+    server {
+        listen 80;
+        server_name localhost;
+
+        # Frontend routes
+        location / {
+            proxy_pass http://frontend;
+            proxy_http_version 1.1;
+            proxy_set_header Upgrade $http_upgrade;
+            proxy_set_header Connection 'upgrade';
+            proxy_set_header Host $host;
+            proxy_cache_bypass $http_upgrade;
+            proxy_set_header X-Real-IP $remote_addr;
+            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+            proxy_set_header X-Forwarded-Proto $scheme;
+        }
+
+        # Backend API routes
+        location /v1/ {
+            proxy_pass http://backend;
+            proxy_http_version 1.1;
+            proxy_set_header Host $host;
+            proxy_set_header X-Real-IP $remote_addr;
+            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+            proxy_set_header X-Forwarded-Proto $scheme;
+            proxy_connect_timeout 600s;
+            proxy_send_timeout 600s;
+            proxy_read_timeout 600s;
+            send_timeout 600s;
+        }
+
+        # Health check endpoint
+        location /health {
+            access_log off;
+            return 200 "healthy\n";
+            add_header Content-Type text/plain;
+        }
+    }
+}
diff --git a/PolyLingua/deploy/start.sh b/PolyLingua/deploy/start.sh
new file mode 100755
index 0000000000..545b86d3a1
--- /dev/null
+++ b/PolyLingua/deploy/start.sh
@@ -0,0 +1,63 @@
+#!/bin/bash
+# Copyright (C) 2024
+# SPDX-License-Identifier: Apache-2.0
+
+set -e
+
+echo "======================================"
+echo "Starting OPEA PolyLingua Service"
+echo "======================================"
+
+# Source environment variables
+if [ -f .env ]; then
+    echo "Loading environment from .env file..."
+    export $(cat .env | grep -v '^#' | xargs)
+else
+    echo "ERROR: .env file not found!"
+    echo "Please run './set_env.sh' first to configure environment variables."
+    exit 1
+fi
+
+# Check for HuggingFace token
+if [ -z "$HF_TOKEN" ]; then
+    echo "WARNING: HF_TOKEN is not set!"
+    echo "You may need a HuggingFace token to download models."
+    read -p "Continue anyway? (y/N): " confirm
+    if [[ ! $confirm =~ ^[Yy]$ ]]; then
+        exit 1
+    fi
+fi
+
+# Create model cache directory if it doesn't exist
+mkdir -p ${MODEL_CACHE:-./data}
+
+echo ""
+echo "Starting services with docker compose..."
+docker compose up -d
+
+echo ""
+echo "Waiting for services to start..."
+sleep 5
+
+echo ""
+echo "======================================"
+echo "Service Status"
+echo "======================================"
+docker compose ps
+
+echo ""
+echo "======================================"
+echo "Services started successfully!"
+echo "======================================"
+echo ""
+echo "Access points:"
+echo "  - Frontend UI: http://${host_ip:-localhost}:${NGINX_PORT:-80}"
+echo "  - Backend API: http://${host_ip:-localhost}:8888"
+# echo "  - LLM Service: http://${host_ip:-localhost}:9000"
+echo ""
+# echo "To view logs:"
+# echo "  docker compose logs -f"
+# echo ""
+echo "To stop services:"
+echo "  ./deploy/stop.sh"
+echo ""
diff --git a/PolyLingua/deploy/stop.sh b/PolyLingua/deploy/stop.sh
new file mode 100755
index 0000000000..d661a75d57
--- /dev/null
+++ b/PolyLingua/deploy/stop.sh
@@ -0,0 +1,25 @@
+#!/bin/bash
+# Copyright (C) 2024
+# SPDX-License-Identifier: Apache-2.0
+
+set -e
+
+echo "======================================"
+echo "Stopping OPEA PolyLingua Service"
+echo "======================================"
+
+echo ""
+echo "Stopping services..."
+docker compose down
+
+echo ""
+echo "======================================"
+echo "Services stopped successfully!"
+echo "======================================"
+echo ""
+echo "To start services again:"
+echo "  ./deploy/start.sh"
+echo ""
+echo "To remove all data (including model cache):"
+echo "  docker compose down -v"
+echo ""
diff --git a/PolyLingua/deploy/test.sh b/PolyLingua/deploy/test.sh
new file mode 100755
index 0000000000..7cb36aeeb0
--- /dev/null
+++ b/PolyLingua/deploy/test.sh
@@ -0,0 +1,54 @@
+#!/bin/bash
+# Copyright (C) 2024
+# SPDX-License-Identifier: Apache-2.0
+
+set -e
+
+echo "======================================"
+echo "Testing OPEA PolyLingua Service"
+echo "======================================"
+
+# Source environment variables
+if [ -f .env ]; then
+    export $(cat .env | grep -v '^#' | xargs)
+fi
+
+HOST=${host_ip:-localhost}
+PORT=${BACKEND_SERVICE_PORT:-8888}
+
+echo ""
+echo "Testing translation endpoint..."
+echo "Target: http://${HOST}:${PORT}/v1/translation"
+echo ""
+
+response=$(curl -s -w "\n%{http_code}" -X POST "http://${HOST}:${PORT}/v1/translation" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "language_from": "English",
+    "language_to": "Spanish",
+    "source_language": "Hello, how are you today?"
+  }')
+
+http_code=$(echo "$response" | tail -n1)
+body=$(echo "$response" | head -n-1)
+
+echo "HTTP Status: $http_code"
+echo ""
+
+if [ "$http_code" -eq 200 ]; then
+    echo "✓ PolyLingua service is working!"
+    echo ""
+    echo "Response:"
+    echo "$body" | jq '.' 2>/dev/null || echo "$body"
+else
+    echo "✗ PolyLingua service returned an error!"
+    echo ""
+    echo "Response:"
+    echo "$body"
+    exit 1
+fi
+
+echo ""
+echo "======================================"
+echo "Test completed successfully!"
+echo "======================================"
diff --git a/PolyLingua/docker_compose/intel/cpu/xeon/compose.yaml b/PolyLingua/docker_compose/intel/cpu/xeon/compose.yaml
new file mode 100644
index 0000000000..5741acadc6
--- /dev/null
+++ b/PolyLingua/docker_compose/intel/cpu/xeon/compose.yaml
@@ -0,0 +1,101 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  vllm-service:
+    image: budstudio/vllm-cpu:0.11.0
+    container_name: vllm-service
+    ports:
+      - "8028:8000"
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      HF_TOKEN: ${HF_TOKEN}
+      HF_HUB_DISABLE_PROGRESS_BARS: 1
+      HF_HUB_ENABLE_HF_TRANSFER: 0
+      host_ip: ${host_ip}
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:8000/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
+    shm_size: 1g
+    command: --model ${LLM_MODEL_ID} --host 0.0.0.0 --port 8000 --max-model-len 8192
+
+  llm:
+    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}
+    container_name: llm-textgen-server
+    depends_on:
+      vllm-service:
+        condition: service_healthy
+    ports:
+      - "9000:9000"
+    ipc: host
+    environment:
+      no_proxy: ${no_proxy}
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      LLM_ENDPOINT: ${VLLM_ENDPOINT}
+      LLM_MODEL_ID: ${LLM_MODEL_ID}
+      HF_TOKEN: ${HF_TOKEN}
+      HF_HUB_DISABLE_PROGRESS_BARS: 1
+      HF_HUB_ENABLE_HF_TRANSFER: 0
+    restart: unless-stopped
+
+  polylingua-xeon-backend-server:
+    image: ${REGISTRY:-opea}/polylingua:${TAG:-latest}
+    container_name: polylingua-xeon-backend-server
+    depends_on:
+      - vllm-service
+      - llm
+    ports:
+      - "8888:8888"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+      - MEGA_SERVICE_PORT=8888
+      - LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+      - LLM_SERVICE_PORT=${LLM_SERVICE_PORT}
+    ipc: host
+    restart: always
+
+  polylingua-ui-server:
+    image: ${REGISTRY:-opea}/polylingua-ui:${TAG:-latest}
+    container_name: polylingua-ui-server
+    depends_on:
+      - polylingua-xeon-backend-server
+    ports:
+      - "5173:5173"
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+      - BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+    ipc: host
+    restart: always
+
+  polylingua-nginx-server:
+    image: nginx:alpine
+    container_name: polylingua-nginx-server
+    depends_on:
+      - polylingua-xeon-backend-server
+      - polylingua-ui-server
+    ports:
+      - "${NGINX_PORT:-80}:80"
+    volumes:
+      - ../../../../deploy/nginx.conf:/etc/nginx/nginx.conf:ro
+    environment:
+      - no_proxy=${no_proxy}
+      - https_proxy=${https_proxy}
+      - http_proxy=${http_proxy}
+    ipc: host
+    restart: always
+
+networks:
+  default:
+    driver: bridge
diff --git a/PolyLingua/docker_image_build/build.yaml b/PolyLingua/docker_image_build/build.yaml
new file mode 100644
index 0000000000..7ae835699f
--- /dev/null
+++ b/PolyLingua/docker_image_build/build.yaml
@@ -0,0 +1,29 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  polylingua:
+    build:
+      args:
+        IMAGE_REPO: ${REGISTRY}
+        BASE_TAG: ${TAG}
+        http_proxy: ${http_proxy}
+        https_proxy: ${https_proxy}
+        no_proxy: ${no_proxy}
+      context: ../
+      dockerfile: ./Dockerfile
+    image: ${REGISTRY:-opea}/polylingua:${TAG:-latest}
+
+  polylingua-ui:
+    build:
+      context: ../ui
+      dockerfile: ./Dockerfile
+    extends: polylingua
+    image: ${REGISTRY:-opea}/polylingua-ui:${TAG:-latest}
+
+  llm-textgen:
+    build:
+      context: GenAIComps
+      dockerfile: comps/llms/src/text-generation/Dockerfile
+    extends: polylingua
+    image: ${REGISTRY:-opea}/llm-textgen:${TAG:-latest}
diff --git a/PolyLingua/polylingua.py b/PolyLingua/polylingua.py
new file mode 100644
index 0000000000..e57a326f98
--- /dev/null
+++ b/PolyLingua/polylingua.py
@@ -0,0 +1,409 @@
+# Copyright (c) 2024 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import asyncio
+import json
+import os
+import tempfile
+from pathlib import Path
+
+from comps import MegaServiceEndpoint, MicroService, ServiceOrchestrator, ServiceRoleType, ServiceType
+from comps.cores.proto.api_protocol import (
+    ChatCompletionRequest,
+    ChatCompletionResponse,
+    ChatCompletionResponseChoice,
+    ChatMessage,
+    UsageInfo,
+)
+from docling.datamodel.base_models import InputFormat
+from docling.document_converter import DocumentConverter
+from fastapi import File, Form, HTTPException, Request, UploadFile
+from fastapi.responses import StreamingResponse
+from langdetect import LangDetectException, detect
+
+MEGA_SERVICE_PORT = int(os.getenv("MEGA_SERVICE_PORT", 8888))
+LLM_SERVICE_HOST_IP = os.getenv("LLM_SERVICE_HOST_IP", "0.0.0.0")
+LLM_SERVICE_PORT = int(os.getenv("LLM_SERVICE_PORT", 9000))
+LLM_MODEL_ID = os.getenv("LLM_MODEL_ID", "swiss-ai/Apertus-8B-Instruct-2509")
+
+# Language code to name mapping
+LANGUAGE_MAP = {
+    "en": "English",
+    "es": "Spanish",
+    "fr": "French",
+    "de": "German",
+    "it": "Italian",
+    "pt": "Portuguese",
+    "ru": "Russian",
+    "ja": "Japanese",
+    "ko": "Korean",
+    "zh-cn": "Chinese (Simplified)",
+    "zh-tw": "Chinese (Traditional)",
+    "ar": "Arabic",
+    "hi": "Hindi",
+    "nl": "Dutch",
+    "pl": "Polish",
+    "tr": "Turkish",
+    "sv": "Swedish",
+}
+
+# Text formats that can be read directly (no conversion needed)
+TEXT_FORMATS = {".txt", ".md", ".markdown", ".rst", ".log", ".csv"}
+
+# Document formats that require docling conversion
+DOCUMENT_FORMATS = {".docx", ".html"}
+
+# All supported extensions
+SUPPORTED_EXTENSIONS = TEXT_FORMATS | DOCUMENT_FORMATS
+
+# Maximum file size (20MB)
+MAX_FILE_SIZE = 20 * 1024 * 1024
+
+
+class DocumentProcessor:
+    """Handles document processing using docling for various file formats."""
+
+    def __init__(self):
+        # Initialize document converter for office documents
+        self.converter = DocumentConverter()
+
+    async def process_file(self, file: UploadFile) -> list[str]:
+        """Process an uploaded file and extract text content in chunks.
+
+        Args:
+            file: The uploaded file
+
+        Returns:
+            List of text chunks (each chunk as markdown string)
+
+        Raises:
+            ValueError: If file type is not supported or file is too large
+        """
+        # Check file size
+        contents = await file.read()
+        if len(contents) > MAX_FILE_SIZE:
+            raise ValueError(f"File size exceeds maximum limit of {MAX_FILE_SIZE / 1024 / 1024}MB")
+
+        # Check file extension
+        file_ext = Path(file.filename).suffix.lower()
+        if file_ext not in SUPPORTED_EXTENSIONS:
+            raise ValueError(
+                f"Unsupported file type: {file_ext}. " f"Supported types: {', '.join(sorted(SUPPORTED_EXTENSIONS))}"
+            )
+
+        page_texts = []
+        CHUNK_SIZE = 8000  # ~2000 words per chunk
+
+        # Handle plain text files (fast path - no conversion needed)
+        if file_ext in TEXT_FORMATS:
+            print(f"Reading text file {file.filename}...")
+            try:
+                # Try UTF-8 first
+                text_content = contents.decode("utf-8")
+            except UnicodeDecodeError:
+                # Fallback to latin-1 for other encodings
+                print("UTF-8 decode failed, trying latin-1...")
+                text_content = contents.decode("latin-1")
+
+            print(f"Read {len(text_content)} characters from text file")
+
+            # Split into chunks if needed
+            if len(text_content) > CHUNK_SIZE:
+                print(f"Splitting into chunks of {CHUNK_SIZE} chars")
+                for i in range(0, len(text_content), CHUNK_SIZE):
+                    chunk = text_content[i : i + CHUNK_SIZE]
+                    page_texts.append(chunk)
+                    print(f"Chunk {len(page_texts)}: {len(chunk)} chars")
+            else:
+                page_texts.append(text_content)
+                print(f"Single chunk: {len(text_content)} chars")
+
+            print(f"Total chunks: {len(page_texts)}")
+            return page_texts
+
+        # Handle document files (DOCX, HTML - requires docling conversion)
+        if file_ext in DOCUMENT_FORMATS:
+            # Save file temporarily for docling
+            with tempfile.NamedTemporaryFile(delete=False, suffix=file_ext) as tmp_file:
+                tmp_file.write(contents)
+                tmp_path = tmp_file.name
+
+            try:
+                # Convert document using docling
+                print(f"Converting document {file.filename}...")
+                result = self.converter.convert(tmp_path)
+                print("Conversion completed")
+
+                # Export entire document to markdown
+                full_markdown = result.document.export_to_markdown()
+                print(f"Extracted {len(full_markdown)} characters from document")
+
+                # Split into chunks for translation
+                if len(full_markdown) > CHUNK_SIZE:
+                    print(f"Splitting into chunks of {CHUNK_SIZE} chars")
+                    # Split into manageable chunks
+                    for i in range(0, len(full_markdown), CHUNK_SIZE):
+                        chunk = full_markdown[i : i + CHUNK_SIZE]
+                        page_texts.append(chunk)
+                        print(f"Chunk {len(page_texts)}: {len(chunk)} chars")
+                else:
+                    # Small enough to translate as single chunk
+                    page_texts.append(full_markdown)
+                    print(f"Single chunk: {len(full_markdown)} chars")
+
+                print(f"Total chunks: {len(page_texts)}")
+                return page_texts
+
+            finally:
+                # Clean up temporary file
+                Path(tmp_path).unlink(missing_ok=True)
+
+        # Should never reach here due to extension check above
+        raise ValueError(f"Unsupported file type: {file_ext}")
+
+
+class PolyLinguaService:
+    def __init__(self, host="0.0.0.0", port=8000):
+        self.host = host
+        self.port = port
+        self.megaservice = ServiceOrchestrator()
+        self.endpoint = str(MegaServiceEndpoint.TRANSLATION)
+        self.doc_processor = DocumentProcessor()
+
+    def add_remote_service(self):
+        llm = MicroService(
+            name="llm",
+            host=LLM_SERVICE_HOST_IP,
+            port=LLM_SERVICE_PORT,
+            endpoint="/v1/chat/completions",
+            use_remote_service=True,
+            service_type=ServiceType.LLM,
+        )
+        self.megaservice.add(llm)
+
+    async def translate_page(self, page_text: str, language_from: str, language_to: str) -> str:
+        """Translate a single page of text by consuming streaming response."""
+        prompt_template = """
+            You are a translation assistant who is specialized in translating {language_from} to {language_to}.
+
+            1. Answer should only contain the translation of the source language to the target language.
+            2. Do not include any other text or information.
+            3. Do not include any other language than the target language.
+            4. Do not include any other information than the translation.
+
+            Translate this from {language_from} to {language_to}:
+
+            {source_language}
+
+        """
+        prompt = prompt_template.format(language_from=language_from, language_to=language_to, source_language=page_text)
+
+        # Create chat completion request with streaming
+        chat_request_dict = {
+            "model": LLM_MODEL_ID,
+            "messages": [{"role": "user", "content": prompt}],
+            "max_tokens": 4096,
+            "stream": True,
+        }
+
+        result_dict, runtime_graph = await self.megaservice.schedule(initial_inputs=chat_request_dict)
+
+        # Find the LLM service response
+        for node, response in result_dict.items():
+            if (
+                isinstance(response, StreamingResponse)
+                and node == list(self.megaservice.services.keys())[-1]
+                and self.megaservice.services[node].service_type == ServiceType.LLM
+            ):
+                # Consume the streaming response
+                accumulated_text = ""
+
+                # Get the response body iterator
+                async for chunk in response.body_iterator:
+                    chunk_str = chunk.decode("utf-8") if isinstance(chunk, bytes) else chunk
+
+                    # Parse SSE format
+                    lines = chunk_str.split("\n")
+                    for line in lines:
+                        if line.startswith("data: "):
+                            data = line[6:]  # Remove "data: " prefix
+
+                            if data == "[DONE]":
+                                continue
+
+                            try:
+                                parsed = json.loads(data)
+                                # Extract content from chat completion format
+                                text = parsed.get("choices", [{}])[0].get("delta", {}).get("content", "")
+                                if text:
+                                    accumulated_text += text
+                            except:
+                                continue
+
+                return accumulated_text
+
+        # Fallback if no streaming response found
+        raise Exception("No LLM streaming response found")
+
+    async def handle_request(self, request: Request):
+        """Handle both JSON text input and multipart file uploads."""
+        content_type = request.headers.get("content-type", "")
+        is_file_upload = False
+
+        # Check if this is a file upload request
+        if "multipart/form-data" in content_type:
+            # Handle file upload
+            is_file_upload = True
+            form_data = await request.form()
+            language_from = form_data.get("language_from", "auto")
+            language_to = form_data.get("language_to")
+            file = form_data.get("file")
+
+            if not file or not hasattr(file, "filename"):
+                raise HTTPException(status_code=400, detail="No file uploaded")
+
+            if not language_to:
+                raise HTTPException(status_code=400, detail="Target language (language_to) is required")
+
+            try:
+                # Process the uploaded file to extract text page by page
+                page_texts = await self.doc_processor.process_file(file)
+            except ValueError as e:
+                raise HTTPException(status_code=400, detail=str(e))
+            except Exception as e:
+                raise HTTPException(status_code=500, detail=f"Error processing file: {str(e)}")
+
+        else:
+            # Handle JSON text input (existing behavior)
+            data = await request.json()
+            language_from = data.get("language_from", "auto")
+            language_to = data.get("language_to")
+            source_language = data.get("source_language")
+
+            if not language_to:
+                raise HTTPException(status_code=400, detail="Target language (language_to) is required")
+
+            if not source_language:
+                raise HTTPException(status_code=400, detail="Source text (source_language) is required")
+
+        # Handle file upload (page-by-page translation)
+        if is_file_upload:
+            # Auto-detect source language from first page
+            if language_from.lower() == "auto" and page_texts:
+                try:
+                    detected_code = detect(page_texts[0])
+                    language_from = LANGUAGE_MAP.get(detected_code, "English")
+                except LangDetectException:
+                    language_from = "English"
+
+            # Translate each page separately
+            translated_pages = []
+            for page_num, page_text in enumerate(page_texts, start=1):
+                print(f"Translating page {page_num}/{len(page_texts)}...")
+                try:
+                    translated_page = await self.translate_page(page_text, language_from, language_to)
+                    translated_pages.append(translated_page)
+                except Exception as e:
+                    print(f"Error translating page {page_num}: {str(e)}")
+                    translated_pages.append(f"[Error translating page {page_num}]")
+
+            # Combine all translated pages
+            combined_translation = "\n\n--- Page Break ---\n\n".join(translated_pages)
+
+            # Return combined result
+            choices = []
+            usage = UsageInfo()
+            choices.append(
+                ChatCompletionResponseChoice(
+                    index=0,
+                    message=ChatMessage(role="assistant", content=combined_translation),
+                    finish_reason="stop",
+                )
+            )
+            return ChatCompletionResponse(model="polylingua", choices=choices, usage=usage)
+
+        # Handle text input (existing streaming behavior)
+        else:
+            # Auto-detect source language if set to "auto"
+            if language_from.lower() == "auto":
+                try:
+                    detected_code = detect(source_language)
+                    language_from = LANGUAGE_MAP.get(detected_code, "English")
+                except LangDetectException:
+                    language_from = "English"
+
+            prompt_template = """
+                You are a translation assistant who is specialized in translating {language_from} to {language_to}.
+
+                1. Answer should only contain the translation of the source language to the target language.
+                2. Do not include any other text or information.
+                3. Do not include any other language than the target language.
+                4. Do not include any other information than the translation.
+
+                Translate this from {language_from} to {language_to}:
+
+                {source_language}
+
+            """
+            prompt = prompt_template.format(
+                language_from=language_from, language_to=language_to, source_language=source_language
+            )
+
+            # Create chat completion request as dict for the LLM service
+            chat_request_dict = {
+                "model": LLM_MODEL_ID,
+                "messages": [{"role": "user", "content": prompt}],
+                "stream": True,
+            }
+
+            result_dict, runtime_graph = await self.megaservice.schedule(initial_inputs=chat_request_dict)
+            for node, response in result_dict.items():
+                # Here it suppose the last microservice in the megaservice is LLM.
+                if (
+                    isinstance(response, StreamingResponse)
+                    and node == list(self.megaservice.services.keys())[-1]
+                    and self.megaservice.services[node].service_type == ServiceType.LLM
+                ):
+                    return response
+            last_node = runtime_graph.all_leaves()[-1]
+            response = result_dict[last_node]["text"]
+            choices = []
+            usage = UsageInfo()
+            choices.append(
+                ChatCompletionResponseChoice(
+                    index=0,
+                    message=ChatMessage(role="assistant", content=response),
+                    finish_reason="stop",
+                )
+            )
+            return ChatCompletionResponse(model="polylingua", choices=choices, usage=usage)
+
+    def start(self):
+        self.service = MicroService(
+            self.__class__.__name__,
+            service_role=ServiceRoleType.MEGASERVICE,
+            host=self.host,
+            port=self.port,
+            endpoint=self.endpoint,
+            input_datatype=ChatCompletionRequest,
+            output_datatype=ChatCompletionResponse,
+        )
+        self.service.add_route(self.endpoint, self.handle_request, methods=["POST"])
+        self.service.start()
+
+
+if __name__ == "__main__":
+    polylingua = PolyLinguaService(port=MEGA_SERVICE_PORT)
+    polylingua.add_remote_service()
+    polylingua.start()
diff --git a/PolyLingua/requirements.txt b/PolyLingua/requirements.txt
new file mode 100644
index 0000000000..aa1c7d7479
--- /dev/null
+++ b/PolyLingua/requirements.txt
@@ -0,0 +1,17 @@
+
+# Async Support
+aiohttp>=3.9.0
+asyncio>=3.4.3
+
+# Document Processing
+docling>=2.0.0
+
+# Core Dependencies
+fastapi>=0.109.0
+
+# Language Detection
+langdetect>=1.0.9
+# OPEA GenAIComps Framework
+opea-comps>=1.3.0
+python-multipart>=0.0.9
+uvicorn[standard]>=0.27.0
diff --git a/PolyLingua/set_env.sh b/PolyLingua/set_env.sh
new file mode 100755
index 0000000000..3a56740ed5
--- /dev/null
+++ b/PolyLingua/set_env.sh
@@ -0,0 +1,110 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# Environment Setup Script for OPEA PolyLingua Service
+
+echo "======================================"
+echo "OPEA PolyLingua Service Setup"
+echo "======================================"
+echo ""
+
+# Function to prompt for input with default value
+prompt_with_default() {
+    local prompt="$1"
+    local default="$2"
+    local var_name="$3"
+
+    read -p "$prompt [$default]: " input
+    input="${input:-$default}"
+    export $var_name="$input"
+    echo "export $var_name=\"$input\"" >> .env
+}
+
+# Remove existing .env file
+rm -f .env
+
+# Get host IP
+host_ip=$(hostname -I | awk '{print $1}')
+if [ -z "$host_ip" ]; then
+    host_ip="localhost"
+fi
+
+echo "Detected host IP: $host_ip"
+echo ""
+
+# HuggingFace Configuration
+echo "--- HuggingFace Configuration ---"
+prompt_with_default "Enter your HuggingFace API Token (get from https://huggingface.co/settings/tokens)" "" "HF_TOKEN"
+
+# Model Configuration
+echo ""
+echo "--- Model Configuration ---"
+prompt_with_default "Enter LLM Model ID" "haoranxu/ALMA-13B" "LLM_MODEL_ID"
+prompt_with_default "Enter Model Cache Directory" "./data" "MODEL_CACHE"
+
+# Host Configuration
+echo ""
+echo "--- Host Configuration ---"
+prompt_with_default "Enter Host IP" "$host_ip" "host_ip"
+
+# Service Endpoints
+echo ""
+echo "--- Service Endpoints ---"
+export VLLM_ENDPOINT="http://${host_ip}:8028"
+echo "export VLLM_ENDPOINT=\"http://${host_ip}:8028\"" >> .env
+
+export LLM_SERVICE_HOST_IP="${host_ip}"
+echo "export LLM_SERVICE_HOST_IP=\"${host_ip}\"" >> .env
+
+export LLM_SERVICE_PORT="9000"
+echo "export LLM_SERVICE_PORT=\"9000\"" >> .env
+
+export MEGA_SERVICE_HOST_IP="${host_ip}"
+echo "export MEGA_SERVICE_HOST_IP=\"${host_ip}\"" >> .env
+
+export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:8888"
+echo "export BACKEND_SERVICE_ENDPOINT=\"http://${host_ip}:8888\"" >> .env
+
+export FRONTEND_SERVICE_IP="${host_ip}"
+echo "export FRONTEND_SERVICE_IP=\"${host_ip}\"" >> .env
+
+export FRONTEND_SERVICE_PORT="5173"
+echo "export FRONTEND_SERVICE_PORT=\"5173\"" >> .env
+
+export BACKEND_SERVICE_NAME="polylingua"
+echo "export BACKEND_SERVICE_NAME=\"polylingua\"" >> .env
+
+export BACKEND_SERVICE_IP="${host_ip}"
+echo "export BACKEND_SERVICE_IP=\"${host_ip}\"" >> .env
+
+export BACKEND_SERVICE_PORT="8888"
+echo "export BACKEND_SERVICE_PORT=\"8888\"" >> .env
+
+# Docker Configuration
+echo ""
+echo "--- Docker Configuration ---"
+prompt_with_default "Enter Docker Registry" "opea" "REGISTRY"
+prompt_with_default "Enter Docker Tag" "latest" "TAG"
+
+# Nginx Configuration
+prompt_with_default "Enter Nginx Port" "80" "NGINX_PORT"
+
+# Proxy Settings (optional)
+echo ""
+echo "--- Proxy Settings (optional, press Enter to skip) ---"
+prompt_with_default "Enter HTTP Proxy" "" "http_proxy"
+prompt_with_default "Enter HTTPS Proxy" "" "https_proxy"
+prompt_with_default "Enter No Proxy" "" "no_proxy"
+
+echo ""
+echo "======================================"
+echo "Configuration saved to .env"
+echo "======================================"
+echo ""
+echo "To load these environment variables, run:"
+echo "  source .env"
+echo ""
+echo "To start the services, run:"
+echo "  docker compose up -d"
+echo ""
diff --git a/PolyLingua/tests/test_compose_on_xeon.sh b/PolyLingua/tests/test_compose_on_xeon.sh
new file mode 100755
index 0000000000..7bcd67496f
--- /dev/null
+++ b/PolyLingua/tests/test_compose_on_xeon.sh
@@ -0,0 +1,360 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+# Get the directory where this script is located
+SCRIPT_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# PolyLingua root is one level up from tests directory
+WORKPATH=$(dirname "$SCRIPT_DIR")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+echo "Script directory: $SCRIPT_DIR"
+echo "Working directory: $WORKPATH"
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+
+    # Clone GenAIComps
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    # Build all images using build.yaml
+    echo "Building PolyLingua images with --no-cache, check docker_image_build.log for details..."
+    service_list="polylingua polylingua-ui llm-textgen"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log 2>&1
+
+    echo "Image build completed"
+    docker images | grep -E "polylingua|llm-textgen"
+    sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+
+    # Load environment variables
+    if [ ! -f .env ]; then
+        echo "Creating .env file..."
+        export HF_TOKEN=${HF_TOKEN}
+        export LLM_MODEL_ID="swiss-ai/Apertus-8B-Instruct-2509"
+        export VLLM_ENDPOINT="http://${host_ip}:8028"
+        export LLM_SERVICE_HOST_IP=${host_ip}
+        export LLM_SERVICE_PORT=9000
+        export MEGA_SERVICE_HOST_IP=${host_ip}
+        export MEGA_SERVICE_PORT=8888
+        export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:8888"
+        export BACKEND_SERVICE_NAME="polylingua"
+        export BACKEND_SERVICE_IP=${host_ip}
+        export BACKEND_SERVICE_PORT=8888
+        export FRONTEND_SERVICE_IP=${host_ip}
+        export FRONTEND_SERVICE_PORT=5173
+        export NGINX_PORT=80
+
+        cat > .env <<EOF
+HF_TOKEN=${HF_TOKEN}
+LLM_MODEL_ID=${LLM_MODEL_ID}
+MODEL_CACHE=${MODEL_CACHE}
+host_ip=${host_ip}
+VLLM_ENDPOINT=${VLLM_ENDPOINT}
+LLM_SERVICE_HOST_IP=${LLM_SERVICE_HOST_IP}
+LLM_SERVICE_PORT=${LLM_SERVICE_PORT}
+MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
+MEGA_SERVICE_PORT=${MEGA_SERVICE_PORT}
+BACKEND_SERVICE_ENDPOINT=${BACKEND_SERVICE_ENDPOINT}
+BACKEND_SERVICE_NAME=${BACKEND_SERVICE_NAME}
+BACKEND_SERVICE_IP=${BACKEND_SERVICE_IP}
+BACKEND_SERVICE_PORT=${BACKEND_SERVICE_PORT}
+FRONTEND_SERVICE_IP=${FRONTEND_SERVICE_IP}
+FRONTEND_SERVICE_PORT=${FRONTEND_SERVICE_PORT}
+NGINX_PORT=${NGINX_PORT}
+REGISTRY=${REGISTRY}
+TAG=${TAG}
+EOF
+    fi
+
+    # Start Docker Containers
+    echo "Starting services with docker compose..."
+    docker compose -f compose.yaml up -d > ${LOG_PATH}/start_services_with_compose.log 2>&1
+
+    # Wait for vLLM service to be ready
+    echo "Waiting for vLLM service to initialize (this may take several minutes)..."
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs vllm-service > ${LOG_PATH}/vllm_service_start.log 2>&1
+        if grep -E "Uvicorn running|Application startup complete" ${LOG_PATH}/vllm_service_start.log; then
+            echo "vLLM service is ready!"
+            break
+        fi
+        if grep -q "error" ${LOG_PATH}/vllm_service_start.log; then
+            echo "Error detected in vLLM service startup"
+            cat ${LOG_PATH}/vllm_service_start.log
+            exit 1
+        fi
+        sleep 10s
+        n=$((n+1))
+    done
+
+    if [[ "$n" -ge 100 ]]; then
+        echo "Timeout waiting for vLLM service"
+        docker logs vllm-service
+        exit 1
+    fi
+
+    echo "Waiting additional 10s for all services to stabilize..."
+    sleep 10s
+}
+
+function validate_services() {
+    local URL="$1"
+    local EXPECTED_RESULT="$2"
+    local SERVICE_NAME="$3"
+    local DOCKER_NAME="$4"
+    local INPUT_DATA="$5"
+    local CONTENT_TYPE="${6:-application/json}"
+
+    echo "Testing $SERVICE_NAME at $URL"
+
+    if [[ "$CONTENT_TYPE" == "multipart/form-data" ]]; then
+        # Handle file upload
+        local HTTP_STATUS=$(eval curl -s -o /dev/null -w "%{http_code}" -X POST $INPUT_DATA "$URL")
+
+        if [ "$HTTP_STATUS" -eq 200 ]; then
+            echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+            local CONTENT=$(eval curl -s -X POST $INPUT_DATA "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
+
+            if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
+                echo "[ $SERVICE_NAME ] ✓ Content is as expected."
+            else
+                echo "[ $SERVICE_NAME ] ✗ Content does not match expected result"
+                echo "Expected: $EXPECTED_RESULT"
+                echo "Got: $CONTENT"
+                docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+                exit 1
+            fi
+        else
+            echo "[ $SERVICE_NAME ] ✗ HTTP status is $HTTP_STATUS (expected 200)"
+            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+            exit 1
+        fi
+    else
+        # Handle JSON request
+        local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H "Content-Type: $CONTENT_TYPE" "$URL")
+
+        if [ "$HTTP_STATUS" -eq 200 ]; then
+            echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
+
+            local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H "Content-Type: $CONTENT_TYPE" "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
+
+            if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
+                echo "[ $SERVICE_NAME ] ✓ Content is as expected."
+            else
+                echo "[ $SERVICE_NAME ] ✗ Content does not match expected result"
+                echo "Expected: $EXPECTED_RESULT"
+                echo "Got: $CONTENT"
+                docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+                exit 1
+            fi
+        else
+            echo "[ $SERVICE_NAME ] ✗ HTTP status is $HTTP_STATUS (expected 200)"
+            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
+            exit 1
+        fi
+    fi
+
+    sleep 2s
+}
+
+function validate_microservices() {
+    echo "======================================"
+    echo "Validating Microservices"
+    echo "======================================"
+
+    # Test vLLM service health
+    echo "Testing vLLM service health..."
+    curl -s http://${ip_address}:8028/health || {
+        echo "vLLM health check failed"
+        exit 1
+    }
+    echo "✓ vLLM service health check passed"
+
+    # Test vLLM service chat completions
+    validate_services \
+        "http://${ip_address}:8028/v1/chat/completions" \
+        "content" \
+        "vllm" \
+        "vllm-service" \
+        '{"model": "swiss-ai/Apertus-8B-Instruct-2509", "messages": [{"role": "user", "content": "Translate Hello to Spanish"}], "max_tokens": 32}'
+
+    # Test LLM microservice
+    validate_services \
+        "http://${ip_address}:9000/v1/chat/completions" \
+        "data: " \
+        "llm" \
+        "llm-textgen-server" \
+        '{"query":"Translate Hello to Spanish", "max_tokens": 32}'
+}
+
+function validate_megaservice() {
+    echo "======================================"
+    echo "Validating Megaservice"
+    echo "======================================"
+
+    # Test 1: Basic text translation (English to Spanish)
+    echo "Test 1: Basic English to Spanish translation..."
+    validate_services \
+        "http://${ip_address}:8888/v1/translation" \
+        "choices" \
+        "mega-polylingua-basic" \
+        "polylingua-xeon-backend-server" \
+        '{"language_from": "English", "language_to": "Spanish", "source_language": "Hello, how are you today?"}'
+
+    # Test 2: Language auto-detection
+    echo "Test 2: Auto-detection test..."
+    validate_services \
+        "http://${ip_address}:8888/v1/translation" \
+        "choices" \
+        "mega-polylingua-auto" \
+        "polylingua-xeon-backend-server" \
+        '{"language_from": "auto", "language_to": "French", "source_language": "Hello world"}'
+
+    # Test 3: Different language pair (English to German)
+    echo "Test 3: English to German translation..."
+    validate_services \
+        "http://${ip_address}:8888/v1/translation" \
+        "choices" \
+        "mega-polylingua-german" \
+        "polylingua-xeon-backend-server" \
+        '{"language_from": "English", "language_to": "German", "source_language": "Good morning"}'
+}
+
+function validate_file_translation() {
+    echo "======================================"
+    echo "Validating File Upload Translation"
+    echo "======================================"
+
+    # Create test file
+    cd $WORKPATH/tests
+    mkdir -p test_data
+    echo "Hello, this is a test document for translation. It contains multiple sentences. We want to test if file upload works correctly." > test_data/sample.txt
+
+    # Test file upload translation
+    echo "Testing file upload translation..."
+    validate_services \
+        "http://${ip_address}:8888/v1/translation" \
+        "choices" \
+        "file-translation" \
+        "polylingua-xeon-backend-server" \
+        '-F "file=@test_data/sample.txt" -F "language_from=English" -F "language_to=Spanish"' \
+        "multipart/form-data"
+}
+
+function validate_nginx() {
+    echo "======================================"
+    echo "Validating Nginx Proxy"
+    echo "======================================"
+
+    # Test translation via nginx
+    validate_services \
+        "http://${ip_address}:80/v1/translation" \
+        "choices" \
+        "nginx-proxy" \
+        "polylingua-nginx-server" \
+        '{"language_from": "English", "language_to": "Italian", "source_language": "Thank you very much"}'
+}
+
+function validate_ui() {
+    echo "======================================"
+    echo "Validating UI Service"
+    echo "======================================"
+
+    # Check if UI is accessible
+    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" http://${ip_address}:5173)
+
+    if [ "$HTTP_STATUS" -eq 200 ]; then
+        echo "[ UI ] ✓ UI service is accessible"
+    else
+        echo "[ UI ] ✗ UI service returned HTTP status $HTTP_STATUS"
+        docker logs polylingua-ui-server
+        exit 1
+    fi
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    echo "Stopping services..."
+    docker compose -f compose.yaml down
+    echo "Services stopped"
+}
+
+function main() {
+    echo "======================================"
+    echo "PolyLingua E2E Test Suite"
+    echo "======================================"
+    echo "Platform: Intel Xeon (CPU)"
+    echo "LLM Backend: vLLM"
+    echo "IP Address: ${ip_address}"
+    echo "======================================"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then
+        build_docker_images
+    else
+        echo "Skipping image build (using IMAGE_REPO=${IMAGE_REPO})"
+    fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_microservices"
+    validate_microservices
+    echo "::endgroup::"
+
+    echo "::group::validate_megaservice"
+    validate_megaservice
+    echo "::endgroup::"
+
+    echo "::group::validate_file_translation"
+    validate_file_translation
+    echo "::endgroup::"
+
+    echo "::group::validate_nginx"
+    validate_nginx
+    echo "::endgroup::"
+
+    echo "::group::validate_ui"
+    validate_ui
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+    echo "======================================"
+    echo "✓ All tests passed successfully!"
+    echo "======================================"
+}
+
+main
diff --git a/PolyLingua/ui/.gitignore b/PolyLingua/ui/.gitignore
new file mode 100644
index 0000000000..45c1abce86
--- /dev/null
+++ b/PolyLingua/ui/.gitignore
@@ -0,0 +1,36 @@
+# See https://help.github.com/articles/ignoring-files/ for more about ignoring files.
+
+# dependencies
+/node_modules
+/.pnp
+.pnp.js
+
+# testing
+/coverage
+
+# next.js
+/.next/
+/out/
+
+# production
+/build
+
+# misc
+.DS_Store
+*.pem
+
+# debug
+npm-debug.log*
+yarn-debug.log*
+yarn-error.log*
+
+# local env files
+.env*.local
+.env
+
+# vercel
+.vercel
+
+# typescript
+*.tsbuildinfo
+next-env.d.ts
diff --git a/PolyLingua/ui/Dockerfile b/PolyLingua/ui/Dockerfile
new file mode 100644
index 0000000000..af9a98c0be
--- /dev/null
+++ b/PolyLingua/ui/Dockerfile
@@ -0,0 +1,59 @@
+# Copyright (C) 2024
+# SPDX-License-Identifier: Apache-2.0
+
+FROM node:18-alpine AS base
+
+# Install dependencies
+FROM base AS deps
+RUN apk add --no-cache libc6-compat
+WORKDIR /app
+
+COPY package.json package-lock.json* ./
+RUN npm install
+
+# Build the application
+FROM base AS builder
+WORKDIR /app
+
+# Accept build argument
+ARG BACKEND_SERVICE_ENDPOINT
+ENV BACKEND_SERVICE_ENDPOINT=$BACKEND_SERVICE_ENDPOINT
+
+COPY --from=deps /app/node_modules ./node_modules
+COPY . .
+
+# Ensure public directory exists
+RUN mkdir -p public
+
+# Set environment for build
+ENV NEXT_TELEMETRY_DISABLED 1
+
+RUN npm run build
+
+# Production image
+FROM base AS runner
+WORKDIR /app
+
+ENV NODE_ENV production
+ENV NEXT_TELEMETRY_DISABLED 1
+
+RUN addgroup --system --gid 1001 nodejs
+RUN adduser --system --uid 1001 nextjs
+
+# Copy build output
+COPY --from=builder /app/next.config.js ./
+COPY --from=builder /app/package.json ./
+COPY --from=builder /app/.next ./.next
+COPY --from=builder /app/node_modules ./node_modules
+COPY --from=builder /app/public ./public
+
+RUN chown -R nextjs:nodejs /app
+
+USER nextjs
+
+EXPOSE 5173
+
+ENV PORT 5173
+ENV HOSTNAME "0.0.0.0"
+
+CMD ["npm", "start"]
diff --git a/PolyLingua/ui/README.md b/PolyLingua/ui/README.md
new file mode 100644
index 0000000000..02fb3e7768
--- /dev/null
+++ b/PolyLingua/ui/README.md
@@ -0,0 +1,155 @@
+# PolyLingua UI
+
+A modern, single-page translation interface built with Next.js 14, React, and shadcn/ui components.
+
+## Features
+
+- 🌐 Clean and intuitive translation interface
+- 🎨 Beautiful UI using shadcn/ui components and Tailwind CSS
+- 📱 Fully responsive design
+- 🌍 Support for 15 languages (Spanish, French, German, Italian, Portuguese, Russian, Japanese, Korean, Chinese, Arabic, Hindi, Dutch, Polish, Turkish, Swedish)
+- ⚡ Real-time character count
+- 🔄 Loading states and smooth animations
+
+## Tech Stack
+
+- **Framework**: Next.js 14 (App Router)
+- **UI Components**: shadcn/ui (Radix UI + Tailwind CSS)
+- **Styling**: Tailwind CSS
+- **Icons**: Lucide React
+- **Language**: TypeScript
+
+## Getting Started
+
+### Prerequisites
+
+- Node.js 18.x or higher
+- npm, yarn, or pnpm
+
+### Installation
+
+1. Navigate to the ui directory:
+
+```bash
+cd ui
+```
+
+2. Install dependencies:
+
+```bash
+npm install
+# or
+yarn install
+# or
+pnpm install
+```
+
+3. Run the development server:
+
+```bash
+npm run dev
+# or
+yarn dev
+# or
+pnpm dev
+```
+
+4. Open YOUR_HOST_IP:3000 in your browser to see the application.
+
+## Project Structure
+
+```
+ui/
+├── app/
+│   ├── globals.css          # Global styles and Tailwind configuration
+│   ├── layout.tsx            # Root layout component
+│   └── page.tsx              # Main page (home)
+├── components/
+│   ├── ui/                   # shadcn/ui components
+│   │   ├── button.tsx
+│   │   ├── card.tsx
+│   │   ├── label.tsx
+│   │   ├── select.tsx
+│   │   └── textarea.tsx
+│   └── polylingua-form.tsx   # Main translation form component
+├── lib/
+│   └── utils.ts              # Utility functions
+├── package.json
+├── tailwind.config.ts
+├── tsconfig.json
+└── next.config.js
+```
+
+## Usage
+
+1. **Enter Text**: Type or paste the text you want to translate in the source text area
+2. **Select Language**: Choose your target language from the dropdown menu
+3. **Translate**: Click the "Translate" button to see the translation
+
+## Backend Integration
+
+Currently, the app uses a mock translation function. To connect to a real translation backend:
+
+1. Update the `handleTranslate` function in `components/polylingua-form.tsx`:
+
+```typescript
+const handleTranslate = async () => {
+  if (!sourceText.trim()) return;
+
+  setIsLoading(true);
+
+  try {
+    const response = await fetch("/api/translate", {
+      method: "POST",
+      headers: {
+        "Content-Type": "application/json",
+      },
+      body: JSON.stringify({
+        text: sourceText,
+        targetLanguage: targetLanguage,
+      }),
+    });
+
+    const data = await response.json();
+    setTranslatedText(data.translatedText);
+  } catch (error) {
+    console.error("Translation error:", error);
+    setTranslatedText("Error: Translation failed. Please try again.");
+  } finally {
+    setIsLoading(false);
+  }
+};
+```
+
+2. Create an API route at `app/api/translate/route.ts` to handle the backend connection.
+
+## Build for Production
+
+```bash
+npm run build
+npm start
+```
+
+## Customization
+
+### Adding More Languages
+
+Edit the `languages` array in `components/polylingua-form.tsx`:
+
+```typescript
+const languages = [
+  { code: "es", name: "Spanish" },
+  { code: "fr", name: "French" },
+  // Add more languages here
+];
+```
+
+### Styling
+
+- Global styles: `app/globals.css`
+- Tailwind configuration: `tailwind.config.ts`
+- Component-specific styles: Use Tailwind utility classes
+
+## License
+
+MIT
diff --git a/PolyLingua/ui/app/globals.css b/PolyLingua/ui/app/globals.css
new file mode 100644
index 0000000000..01b77aafd6
--- /dev/null
+++ b/PolyLingua/ui/app/globals.css
@@ -0,0 +1,59 @@
+@tailwind base;
+@tailwind components;
+@tailwind utilities;
+
+@layer base {
+  :root {
+    --background: 0 0% 100%;
+    --foreground: 222.2 84% 4.9%;
+    --card: 0 0% 100%;
+    --card-foreground: 222.2 84% 4.9%;
+    --popover: 0 0% 100%;
+    --popover-foreground: 222.2 84% 4.9%;
+    --primary: 270 70% 55%;
+    --primary-foreground: 210 40% 98%;
+    --secondary: 210 40% 96.1%;
+    --secondary-foreground: 222.2 47.4% 11.2%;
+    --muted: 210 40% 96.1%;
+    --muted-foreground: 215.4 16.3% 46.9%;
+    --accent: 210 40% 96.1%;
+    --accent-foreground: 222.2 47.4% 11.2%;
+    --destructive: 0 84.2% 60.2%;
+    --destructive-foreground: 210 40% 98%;
+    --border: 214.3 31.8% 91.4%;
+    --input: 214.3 31.8% 91.4%;
+    --ring: 270 70% 55%;
+    --radius: 0.5rem;
+  }
+
+  .dark {
+    --background: 222.2 84% 4.9%;
+    --foreground: 210 40% 98%;
+    --card: 222.2 84% 4.9%;
+    --card-foreground: 210 40% 98%;
+    --popover: 222.2 84% 4.9%;
+    --popover-foreground: 210 40% 98%;
+    --primary: 270 75% 60%;
+    --primary-foreground: 222.2 47.4% 11.2%;
+    --secondary: 217.2 32.6% 17.5%;
+    --secondary-foreground: 210 40% 98%;
+    --muted: 217.2 32.6% 17.5%;
+    --muted-foreground: 215 20.2% 65.1%;
+    --accent: 217.2 32.6% 17.5%;
+    --accent-foreground: 210 40% 98%;
+    --destructive: 0 62.8% 30.6%;
+    --destructive-foreground: 210 40% 98%;
+    --border: 217.2 32.6% 17.5%;
+    --input: 217.2 32.6% 17.5%;
+    --ring: 270 75% 60%;
+  }
+}
+
+@layer base {
+  * {
+    @apply border-border;
+  }
+  body {
+    @apply bg-background text-foreground;
+  }
+}
diff --git a/PolyLingua/ui/app/layout.tsx b/PolyLingua/ui/app/layout.tsx
new file mode 100644
index 0000000000..df014cacf3
--- /dev/null
+++ b/PolyLingua/ui/app/layout.tsx
@@ -0,0 +1,22 @@
+import type { Metadata } from "next"
+import { Inter } from "next/font/google"
+import "./globals.css"
+
+const inter = Inter({ subsets: ["latin"] })
+
+export const metadata: Metadata = {
+  title: "PolyLingua",
+  description: "Translate text to multiple languages",
+}
+
+export default function RootLayout({
+  children,
+}: Readonly<{
+  children: React.ReactNode
+}>) {
+  return (
+    <html lang="en">
+      <body className={inter.className}>{children}</body>
+    </html>
+  )
+}
diff --git a/PolyLingua/ui/app/page.tsx b/PolyLingua/ui/app/page.tsx
new file mode 100644
index 0000000000..96881bfa63
--- /dev/null
+++ b/PolyLingua/ui/app/page.tsx
@@ -0,0 +1,9 @@
+import { PolyLinguaForm } from "@/components/polylingua-form"
+
+export default function Home() {
+  return (
+    <main className="min-h-screen bg-gradient-to-b from-background to-muted/20 py-12 px-4">
+      <PolyLinguaForm />
+    </main>
+  )
+}
diff --git a/PolyLingua/ui/components.json b/PolyLingua/ui/components.json
new file mode 100644
index 0000000000..fa674c93d1
--- /dev/null
+++ b/PolyLingua/ui/components.json
@@ -0,0 +1,17 @@
+{
+  "$schema": "https://ui.shadcn.com/schema.json",
+  "style": "default",
+  "rsc": true,
+  "tsx": true,
+  "tailwind": {
+    "config": "tailwind.config.ts",
+    "css": "app/globals.css",
+    "baseColor": "slate",
+    "cssVariables": true,
+    "prefix": ""
+  },
+  "aliases": {
+    "components": "@/components",
+    "utils": "@/lib/utils"
+  }
+}
diff --git a/PolyLingua/ui/components/polylingua-form.tsx b/PolyLingua/ui/components/polylingua-form.tsx
new file mode 100644
index 0000000000..78aba636ca
--- /dev/null
+++ b/PolyLingua/ui/components/polylingua-form.tsx
@@ -0,0 +1,438 @@
+"use client"
+
+import * as React from "react"
+import { Button } from "@/components/ui/button"
+import { Textarea } from "@/components/ui/textarea"
+import { Label } from "@/components/ui/label"
+import {
+  Select,
+  SelectContent,
+  SelectItem,
+  SelectTrigger,
+  SelectValue,
+} from "@/components/ui/select"
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card"
+import { Languages, Loader2, Upload, X, FileText } from "lucide-react"
+import { Tabs, TabsContent, TabsList, TabsTrigger } from "@/components/ui/tabs"
+
+const languages = [
+  { code: "en", name: "English" },
+  { code: "es", name: "Spanish" },
+  { code: "fr", name: "French" },
+  { code: "de", name: "German" },
+  { code: "it", name: "Italian" },
+  { code: "pt", name: "Portuguese" },
+  { code: "ru", name: "Russian" },
+  { code: "ja", name: "Japanese" },
+  { code: "ko", name: "Korean" },
+  { code: "zh", name: "Chinese (Simplified)" },
+  { code: "ar", name: "Arabic" },
+  { code: "hi", name: "Hindi" },
+  { code: "nl", name: "Dutch" },
+  { code: "pl", name: "Polish" },
+  { code: "tr", name: "Turkish" },
+  { code: "sv", name: "Swedish" },
+]
+
+// Supported file types
+const SUPPORTED_FILE_TYPES = [
+  ".docx",
+  ".txt",
+  ".md",
+  ".markdown",
+  ".rst",
+  ".log",
+  ".csv",
+]
+
+const MAX_FILE_SIZE = 20 * 1024 * 1024 // 20MB
+
+export function PolyLinguaForm() {
+  const [sourceText, setSourceText] = React.useState("")
+  const [translatedText, setTranslatedText] = React.useState("")
+  const [targetLanguage, setTargetLanguage] = React.useState("es")
+  const [isLoading, setIsLoading] = React.useState(false)
+  const [inputMode, setInputMode] = React.useState<"text" | "file">("text")
+  const [selectedFile, setSelectedFile] = React.useState<File | null>(null)
+  const [fileError, setFileError] = React.useState<string>("")
+  const [dragActive, setDragActive] = React.useState(false)
+  const [extractedText, setExtractedText] = React.useState("")
+  const fileInputRef = React.useRef<HTMLInputElement>(null)
+
+  // Validate file
+  const validateFile = (file: File): string | null => {
+    const fileExt = `.${file.name.split(".").pop()?.toLowerCase()}`
+    if (!SUPPORTED_FILE_TYPES.includes(fileExt)) {
+      return `Unsupported file type. Supported: ${SUPPORTED_FILE_TYPES.join(", ")}`
+    }
+    if (file.size > MAX_FILE_SIZE) {
+      return `File size exceeds 20MB limit`
+    }
+    return null
+  }
+
+  // Handle file selection
+  const handleFileSelect = (file: File) => {
+    const error = validateFile(file)
+    if (error) {
+      setFileError(error)
+      setSelectedFile(null)
+    } else {
+      setFileError("")
+      setSelectedFile(file)
+      setTranslatedText("")
+      setExtractedText("")
+    }
+  }
+
+  // Handle drag events
+  const handleDrag = (e: React.DragEvent) => {
+    e.preventDefault()
+    e.stopPropagation()
+    if (e.type === "dragenter" || e.type === "dragover") {
+      setDragActive(true)
+    } else if (e.type === "dragleave") {
+      setDragActive(false)
+    }
+  }
+
+  // Handle drop
+  const handleDrop = (e: React.DragEvent) => {
+    e.preventDefault()
+    e.stopPropagation()
+    setDragActive(false)
+
+    if (e.dataTransfer.files && e.dataTransfer.files[0]) {
+      handleFileSelect(e.dataTransfer.files[0])
+    }
+  }
+
+  // Handle file input change
+  const handleFileInputChange = (e: React.ChangeEvent<HTMLInputElement>) => {
+    if (e.target.files && e.target.files[0]) {
+      handleFileSelect(e.target.files[0])
+    }
+  }
+
+  // Clear file selection
+  const clearFile = () => {
+    setSelectedFile(null)
+    setFileError("")
+    setExtractedText("")
+    if (fileInputRef.current) {
+      fileInputRef.current.value = ""
+    }
+  }
+
+  const handleTranslate = async () => {
+    // Validate input based on mode
+    if (inputMode === "text" && !sourceText.trim()) {
+      return
+    }
+    if (inputMode === "file" && !selectedFile) {
+      return
+    }
+
+    setIsLoading(true)
+    setTranslatedText("") // Clear previous translation
+
+    try {
+      const selectedLang = languages.find(lang => lang.code === targetLanguage)
+      const backendUrl = process.env.NEXT_PUBLIC_BACKEND_URL || "http://localhost:8888"
+
+      let response: Response
+
+      if (inputMode === "file" && selectedFile) {
+        // Handle file upload
+        const formData = new FormData()
+        formData.append("file", selectedFile)
+        formData.append("language_from", "auto")
+        formData.append("language_to", selectedLang?.name || "Spanish")
+
+        response = await fetch(`${backendUrl}/v1/translation`, {
+          method: "POST",
+          body: formData,
+        })
+      } else {
+        // Handle text input
+        response = await fetch(`${backendUrl}/v1/translation`, {
+          method: "POST",
+          headers: {
+            "Content-Type": "application/json",
+          },
+          body: JSON.stringify({
+            language_from: "auto",
+            language_to: selectedLang?.name || "Spanish",
+            source_language: sourceText,
+          }),
+        })
+      }
+
+      if (!response.ok) {
+        const errorData = await response.json().catch(() => ({}))
+        throw new Error(errorData.detail || `Translation failed: ${response.statusText}`)
+      }
+
+      // Check if response is streaming (SSE)
+      const contentType = response.headers.get("content-type")
+      if (contentType?.includes("text/event-stream")) {
+        // Handle Server-Sent Events streaming
+        const reader = response.body?.getReader()
+        const decoder = new TextDecoder()
+        let accumulatedText = ""
+
+        if (!reader) {
+          throw new Error("Response body is not readable")
+        }
+
+        while (true) {
+          const { done, value } = await reader.read()
+          if (done) break
+
+          const chunk = decoder.decode(value, { stream: true })
+          const lines = chunk.split("\n")
+
+          for (const line of lines) {
+            if (line.startsWith("data: ")) {
+              const data = line.slice(6) // Remove "data: " prefix
+
+              if (data === "[DONE]") {
+                continue
+              }
+
+              try {
+                const parsed = JSON.parse(data)
+                // Extract content from chat completion streaming format
+                const text = parsed.choices?.[0]?.delta?.content || ""
+                if (text) {
+                  accumulatedText += text
+                  setTranslatedText(accumulatedText)
+                }
+              } catch (e) {
+                // Skip malformed JSON chunks
+                console.warn("Failed to parse chunk:", e)
+              }
+            }
+          }
+        }
+      } else {
+        // Handle regular JSON response (fallback)
+        const data = await response.json()
+        const translatedContent = data.choices?.[0]?.message?.content || data.text || "Translation not available"
+        setTranslatedText(translatedContent)
+      }
+    } catch (error) {
+      console.error("Translation error:", error)
+      setTranslatedText(`Error: Translation failed. Please try again.\n\nDetails: ${error instanceof Error ? error.message : "Unknown error"}`)
+    } finally {
+      setIsLoading(false)
+    }
+  }
+
+  const characterCount = sourceText.length
+
+  return (
+    <div className="w-full max-w-7xl mx-auto space-y-10">
+      <div className="flex items-start justify-between">
+        <div className="space-y-2">
+          <div className="flex items-center gap-2">
+            <Languages className="h-8 w-8 text-primary" />
+            <h1 className="text-3xl font-bold">PolyLingua</h1>
+          </div>
+          <p className="text-muted-foreground">
+            Translate your text to multiple languages
+          </p>
+        </div>
+
+        <img
+          src="https://www.netapp.com/media/na_logo_black_rgb_reg-mark_tcm19-21014.jpg"
+          alt="NetApp"
+          className="h-14 w-auto"
+        />
+      </div>
+
+      <div className="grid grid-cols-1 md:grid-cols-2 gap-6">
+        <Card>
+          <CardHeader>
+            <div className="flex items-center justify-between">
+              <div>
+                <CardTitle>Input</CardTitle>
+                <CardDescription>
+                  Enter text or upload a document
+                </CardDescription>
+              </div>
+              <div className="flex items-center gap-2">
+                <div className="w-48">
+                  <Select value={targetLanguage} onValueChange={setTargetLanguage}>
+                    <SelectTrigger id="target-language">
+                      <SelectValue placeholder="Select target language" />
+                    </SelectTrigger>
+                    <SelectContent>
+                      {languages.map((lang) => (
+                        <SelectItem key={lang.code} value={lang.code}>
+                          {lang.name}
+                        </SelectItem>
+                      ))}
+                    </SelectContent>
+                  </Select>
+                </div>
+                <Button
+                  onClick={handleTranslate}
+                  disabled={
+                    (inputMode === "text" && !sourceText.trim()) ||
+                    (inputMode === "file" && !selectedFile) ||
+                    isLoading
+                  }
+                  size="lg"
+                >
+                  {isLoading ? (
+                    <>
+                      <Loader2 className="mr-2 h-4 w-4 animate-spin" />
+                      Translating...
+                    </>
+                  ) : (
+                    <>
+                      <Languages className="mr-2 h-4 w-4" />
+                      Translate
+                    </>
+                  )}
+                </Button>
+              </div>
+            </div>
+          </CardHeader>
+          <CardContent className="space-y-4">
+            <Tabs value={inputMode} onValueChange={(value) => setInputMode(value as "text" | "file")}>
+              <TabsList className="grid w-full grid-cols-2">
+                <TabsTrigger value="text">Text Input</TabsTrigger>
+                <TabsTrigger value="file">File Upload</TabsTrigger>
+              </TabsList>
+
+              <TabsContent value="text" className="space-y-2 mt-4">
+                <Textarea
+                  id="source-text"
+                  placeholder="Enter text to translate..."
+                  value={sourceText}
+                  onChange={(e) => setSourceText(e.target.value)}
+                  className="min-h-[400px] resize-none"
+                />
+                <p className="text-sm text-muted-foreground text-right">
+                  {characterCount} characters
+                </p>
+              </TabsContent>
+
+              <TabsContent value="file" className="mt-4">
+                <div
+                  className={`border-2 border-dashed rounded-lg p-8 text-center transition-colors ${
+                    dragActive
+                      ? "border-primary bg-primary/5"
+                      : "border-muted-foreground/25 hover:border-primary/50"
+                  }`}
+                  onDragEnter={handleDrag}
+                  onDragLeave={handleDrag}
+                  onDragOver={handleDrag}
+                  onDrop={handleDrop}
+                >
+                  <input
+                    ref={fileInputRef}
+                    type="file"
+                    className="hidden"
+                    accept={SUPPORTED_FILE_TYPES.join(",")}
+                    onChange={handleFileInputChange}
+                  />
+
+                  {selectedFile ? (
+                    <div className="space-y-4">
+                      <div className="flex items-center justify-center gap-3 p-4 bg-muted rounded-lg">
+                        <FileText className="h-8 w-8 text-primary" />
+                        <div className="flex-1 text-left">
+                          <p className="font-medium">{selectedFile.name}</p>
+                          <p className="text-sm text-muted-foreground">
+                            {(selectedFile.size / 1024 / 1024).toFixed(2)} MB
+                          </p>
+                        </div>
+                        <Button
+                          variant="ghost"
+                          size="icon"
+                          onClick={clearFile}
+                        >
+                          <X className="h-4 w-4" />
+                        </Button>
+                      </div>
+                    </div>
+                  ) : (
+                    <div className="space-y-4">
+                      <Upload className="h-12 w-12 mx-auto text-muted-foreground" />
+                      <div>
+                        <p className="text-lg font-medium">
+                          Drop your file here, or{" "}
+                          <button
+                            type="button"
+                            onClick={() => fileInputRef.current?.click()}
+                            className="text-primary hover:underline"
+                          >
+                            browse
+                          </button>
+                        </p>
+                        <p className="text-sm text-muted-foreground mt-2">
+                          Supported: DOCX, TXT, MD, CSV, LOG, RST
+                        </p>
+                        <p className="text-sm text-muted-foreground">
+                          Max file size: 20MB
+                        </p>
+                      </div>
+                    </div>
+                  )}
+
+                  {fileError && (
+                    <p className="text-sm text-destructive mt-4">{fileError}</p>
+                  )}
+                </div>
+              </TabsContent>
+            </Tabs>
+          </CardContent>
+        </Card>
+
+        <Card>
+          <CardHeader>
+            <CardTitle>Translation</CardTitle>
+            <CardDescription>
+              {translatedText
+                ? `Translated to ${languages.find(lang => lang.code === targetLanguage)?.name}`
+                : "Translation will appear here"
+              }
+            </CardDescription>
+          </CardHeader>
+          <CardContent>
+            <div className="space-y-2">
+              <Textarea
+                value={translatedText}
+                readOnly
+                placeholder="Translation will appear here..."
+                className="min-h-[400px] resize-none bg-muted"
+              />
+            </div>
+          </CardContent>
+        </Card>
+      </div>
+
+      {/* Powered by footer */}
+      <div className="mt-16 pt-8 border-t border-border">
+        <div className="text-center space-y-4">
+          <p className="text-sm text-muted-foreground">Powered by</p>
+          <div className="flex items-center justify-center gap-8 flex-wrap">
+            <img
+              src="https://budecosystem.com/logo-black.svg"
+              alt="Bud Ecosystem"
+              className="h-6 w-auto opacity-70 hover:opacity-100 transition-opacity"
+            />
+            <img
+              src="https://opea.dev/wp-content/uploads/sites/9/2024/04/opea-horizontal-color.svg"
+              alt="OPEA"
+              className="h-7 w-auto opacity-70 hover:opacity-100 transition-opacity"
+            />
+          </div>
+        </div>
+      </div>
+    </div>
+  )
+}
diff --git a/PolyLingua/ui/components/ui/button.tsx b/PolyLingua/ui/components/ui/button.tsx
new file mode 100644
index 0000000000..0ba4277355
--- /dev/null
+++ b/PolyLingua/ui/components/ui/button.tsx
@@ -0,0 +1,56 @@
+import * as React from "react"
+import { Slot } from "@radix-ui/react-slot"
+import { cva, type VariantProps } from "class-variance-authority"
+
+import { cn } from "@/lib/utils"
+
+const buttonVariants = cva(
+  "inline-flex items-center justify-center whitespace-nowrap rounded-md text-sm font-medium ring-offset-background transition-colors focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:pointer-events-none disabled:opacity-50",
+  {
+    variants: {
+      variant: {
+        default: "bg-primary text-primary-foreground hover:bg-primary/90",
+        destructive:
+          "bg-destructive text-destructive-foreground hover:bg-destructive/90",
+        outline:
+          "border border-input bg-background hover:bg-accent hover:text-accent-foreground",
+        secondary:
+          "bg-secondary text-secondary-foreground hover:bg-secondary/80",
+        ghost: "hover:bg-accent hover:text-accent-foreground",
+        link: "text-primary underline-offset-4 hover:underline",
+      },
+      size: {
+        default: "h-10 px-4 py-2",
+        sm: "h-9 rounded-md px-3",
+        lg: "h-11 rounded-md px-8",
+        icon: "h-10 w-10",
+      },
+    },
+    defaultVariants: {
+      variant: "default",
+      size: "default",
+    },
+  }
+)
+
+export interface ButtonProps
+  extends React.ButtonHTMLAttributes<HTMLButtonElement>,
+    VariantProps<typeof buttonVariants> {
+  asChild?: boolean
+}
+
+const Button = React.forwardRef<HTMLButtonElement, ButtonProps>(
+  ({ className, variant, size, asChild = false, ...props }, ref) => {
+    const Comp = asChild ? Slot : "button"
+    return (
+      <Comp
+        className={cn(buttonVariants({ variant, size, className }))}
+        ref={ref}
+        {...props}
+      />
+    )
+  }
+)
+Button.displayName = "Button"
+
+export { Button, buttonVariants }
diff --git a/PolyLingua/ui/components/ui/card.tsx b/PolyLingua/ui/components/ui/card.tsx
new file mode 100644
index 0000000000..afa13ecfa3
--- /dev/null
+++ b/PolyLingua/ui/components/ui/card.tsx
@@ -0,0 +1,79 @@
+import * as React from "react"
+
+import { cn } from "@/lib/utils"
+
+const Card = React.forwardRef<
+  HTMLDivElement,
+  React.HTMLAttributes<HTMLDivElement>
+>(({ className, ...props }, ref) => (
+  <div
+    ref={ref}
+    className={cn(
+      "rounded-lg border bg-card text-card-foreground shadow-sm",
+      className
+    )}
+    {...props}
+  />
+))
+Card.displayName = "Card"
+
+const CardHeader = React.forwardRef<
+  HTMLDivElement,
+  React.HTMLAttributes<HTMLDivElement>
+>(({ className, ...props }, ref) => (
+  <div
+    ref={ref}
+    className={cn("flex flex-col space-y-1.5 p-6", className)}
+    {...props}
+  />
+))
+CardHeader.displayName = "CardHeader"
+
+const CardTitle = React.forwardRef<
+  HTMLParagraphElement,
+  React.HTMLAttributes<HTMLHeadingElement>
+>(({ className, ...props }, ref) => (
+  <h3
+    ref={ref}
+    className={cn(
+      "text-2xl font-semibold leading-none tracking-tight",
+      className
+    )}
+    {...props}
+  />
+))
+CardTitle.displayName = "CardTitle"
+
+const CardDescription = React.forwardRef<
+  HTMLParagraphElement,
+  React.HTMLAttributes<HTMLParagraphElement>
+>(({ className, ...props }, ref) => (
+  <p
+    ref={ref}
+    className={cn("text-sm text-muted-foreground", className)}
+    {...props}
+  />
+))
+CardDescription.displayName = "CardDescription"
+
+const CardContent = React.forwardRef<
+  HTMLDivElement,
+  React.HTMLAttributes<HTMLDivElement>
+>(({ className, ...props }, ref) => (
+  <div ref={ref} className={cn("p-6 pt-0", className)} {...props} />
+))
+CardContent.displayName = "CardContent"
+
+const CardFooter = React.forwardRef<
+  HTMLDivElement,
+  React.HTMLAttributes<HTMLDivElement>
+>(({ className, ...props }, ref) => (
+  <div
+    ref={ref}
+    className={cn("flex items-center p-6 pt-0", className)}
+    {...props}
+  />
+))
+CardFooter.displayName = "CardFooter"
+
+export { Card, CardHeader, CardFooter, CardTitle, CardDescription, CardContent }
diff --git a/PolyLingua/ui/components/ui/label.tsx b/PolyLingua/ui/components/ui/label.tsx
new file mode 100644
index 0000000000..683faa7938
--- /dev/null
+++ b/PolyLingua/ui/components/ui/label.tsx
@@ -0,0 +1,24 @@
+import * as React from "react"
+import * as LabelPrimitive from "@radix-ui/react-label"
+import { cva, type VariantProps } from "class-variance-authority"
+
+import { cn } from "@/lib/utils"
+
+const labelVariants = cva(
+  "text-sm font-medium leading-none peer-disabled:cursor-not-allowed peer-disabled:opacity-70"
+)
+
+const Label = React.forwardRef<
+  React.ElementRef<typeof LabelPrimitive.Root>,
+  React.ComponentPropsWithoutRef<typeof LabelPrimitive.Root> &
+    VariantProps<typeof labelVariants>
+>(({ className, ...props }, ref) => (
+  <LabelPrimitive.Root
+    ref={ref}
+    className={cn(labelVariants(), className)}
+    {...props}
+  />
+))
+Label.displayName = LabelPrimitive.Root.displayName
+
+export { Label }
diff --git a/PolyLingua/ui/components/ui/select.tsx b/PolyLingua/ui/components/ui/select.tsx
new file mode 100644
index 0000000000..fe56d4d3ad
--- /dev/null
+++ b/PolyLingua/ui/components/ui/select.tsx
@@ -0,0 +1,158 @@
+import * as React from "react"
+import * as SelectPrimitive from "@radix-ui/react-select"
+import { Check, ChevronDown, ChevronUp } from "lucide-react"
+
+import { cn } from "@/lib/utils"
+
+const Select = SelectPrimitive.Root
+
+const SelectGroup = SelectPrimitive.Group
+
+const SelectValue = SelectPrimitive.Value
+
+const SelectTrigger = React.forwardRef<
+  React.ElementRef<typeof SelectPrimitive.Trigger>,
+  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Trigger>
+>(({ className, children, ...props }, ref) => (
+  <SelectPrimitive.Trigger
+    ref={ref}
+    className={cn(
+      "flex h-10 w-full items-center justify-between rounded-md border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus:outline-none focus:ring-2 focus:ring-ring focus:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50 [&>span]:line-clamp-1",
+      className
+    )}
+    {...props}
+  >
+    {children}
+    <SelectPrimitive.Icon asChild>
+      <ChevronDown className="h-4 w-4 opacity-50" />
+    </SelectPrimitive.Icon>
+  </SelectPrimitive.Trigger>
+))
+SelectTrigger.displayName = SelectPrimitive.Trigger.displayName
+
+const SelectScrollUpButton = React.forwardRef<
+  React.ElementRef<typeof SelectPrimitive.ScrollUpButton>,
+  React.ComponentPropsWithoutRef<typeof SelectPrimitive.ScrollUpButton>
+>(({ className, ...props }, ref) => (
+  <SelectPrimitive.ScrollUpButton
+    ref={ref}
+    className={cn(
+      "flex cursor-default items-center justify-center py-1",
+      className
+    )}
+    {...props}
+  >
+    <ChevronUp className="h-4 w-4" />
+  </SelectPrimitive.ScrollUpButton>
+))
+SelectScrollUpButton.displayName = SelectPrimitive.ScrollUpButton.displayName
+
+const SelectScrollDownButton = React.forwardRef<
+  React.ElementRef<typeof SelectPrimitive.ScrollDownButton>,
+  React.ComponentPropsWithoutRef<typeof SelectPrimitive.ScrollDownButton>
+>(({ className, ...props }, ref) => (
+  <SelectPrimitive.ScrollDownButton
+    ref={ref}
+    className={cn(
+      "flex cursor-default items-center justify-center py-1",
+      className
+    )}
+    {...props}
+  >
+    <ChevronDown className="h-4 w-4" />
+  </SelectPrimitive.ScrollDownButton>
+))
+SelectScrollDownButton.displayName =
+  SelectPrimitive.ScrollDownButton.displayName
+
+const SelectContent = React.forwardRef<
+  React.ElementRef<typeof SelectPrimitive.Content>,
+  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Content>
+>(({ className, children, position = "popper", ...props }, ref) => (
+  <SelectPrimitive.Portal>
+    <SelectPrimitive.Content
+      ref={ref}
+      className={cn(
+        "relative z-50 max-h-96 min-w-[8rem] overflow-hidden rounded-md border bg-popover text-popover-foreground shadow-md data-[state=open]:animate-in data-[state=closed]:animate-out data-[state=closed]:fade-out-0 data-[state=open]:fade-in-0 data-[state=closed]:zoom-out-95 data-[state=open]:zoom-in-95 data-[side=bottom]:slide-in-from-top-2 data-[side=left]:slide-in-from-right-2 data-[side=right]:slide-in-from-left-2 data-[side=top]:slide-in-from-bottom-2",
+        position === "popper" &&
+          "data-[side=bottom]:translate-y-1 data-[side=left]:-translate-x-1 data-[side=right]:translate-x-1 data-[side=top]:-translate-y-1",
+        className
+      )}
+      position={position}
+      {...props}
+    >
+      <SelectScrollUpButton />
+      <SelectPrimitive.Viewport
+        className={cn(
+          "p-1",
+          position === "popper" &&
+            "h-[var(--radix-select-trigger-height)] w-full min-w-[var(--radix-select-trigger-width)]"
+        )}
+      >
+        {children}
+      </SelectPrimitive.Viewport>
+      <SelectScrollDownButton />
+    </SelectPrimitive.Content>
+  </SelectPrimitive.Portal>
+))
+SelectContent.displayName = SelectPrimitive.Content.displayName
+
+const SelectLabel = React.forwardRef<
+  React.ElementRef<typeof SelectPrimitive.Label>,
+  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Label>
+>(({ className, ...props }, ref) => (
+  <SelectPrimitive.Label
+    ref={ref}
+    className={cn("py-1.5 pl-8 pr-2 text-sm font-semibold", className)}
+    {...props}
+  />
+))
+SelectLabel.displayName = SelectPrimitive.Label.displayName
+
+const SelectItem = React.forwardRef<
+  React.ElementRef<typeof SelectPrimitive.Item>,
+  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Item>
+>(({ className, children, ...props }, ref) => (
+  <SelectPrimitive.Item
+    ref={ref}
+    className={cn(
+      "relative flex w-full cursor-default select-none items-center rounded-sm py-1.5 pl-8 pr-2 text-sm outline-none focus:bg-accent focus:text-accent-foreground data-[disabled]:pointer-events-none data-[disabled]:opacity-50",
+      className
+    )}
+    {...props}
+  >
+    <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
+      <SelectPrimitive.ItemIndicator>
+        <Check className="h-4 w-4" />
+      </SelectPrimitive.ItemIndicator>
+    </span>
+
+    <SelectPrimitive.ItemText>{children}</SelectPrimitive.ItemText>
+  </SelectPrimitive.Item>
+))
+SelectItem.displayName = SelectPrimitive.Item.displayName
+
+const SelectSeparator = React.forwardRef<
+  React.ElementRef<typeof SelectPrimitive.Separator>,
+  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Separator>
+>(({ className, ...props }, ref) => (
+  <SelectPrimitive.Separator
+    ref={ref}
+    className={cn("-mx-1 my-1 h-px bg-muted", className)}
+    {...props}
+  />
+))
+SelectSeparator.displayName = SelectPrimitive.Separator.displayName
+
+export {
+  Select,
+  SelectGroup,
+  SelectValue,
+  SelectTrigger,
+  SelectContent,
+  SelectLabel,
+  SelectItem,
+  SelectSeparator,
+  SelectScrollUpButton,
+  SelectScrollDownButton,
+}
diff --git a/PolyLingua/ui/components/ui/tabs.tsx b/PolyLingua/ui/components/ui/tabs.tsx
new file mode 100644
index 0000000000..f57fffdb5a
--- /dev/null
+++ b/PolyLingua/ui/components/ui/tabs.tsx
@@ -0,0 +1,53 @@
+import * as React from "react"
+import * as TabsPrimitive from "@radix-ui/react-tabs"
+
+import { cn } from "@/lib/utils"
+
+const Tabs = TabsPrimitive.Root
+
+const TabsList = React.forwardRef<
+  React.ElementRef<typeof TabsPrimitive.List>,
+  React.ComponentPropsWithoutRef<typeof TabsPrimitive.List>
+>(({ className, ...props }, ref) => (
+  <TabsPrimitive.List
+    ref={ref}
+    className={cn(
+      "inline-flex h-10 items-center justify-center rounded-md bg-muted p-1 text-muted-foreground",
+      className
+    )}
+    {...props}
+  />
+))
+TabsList.displayName = TabsPrimitive.List.displayName
+
+const TabsTrigger = React.forwardRef<
+  React.ElementRef<typeof TabsPrimitive.Trigger>,
+  React.ComponentPropsWithoutRef<typeof TabsPrimitive.Trigger>
+>(({ className, ...props }, ref) => (
+  <TabsPrimitive.Trigger
+    ref={ref}
+    className={cn(
+      "inline-flex items-center justify-center whitespace-nowrap rounded-sm px-3 py-1.5 text-sm font-medium ring-offset-background transition-all focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:pointer-events-none disabled:opacity-50 data-[state=active]:bg-background data-[state=active]:text-foreground data-[state=active]:shadow-sm",
+      className
+    )}
+    {...props}
+  />
+))
+TabsTrigger.displayName = TabsPrimitive.Trigger.displayName
+
+const TabsContent = React.forwardRef<
+  React.ElementRef<typeof TabsPrimitive.Content>,
+  React.ComponentPropsWithoutRef<typeof TabsPrimitive.Content>
+>(({ className, ...props }, ref) => (
+  <TabsPrimitive.Content
+    ref={ref}
+    className={cn(
+      "mt-2 ring-offset-background focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2",
+      className
+    )}
+    {...props}
+  />
+))
+TabsContent.displayName = TabsPrimitive.Content.displayName
+
+export { Tabs, TabsList, TabsTrigger, TabsContent }
diff --git a/PolyLingua/ui/components/ui/textarea.tsx b/PolyLingua/ui/components/ui/textarea.tsx
new file mode 100644
index 0000000000..9f9a6dc561
--- /dev/null
+++ b/PolyLingua/ui/components/ui/textarea.tsx
@@ -0,0 +1,24 @@
+import * as React from "react"
+
+import { cn } from "@/lib/utils"
+
+export interface TextareaProps
+  extends React.TextareaHTMLAttributes<HTMLTextAreaElement> {}
+
+const Textarea = React.forwardRef<HTMLTextAreaElement, TextareaProps>(
+  ({ className, ...props }, ref) => {
+    return (
+      <textarea
+        className={cn(
+          "flex min-h-[80px] w-full rounded-md border border-input bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50",
+          className
+        )}
+        ref={ref}
+        {...props}
+      />
+    )
+  }
+)
+Textarea.displayName = "Textarea"
+
+export { Textarea }
diff --git a/PolyLingua/ui/lib/utils.ts b/PolyLingua/ui/lib/utils.ts
new file mode 100644
index 0000000000..d9efeb7285
--- /dev/null
+++ b/PolyLingua/ui/lib/utils.ts
@@ -0,0 +1,9 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+import { type ClassValue, clsx } from "clsx";
+import { twMerge } from "tailwind-merge";
+
+export function cn(...inputs: ClassValue[]) {
+  return twMerge(clsx(inputs));
+}
diff --git a/PolyLingua/ui/next.config.js b/PolyLingua/ui/next.config.js
new file mode 100644
index 0000000000..25b8bbc3a5
--- /dev/null
+++ b/PolyLingua/ui/next.config.js
@@ -0,0 +1,12 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+/** @type {import('next').NextConfig} */
+const nextConfig = {
+  reactStrictMode: true,
+  env: {
+    NEXT_PUBLIC_BACKEND_URL: process.env.BACKEND_SERVICE_ENDPOINT || "http://localhost:8888",
+  },
+};
+
+module.exports = nextConfig;
diff --git a/PolyLingua/ui/package.json b/PolyLingua/ui/package.json
new file mode 100644
index 0000000000..ac486e0ad0
--- /dev/null
+++ b/PolyLingua/ui/package.json
@@ -0,0 +1,36 @@
+{
+  "name": "polylingua-ui",
+  "version": "0.1.0",
+  "private": true,
+  "scripts": {
+    "dev": "next dev",
+    "build": "next build",
+    "start": "next start -p 5173",
+    "lint": "next lint"
+  },
+  "dependencies": {
+    "react": "^18.3.1",
+    "react-dom": "^18.3.1",
+    "next": "14.2.35",
+    "@radix-ui/react-label": "^2.0.2",
+    "@radix-ui/react-select": "^2.0.0",
+    "@radix-ui/react-slot": "^1.0.2",
+    "@radix-ui/react-tabs": "^1.0.4",
+    "class-variance-authority": "^0.7.0",
+    "clsx": "^2.1.1",
+    "lucide-react": "^0.424.0",
+    "tailwind-merge": "^2.4.0",
+    "tailwindcss-animate": "^1.0.7"
+  },
+  "devDependencies": {
+    "typescript": "^5.5.4",
+    "@types/node": "^20.14.15",
+    "@types/react": "^18.3.3",
+    "@types/react-dom": "^18.3.0",
+    "autoprefixer": "^10.4.20",
+    "postcss": "^8.4.41",
+    "tailwindcss": "^3.4.9",
+    "eslint": "^8.57.0",
+    "eslint-config-next": "14.2.32"
+  }
+}
diff --git a/PolyLingua/ui/postcss.config.js b/PolyLingua/ui/postcss.config.js
new file mode 100644
index 0000000000..a7246f491e
--- /dev/null
+++ b/PolyLingua/ui/postcss.config.js
@@ -0,0 +1,9 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+module.exports = {
+  plugins: {
+    tailwindcss: {},
+    autoprefixer: {},
+  },
+};
diff --git a/PolyLingua/ui/public/.gitkeep b/PolyLingua/ui/public/.gitkeep
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/PolyLingua/ui/tailwind.config.ts b/PolyLingua/ui/tailwind.config.ts
new file mode 100644
index 0000000000..1f26a42cc2
--- /dev/null
+++ b/PolyLingua/ui/tailwind.config.ts
@@ -0,0 +1,78 @@
+// Copyright (C) 2025 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+
+import type { Config } from "tailwindcss";
+
+const config = {
+  darkMode: ["class"],
+  content: ["./pages/**/*.{ts,tsx}", "./components/**/*.{ts,tsx}", "./app/**/*.{ts,tsx}", "./src/**/*.{ts,tsx}"],
+  prefix: "",
+  theme: {
+    container: {
+      center: true,
+      padding: "2rem",
+      screens: {
+        "2xl": "1400px",
+      },
+    },
+    extend: {
+      colors: {
+        border: "hsl(var(--border))",
+        input: "hsl(var(--input))",
+        ring: "hsl(var(--ring))",
+        background: "hsl(var(--background))",
+        foreground: "hsl(var(--foreground))",
+        primary: {
+          DEFAULT: "hsl(var(--primary))",
+          foreground: "hsl(var(--primary-foreground))",
+        },
+        secondary: {
+          DEFAULT: "hsl(var(--secondary))",
+          foreground: "hsl(var(--secondary-foreground))",
+        },
+        destructive: {
+          DEFAULT: "hsl(var(--destructive))",
+          foreground: "hsl(var(--destructive-foreground))",
+        },
+        muted: {
+          DEFAULT: "hsl(var(--muted))",
+          foreground: "hsl(var(--muted-foreground))",
+        },
+        accent: {
+          DEFAULT: "hsl(var(--accent))",
+          foreground: "hsl(var(--accent-foreground))",
+        },
+        popover: {
+          DEFAULT: "hsl(var(--popover))",
+          foreground: "hsl(var(--popover-foreground))",
+        },
+        card: {
+          DEFAULT: "hsl(var(--card))",
+          foreground: "hsl(var(--card-foreground))",
+        },
+      },
+      borderRadius: {
+        lg: "var(--radius)",
+        md: "calc(var(--radius) - 2px)",
+        sm: "calc(var(--radius) - 4px)",
+      },
+      keyframes: {
+        "accordion-down": {
+          from: { height: "0" },
+          to: { height: "var(--radix-accordion-content-height)" },
+        },
+        "accordion-up": {
+          from: { height: "var(--radix-accordion-content-height)" },
+          to: { height: "0" },
+        },
+      },
+      animation: {
+        "accordion-down": "accordion-down 0.2s ease-out",
+        "accordion-up": "accordion-up 0.2s ease-out",
+      },
+    },
+  },
+  plugins: [require("tailwindcss-animate")],
+} satisfies Config;
+
+export default config;
diff --git a/PolyLingua/ui/tsconfig.json b/PolyLingua/ui/tsconfig.json
new file mode 100644
index 0000000000..d8b93235f2
--- /dev/null
+++ b/PolyLingua/ui/tsconfig.json
@@ -0,0 +1,27 @@
+{
+  "compilerOptions": {
+    "target": "ES2017",
+    "lib": ["dom", "dom.iterable", "esnext"],
+    "allowJs": true,
+    "skipLibCheck": true,
+    "strict": true,
+    "noEmit": true,
+    "esModuleInterop": true,
+    "module": "esnext",
+    "moduleResolution": "bundler",
+    "resolveJsonModule": true,
+    "isolatedModules": true,
+    "jsx": "preserve",
+    "incremental": true,
+    "plugins": [
+      {
+        "name": "next"
+      }
+    ],
+    "paths": {
+      "@/*": ["./*"]
+    }
+  },
+  "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
+  "exclude": ["node_modules"]
+}
diff --git a/ProductivitySuite/docker_compose/amd/cpu/epyc/README.md b/ProductivitySuite/docker_compose/amd/cpu/epyc/README.md
index c4cdd2673a..7263cea913 100644
--- a/ProductivitySuite/docker_compose/amd/cpu/epyc/README.md
+++ b/ProductivitySuite/docker_compose/amd/cpu/epyc/README.md
@@ -10,14 +10,18 @@ This document details the deployment process for the OPEA Productivity Suite usi
 
 This section describes how to quickly deploy and test the Productivity Suite service manually on AMD EPYC™ platform. The basic steps are:
 
-1. [Access the Code](#access-the-code)
-2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
-3. [Configure the Deployment Environment](#configure-the-deployment-environment)
-4. [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
-5. [Check the Deployment Status](#check-the-deployment-status)
-6. [Setup Keycloak](#setup-keycloak)
-7. [Test the Pipeline](#test-the-pipeline)
-8. [Cleanup the Deployment](#cleanup-the-deployment)
+- [Build Mega Service of Productivity Suite on AMD EPYC™ Processors](#build-mega-service-of-productivity-suite-on-amd-epyc-processors)
+  - [Productivity Suite Quick Start Deployment](#productivity-suite-quick-start-deployment)
+    - [Access the Code](#access-the-code)
+    - [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+    - [Configure the Deployment Environment](#configure-the-deployment-environment)
+    - [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Setup Keycloak](#setup-keycloak)
+    - [Test the Pipeline](#test-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [Productivity Suite Docker Compose Files](#productivity-suite-docker-compose-files)
+  - [Productivity Suite Service Configuration](#productivity-suite-service-configuration)
 
 ### Access the Code
 
@@ -126,8 +130,8 @@ ea7444faa8b2   ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
 9fb471c452ec   quay.io/keycloak/keycloak:25.0.2                                                            "/opt/keycloak/bin/k…"   8 minutes ago   Up 8 minutes             8443/tcp, 0.0.0.0:8080->8080/tcp, :::8080->8080/tcp, 9000/tcp                          keycloak-server
 a00ac544abb7   ghcr.io/huggingface/text-embeddings-inference:cpu-1.6                                       "/bin/sh -c 'apt-get…"   8 minutes ago   Up 8 minutes (healthy)   0.0.0.0:6006->80/tcp, :::6006->80/tcp                                                  tei-embedding-server
 87c2996111d5   redis/redis-stack:7.2.0-v9                                                                  "/entrypoint.sh"         8 minutes ago   Up 8 minutes             0.0.0.0:6379->6379/tcp, :::6379->6379/tcp, 0.0.0.0:8001->8001/tcp, :::8001->8001/tcp   redis-vector-db
-536b71e4ec67   opea/chathistory-mongo:latest                                                               "python opea_chathis…"   8 minutes ago   Up 8 minutes             0.0.0.0:6012->6012/tcp, :::6012->6012/tcp                                              chathistory-mongo-server
-8d56c2b03431   opea/promptregistry-mongo:latest                                                            "python opea_prompt_…"   8 minutes ago   Up 8 minutes             0.0.0.0:6018->6018/tcp, :::6018->6018/tcp                                              promptregistry-mongo-server
+536b71e4ec67   opea/chathistory:latest                                                                     "python opea_chathis…"   8 minutes ago   Up 8 minutes             0.0.0.0:6012->6012/tcp, :::6012->6012/tcp                                              chathistory-mongo-server
+8d56c2b03431   opea/promptregistry:latest                                                                  "python opea_prompt_…"   8 minutes ago   Up 8 minutes             0.0.0.0:6018->6018/tcp, :::6018->6018/tcp                                              promptregistry-mongo-server
 c48921438848   ghcr.io/huggingface/text-embeddings-inference:cpu-1.6                                       "/bin/sh -c 'apt-get…"   8 minutes ago   Up 8 minutes (healthy)   0.0.0.0:8808->80/tcp, :::8808->80/tcp                                                  tei-reranking-server
 ```
 
@@ -203,7 +207,7 @@ The compose.yaml is default compose file using tgi as serving framework
 
 | Service Name                            | Image Name                                                    |
 | --------------------------------------- | ------------------------------------------------------------- |
-| chathistory-mongo-server                | opea/chathistory-mongo:latest                                 |
+| chathistory-mongo-server                | opea/chathistory:latest                                       |
 | chatqna-epyc-backend-server             | opea/chatqna:latest                                           |
 | codegen-epyc-backend-server             | opea/codegen:latest                                           |
 | dataprep-redis-server                   | opea/dataprep:latest                                          |
@@ -213,7 +217,7 @@ The compose.yaml is default compose file using tgi as serving framework
 | llm-textgen-server-codegen              | opea/llm-textgen:latest                                       |
 | mongodb                                 | mongo:7.0.11                                                  |
 | productivity-suite-epyc-react-ui-server | opea/productivity-suite-react-ui-server:latest                |
-| promptregistry-mongo-server             | opea/promptregistry-mongo:latest                              |
+| promptregistry-mongo-server             | opea/promptregistry:latest                                    |
 | redis-vector-db                         | redis/redis-stack:7.2.0-v9                                    |
 | retriever-redis-server                  | opea/retriever:latest                                         |
 | tei-embedding-server                    | ghcr.io/huggingface/text-embeddings-inference:cpu-1.6         |
@@ -228,7 +232,7 @@ The table provides a comprehensive overview of the Productivity Suite service ut
 
 | Service Name                            | Possible Image Names                                          | Optional | Description                                                                                                      |
 | --------------------------------------- | ------------------------------------------------------------- | -------- | ---------------------------------------------------------------------------------------------------------------- |
-| chathistory-mongo-server                | opea/chathistory-mongo:latest                                 | No       | Handles chat history storage and retrieval using MongoDB.                                                        |
+| chathistory-mongo-server                | opea/chathistory:latest                                       | No       | Handles chat history storage and retrieval using MongoDB.                                                        |
 | chatqna-epyc-backend-server             | opea/chatqna:latest                                           | No       | Handles question answering and chat interactions.                                                                |
 | codegen-epyc-backend-server             | opea/codegen:latest                                           | No       | Handles code generation tasks.                                                                                   |
 | dataprep-redis-server                   | opea/dataprep:latest                                          | No       | Handles data preparation and preprocessing tasks for downstream services.                                        |
@@ -238,7 +242,7 @@ The table provides a comprehensive overview of the Productivity Suite service ut
 | llm-textgen-server-codegen              | opea/llm-textgen:latest                                       | No       | Handles large language model (LLM) text generation tasks, providing inference APIs for code and text completion. |
 | mongodb                                 | mongo:7.0.11                                                  | No       | Provides persistent storage for application data using MongoDB.                                                  |
 | productivity-suite-epyc-react-ui-server | opea/productivity-suite-react-ui-server:latest                | No       | Hosts the web-based user interface for interacting with the Productivity Suite services.                         |
-| promptregistry-mongo-server             | opea/promptregistry-mongo:latest                              | No       | Manages storage and retrieval of prompt templates and related metadata.                                          |
+| promptregistry-mongo-server             | opea/promptregistry:latest                                    | No       | Manages storage and retrieval of prompt templates and related metadata.                                          |
 | redis-vector-db                         | redis/redis-stack:7.2.0-v9                                    | No       | Offers in-memory data storage and vector database capabilities for fast retrieval and caching.                   |
 | retriever-redis-server                  | opea/retriever:latest                                         | No       | Handles retrieval-augmented generation tasks, enabling efficient document and context retrieval.                 |
 | tei-embedding-server                    | ghcr.io/huggingface/text-embeddings-inference:cpu-1.6         | No       | Provides text embedding and sequence classification services for downstream NLP tasks.                           |
diff --git a/ProductivitySuite/docker_compose/amd/cpu/epyc/compose.yaml b/ProductivitySuite/docker_compose/amd/cpu/epyc/compose.yaml
index 83ea9c8a03..fe43844af7 100644
--- a/ProductivitySuite/docker_compose/amd/cpu/epyc/compose.yaml
+++ b/ProductivitySuite/docker_compose/amd/cpu/epyc/compose.yaml
@@ -222,7 +222,7 @@ services:
     command: mongod --quiet --logpath /dev/null
 
   chathistory-mongo:
-    image: ${REGISTRY:-opea}/chathistory-mongo:${TAG:-latest}
+    image: ${REGISTRY:-opea}/chathistory:${TAG:-latest}
     container_name: chathistory-mongo-server
     ports:
       - "6012:6012"
@@ -231,6 +231,7 @@ services:
       http_proxy: ${http_proxy}
       no_proxy: ${no_proxy}
       https_proxy: ${https_proxy}
+      OPEA_STORE_NAME: "mongodb"
       MONGO_HOST: ${MONGO_HOST:-mongo}
       MONGO_PORT: ${MONGO_PORT:-27017}
       COLLECTION_NAME: ${COLLECTION_NAME:-Conversations}
@@ -238,7 +239,7 @@ services:
     restart: unless-stopped
 
   promptregistry-mongo:
-    image: ${REGISTRY:-opea}/promptregistry-mongo:${TAG:-latest}
+    image: ${REGISTRY:-opea}/promptregistry:${TAG:-latest}
     container_name: promptregistry-mongo-server
     ports:
       - "6018:6018"
@@ -247,6 +248,7 @@ services:
       http_proxy: ${http_proxy}
       https_proxy: ${https_proxy}
       no_proxy: ${no_proxy}
+      OPEA_STORE_NAME: "mongodb"
       MONGO_HOST: ${MONGO_HOST:-mongo}
       MONGO_PORT: ${MONGO_PORT:-27017}
       COLLECTION_NAME: ${PROMPT_COLLECTION_NAME:-prompt}
diff --git a/ProductivitySuite/docker_compose/intel/cpu/xeon/README.md b/ProductivitySuite/docker_compose/intel/cpu/xeon/README.md
index 8ac4dc65b5..0849b80ad7 100644
--- a/ProductivitySuite/docker_compose/intel/cpu/xeon/README.md
+++ b/ProductivitySuite/docker_compose/intel/cpu/xeon/README.md
@@ -10,14 +10,19 @@ This document outlines the deployment process for OPEA Productivity Suite utiliz
 
 This section describes how to quickly deploy and test the Productivity Suite service manually on Intel® Xeon® platform. The basic steps are:
 
-1. [Access the Code](#access-the-code)
-2. [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
-3. [Configure the Deployment Environment](#configure-the-deployment-environment)
-4. [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
-5. [Check the Deployment Status](#check-the-deployment-status)
-6. [Setup Keycloak](#setup-keycloak)
-7. [Test the Pipeline](#test-the-pipeline)
-8. [Cleanup the Deployment](#cleanup-the-deployment)
+- [Example Productivity Suite Deployment on Intel® Xeon® Platform](#example-productivity-suite-deployment-on-intel-xeon-platform)
+  - [Productivity Suite Quick Start Deployment](#productivity-suite-quick-start-deployment)
+    - [Access the Code](#access-the-code)
+    - [Generate a HuggingFace Access Token](#generate-a-huggingface-access-token)
+    - [Configure the Deployment Environment](#configure-the-deployment-environment)
+    - [Deploy the Service Using Docker Compose](#deploy-the-service-using-docker-compose)
+    - [Check the Deployment Status](#check-the-deployment-status)
+    - [Setup Keycloak](#setup-keycloak)
+    - [Test the Pipeline](#test-the-pipeline)
+    - [Cleanup the Deployment](#cleanup-the-deployment)
+  - [Productivity Suite Docker Compose Files](#productivity-suite-docker-compose-files)
+  - [Productivity Suite Service Configuration](#productivity-suite-service-configuration)
+    - [Running LLM models with remote endpoints](#running-llm-models-with-remote-endpoints)
 
 ### Access the Code
 
@@ -109,8 +114,8 @@ ea7444faa8b2   ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
 9fb471c452ec   quay.io/keycloak/keycloak:25.0.2                                                            "/opt/keycloak/bin/k…"   8 minutes ago   Up 8 minutes             8443/tcp, 0.0.0.0:8080->8080/tcp, :::8080->8080/tcp, 9000/tcp                          keycloak-server
 a00ac544abb7   ghcr.io/huggingface/text-embeddings-inference:cpu-1.6                                       "/bin/sh -c 'apt-get…"   8 minutes ago   Up 8 minutes (healthy)   0.0.0.0:6006->80/tcp, :::6006->80/tcp                                                  tei-embedding-server
 87c2996111d5   redis/redis-stack:7.2.0-v9                                                                  "/entrypoint.sh"         8 minutes ago   Up 8 minutes             0.0.0.0:6379->6379/tcp, :::6379->6379/tcp, 0.0.0.0:8001->8001/tcp, :::8001->8001/tcp   redis-vector-db
-536b71e4ec67   opea/chathistory-mongo:latest                                                               "python opea_chathis…"   8 minutes ago   Up 8 minutes             0.0.0.0:6012->6012/tcp, :::6012->6012/tcp                                              chathistory-mongo-server
-8d56c2b03431   opea/promptregistry-mongo:latest                                                            "python opea_prompt_…"   8 minutes ago   Up 8 minutes             0.0.0.0:6018->6018/tcp, :::6018->6018/tcp                                              promptregistry-mongo-server
+536b71e4ec67   opea/chathistory:latest                                                                     "python opea_chathis…"   8 minutes ago   Up 8 minutes             0.0.0.0:6012->6012/tcp, :::6012->6012/tcp                                              chathistory-mongo-server
+8d56c2b03431   opea/promptregistry:latest                                                                  "python opea_prompt_…"   8 minutes ago   Up 8 minutes             0.0.0.0:6018->6018/tcp, :::6018->6018/tcp                                              promptregistry-mongo-server
 c48921438848   ghcr.io/huggingface/text-embeddings-inference:cpu-1.6                                       "/bin/sh -c 'apt-get…"   8 minutes ago   Up 8 minutes (healthy)   0.0.0.0:8808->80/tcp, :::8808->80/tcp                                                  tei-reranking-server
 ```
 
@@ -186,7 +191,7 @@ The compose.yaml is default compose file using tgi as serving framework
 
 | Service Name                            | Image Name                                                    |
 | --------------------------------------- | ------------------------------------------------------------- |
-| chathistory-mongo-server                | opea/chathistory-mongo:latest                                 |
+| chathistory-mongo-server                | opea/chathistory:latest                                       |
 | chatqna-xeon-backend-server             | opea/chatqna:latest                                           |
 | codegen-xeon-backend-server             | opea/codegen:latest                                           |
 | dataprep-redis-server                   | opea/dataprep:latest                                          |
@@ -196,7 +201,7 @@ The compose.yaml is default compose file using tgi as serving framework
 | llm-textgen-server-codegen              | opea/llm-textgen:latest                                       |
 | mongodb                                 | mongo:7.0.11                                                  |
 | productivity-suite-xeon-react-ui-server | opea/productivity-suite-react-ui-server:latest                |
-| promptregistry-mongo-server             | opea/promptregistry-mongo:latest                              |
+| promptregistry-mongo-server             | opea/promptregistry:latest                                    |
 | redis-vector-db                         | redis/redis-stack:7.2.0-v9                                    |
 | retriever-redis-server                  | opea/retriever:latest                                         |
 | tei-embedding-server                    | ghcr.io/huggingface/text-embeddings-inference:cpu-1.6         |
@@ -211,7 +216,7 @@ The table provides a comprehensive overview of the Productivity Suite service ut
 
 | Service Name                            | Possible Image Names                                          | Optional | Description                                                                                                      |
 | --------------------------------------- | ------------------------------------------------------------- | -------- | ---------------------------------------------------------------------------------------------------------------- |
-| chathistory-mongo-server                | opea/chathistory-mongo:latest                                 | No       | Handles chat history storage and retrieval using MongoDB.                                                        |
+| chathistory-mongo-server                | opea/chathistory:latest                                       | No       | Handles chat history storage and retrieval using MongoDB.                                                        |
 | chatqna-xeon-backend-server             | opea/chatqna:latest                                           | No       | Handles question answering and chat interactions.                                                                |
 | codegen-xeon-backend-server             | opea/codegen:latest                                           | No       | Handles code generation tasks.                                                                                   |
 | dataprep-redis-server                   | opea/dataprep:latest                                          | No       | Handles data preparation and preprocessing tasks for downstream services.                                        |
@@ -221,7 +226,7 @@ The table provides a comprehensive overview of the Productivity Suite service ut
 | llm-textgen-server-codegen              | opea/llm-textgen:latest                                       | No       | Handles large language model (LLM) text generation tasks, providing inference APIs for code and text completion. |
 | mongodb                                 | mongo:7.0.11                                                  | No       | Provides persistent storage for application data using MongoDB.                                                  |
 | productivity-suite-xeon-react-ui-server | opea/productivity-suite-react-ui-server:latest                | No       | Hosts the web-based user interface for interacting with the Productivity Suite services.                         |
-| promptregistry-mongo-server             | opea/promptregistry-mongo:latest                              | No       | Manages storage and retrieval of prompt templates and related metadata.                                          |
+| promptregistry-mongo-server             | opea/promptregistry:latest                                    | No       | Manages storage and retrieval of prompt templates and related metadata.                                          |
 | redis-vector-db                         | redis/redis-stack:7.2.0-v9                                    | No       | Offers in-memory data storage and vector database capabilities for fast retrieval and caching.                   |
 | retriever-redis-server                  | opea/retriever:latest                                         | No       | Handles retrieval-augmented generation tasks, enabling efficient document and context retrieval.                 |
 | tei-embedding-server                    | ghcr.io/huggingface/text-embeddings-inference:cpu-1.6         | No       | Provides text embedding and sequence classification services for downstream NLP tasks.                           |
diff --git a/ProductivitySuite/docker_compose/intel/cpu/xeon/compose.yaml b/ProductivitySuite/docker_compose/intel/cpu/xeon/compose.yaml
index 4c243eb61a..4ab9b7f11f 100644
--- a/ProductivitySuite/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/ProductivitySuite/docker_compose/intel/cpu/xeon/compose.yaml
@@ -222,7 +222,7 @@ services:
     command: mongod --quiet --logpath /dev/null
 
   chathistory-mongo:
-    image: ${REGISTRY:-opea}/chathistory-mongo:${TAG:-latest}
+    image: ${REGISTRY:-opea}/chathistory:${TAG:-latest}
     container_name: chathistory-mongo-server
     ports:
       - "6012:6012"
@@ -231,6 +231,7 @@ services:
       http_proxy: ${http_proxy}
       no_proxy: ${no_proxy}
       https_proxy: ${https_proxy}
+      OPEA_STORE_NAME: "mongodb"
       MONGO_HOST: ${MONGO_HOST:-mongo}
       MONGO_PORT: ${MONGO_PORT:-27017}
       COLLECTION_NAME: ${COLLECTION_NAME:-Conversations}
@@ -238,7 +239,7 @@ services:
     restart: unless-stopped
 
   promptregistry-mongo:
-    image: ${REGISTRY:-opea}/promptregistry-mongo:${TAG:-latest}
+    image: ${REGISTRY:-opea}/promptregistry:${TAG:-latest}
     container_name: promptregistry-mongo-server
     ports:
       - "6018:6018"
@@ -247,6 +248,7 @@ services:
       http_proxy: ${http_proxy}
       https_proxy: ${https_proxy}
       no_proxy: ${no_proxy}
+      OPEA_STORE_NAME: "mongodb"
       MONGO_HOST: ${MONGO_HOST:-mongo}
       MONGO_PORT: ${MONGO_PORT:-27017}
       COLLECTION_NAME: ${PROMPT_COLLECTION_NAME:-prompt}
diff --git a/ProductivitySuite/docker_compose/intel/cpu/xeon/compose_remote.yaml b/ProductivitySuite/docker_compose/intel/cpu/xeon/compose_remote.yaml
index a117b7b70e..c78f1dd576 100644
--- a/ProductivitySuite/docker_compose/intel/cpu/xeon/compose_remote.yaml
+++ b/ProductivitySuite/docker_compose/intel/cpu/xeon/compose_remote.yaml
@@ -163,7 +163,7 @@ services:
     command: mongod --quiet --logpath /dev/null
 
   chathistory-mongo:
-    image: ${REGISTRY:-opea}/chathistory-mongo:${TAG:-latest}
+    image: ${REGISTRY:-opea}/chathistory:${TAG:-latest}
     container_name: chathistory-mongo-server
     ports:
       - "6012:6012"
@@ -172,6 +172,7 @@ services:
       http_proxy: ${http_proxy}
       no_proxy: ${no_proxy}
       https_proxy: ${https_proxy}
+      OPEA_STORE_NAME: "mongodb"
       MONGO_HOST: ${MONGO_HOST:-mongo}
       MONGO_PORT: ${MONGO_PORT:-27017}
       COLLECTION_NAME: ${COLLECTION_NAME:-Conversations}
@@ -179,7 +180,7 @@ services:
     restart: unless-stopped
 
   promptregistry-mongo:
-    image: ${REGISTRY:-opea}/promptregistry-mongo:${TAG:-latest}
+    image: ${REGISTRY:-opea}/promptregistry:${TAG:-latest}
     container_name: promptregistry-mongo-server
     ports:
       - "6018:6018"
@@ -188,6 +189,7 @@ services:
       http_proxy: ${http_proxy}
       https_proxy: ${https_proxy}
       no_proxy: ${no_proxy}
+      OPEA_STORE_NAME: "mongodb"
       MONGO_HOST: ${MONGO_HOST:-mongo}
       MONGO_PORT: ${MONGO_PORT:-27017}
       COLLECTION_NAME: ${PROMPT_COLLECTION_NAME:-prompt}
diff --git a/ProductivitySuite/docker_image_build/build.yaml b/ProductivitySuite/docker_image_build/build.yaml
index 3ad40916ba..ee15e9ba06 100644
--- a/ProductivitySuite/docker_image_build/build.yaml
+++ b/ProductivitySuite/docker_image_build/build.yaml
@@ -43,18 +43,18 @@ services:
       dockerfile: comps/dataprep/src/Dockerfile
     extends: chatqna
     image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}
-  promptregistry-mongo:
+  promptregistry:
     build:
       context: GenAIComps
       dockerfile: comps/prompt_registry/src/Dockerfile
     extends: chatqna
-    image: ${REGISTRY:-opea}/promptregistry-mongo:${TAG:-latest}
-  chathistory-mongo:
+    image: ${REGISTRY:-opea}/promptregistry:${TAG:-latest}
+  chathistory:
     build:
       context: GenAIComps
       dockerfile: comps/chathistory/src/Dockerfile
     extends: chatqna
-    image: ${REGISTRY:-opea}/chathistory-mongo:${TAG:-latest}
+    image: ${REGISTRY:-opea}/chathistory:${TAG:-latest}
   productivity-suite-react-ui-server:
     build:
       context: ../ui
diff --git a/ProductivitySuite/tests/test_compose_on_epyc.sh b/ProductivitySuite/tests/test_compose_on_epyc.sh
index d97b617121..ce81127fbe 100755
--- a/ProductivitySuite/tests/test_compose_on_epyc.sh
+++ b/ProductivitySuite/tests/test_compose_on_epyc.sh
@@ -227,38 +227,6 @@ function validate_megaservice() {
         '{"messages": "def print_hello_world():"}'
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd $WORKPATH/ui/react
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-
-    if conda info --envs | grep -q "^${conda_env_name}[[:space:]]"; then
-        echo "[ TEST INFO ]: Conda environment '${conda_env_name}' exists. Activating..."
-    else
-        echo "[ TEST INFO ]: Conda environment '${conda_env_name}' not found. Creating..."
-        conda create -n "${conda_env_name}" python=3.12 -y
-    fi
-    CONDA_ROOT=$(conda info --base)
-    source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-    conda activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npm run test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
     docker compose stop && docker compose rm -f
@@ -282,10 +250,6 @@ function main() {
     validate_microservices
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ProductivitySuite/tests/test_compose_on_xeon.sh b/ProductivitySuite/tests/test_compose_on_xeon.sh
index 3e6156eef4..81f736a98f 100755
--- a/ProductivitySuite/tests/test_compose_on_xeon.sh
+++ b/ProductivitySuite/tests/test_compose_on_xeon.sh
@@ -225,37 +225,6 @@ function validate_megaservice() {
         '{"messages": "def print_hello_world():"}'
 }
 
-function validate_frontend() {
-    echo "[ TEST INFO ]: --------- frontend test started ---------"
-    cd $WORKPATH/ui/react
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-
-    if conda info --envs | grep -q "^${conda_env_name}[[:space:]]"; then
-        echo "[ TEST INFO ]: Conda environment '${conda_env_name}' exists. Activating..."
-    else
-        echo "[ TEST INFO ]: Conda environment '${conda_env_name}' not found. Creating..."
-        conda create -n "${conda_env_name}" python=3.12 -y
-    fi
-
-    source activate ${conda_env_name}
-    echo "[ TEST INFO ]: --------- conda env activated ---------"
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npm run test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     docker compose stop && docker compose rm -f
@@ -279,10 +248,6 @@ function main() {
     validate_microservices
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/ProductivitySuite/tests/test_ui_on_xeon.sh b/ProductivitySuite/tests/test_ui_on_xeon.sh
new file mode 100755
index 0000000000..41f851aa64
--- /dev/null
+++ b/ProductivitySuite/tests/test_ui_on_xeon.sh
@@ -0,0 +1,119 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    export host_ip=${ip_address}
+    export LOGFLAG=True
+    export no_proxy="$no_proxy,tgi_service_codegen,llm_codegen,tei-embedding-service,tei-reranking-service,chatqna-xeon-backend-server,retriever,tgi-service,redis-vector-db,whisper,llm-docsum-tgi,docsum-xeon-backend-server,mongo,codegen"
+
+    source set_env.sh
+
+    # Start Docker Containers
+    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+    sleep 30s
+
+    n=0
+    until [[ "$n" -ge 100 ]]; do
+        docker logs tgi_service_codegen > ${LOG_PATH}/tgi_service_codegen_start.log 2>&1
+        if grep -q Connected ${LOG_PATH}/tgi_service_codegen_start.log; then
+            echo "CodeGen TGI Service Connected"
+            break
+        fi
+        sleep 5s
+        n=$((n+1))
+    done
+}
+
+function validate_frontend() {
+    echo "[ TEST INFO ]: --------- frontend test started ---------"
+    cd $WORKPATH/ui/react
+    local conda_env_name="OPEA_e2e"
+    export PATH=${HOME}/miniforge3/bin/:$PATH
+
+    if conda info --envs | grep -q "^${conda_env_name}[[:space:]]"; then
+        echo "[ TEST INFO ]: Conda environment '${conda_env_name}' exists. Activating..."
+    else
+        echo "[ TEST INFO ]: Conda environment '${conda_env_name}' not found. Creating..."
+        conda create -n "${conda_env_name}" python=3.12 -y
+    fi
+
+    source activate ${conda_env_name}
+    echo "[ TEST INFO ]: --------- conda env activated ---------"
+
+    conda install -c conda-forge nodejs=22.6.0 -y
+    npm install && npm ci
+    node -v && npm -v && pip list
+
+    exit_status=0
+    npm run test || exit_status=$?
+
+    if [ $exit_status -ne 0 ]; then
+        echo "[TEST INFO]: ---------frontend test failed---------"
+        exit $exit_status
+    else
+        echo "[TEST INFO]: ---------frontend test passed---------"
+    fi
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_frontend"
+    validate_frontend
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/SearchQnA/kubernetes/helm/gaudi-values.yaml b/SearchQnA/kubernetes/helm/gaudi-values.yaml
index a1abc1a447..35a0dd9cd2 100644
--- a/SearchQnA/kubernetes/helm/gaudi-values.yaml
+++ b/SearchQnA/kubernetes/helm/gaudi-values.yaml
@@ -31,8 +31,8 @@ tgi:
 tei:
   accelDevice: "gaudi"
   image:
-    repository: ghcr.io/huggingface/tei-gaudi
-    tag: "1.5.0"
+    repository: ghcr.io/huggingface/text-embeddings-inference
+    tag: "hpu-1.7"
   OMPI_MCA_btl_vader_single_copy_mechanism: none
   MAX_WARMUP_SEQUENCE_LENGTH: 512
   securityContext:
diff --git a/SearchQnA/tests/test_compose_on_epyc.sh b/SearchQnA/tests/test_compose_on_epyc.sh
index f6edbc01cd..568221f5b4 100644
--- a/SearchQnA/tests/test_compose_on_epyc.sh
+++ b/SearchQnA/tests/test_compose_on_epyc.sh
@@ -39,6 +39,7 @@ function start_services() {
     export BACKEND_SERVICE_ENDPOINT="http://${ip_address}:3008/v1/searchqna"
     export host_ip=${ip_address}
     export LOGFLAG=true
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
@@ -66,37 +67,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    CONDA_ROOT=$(conda info --base)
-    source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-    conda activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    # npm install && npm ci && npx playwright install --with-deps
-    npm install && npm ci && npx playwright install
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-       echo "[TEST INFO]: ---------frontend test failed---------"
-       exit $exit_status
-    else
-       echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
     docker compose stop && docker compose rm -f
@@ -120,10 +90,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/SearchQnA/tests/test_compose_on_gaudi.sh b/SearchQnA/tests/test_compose_on_gaudi.sh
index 7744b15be4..660c2c1070 100644
--- a/SearchQnA/tests/test_compose_on_gaudi.sh
+++ b/SearchQnA/tests/test_compose_on_gaudi.sh
@@ -38,6 +38,7 @@ function start_services() {
     export BACKEND_SERVICE_ENDPOINT="http://${ip_address}:3008/v1/searchqna"
     export host_ip=${ip_address}
     export LOGFLAG=true
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
     cd hpu/gaudi
 
@@ -68,35 +69,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose stop && docker compose rm -f
@@ -120,10 +92,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/SearchQnA/tests/test_compose_on_rocm.sh b/SearchQnA/tests/test_compose_on_rocm.sh
index 3cbfe1d787..14b652ca9c 100644
--- a/SearchQnA/tests/test_compose_on_rocm.sh
+++ b/SearchQnA/tests/test_compose_on_rocm.sh
@@ -69,34 +69,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-       echo "[TEST INFO]: ---------frontend test failed---------"
-       exit $exit_status
-    else
-       echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose stop && docker compose rm -f
@@ -120,10 +92,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/SearchQnA/tests/test_compose_on_xeon.sh b/SearchQnA/tests/test_compose_on_xeon.sh
index 0c05e4dcb8..ab9e09ec2f 100644
--- a/SearchQnA/tests/test_compose_on_xeon.sh
+++ b/SearchQnA/tests/test_compose_on_xeon.sh
@@ -37,6 +37,7 @@ function start_services() {
     export BACKEND_SERVICE_ENDPOINT="http://${ip_address}:3008/v1/searchqna"
     export host_ip=${ip_address}
     export LOGFLAG=true
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
     cd cpu/xeon
 
@@ -65,34 +66,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-       echo "[TEST INFO]: ---------frontend test failed---------"
-       exit $exit_status
-    else
-       echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     docker compose stop && docker compose rm -f
@@ -116,10 +89,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/SearchQnA/tests/test_compose_vllm_on_rocm.sh b/SearchQnA/tests/test_compose_vllm_on_rocm.sh
index be78bff0cc..a844398221 100644
--- a/SearchQnA/tests/test_compose_vllm_on_rocm.sh
+++ b/SearchQnA/tests/test_compose_vllm_on_rocm.sh
@@ -71,34 +71,6 @@ function validate_megaservice() {
 
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-       echo "[TEST INFO]: ---------frontend test failed---------"
-       exit $exit_status
-    else
-       echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose -f compose_vllm.yaml stop && docker compose -f compose_vllm.yaml rm -f
@@ -122,10 +94,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/SearchQnA/tests/test_ui_on_xeon.sh b/SearchQnA/tests/test_ui_on_xeon.sh
new file mode 100644
index 0000000000..1cc3d1de14
--- /dev/null
+++ b/SearchQnA/tests/test_ui_on_xeon.sh
@@ -0,0 +1,111 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="searchqna searchqna-ui embedding web-retriever reranking llm-textgen nginx"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel/
+    export RERANK_TYPE="tei"
+    export BACKEND_SERVICE_ENDPOINT="http://${ip_address}:3008/v1/searchqna"
+    export host_ip=${ip_address}
+    export LOGFLAG=true
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    source ./set_env.sh
+    cd cpu/xeon
+
+    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
+
+    # Start Docker Containers
+    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    sleep 10s
+}
+
+function validate_frontend() {
+    cd $WORKPATH/ui/svelte
+    local conda_env_name="OPEA_e2e"
+    export PATH=${HOME}/miniforge3/bin/:$PATH
+    if conda info --envs | grep -q "$conda_env_name"; then
+        echo "$conda_env_name exist!"
+    else
+        conda create -n ${conda_env_name} python=3.12 -y
+    fi
+    source activate ${conda_env_name}
+
+    sed -i "s/localhost/$ip_address/g" playwright.config.ts
+
+    conda install -c conda-forge nodejs=22.6.0 -y
+    npm install && npm ci && npx playwright install --with-deps
+    node -v && npm -v && pip list
+
+    exit_status=0
+    npx playwright test || exit_status=$?
+
+    if [ $exit_status -ne 0 ]; then
+       echo "[TEST INFO]: ---------frontend test failed---------"
+       exit $exit_status
+    else
+       echo "[TEST INFO]: ---------frontend test passed---------"
+    fi
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_frontend"
+    validate_frontend
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/SearchQnA/ui/svelte/package.json b/SearchQnA/ui/svelte/package.json
index f69ca7f9d3..feadc1ed6c 100644
--- a/SearchQnA/ui/svelte/package.json
+++ b/SearchQnA/ui/svelte/package.json
@@ -18,7 +18,7 @@
     "@fortawesome/free-solid-svg-icons": "6.2.0",
     "@playwright/test": "^1.45.2",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "@tailwindcss/typography": "0.5.7",
     "@types/debug": "4.1.7",
diff --git a/SearchQnA/ui/svelte/tests/searchQnA.spec.ts b/SearchQnA/ui/svelte/tests/searchQnA.spec.ts
index 29396cd61a..ab3f8c6220 100644
--- a/SearchQnA/ui/svelte/tests/searchQnA.spec.ts
+++ b/SearchQnA/ui/svelte/tests/searchQnA.spec.ts
@@ -3,6 +3,8 @@
 
 import { test, expect, type Page } from "@playwright/test";
 
+test.setTimeout(5 * 60 * 1000);
+
 // Initialization before each test
 test.beforeEach(async ({ page }) => {
 	await page.goto("/");
@@ -16,8 +18,8 @@ async function enterMessageToChat(page: Page, message: string) {
 	await page.getByTestId("chat-input").click();
 	await page.getByTestId("chat-input").fill(message);
 	await page.getByTestId("chat-input").press("Enter");
-	await page.waitForTimeout(10000);
-	await expect(page.getByTestId("display-answer")).toBeVisible();
+
+	await expect(page.getByTestId("display-answer")).toBeVisible({ timeout: 5 * 60 * 1000 });
 }
 
 // Test description: New Chat
diff --git a/Text2Image/docker_compose/intel/cpu/xeon/README.md b/Text2Image/docker_compose/intel/cpu/xeon/README.md
index fb5192cf12..16c42ebaa9 100644
--- a/Text2Image/docker_compose/intel/cpu/xeon/README.md
+++ b/Text2Image/docker_compose/intel/cpu/xeon/README.md
@@ -23,8 +23,6 @@ Select Stable Diffusion (SD) model and assign its name to a environment variable
 ```bash
 # SD1.5
 export MODEL=stable-diffusion-v1-5/stable-diffusion-v1-5
-# SD2.1
-export MODEL=stabilityai/stable-diffusion-2-1
 # SDXL
 export MODEL=stabilityai/stable-diffusion-xl-base-1.0
 # SD3
diff --git a/Text2Image/docker_compose/intel/hpu/gaudi/README.md b/Text2Image/docker_compose/intel/hpu/gaudi/README.md
index f595c8bc3c..82bcaaf553 100644
--- a/Text2Image/docker_compose/intel/hpu/gaudi/README.md
+++ b/Text2Image/docker_compose/intel/hpu/gaudi/README.md
@@ -23,8 +23,6 @@ Select Stable Diffusion (SD) model and assign its name to a environment variable
 ```bash
 # SD1.5
 export MODEL=stable-diffusion-v1-5/stable-diffusion-v1-5
-# SD2.1
-export MODEL=stabilityai/stable-diffusion-2-1
 # SDXL
 export MODEL=stabilityai/stable-diffusion-xl-base-1.0
 # SD3
diff --git a/Text2Image/tests/test_compose_on_epyc.sh b/Text2Image/tests/test_compose_on_epyc.sh
index cb922a5937..4aa2044a8f 100644
--- a/Text2Image/tests/test_compose_on_epyc.sh
+++ b/Text2Image/tests/test_compose_on_epyc.sh
@@ -16,7 +16,7 @@ mkdir -p "$WORKPATH/tests/logs"
 LOG_PATH="$WORKPATH/tests/logs"
 ip_address=$(hostname -I | awk '{print $1}')
 text2image_service_port=9379
-MODEL=stabilityai/stable-diffusion-2-1
+MODEL=stable-diffusion-v1-5/stable-diffusion-v1-5
 export MODEL=${MODEL}
 
 function build_docker_images() {
diff --git a/Text2Image/tests/test_compose_on_gaudi.sh b/Text2Image/tests/test_compose_on_gaudi.sh
index d0f7b34b0e..bc1f59c31b 100644
--- a/Text2Image/tests/test_compose_on_gaudi.sh
+++ b/Text2Image/tests/test_compose_on_gaudi.sh
@@ -14,7 +14,7 @@ WORKPATH=$(dirname "$PWD")
 LOG_PATH="$WORKPATH/tests"
 ip_address=$(hostname -I | awk '{print $1}')
 text2image_service_port=9379
-MODEL=stabilityai/stable-diffusion-2-1
+MODEL=stable-diffusion-v1-5/stable-diffusion-v1-5
 export MODEL=${MODEL}
 
 function build_docker_images() {
diff --git a/Text2Image/tests/test_compose_on_xeon.sh b/Text2Image/tests/test_compose_on_xeon.sh
index 3c3ee9f2d9..8582f1e3b9 100644
--- a/Text2Image/tests/test_compose_on_xeon.sh
+++ b/Text2Image/tests/test_compose_on_xeon.sh
@@ -14,7 +14,7 @@ WORKPATH=$(dirname "$PWD")
 LOG_PATH="$WORKPATH/tests"
 ip_address=$(hostname -I | awk '{print $1}')
 text2image_service_port=9379
-MODEL=stabilityai/stable-diffusion-2-1
+MODEL=stable-diffusion-v1-5/stable-diffusion-v1-5
 export MODEL=${MODEL}
 
 function build_docker_images() {
diff --git a/Text2Image/ui/svelte/package.json b/Text2Image/ui/svelte/package.json
index fd5c4ded03..401bf24fbd 100644
--- a/Text2Image/ui/svelte/package.json
+++ b/Text2Image/ui/svelte/package.json
@@ -18,7 +18,7 @@
     "@fortawesome/free-solid-svg-icons": "6.2.0",
     "@playwright/test": "^1.45.2",
     "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "2.0.0",
+    "@sveltejs/kit": "2.20.6",
     "@sveltejs/vite-plugin-svelte": "^3.0.0",
     "@tailwindcss/typography": "0.5.7",
     "@types/debug": "4.1.7",
diff --git a/Translation/tests/test_compose_on_epyc.sh b/Translation/tests/test_compose_on_epyc.sh
index 57abfdcfc2..9488750fc6 100644
--- a/Translation/tests/test_compose_on_epyc.sh
+++ b/Translation/tests/test_compose_on_epyc.sh
@@ -36,6 +36,7 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
 
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
@@ -121,37 +122,6 @@ function validate_megaservice() {
         '{"language_from": "Chinese","language_to": "English","source_language": "我爱机器翻译。"}'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    CONDA_ROOT=$(conda info --base)
-    source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-    conda activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    # npm install && npm ci && npx playwright install --with-deps
-    npm install && npm ci && npx playwright install
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
     docker compose stop && docker compose rm -f
@@ -179,10 +149,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/Translation/tests/test_compose_on_gaudi.sh b/Translation/tests/test_compose_on_gaudi.sh
index 9d47a03ae9..12e0b3cd48 100644
--- a/Translation/tests/test_compose_on_gaudi.sh
+++ b/Translation/tests/test_compose_on_gaudi.sh
@@ -34,6 +34,7 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     cd hpu/gaudi
 
@@ -119,34 +120,6 @@ function validate_megaservice() {
         '{"language_from": "Chinese","language_to": "English","source_language": "我爱机器翻译。"}'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
     docker compose stop && docker compose rm -f
@@ -174,10 +147,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-#    echo "::group::validate_frontend"
-#    validate_frontend
-#    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/Translation/tests/test_compose_on_rocm.sh b/Translation/tests/test_compose_on_rocm.sh
index 0190dc6d60..f4e0ec2199 100644
--- a/Translation/tests/test_compose_on_rocm.sh
+++ b/Translation/tests/test_compose_on_rocm.sh
@@ -120,34 +120,6 @@ function validate_megaservice() {
         '{"language_from": "Chinese","language_to": "English","source_language": "我爱机器翻译。"}'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose stop && docker compose rm -f
@@ -175,10 +147,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/Translation/tests/test_compose_on_xeon.sh b/Translation/tests/test_compose_on_xeon.sh
index 6d301eeea4..ec279e4d08 100644
--- a/Translation/tests/test_compose_on_xeon.sh
+++ b/Translation/tests/test_compose_on_xeon.sh
@@ -34,6 +34,7 @@ function build_docker_images() {
 function start_services() {
     cd $WORKPATH/docker_compose/intel
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source set_env.sh
     cd cpu/xeon
 
@@ -120,34 +121,6 @@ function validate_megaservice() {
         '{"language_from": "Chinese","language_to": "English","source_language": "我爱机器翻译。"}'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     docker compose stop && docker compose rm -f
@@ -175,10 +148,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/Translation/tests/test_compose_vllm_on_rocm.sh b/Translation/tests/test_compose_vllm_on_rocm.sh
index 96b7b8e02a..62e32b0eb7 100644
--- a/Translation/tests/test_compose_vllm_on_rocm.sh
+++ b/Translation/tests/test_compose_vllm_on_rocm.sh
@@ -120,34 +120,6 @@ function validate_megaservice() {
         '{"language_from": "Chinese","language_to": "English","source_language": "我爱机器翻译。"}'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniconda3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose -f compose_vllm.yaml stop && docker compose -f compose_vllm.yaml rm -f
@@ -175,10 +147,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/Translation/tests/test_ui_on_xeon.sh b/Translation/tests/test_ui_on_xeon.sh
new file mode 100644
index 0000000000..d142e51bc7
--- /dev/null
+++ b/Translation/tests/test_ui_on_xeon.sh
@@ -0,0 +1,117 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -xe
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+export MODEL_CACHE=${model_cache:-"./data"}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    service_list="translation translation-ui llm-textgen nginx"
+    docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    cd $WORKPATH/docker_compose/intel
+    export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    source set_env.sh
+    cd cpu/xeon
+
+    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
+
+    # Start Docker Containers
+    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+
+    n=0
+    # wait long for llm model download
+    until [[ "$n" -ge 500 ]]; do
+        docker logs tgi-service > ${LOG_PATH}/tgi_service_start.log 2>&1
+        if grep -q Connected ${LOG_PATH}/tgi_service_start.log; then
+            break
+        fi
+        sleep 10s
+        n=$((n+1))
+    done
+}
+
+function validate_frontend() {
+    cd $WORKPATH/ui/svelte
+    local conda_env_name="OPEA_e2e"
+    export PATH=${HOME}/miniforge3/bin/:$PATH
+    if conda info --envs | grep -q "$conda_env_name"; then
+        echo "$conda_env_name exist!"
+    else
+        conda create -n ${conda_env_name} python=3.12 -y
+    fi
+    source activate ${conda_env_name}
+
+    sed -i "s/localhost/$ip_address/g" playwright.config.ts
+
+    conda install -c conda-forge nodejs=22.6.0 -y
+    npm install && npm ci && npx playwright install --with-deps
+    node -v && npm -v && pip list
+
+    exit_status=0
+    npx playwright test || exit_status=$?
+
+    if [ $exit_status -ne 0 ]; then
+        echo "[TEST INFO]: ---------frontend test failed---------"
+        exit $exit_status
+    else
+        echo "[TEST INFO]: ---------frontend test passed---------"
+    fi
+}
+
+function stop_docker() {
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose stop && docker compose rm -f
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_frontend"
+    validate_frontend
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/Translation/ui/docker/Dockerfile b/Translation/ui/docker/Dockerfile
index 1d5115f4b5..3a6ca7f7c9 100644
--- a/Translation/ui/docker/Dockerfile
+++ b/Translation/ui/docker/Dockerfile
@@ -1,8 +1,8 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-# Use node 20.11.1 as the base image
-FROM node:20.11.1
+# Use node 20.19.0 as the base image (required for chokidar@5.0.0 compatibility)
+FROM node:20.19.0
 
 # Update package manager and install Git
 RUN apt-get update -y && apt-get install -y git
diff --git a/Translation/ui/svelte/package.json b/Translation/ui/svelte/package.json
index 4dd56be28f..c36dcc1790 100644
--- a/Translation/ui/svelte/package.json
+++ b/Translation/ui/svelte/package.json
@@ -27,7 +27,7 @@
     "postcss": "^8.4.32",
     "postcss-load-config": "^5.0.2",
     "publint": "^0.1.9",
-    "svelte": "4.2.7",
+    "svelte": "4.2.19",
     "svelte-check": "^3.6.0",
     "svelte-highlight": "^7.6.0",
     "tailwindcss": "^3.3.6",
diff --git a/VideoQnA/tests/test_compose_on_xeon.sh b/VideoQnA/tests/test_compose_on_xeon.sh
index 8ee2534fa4..7ad0c03844 100755
--- a/VideoQnA/tests/test_compose_on_xeon.sh
+++ b/VideoQnA/tests/test_compose_on_xeon.sh
@@ -42,7 +42,7 @@ function start_services() {
     echo "Starting services..."
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
     source ./set_env.sh
-
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     docker volume create video-llama-model
     docker volume create videoqna-cache
     docker compose up vdms-vector-db dataprep -d
@@ -243,30 +243,6 @@ function validate_megaservice() {
     echo "==== megaservice validated ===="
 }
 
-function validate_frontend() {
-    echo "Validating frontend ..."
-
-    HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X GET ${FRONTEND_ENDPOINT})
-
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "Frontend is running correctly."
-        local CONTENT=$(curl -s -X GET ${FRONTEND_ENDPOINT})
-        if echo "$CONTENT" | grep -q "ok"; then
-            echo "Frontend Content is as expected."
-        else
-            echo "Frontend Content does not match the expected result: $CONTENT"
-            docker logs videoqna-xeon-ui-server >> ${LOG_PATH}/ui.log
-            exit 1
-        fi
-    else
-        echo "Frontend is not running correctly. Received status was $HTTP_STATUS"
-        docker logs videoqna-xeon-ui-server >> ${LOG_PATH}/ui.log
-        exit 1
-    fi
-
-    echo "==== frontend validated ===="
-}
-
 function stop_docker() {
     echo "Stopping docker..."
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
@@ -298,10 +274,6 @@ function main() {
     validate_megaservice
     echo "::endgroup::"
 
-    echo "::group::validate_frontend"
-    validate_frontend
-    echo "::endgroup::"
-
     echo "::group::stop_docker"
     stop_docker
     echo "::endgroup::"
diff --git a/VideoQnA/tests/test_ui_on_xeon.sh b/VideoQnA/tests/test_ui_on_xeon.sh
new file mode 100755
index 0000000000..2fed42cc3c
--- /dev/null
+++ b/VideoQnA/tests/test_ui_on_xeon.sh
@@ -0,0 +1,186 @@
+#!/bin/bash
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+set -x
+IMAGE_REPO=${IMAGE_REPO:-"opea"}
+IMAGE_TAG=${IMAGE_TAG:-"latest"}
+echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
+echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
+export REGISTRY=${IMAGE_REPO}
+export TAG=${IMAGE_TAG}
+
+WORKPATH=$(dirname "$PWD")
+LOG_PATH="$WORKPATH/tests"
+ip_address=$(hostname -I | awk '{print $1}')
+export host_ip=${ip_address}
+
+
+function build_docker_images() {
+    opea_branch=${opea_branch:-"main"}
+    cd $WORKPATH/docker_image_build
+    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
+    pushd GenAIComps
+    echo "GenAIComps test commit is $(git rev-parse HEAD)"
+    docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
+    popd && sleep 1s
+
+    # Create .cache directory for cache volume to connect (avoids permission denied error)
+    OLD_STRING="mkdir -p /home/user "
+    NEW_STRING="mkdir -p /home/user/.cache "
+    sed -i "s|$OLD_STRING|$NEW_STRING|g" "GenAIComps/comps/dataprep/src/Dockerfile"
+    sed -i "s|$OLD_STRING|$NEW_STRING|g" "GenAIComps/comps/retrievers/src/Dockerfile"
+    sed -i "s|$OLD_STRING|$NEW_STRING|g" "GenAIComps/comps/third_parties/clip/src/Dockerfile"
+
+    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
+    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log 2>&1
+
+    docker images && sleep 1s
+}
+
+function start_services() {
+    echo "Starting services..."
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    source ./set_env.sh
+    export no_proxy="localhost,127.0.0.1,$ip_address"
+    docker volume create video-llama-model
+    docker volume create videoqna-cache
+    docker compose up vdms-vector-db dataprep -d
+    sleep 30s
+
+    # Insert some sample data to the DB
+    HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST ${DATAPREP_INGEST_SERVICE_ENDPOINT} \
+    -H "Content-Type: multipart/form-data" \
+    -F "files=@./data/op_1_0320241830.mp4")
+
+    if [ "$HTTP_STATUS" -eq 200 ]; then
+        echo "Inserted some data at the beginning."
+    else
+        echo "Inserted failed at the beginning. Received status was $HTTP_STATUS"
+        docker logs dataprep-vdms-server >> ${LOG_PATH}/dataprep.log
+        exit 1
+    fi
+
+    # Bring all the others
+    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+    sleep 1m
+
+    # List of containers running uvicorn
+    list=("dataprep-vdms-server" "clip-embedding-server" "retriever-vdms-server" "reranking-tei-server" "lvm-video-llama" "videoqna-xeon-backend-server")
+
+    # Define the maximum time limit in seconds
+    TIME_LIMIT=5400
+    start_time=$(date +%s)
+
+    check_condition() {
+        local item=$1
+
+        if docker logs $item 2>&1 | grep -q "Uvicorn running on"; then
+            return 0
+        else
+            return 1
+        fi
+    }
+
+    # Main loop
+    while [[ ${#list[@]} -gt 0 ]]; do
+        # Get the current time
+        current_time=$(date +%s)
+        elapsed_time=$((current_time - start_time))
+
+        # Exit if time exceeds the limit
+        if (( elapsed_time >= TIME_LIMIT )); then
+            echo "Time limit exceeded."
+            break
+        fi
+
+        # Iterate through the list
+        for i in "${!list[@]}"; do
+            item=${list[i]}
+            if check_condition "$item"; then
+                echo "Condition met for $item, removing from list." >> ${LOG_PATH}/list_check.log
+                unset "list[i]"
+            else
+                echo "Condition not met for $item, keeping in list." >> ${LOG_PATH}/list_check.log
+            fi
+        done
+
+        # Clean up the list to remove empty elements
+        list=("${list[@]}")
+
+        # Check if the list is empty
+        if [[ ${#list[@]} -eq 0 ]]; then
+            echo "List is empty. Exiting."
+            break
+        fi
+        sleep 2m
+    done
+
+    if docker logs videoqna-xeon-ui-server 2>&1 | grep -q "Streamlit app"; then
+        return 0
+    else
+        return 1
+    fi
+
+}
+
+function validate_frontend() {
+    echo "Validating frontend ..."
+
+    HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X GET ${FRONTEND_ENDPOINT})
+
+    if [ "$HTTP_STATUS" -eq 200 ]; then
+        echo "Frontend is running correctly."
+        local CONTENT=$(curl -s -X GET ${FRONTEND_ENDPOINT})
+        if echo "$CONTENT" | grep -q "ok"; then
+            echo "Frontend Content is as expected."
+        else
+            echo "Frontend Content does not match the expected result: $CONTENT"
+            docker logs videoqna-xeon-ui-server >> ${LOG_PATH}/ui.log
+            exit 1
+        fi
+    else
+        echo "Frontend is not running correctly. Received status was $HTTP_STATUS"
+        docker logs videoqna-xeon-ui-server >> ${LOG_PATH}/ui.log
+        exit 1
+    fi
+
+    echo "==== frontend validated ===="
+}
+
+function stop_docker() {
+    echo "Stopping docker..."
+    cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    docker compose stop && docker compose rm -f
+    docker volume rm video-llama-model
+    docker volume rm videoqna-cache
+    echo "Docker stopped."
+}
+
+function main() {
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    echo "::group::build_docker_images"
+    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
+    echo "::endgroup::"
+
+    echo "::group::start_services"
+    start_services
+    echo "::endgroup::"
+
+    echo "::group::validate_frontend"
+    validate_frontend
+    echo "::endgroup::"
+
+    echo "::group::stop_docker"
+    stop_docker
+    echo "::endgroup::"
+
+    docker system prune -f
+
+}
+
+main
diff --git a/VisualQnA/docker_compose/amd/cpu/epyc/compose.yaml b/VisualQnA/docker_compose/amd/cpu/epyc/compose.yaml
index 9352f411f7..6e8e05e3be 100644
--- a/VisualQnA/docker_compose/amd/cpu/epyc/compose.yaml
+++ b/VisualQnA/docker_compose/amd/cpu/epyc/compose.yaml
@@ -5,7 +5,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - ${VLLM_PORT:-8399}:80
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/compose.monitoring.yaml b/VisualQnA/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
new file mode 100644
index 0000000000..187427d348
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/cpu/xeon/compose.monitoring.yaml
@@ -0,0 +1,59 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.sysfs=/host/sys'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    ipc: host
+    restart: always
+    deploy:
+      mode: global
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/compose.yaml b/VisualQnA/docker_compose/intel/cpu/xeon/compose.yaml
index 47a99a6b0b..c523908264 100644
--- a/VisualQnA/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/VisualQnA/docker_compose/intel/cpu/xeon/compose.yaml
@@ -3,7 +3,7 @@
 
 services:
   vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    image: public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.10.1
     container_name: vllm-service
     ports:
       - ${VLLM_PORT:-8399}:80
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh b/VisualQnA/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..28e5d2d5e0
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/cpu/xeon/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/visualqna_megaservice_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml b/VisualQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml b/VisualQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml
new file mode 100644
index 0000000000..109fc0978f
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/cpu/xeon/grafana/provisioning/datasources/datasource.yml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://prometheus:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/prometheus.yaml b/VisualQnA/docker_compose/intel/cpu/xeon/prometheus.yaml
new file mode 100644
index 0000000000..bf5a52ff22
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/cpu/xeon/prometheus.yaml
@@ -0,0 +1,27 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["vllm-service:80"]
+  - job_name: "tgi"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["tgi-service:80"]
+  - job_name: "visualqna-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["visualqna-backend-server:8888"]
+  - job_name: "prometheus-node-exporter"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/set_env.sh b/VisualQnA/docker_compose/intel/cpu/xeon/set_env.sh
index 2b61baaf6e..0cf9e1ac32 100644
--- a/VisualQnA/docker_compose/intel/cpu/xeon/set_env.sh
+++ b/VisualQnA/docker_compose/intel/cpu/xeon/set_env.sh
@@ -8,8 +8,14 @@ pushd "$SCRIPT_DIR/../../../../../" > /dev/null
 source .set_env.sh
 popd > /dev/null
 
+# Download Grafana configurations
+pushd "${SCRIPT_DIR}/grafana/dashboards" > /dev/null
+source download_opea_dashboard.sh
+popd > /dev/null
+
 export host_ip=$(hostname -I | awk '{print $1}')
-export no_proxy=$host_ip,$no_proxy
+# Set network proxy settings
+export no_proxy="${no_proxy},${host_ip},vllm-service,tgi-llava-xeon-server,visualqna-xeon-backend-server,opea_prometheus,grafana,node-exporter,$JAEGER_IP" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
 export LVM_MODEL_ID="llava-hf/llava-v1.6-mistral-7b-hf"
 export LVM_ENDPOINT="http://${host_ip}:8399"
 export LVM_SERVICE_PORT=9399
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml b/VisualQnA/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
new file mode 100644
index 0000000000..4aedad874e
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/hpu/gaudi/compose.monitoring.yaml
@@ -0,0 +1,74 @@
+# Copyright (C) 2024 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+services:
+  prometheus:
+    image: prom/prometheus:v2.52.0
+    container_name: opea_prometheus
+    user: root
+    volumes:
+      - ./prometheus.yaml:/etc/prometheus/prometheus.yaml
+      - ./prometheus_data:/prometheus
+    command:
+      - '--config.file=/etc/prometheus/prometheus.yaml'
+    ports:
+      - '9090:9090'
+    ipc: host
+    restart: unless-stopped
+
+  grafana:
+    image: grafana/grafana:11.0.0
+    container_name: grafana
+    volumes:
+      - ./grafana_data:/var/lib/grafana
+      - ./grafana/dashboards:/var/lib/grafana/dashboards
+      - ./grafana/provisioning:/etc/grafana/provisioning
+    user: root
+    environment:
+      GF_SECURITY_ADMIN_PASSWORD: admin
+      GF_RENDERING_CALLBACK_URL: http://grafana:3000/
+      GF_LOG_FILTERS: rendering:debug
+      no_proxy: ${no_proxy}
+      host_ip: ${host_ip}
+    depends_on:
+      - prometheus
+    ports:
+      - '3000:3000'
+    ipc: host
+    restart: unless-stopped
+
+  node-exporter:
+    image: prom/node-exporter
+    container_name: node-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+    command:
+      - '--path.procfs=/host/proc'
+      - '--path.sysfs=/host/sys'
+      - --collector.filesystem.ignored-mount-points
+      - "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
+    environment:
+      no_proxy: ${no_proxy}
+    ports:
+      - 9100:9100
+    ipc: host
+    restart: always
+    deploy:
+      mode: global
+
+  gaudi-metrics-exporter:
+    image: vault.habana.ai/gaudi-metric-exporter/metric-exporter:latest
+    privileged: true
+    container_name: gaudi-metrics-exporter
+    volumes:
+      - /proc:/host/proc:ro
+      - /sys:/host/sys:ro
+      - /:/rootfs:ro
+      - /dev:/dev
+    deploy:
+      mode: global
+    ports:
+      - 41611:41611
+    restart: unless-stopped
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/compose.yaml b/VisualQnA/docker_compose/intel/hpu/gaudi/compose.yaml
index 3430ac1052..aa2ae3b1fe 100644
--- a/VisualQnA/docker_compose/intel/hpu/gaudi/compose.yaml
+++ b/VisualQnA/docker_compose/intel/hpu/gaudi/compose.yaml
@@ -3,7 +3,7 @@
 
 services:
   vllm-gaudi-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
+    image: opea/vllm-gaudi:1.4
     container_name: vllm-gaudi-service
     ports:
       - ${VLLM_PORT:-8399}:80
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh b/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
new file mode 100644
index 0000000000..e3eb6d8a94
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/dashboards/download_opea_dashboard.sh
@@ -0,0 +1,26 @@
+#!/bin/bash
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+if ls *.json 1> /dev/null 2>&1; then
+    rm *.json
+fi
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/visualqna_megaservice_grafana.json
+if [ $? -ne 0 ]; then
+    echo "Error: Failed to download visualqna_megaservice_grafana.json"
+    exit 1
+fi
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/vllm_grafana.json
+if [ $? -ne 0 ]; then
+    echo "Error: Failed to download vllm_grafana.json"
+    exit 1
+fi
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/tgi_grafana.json
+if [ $? -ne 0 ]; then
+    echo "Error: Failed to download tgi_grafana.json"
+    exit 1
+fi
+wget https://raw.githubusercontent.com/opea-project/GenAIEval/refs/heads/main/evals/benchmark/grafana/node_grafana.json
+if [ $? -ne 0 ]; then
+    echo "Error: Failed to download node_grafana.json"
+    exit 1
+fi
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml b/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
new file mode 100644
index 0000000000..13922a769b
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/dashboards/local.yaml
@@ -0,0 +1,14 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+apiVersion: 1
+
+providers:
+- name: 'default'
+  orgId: 1
+  folder: ''
+  type: file
+  disableDeletion: false
+  updateIntervalSeconds: 10 #how often Grafana will scan for changed dashboards
+  options:
+    path: /var/lib/grafana/dashboards
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml b/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml
new file mode 100644
index 0000000000..109fc0978f
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/hpu/gaudi/grafana/provisioning/datasources/datasource.yml
@@ -0,0 +1,54 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# config file version
+apiVersion: 1
+
+# list of datasources that should be deleted from the database
+deleteDatasources:
+  - name: Prometheus
+    orgId: 1
+
+# list of datasources to insert/update depending
+# what's available in the database
+datasources:
+  # <string, required> name of the datasource. Required
+- name: Prometheus
+  # <string, required> datasource type. Required
+  type: prometheus
+  # <string, required> access mode. direct or proxy. Required
+  access: proxy
+  # <int> org id. will default to orgId 1 if not specified
+  orgId: 1
+  # <string> url
+  url: http://prometheus:9090
+  # <string> database password, if used
+  password:
+  # <string> database user, if used
+  user:
+  # <string> database name, if used
+  database:
+  # <bool> enable/disable basic auth
+  basicAuth: false
+  # <string> basic auth username, if used
+  basicAuthUser:
+  # <string> basic auth password, if used
+  basicAuthPassword:
+  # <bool> enable/disable with credentials headers
+  withCredentials:
+  # <bool> mark as default datasource. Max one per org
+  isDefault: true
+  # <map> fields that will be converted to json and stored in json_data
+  jsonData:
+     httpMethod: GET
+     graphiteVersion: "1.1"
+     tlsAuth: false
+     tlsAuthWithCACert: false
+  # <string> json object of data that will be encrypted.
+  secureJsonData:
+    tlsCACert: "..."
+    tlsClientCert: "..."
+    tlsClientKey: "..."
+  version: 1
+  # <bool> allow users to edit datasources from the UI.
+  editable: true
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/prometheus.yaml b/VisualQnA/docker_compose/intel/hpu/gaudi/prometheus.yaml
new file mode 100644
index 0000000000..bf5a52ff22
--- /dev/null
+++ b/VisualQnA/docker_compose/intel/hpu/gaudi/prometheus.yaml
@@ -0,0 +1,27 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+# [IP_ADDR]:{PORT_OUTSIDE_CONTAINER} -> {PORT_INSIDE_CONTAINER} / {PROTOCOL}
+global:
+  scrape_interval: 5s
+  external_labels:
+    monitor: "my-monitor"
+scrape_configs:
+  - job_name: "prometheus"
+    static_configs:
+      - targets: ["prometheus:9090"]
+  - job_name: "vllm"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["vllm-service:80"]
+  - job_name: "tgi"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["tgi-service:80"]
+  - job_name: "visualqna-backend-server"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["visualqna-backend-server:8888"]
+  - job_name: "prometheus-node-exporter"
+    metrics_path: /metrics
+    static_configs:
+      - targets: ["node-exporter:9100"]
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/set_env.sh b/VisualQnA/docker_compose/intel/hpu/gaudi/set_env.sh
index 39df67f949..c1d9ea1b0b 100644
--- a/VisualQnA/docker_compose/intel/hpu/gaudi/set_env.sh
+++ b/VisualQnA/docker_compose/intel/hpu/gaudi/set_env.sh
@@ -8,8 +8,14 @@ pushd "$SCRIPT_DIR/../../../../../" > /dev/null
 source .set_env.sh
 popd > /dev/null
 
+# Download Grafana configurations
+pushd "${SCRIPT_DIR}/grafana/dashboards" > /dev/null
+source download_opea_dashboard.sh
+popd > /dev/null
+
 export host_ip=$(hostname -I | awk '{print $1}')
-export no_proxy=$host_ip,$no_proxy
+# Set network proxy settings
+export no_proxy="${no_proxy},${host_ip},vllm-service,tgi-llava-xeon-server,visualqna-xeon-backend-server,opea_prometheus,grafana,node-exporter,$JAEGER_IP" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
 # export LVM_MODEL_ID="llava-hf/llava-v1.6-mistral-7b-hf"
 export LVM_MODEL_ID="llava-hf/llava-1.5-7b-hf"
 export LVM_ENDPOINT="http://${host_ip}:8399"
diff --git a/VisualQnA/docker_image_build/build.yaml b/VisualQnA/docker_image_build/build.yaml
index e8b1240040..5213802652 100644
--- a/VisualQnA/docker_image_build/build.yaml
+++ b/VisualQnA/docker_image_build/build.yaml
@@ -37,15 +37,3 @@ services:
       dockerfile: comps/third_parties/vllm/src/Dockerfile.amd_gpu
     extends: visualqna
     image: ${REGISTRY:-opea}/vllm-rocm:${TAG:-latest}
-  vllm:
-    build:
-      context: vllm
-      dockerfile: docker/Dockerfile.cpu
-    extends: visualqna
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
-  vllm-gaudi:
-    build:
-      context: vllm-fork
-      dockerfile: Dockerfile.hpu
-    extends: visualqna
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
diff --git a/VisualQnA/tests/test_compose_on_epyc.sh b/VisualQnA/tests/test_compose_on_epyc.sh
index 7eb33312b1..2bbe5df45b 100644
--- a/VisualQnA/tests/test_compose_on_epyc.sh
+++ b/VisualQnA/tests/test_compose_on_epyc.sh
@@ -26,18 +26,8 @@ function build_docker_images() {
 	echo "GenAIComps test commit is $(git rev-parse HEAD)"
 	docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
 	popd && sleep 1s
-	git clone https://github.com/vllm-project/vllm.git && cd vllm
-	VLLM_VER=v0.10.0
-	echo "Check out vLLM tag ${VLLM_VER}"
-	git checkout ${VLLM_VER} &>/dev/null
-	VLLM_REQ_FILE="requirements/cpu.txt"
-	if ! grep -q "^transformers" "$VLLM_REQ_FILE"; then
-		echo "Adding transformers<4.54.0 to $VLLM_REQ_FILE"
-		echo "transformers<4.54.0" >>"$VLLM_REQ_FILE"
-	fi
-	cd ../
 
-	service_list="visualqna visualqna-ui lvm nginx vllm"
+	service_list="visualqna visualqna-ui lvm nginx"
 	docker compose -f build.yaml build ${service_list} --no-cache >${LOG_PATH}/docker_image_build.log
 	docker images && sleep 1s
 }
@@ -45,6 +35,7 @@ function build_docker_images() {
 function start_services() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc/
 	source ./set_env.sh
+	export no_proxy="localhost,127.0.0.1,$ip_address"
 	sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 	# Start Docker Containers
 	docker compose up -d >${LOG_PATH}/start_services_with_compose.log
@@ -157,37 +148,6 @@ function validate_megaservice() {
     }'
 }
 
-function validate_frontend() {
-	cd $WORKPATH/ui/svelte
-	local conda_env_name="OPEA_e2e"
-	export PATH=${HOME}/miniforge3/bin/:$PATH
-	if conda info --envs | grep -q "$conda_env_name"; then
-		echo "$conda_env_name exist!"
-	else
-		conda create -n ${conda_env_name} python=3.12 -y
-	fi
-	CONDA_ROOT=$(conda info --base)
-	source "${CONDA_ROOT}/etc/profile.d/conda.sh"
-	conda activate ${conda_env_name}
-
-	sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-	conda install -c conda-forge nodejs=22.6.0 -y
-	# npm install && npm ci && npx playwright install --with-deps
-	npm install && npm ci && npx playwright install
-	node -v && npm -v && pip list
-
-	exit_status=0
-	npx playwright test || exit_status=$?
-
-	if [ $exit_status -ne 0 ]; then
-		echo "[TEST INFO]: ---------frontend test failed---------"
-		exit $exit_status
-	else
-		echo "[TEST INFO]: ---------frontend test passed---------"
-	fi
-}
-
 function stop_docker() {
 	cd $WORKPATH/docker_compose/amd/cpu/epyc/
 	docker compose stop && docker compose rm -f
diff --git a/VisualQnA/tests/test_compose_on_gaudi.sh b/VisualQnA/tests/test_compose_on_gaudi.sh
index 1df520183c..5ae106a5ce 100644
--- a/VisualQnA/tests/test_compose_on_gaudi.sh
+++ b/VisualQnA/tests/test_compose_on_gaudi.sh
@@ -26,11 +26,7 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
 
-    git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
-    git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
-
-    service_list="visualqna visualqna-ui lvm nginx vllm-gaudi"
+    service_list="visualqna visualqna-ui lvm nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
     docker images && sleep 1s
 }
@@ -44,7 +40,7 @@ function start_services() {
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
     # Start Docker Containers
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -155,37 +151,9 @@ function validate_megaservice() {
     }'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose stop && docker compose rm -f
+    docker compose -f compose.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/VisualQnA/tests/test_compose_on_rocm.sh b/VisualQnA/tests/test_compose_on_rocm.sh
index e2494382f9..bd02667998 100644
--- a/VisualQnA/tests/test_compose_on_rocm.sh
+++ b/VisualQnA/tests/test_compose_on_rocm.sh
@@ -151,34 +151,6 @@ function validate_megaservice() {
     }'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose stop && docker compose rm -f
diff --git a/VisualQnA/tests/test_compose_on_xeon.sh b/VisualQnA/tests/test_compose_on_xeon.sh
index 1775e8ade7..d3ffe6aaea 100644
--- a/VisualQnA/tests/test_compose_on_xeon.sh
+++ b/VisualQnA/tests/test_compose_on_xeon.sh
@@ -24,23 +24,19 @@ function build_docker_images() {
     echo "GenAIComps test commit is $(git rev-parse HEAD)"
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
-    git clone https://github.com/vllm-project/vllm.git && cd vllm
-    VLLM_VER=v0.10.0
-    echo "Check out vLLM tag ${VLLM_VER}"
-    git checkout ${VLLM_VER} &> /dev/null
-    cd ../
 
-    service_list="visualqna visualqna-ui lvm nginx vllm"
+    service_list="visualqna visualqna-ui lvm nginx"
     docker compose -f build.yaml build ${service_list} --no-cache > ${LOG_PATH}/docker_image_build.log
     docker images && sleep 1s
 }
 
 function start_services() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
     # Start Docker Containers
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 200 ]]; do
@@ -150,37 +146,9 @@ function validate_megaservice() {
     }'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose stop && docker compose rm -f
+    docker compose -f compose.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/VisualQnA/tests/test_compose_tgi_on_epyc.sh b/VisualQnA/tests/test_compose_tgi_on_epyc.sh
index e61afa9baa..558f4c05a5 100644
--- a/VisualQnA/tests/test_compose_tgi_on_epyc.sh
+++ b/VisualQnA/tests/test_compose_tgi_on_epyc.sh
@@ -39,6 +39,7 @@ function start_services() {
     export HF_TOKEN=${HF_TOKEN}
     export NGINX_PORT=80
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
@@ -155,35 +156,6 @@ function validate_megaservice() {
     }'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    # npm install && npm ci && npx playwright install --with-deps
-    npm install && npm ci && npx playwright install
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/cpu/epyc/
     docker compose -f compose_tgi.yaml down
diff --git a/VisualQnA/tests/test_compose_tgi_on_gaudi.sh b/VisualQnA/tests/test_compose_tgi_on_gaudi.sh
index ba49821249..04acca7531 100644
--- a/VisualQnA/tests/test_compose_tgi_on_gaudi.sh
+++ b/VisualQnA/tests/test_compose_tgi_on_gaudi.sh
@@ -37,13 +37,14 @@ function start_services() {
     export HF_TOKEN=${HF_TOKEN}
     export NGINX_PORT=80
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
     export LVM_MODEL_ID="llava-hf/llava-v1.6-mistral-7b-hf"
 
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
     # Start Docker Containers
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 100 ]]; do
@@ -154,37 +155,9 @@ function validate_megaservice() {
     }'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose -f compose_tgi.yaml down
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/VisualQnA/tests/test_compose_tgi_on_xeon.sh b/VisualQnA/tests/test_compose_tgi_on_xeon.sh
index 270b638350..18d2410183 100644
--- a/VisualQnA/tests/test_compose_tgi_on_xeon.sh
+++ b/VisualQnA/tests/test_compose_tgi_on_xeon.sh
@@ -37,12 +37,13 @@ function start_services() {
     export HF_TOKEN=${HF_TOKEN}
     export NGINX_PORT=80
     export host_ip=${ip_address}
+    export no_proxy="localhost,127.0.0.1,$ip_address"
     source ./set_env.sh
 
     sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
 
     # Start Docker Containers
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
 
     n=0
     until [[ "$n" -ge 200 ]]; do
@@ -153,37 +154,9 @@ function validate_megaservice() {
     }'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose -f compose_tgi.yaml down
+    docker compose -f compose_tgi.yaml -f compose.monitoring.yaml down
 }
 
 function main() {
diff --git a/VisualQnA/tests/test_compose_vllm_on_rocm.sh b/VisualQnA/tests/test_compose_vllm_on_rocm.sh
index 38daf86d17..7e6835f8be 100644
--- a/VisualQnA/tests/test_compose_vllm_on_rocm.sh
+++ b/VisualQnA/tests/test_compose_vllm_on_rocm.sh
@@ -151,34 +151,6 @@ function validate_megaservice() {
     }'
 }
 
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
 function stop_docker() {
     cd $WORKPATH/docker_compose/amd/gpu/rocm/
     docker compose stop && docker compose rm -f
diff --git a/docker_images_list.md b/docker_images_list.md
index 17c4d6faf0..6620531cca 100644
--- a/docker_images_list.md
+++ b/docker_images_list.md
@@ -53,14 +53,14 @@ Take ChatQnA for example. ChatQnA is a chatbot application service based on the
 | [opea/agent-ui](https://hub.docker.com/r/opea/agent-ui)                                                             | [Link](https://github.com/opea-project/GenAIExamples/blob/main/AgentQnA/ui/docker/Dockerfile)                         | OPEA agent microservice UI entry for GenAI applications use                                                                                                                                  | [Link](https://github.com/opea-project/GenAIExamples/blob/main/AgentQnA/README.md)                                       |
 | [opea/animation](https://hub.docker.com/r/opea/animation)                                                           | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/animation/src/Dockerfile)                           | OPEA Avatar Animation microservice for GenAI applications                                                                                                                                    | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/animation/src/README.md)                               |
 | [opea/asr](https://hub.docker.com/r/opea/asr)                                                                       | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/asr/src/Dockerfile)                                 | OPEA Audio-Speech-Recognition microservice for GenAI applications                                                                                                                            | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/asr/src/README.md)                                     |
-| [opea/chathistory-mongo](https://hub.docker.com/r/opea/chathistory-mongo)                                           | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/chathistory/src/Dockerfile)                         | OPEA Chat History microservice is based on a MongoDB database and is designed to allow users to store, retrieve and manage chat conversations.                                               | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/chathistory/src/README.md)                             |
+| [opea/chathistory](https://hub.docker.com/r/opea/chathistory)                                                       | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/chathistory/src/Dockerfile)                         | OPEA Chat History microservice is based on a NoSQL database and is designed to allow users to store, retrieve and manage chat conversations.                                                 | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/chathistory/README.md)                                 |
 | [opea/comps-base](https://hub.docker.com/r/opea/comps-base)                                                         | [Link](https://github.com/opea-project/GenAIComps/blob/main/Dockerfile)                                               | OPEA Microservice base image.                                                                                                                                                                | [Link](https://github.com/opea-project/GenAIComps/blob/main/README.md)                                                   |
 | [opea/dataprep](https://hub.docker.com/r/opea/dataprep)                                                             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/dataprep/src/Dockerfile)                            | OPEA data preparation microservices for GenAI applications                                                                                                                                   | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/dataprep/README.md)                                    |
-| [opea/embedding](https://hub.docker.com/r/opea/embedding)                                                           | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/embeddings/src/Dockerfile)                          | OPEA mosec embedding microservice for GenAI application                                                                                                                                      | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/embeddings/src/README.md)                              |
+| [opea/embedding](https://hub.docker.com/r/opea/embedding)                                                           | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/embeddings/src/Dockerfile)                          | OPEA mosec embedding microservice for GenAI application                                                                                                                                      | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/embeddings/README.md)                                  |
 | [opea/embedding-multimodal-bridgetower](https://hub.docker.com/r/opea/embedding-multimodal-bridgetower)             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/bridgetower/src/Dockerfile)           | OPEA multimodal embedded microservices based on bridgetower for use by GenAI applications                                                                                                    | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/bridgetower/src/README.md)               |
 | [opea/embedding-multimodal-bridgetower-gaudi](https://hub.docker.com/r/opea/embedding-multimodal-bridgetower-gaudi) | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/bridgetower/src/Dockerfile.intel_hpu) | OPEA multimodal embedded microservices based on bridgetower for use by GenAI applications on the Gaudi                                                                                       | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/bridgetower/src/README.md)               |
 | [opea/embedding-multimodal-clip](https://hub.docker.com/r/opea/embedding-multimodal-clip)                           | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/clip/src/Dockerfile)                  | OPEA mosec embedding microservice base on Langchain framework for GenAI application use                                                                                                      | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/clip/src/README.md)                      |
-| [opea/feedbackmanagement-mongo](https://hub.docker.com/r/opea/feedbackmanagement-mongo)                             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/feedback_management/src/Dockerfile)                 | OPEA feedback management microservice uses MongoDB database for GenAI applications.                                                                                                          | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/feedback_management/src/README.md)                     |
+| [opea/feedbackmanagement](https://hub.docker.com/r/opea/feedbackmanagement)                                         | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/feedback_management/src/Dockerfile)                 | OPEA feedback management microservice uses NoSQL database for GenAI applications.                                                                                                            | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/feedback_management/README.md)                         |
 | [opea/finetuning](https://hub.docker.com/r/opea/finetuning)                                                         | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/finetuning/src/Dockerfile)                          | OPEA Fine-tuning microservice for GenAI application                                                                                                                                          | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/finetuning/src/README.md)                              |
 | [opea/finetuning-gaudi](https://hub.docker.com/r/opea/finetuning-gaudi)                                             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/finetuning/src/Dockerfile.intel_hpu)                | OPEA Fine-tuning microservice for GenAI application use on the Gaudi                                                                                                                         | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/finetuning/src/README.md)                              |
 | [opea/finetuning-xtune](https://hub.docker.com/r/opea/finetuning-xtune)                                             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/finetuning/src/Dockerfile.xtune)                    | OPEA Fine-tuning microservice base on Xtune for GenAI application use on the Arc A770                                                                                                        | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/finetuning/src/README.md)                              |
@@ -83,7 +83,7 @@ Take ChatQnA for example. ChatQnA is a chatbot application service based on the
 | [opea/llm-textgen](https://hub.docker.com/r/opea/llm-textgen)                                                       | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/llms/src/text-generation/Dockerfile)                | OPEA LLM microservice upon textgen docker image for GenAI application                                                                                                                        | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/llms/src/text-generation/README.md)                    |
 | [opea/llm-textgen-gaudi](https://hub.docker.com/r/opea/llm-textgen-gaudi)                                           | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/llms/src/text-generation/Dockerfile.intel_hpu)      | OPEA LLM microservice upon textgen docker image for GenAI application use on the Gaudi2                                                                                                      | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/llms/src/text-generation/README.md)                    |
 | [opea/llm-textgen-phi4-gaudi](https://hub.docker.com/r/opea/llm-textgen-phi4-gaudi)                                 | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/llms/src/text-generation/Dockerfile.intel_hpu_phi4) | OPEA LLM microservice upon textgen docker image for GenAI application use on the Gaudi2 with Phi4 optimization.                                                                              | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/llms/src/text-generation/README_native.md)             |
-| [opea/lvm](https://hub.docker.com/r/opea/lvm)                                                                       | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/lvms/src/Dockerfile)                                | OPEA large visual model (LVM) microservice for GenAI application                                                                                                                             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/lvms/src/README.md)                                    |
+| [opea/lvm](https://hub.docker.com/r/opea/lvm)                                                                       | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/lvms/src/Dockerfile)                                | OPEA large visual model (LVM) microservice for GenAI application                                                                                                                             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/lvms/README.md)                                        |
 | [opea/lvm-llama-vision](https://hub.docker.com/r/opea/lvm-llama-vision)                                             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/llama-vision/src/Dockerfile)          | OPEA microservice running Llama Vision as a large visualization model (LVM) server for GenAI applications                                                                                    | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/llama-vision/src/README.md)              |
 | [opea/lvm-llama-vision-guard](https://hub.docker.com/r/opea/lvm-llama-vision-guard)                                 | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/llama-vision/src/Dockerfile.guard)    | OPEA microservice running Llama Vision Guard as a large visualization model (LVM) server for GenAI applications                                                                              | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/llama-vision/src/README.md)              |
 | [opea/lvm-llama-vision-tp](https://hub.docker.com/r/opea/lvm-llama-vision-tp)                                       | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/llama-vision/src/Dockerfile.tp)       | OPEA microservice running Llama Vision with DeepSpeed as a large visualization model (LVM) server for GenAI applications                                                                     | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/llama-vision/src/README.md)              |
@@ -93,7 +93,7 @@ Take ChatQnA for example. ChatQnA is a chatbot application service based on the
 | [opea/lvm-video-llama](https://hub.docker.com/r/opea/lvm-video-llama)                                               | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/video-llama/src/Dockerfile)           | OPEA microservice running Video-Llama as a large visualization model (LVM) server for GenAI applications                                                                                     | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/video-llama/src/README.md)               |
 | [opea/nginx](https://hub.docker.com/r/opea/nginx)                                                                   | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/nginx/src/Dockerfile)                 | OPEA nginx microservice for GenAI application                                                                                                                                                | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/nginx/deployment/kubernetes/README.md)   |
 | [opea/pathway](https://hub.docker.com/r/opea/pathway)                                                               | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/pathway/src/Dockerfile)               | OPEA Pathway microservice for GenAI application                                                                                                                                              | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/pathway/src/README.md)                   |
-| [opea/promptregistry-mongo](https://hub.docker.com/r/opea/promptregistry-mongo)                                     | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/prompt_registry/src/Dockerfile)                     | OPEA Prompt Registry microservice based on MongoDB database, designed to store and retrieve user preference prompts                                                                          | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/prompt_registry/src/README.md)                         |
+| [opea/promptregistry](https://hub.docker.com/r/opea/promptregistry)                                                 | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/prompt_registry/src/Dockerfile)                     | OPEA Prompt Registry microservice based on NoSQL database, designed to store and retrieve user preference prompts                                                                            | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/prompt_registry/README.md)                             |
 | [opea/reranking](https://hub.docker.com/r/opea/reranking)                                                           | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/rerankings/src/Dockerfile)                          | OPEA reranking microservice for GenAI application                                                                                                                                            | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/rerankings/src/README.md)                              |
 | [opea/retriever](https://hub.docker.com/r/opea/retriever)                                                           | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/retrievers/src/Dockerfile)                          | OPEA retrieval microservice for GenAI application                                                                                                                                            | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/retrievers/README.md)                                  |
 | [opea/speecht5](https://hub.docker.com/r/opea/speecht5)                                                             | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/third_parties/speecht5/src/Dockerfile)              | OPEA SpeechT5 service for GenAI application                                                                                                                                                  | [Link](https://github.com/opea-project/GenAIComps/blob/main/comps/tts/src/README.md)                                     |
diff --git a/one_click_deploy/common/update_images.sh b/one_click_deploy/common/update_images.sh
index d78caa0eee..989975d4d4 100644
--- a/one_click_deploy/common/update_images.sh
+++ b/one_click_deploy/common/update_images.sh
@@ -14,6 +14,7 @@ LOG_FILE="${PROJECT_ROOT}/deploy.log"
 # --- Configuration ---
 EXAMPLE="ChatQnA"
 DEVICE="xeon"
+OS="debian"
 REGISTRY="opea"
 TAG="latest"
 BUILD_ACTION=false
@@ -37,6 +38,8 @@ usage() {
     echo "                              (default: ${EXAMPLE})"
     echo "  --device <DEVICE>:          Specify the target device (e.g., xeon, gaudi)."
     echo "                              (default: ${DEVICE})"
+    echo "  --os <OS>:                  Specify the target operating system (e.g., debian, openeuler)."
+    echo "                              (default: ${OS})"
     echo "  --build:                    Build all images for the specified example."
     echo "  --push:                     Push all built images for the specified example to the registry."
     echo "  --setup-registry:           Set up a local Docker registry (localhost:5000) for this run."
@@ -59,6 +62,7 @@ usage() {
 get_service_list() {
     local example_name=$1
     local device_name=$2
+    local os_name=$3
     case "$example_name" in
         "DocSum")
             if [[ "$device_name" == "gaudi" ]]; then
@@ -68,20 +72,32 @@ get_service_list() {
             fi
             ;;
         "ChatQnA")
-            echo "chatqna chatqna-ui dataprep retriever vllm nginx"
+            if [[ "$os_name" == "openeuler" ]]; then
+                echo "chatqna-openeuler chatqna-ui-openeuler dataprep-openeuler retriever-openeuler nginx-openeuler"
+            else
+                echo "chatqna chatqna-ui dataprep retriever vllm nginx"
+            fi
             ;;
         "CodeGen")
-            if [[ "$device_name" == "gaudi" ]]; then
-                echo "codegen codegen-gradio-ui dataprep embedding retriever llm-textgen vllm-gaudi"
+            if [[ "$os_name" == "openeuler" ]]; then
+                echo "codegen-openeuler codegen-gradio-ui-openeuler dataprep-openeuler embedding-openeuler retriever-openeuler llm-textgen-openeuler"
             else
-                echo "codegen codegen-gradio-ui dataprep embedding retriever llm-textgen vllm"
+                if [[ "$device_name" == "gaudi" ]]; then
+                    echo "codegen codegen-gradio-ui dataprep embedding retriever llm-textgen vllm-gaudi"
+                else
+                    echo "codegen codegen-gradio-ui dataprep embedding retriever llm-textgen vllm"
+                fi
             fi
             ;;
         "AudioQnA")
-            if [[ "$device_name" == "gaudi" ]]; then
-                echo "audioqna audioqna-ui whisper-gaudi speecht5-gaudi vllm-gaudi"
+            if [[ "$os_name" == "openeuler" ]]; then
+                echo "audioqna-openeuler audioqna-ui-openeuler whisper-openeuler speecht5-openeuler"
             else
-                echo "audioqna audioqna-ui whisper speecht5 vllm"
+                if [[ "$device_name" == "gaudi" ]]; then
+                    echo "audioqna audioqna-ui whisper-gaudi speecht5-gaudi vllm-gaudi"
+                else
+                    echo "audioqna audioqna-ui whisper speecht5 vllm"
+                fi
             fi
             ;;
         "FaqGen")
@@ -197,10 +213,17 @@ execute_build() {
 
     log "INFO" "Building base image: comps-base (build-time only)"
     pushd GenAIComps
-    docker build --no-cache -t "${REGISTRY}/comps-base:${TAG}" \
-        --build-arg https_proxy="$https_proxy" \
-        --build-arg http_proxy="$http_proxy" \
-        -f Dockerfile .
+    if [[ "$OS" == "openeuler" ]]; then
+        docker build --no-cache -t "${REGISTRY}/comps-base:${TAG}-openeuler" \
+            --build-arg https_proxy="$https_proxy" \
+            --build-arg http_proxy="$http_proxy" \
+            -f Dockerfile.openEuler .
+    else
+        docker build --no-cache -t "${REGISTRY}/comps-base:${TAG}" \
+            --build-arg https_proxy="$https_proxy" \
+            --build-arg http_proxy="$http_proxy" \
+            -f Dockerfile .
+    fi
     popd
 
     log "INFO" "Starting build for specified ${example_name} services..."
@@ -215,9 +238,10 @@ dispatch_build() {
     local example_name=$1
     local example_path=$2
     local device_name=$3
+    local os_name=$4
     local config_name # This will hold the name of the config array
 
-    section_header "Building Docker Images for ${example_name} on ${device_name}"
+    section_header "Building Docker Images for ${example_name} on ${device_name} with OS ${os_name}"
 
     export REGISTRY
     export TAG
@@ -225,7 +249,7 @@ dispatch_build() {
     export https_proxy=${https_proxy:-}
     export no_proxy=${no_proxy:-}
 
-    local service_list=$(get_service_list "$example_name" "$device_name")
+    local service_list=$(get_service_list "$example_name" "$device_name" "$os_name")
 
     case "$example_name" in
         "DocSum"|"ChatQnA"|"CodeTrans"|"FaqGen"|"VisualQnA")
@@ -268,6 +292,7 @@ push_images() {
     local example_name=$1
     local example_path=$2
     local device_name=$3
+    local os_name=$4
     section_header "Pushing Docker Images for ${example_name}"
 
     cd "${example_path}/docker_image_build"
@@ -277,7 +302,7 @@ push_images() {
     export REGISTRY
     export TAG
 
-    local service_list=$(get_service_list "$example_name" "$device_name")
+    local service_list=$(get_service_list "$example_name" "$device_name" "$os_name" )
 
     if [ -z "$service_list" ]; then
         log "INFO" "Pushing all services defined in build.yaml for ${example_name}..."
@@ -340,6 +365,10 @@ while [[ $# -gt 0 ]]; do
             DEVICE="$2"
             shift 2
             ;;
+        --os)
+            OS="$2"
+            shift 2
+            ;;
         --build)
             BUILD_ACTION=true
             shift
@@ -377,6 +406,7 @@ EXAMPLE_PATH=$(get_example_path "$EXAMPLE")
 log "INFO" "Project Root: ${PROJECT_ROOT}"
 log "INFO" "Selected Example: ${EXAMPLE} (Path: ${EXAMPLE_PATH})"
 log "INFO" "Target Device: ${DEVICE}"
+log "INFO" "Target OS: ${OS}"
 log "INFO" "Image Registry: ${REGISTRY:-'Not set'}"
 log "INFO" "Image Tag: ${TAG}"
 
@@ -385,14 +415,14 @@ if [ "$SETUP_REGISTRY_ACTION" = true ]; then
 fi
 
 if [ "$BUILD_ACTION" = true ]; then
-    dispatch_build "$EXAMPLE" "$EXAMPLE_PATH" "$DEVICE"
+    dispatch_build "$EXAMPLE" "$EXAMPLE_PATH" "$DEVICE" "$OS"
 fi
 
 if [ "$PUSH_ACTION" = true ]; then
     if [ "$REGISTRY" == "opea" ] && [ "$SETUP_REGISTRY_ACTION" = false ]; then
         log "INFO" "Warning: Pushing to default 'opea' registry. Use --registry to specify user/org, e.g., --registry docker.io/opea."
     fi
-    push_images "$EXAMPLE" "$EXAMPLE_PATH" "$DEVICE"
+    push_images "$EXAMPLE" "$EXAMPLE_PATH" "$DEVICE" "$OS"
 fi
 
 if [ "$BUILD_ACTION" = false ] && [ "$PUSH_ACTION" = false ] && [ "$SETUP_REGISTRY_ACTION" = false ]; then
diff --git a/one_click_deploy/common/utils.sh b/one_click_deploy/common/utils.sh
index 3e7c3ea0c0..aea383c78a 100644
--- a/one_click_deploy/common/utils.sh
+++ b/one_click_deploy/common/utils.sh
@@ -33,7 +33,7 @@ log() {
 
 section_header() {
     local title="$1"
-    local width=56
+    local width=96
     local border_top="┌"
     local border_side="│"
     local border_bot="└"
diff --git a/one_click_deploy/core/config.py b/one_click_deploy/core/config.py
index 0c3002f3c9..f4c4ee671c 100644
--- a/one_click_deploy/core/config.py
+++ b/one_click_deploy/core/config.py
@@ -14,8 +14,13 @@
         "base_dir": "ChatQnA",
         "docker_compose": {
             "paths": {
-                "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
-                "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                "debian": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
+                    "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                },
+                "openeuler": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose_openeuler.yaml",
+                },
             },
             "set_env_scripts": {
                 "xeon": "docker_compose/intel/cpu/xeon/set_env.sh",
@@ -33,8 +38,13 @@
             "helm": {
                 "chart_oci": "oci://ghcr.io/opea-project/charts/chatqna",
                 "values_files": {
-                    "xeon": "kubernetes/helm/cpu-values.yaml",
-                    "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    "debian": {
+                        "xeon": "kubernetes/helm/cpu-values.yaml",
+                        "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    },
+                    "openeuler": {
+                        "xeon": "kubernetes/helm/cpu-openeuler-values.yaml",
+                    },
                 },
                 "params_to_values": {
                     "hf_token": ["global", "HUGGINGFACEHUB_API_TOKEN"],
@@ -47,7 +57,12 @@
             "release_name": "chatqna",
             "ui_namespace": "rag-ui",
         },
-        "supported_devices": ["xeon", "gaudi"],
+        "supported_os": ["debian", "openeuler"],
+        "default_os": "debian",
+        "supported_devices": {
+            "debian": ["xeon", "gaudi"],
+            "openeuler": ["xeon"],
+        },
         "default_device": "xeon",
         "offline_support": ["docker"],
         "ports": {
@@ -100,29 +115,26 @@
                 "name": "llm_model",
                 "prompt": "LLM Model ID",
                 "type": str,
-                "default": "meta-llama/Meta-Llama-3-8B-Instruct",
                 "help": "e.g., meta-llama/Meta-Llama-3-8B-Instruct",
             },
             {
                 "name": "embed_model",
                 "prompt": "Embedding Model ID",
                 "type": str,
-                "default": "BAAI/bge-base-en-v1.5",
                 "help": "e.g., BAAI/bge-base-en-v1.5",
             },
             {
                 "name": "rerank_model",
                 "prompt": "Reranking Model ID",
                 "type": str,
-                "default": "BAAI/bge-reranker-base",
                 "help": "e.g., BAAI/bge-reranker-base",
             },
             {
                 "name": "mount_dir",
                 "prompt": "Data Mount Directory (for Docker)",
                 "type": str,
-                "modes": ["docker"],
                 "default": "./data",
+                "modes": ["docker"],
             },
         ],
     },
@@ -130,8 +142,10 @@
         "base_dir": "CodeTrans",
         "docker_compose": {
             "paths": {
-                "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
-                "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                "debian": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
+                    "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                },
             },
             "set_env_scripts": {"xeon": "docker_compose/intel/set_env.sh", "gaudi": "docker_compose/intel/set_env.sh"},
             "params_to_set_env": {"llm_model": "LLM_MODEL_ID", "hf_token": "HF_TOKEN"},
@@ -140,8 +154,10 @@
             "helm": {
                 "chart_oci": "oci://ghcr.io/opea-project/charts/codetrans",
                 "values_files": {
-                    "xeon": "kubernetes/helm/cpu-values.yaml",
-                    "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    "debian": {
+                        "xeon": "kubernetes/helm/cpu-values.yaml",
+                        "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    },
                 },
                 "params_to_values": {
                     "hf_token": ["global", "HUGGINGFACEHUB_API_TOKEN"],
@@ -151,7 +167,11 @@
             "namespace": "codetrans",
             "release_name": "codetrans",
         },
-        "supported_devices": ["xeon", "gaudi"],
+        "supported_os": ["debian"],
+        "default_os": "debian",
+        "supported_devices": {
+            "debian": ["xeon", "gaudi"],
+        },
         "default_device": "xeon",
         "offline_support": [],
         "ports": {
@@ -193,7 +213,6 @@
                 "name": "llm_model",
                 "prompt": "LLM Model ID (for Code Translation)",
                 "type": str,
-                "default": "mistralai/Mistral-7B-Instruct-v0.3",
                 "help": "e.g., mistralai/Mistral-7B-Instruct-v0.3",
             },
         ],
@@ -202,8 +221,10 @@
         "base_dir": "DocSum",
         "docker_compose": {
             "paths": {
-                "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
-                "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                "debian": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
+                    "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                },
             },
             "set_env_scripts": {"xeon": "docker_compose/intel/set_env.sh", "gaudi": "docker_compose/intel/set_env.sh"},
             "params_to_set_env": {"llm_model": "LLM_MODEL_ID", "hf_token": "HF_TOKEN"},
@@ -212,8 +233,10 @@
             "helm": {
                 "chart_oci": "oci://ghcr.io/opea-project/charts/docsum",
                 "values_files": {
-                    "xeon": "kubernetes/helm/cpu-values.yaml",
-                    "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    "debian": {
+                        "xeon": "kubernetes/helm/cpu-values.yaml",
+                        "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    },
                 },
                 "params_to_values": {
                     "hf_token": ["global", "HUGGINGFACEHUB_API_TOKEN"],
@@ -223,7 +246,11 @@
             "namespace": "docsum",
             "release_name": "docsum",
         },
-        "supported_devices": ["xeon", "gaudi"],
+        "supported_os": ["debian"],
+        "default_os": "debian",
+        "supported_devices": {
+            "debian": ["xeon", "gaudi"],
+        },
         "default_device": "xeon",
         "offline_support": [],
         "ports": {
@@ -264,7 +291,6 @@
                 "name": "llm_model",
                 "prompt": "LLM Model ID (for DocSum)",
                 "type": str,
-                "default": "meta-llama/Meta-Llama-3-8B-Instruct",
                 "help": "e.g., meta-llama/Meta-Llama-3-8B-Instruct",
             },
         ],
@@ -273,8 +299,13 @@
         "base_dir": "CodeGen",
         "docker_compose": {
             "paths": {
-                "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
-                "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                "debian": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
+                    "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                },
+                "openeuler": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose_openeuler.yaml",
+                },
             },
             "set_env_scripts": {"xeon": "docker_compose/intel/set_env.sh", "gaudi": "docker_compose/intel/set_env.sh"},
             "params_to_set_env": {"llm_model": "LLM_MODEL_ID", "hf_token": "HF_TOKEN"},
@@ -283,8 +314,13 @@
             "helm": {
                 "chart_oci": "oci://ghcr.io/opea-project/charts/codegen",
                 "values_files": {
-                    "xeon": "kubernetes/helm/cpu-values.yaml",
-                    "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    "debian": {
+                        "xeon": "kubernetes/helm/cpu-values.yaml",
+                        "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    },
+                    "openeuler": {
+                        "xeon": "kubernetes/helm/cpu-openeuler-values.yaml",
+                    },
                 },
                 "params_to_values": {
                     "hf_token": ["global", "HUGGINGFACEHUB_API_TOKEN"],
@@ -294,7 +330,12 @@
             "namespace": "codegen",
             "release_name": "codegen",
         },
-        "supported_devices": ["xeon", "gaudi"],
+        "supported_os": ["debian", "openeuler"],
+        "default_os": "debian",
+        "supported_devices": {
+            "debian": ["xeon", "gaudi"],
+            "openeuler": ["xeon"],
+        },
         "default_device": "xeon",
         "offline_support": [],
         "ports": {
@@ -333,7 +374,6 @@
                 "name": "llm_model",
                 "prompt": "LLM Model ID (for Code Generation)",
                 "type": str,
-                "default": "Qwen/Qwen2.5-Coder-7B-Instruct",
                 "help": "e.g., Qwen/Qwen2.5-Coder-7B-Instruct",
             },
         ],
@@ -342,8 +382,13 @@
         "base_dir": "AudioQnA",
         "docker_compose": {
             "paths": {
-                "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
-                "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                "debian": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
+                    "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                },
+                "openeuler": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose_openeuler.yaml",
+                },
             },
             "set_env_scripts": {
                 "xeon": "docker_compose/intel/cpu/xeon/set_env.sh",
@@ -355,8 +400,13 @@
             "helm": {
                 "chart_oci": "oci://ghcr.io/opea-project/charts/audioqna",
                 "values_files": {
-                    "xeon": "kubernetes/helm/cpu-values.yaml",
-                    "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    "debian": {
+                        "xeon": "kubernetes/helm/cpu-values.yaml",
+                        "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    },
+                    "openeuler": {
+                        "xeon": "kubernetes/helm/cpu-openeuler-values.yaml",
+                    },
                 },
                 "params_to_values": {
                     "hf_token": ["global", "HUGGINGFACEHUB_API_TOKEN"],
@@ -366,7 +416,12 @@
             "namespace": "audioqna",
             "release_name": "audioqna",
         },
-        "supported_devices": ["xeon", "gaudi"],
+        "supported_os": ["debian", "openeuler"],
+        "default_os": "debian",
+        "supported_devices": {
+            "debian": ["xeon", "gaudi"],
+            "openeuler": ["xeon"],
+        },
         "default_device": "xeon",
         "offline_support": [],
         "ports": {
@@ -409,7 +464,6 @@
                 "name": "llm_model",
                 "prompt": "LLM Model ID (for Audio Q&A)",
                 "type": str,
-                "default": "meta-llama/Meta-Llama-3-8B-Instruct",
                 "help": "e.g., meta-llama/Meta-Llama-3-8B-Instruct",
             },
         ],
@@ -418,8 +472,10 @@
         "base_dir": "VisualQnA",
         "docker_compose": {
             "paths": {
-                "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
-                "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                "debian": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose.yaml",
+                    "gaudi": "docker_compose/intel/hpu/gaudi/compose.yaml",
+                },
             },
             "set_env_scripts": {
                 "xeon": "docker_compose/intel/cpu/xeon/set_env.sh",
@@ -431,15 +487,21 @@
             "helm": {
                 "chart_oci": "oci://ghcr.io/opea-project/charts/visualqna",
                 "values_files": {
-                    "xeon": "kubernetes/helm/cpu-values.yaml",
-                    "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    "debian": {
+                        "xeon": "kubernetes/helm/cpu-values.yaml",
+                        "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    },
                 },
                 "params_to_values": {"hf_token": ["global", "HUGGINGFACEHUB_API_TOKEN"]},
             },
             "namespace": "visualqna",
             "release_name": "visualqna",
         },
-        "supported_devices": ["xeon", "gaudi"],
+        "supported_os": ["debian"],
+        "default_os": "debian",
+        "supported_devices": {
+            "debian": ["xeon", "gaudi"],
+        },
         "default_device": "xeon",
         "offline_support": [],
         "ports": {
@@ -486,7 +548,6 @@
                 "name": "lvm_model",
                 "prompt": "LVM Model ID (for Visual Q&A)",
                 "type": str,
-                "default": "llava-hf/llava-v1.6-mistral-7b-hf",
                 "help": "e.g., llava-hf/llava-v1.6-mistral-7b-hf",
             },
         ],
@@ -495,8 +556,10 @@
         "base_dir": "ChatQnA",
         "docker_compose": {
             "paths": {
-                "xeon": "docker_compose/intel/cpu/xeon/compose_faqgen.yaml",
-                "gaudi": "docker_compose/intel/hpu/gaudi/compose_faqgen.yaml",
+                "debian": {
+                    "xeon": "docker_compose/intel/cpu/xeon/compose_faqgen.yaml",
+                    "gaudi": "docker_compose/intel/hpu/gaudi/compose_faqgen.yaml",
+                },
             },
             "set_env_scripts": {
                 "xeon": "docker_compose/intel/cpu/xeon/set_env.sh",
@@ -511,8 +574,10 @@
             "helm": {
                 "chart_oci": "oci://ghcr.io/opea-project/charts/chatqna",
                 "values_files": {
-                    "xeon": "kubernetes/helm/faqgen-cpu-values.yaml",
-                    "gaudi": "kubernetes/helm/faqgen-gaudi-values.yaml",
+                    "debian": {
+                        "xeon": "kubernetes/helm/faqgen-cpu-values.yaml",
+                        "gaudi": "kubernetes/helm/faqgen-gaudi-values.yaml",
+                    },
                 },
                 "params_to_values": {
                     "hf_token": ["global", "HUGGINGFACEHUB_API_TOKEN"],
@@ -522,7 +587,11 @@
             "namespace": "faqgen",
             "release_name": "faqgen",
         },
-        "supported_devices": ["xeon", "gaudi"],
+        "supported_os": ["debian"],
+        "default_os": "debian",
+        "supported_devices": {
+            "debian": ["xeon", "gaudi"],
+        },
         "default_device": "xeon",
         "offline_support": [],
         "ports": {
@@ -568,7 +637,6 @@
                 "name": "llm_model",
                 "prompt": "LLM Model ID",
                 "type": str,
-                "default": "meta-llama/Meta-Llama-3-8B-Instruct",
                 "help": "e.g., meta-llama/Meta-Llama-3-8B-Instruct",
             },
         ],
@@ -577,14 +645,16 @@
         "base_dir": "AgentQnA",
         "docker_compose": {
             "paths": {
-                "xeon": [
-                    "docker_compose/intel/cpu/xeon/compose_openai.yaml",
-                    f"{EXAMPLES_ROOT_DIR}/DocIndexRetriever/docker_compose/intel/cpu/xeon/compose.yaml",
-                ],
-                "gaudi": [
-                    "docker_compose/intel/hpu/gaudi/compose.yaml",
-                    f"{EXAMPLES_ROOT_DIR}/DocIndexRetriever/docker_compose/intel/cpu/xeon/compose.yaml",
-                ],
+                "debian": {
+                    "xeon": [
+                        "docker_compose/intel/cpu/xeon/compose_openai.yaml",
+                        f"{EXAMPLES_ROOT_DIR}/DocIndexRetriever/docker_compose/intel/cpu/xeon/compose.yaml",
+                    ],
+                    "gaudi": [
+                        "docker_compose/intel/hpu/gaudi/compose.yaml",
+                        f"{EXAMPLES_ROOT_DIR}/DocIndexRetriever/docker_compose/intel/cpu/xeon/compose.yaml",
+                    ],
+                }
             },
             "set_env_scripts": {
                 "xeon": "docker_compose/intel/cpu/xeon/set_env.sh",
@@ -606,7 +676,9 @@
             "helm": {
                 "chart_oci": "oci://ghcr.io/opea-project/charts/agentqna",
                 "values_files": {
-                    "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    "debian": {
+                        "gaudi": "kubernetes/helm/gaudi-values.yaml",
+                    },
                 },
                 "params_to_values": {
                     "llm_model": [
@@ -623,7 +695,11 @@
             "release_name": "agentqna",
             "ui_namespace": "agentqna-ui",
         },
-        "supported_devices": ["xeon", "gaudi"],
+        "supported_os": ["debian"],
+        "default_os": "debian",
+        "supported_devices": {
+            "debian": ["xeon", "gaudi"],
+        },
         "default_device": "xeon",
         "offline_support": [],
         "ports": {
@@ -659,14 +735,12 @@
                     "name": "llm_model",
                     "prompt": "LLM Model ID (for Gaudi)",
                     "type": str,
-                    "default": "meta-llama/Meta-Llama-3-8B-Instruct",
                     "help": "e.g., meta-llama/Meta-Llama-3-8B-Instruct",
                 },
                 {
                     "name": "num_shards",
                     "prompt": "Number of Gaudi HPU cards (shards)",
                     "type": int,
-                    "default": 4,
                     "help": "e.g., 1, 2, 4. Controls tensor parallel size.",
                 },
             ],
diff --git a/one_click_deploy/core/deployer.py b/one_click_deploy/core/deployer.py
index 3aaa79ce01..4d3a6dc9fe 100644
--- a/one_click_deploy/core/deployer.py
+++ b/one_click_deploy/core/deployer.py
@@ -182,7 +182,7 @@ def _get_device_specific_or_common_config(self, key_path):
 
     def _get_docker_compose_files(self):
         """Returns a list of Docker Compose file paths."""
-        return self._get_path_from_config(["docker_compose", "paths"], self.args.device)
+        return self._get_path_from_config(["docker_compose", "paths", self.args.os], self.args.device)
 
     def _get_docker_set_env_script(self):
         """Returns the path to the set_env script."""
@@ -203,7 +203,7 @@ def _get_local_env_file_path(self):
 
     def _get_helm_values_file(self):
         """Gets the original Helm values file path."""
-        paths = self._get_path_from_config(["kubernetes", "helm", "values_files"], self.args.device)
+        paths = self._get_path_from_config(["kubernetes", "helm", "values_files", self.args.os], self.args.device)
         return paths[0] if paths else None
 
     def _get_local_helm_values_file_path(self):
@@ -318,10 +318,14 @@ def _interactive_setup_for_deploy(self):
             self.args.deploy_mode = click.prompt(
                 "Deployment Mode", type=click.Choice(["docker", "k8s"]), default="docker"
             )
-
+        self.args.os = click.prompt(
+            "Target OS",
+            type=click.Choice(self.config.get("supported_os")),
+            default=self.config.get("default_os"),
+        )
         self.args.device = click.prompt(
             "Target Device",
-            type=click.Choice(self.config.get("supported_devices")),
+            type=click.Choice(self.config.get("supported_devices").get(self.args.os)),
             default=self.config.get("default_device"),
         )
         cached_token = get_huggingface_token_from_file()
@@ -345,26 +349,44 @@ def _interactive_setup_for_deploy(self):
 
         interactive_params = self._get_device_specific_or_common_config(["interactive_params"]) or []
 
+        docker_param_map = self._get_device_specific_or_common_config(["docker_compose", "params_to_set_env"]) or {}
+        source_env_script = self._get_docker_set_env_script()
+
         for param in interactive_params:
             if "modes" in param and self.args.deploy_mode not in param["modes"]:
                 setattr(self.args, param["name"], None)
                 continue
 
+            static_default = param.get("default")
+
+            dynamic_default = None
+            env_var_name = docker_param_map.get(param["name"])
+            if env_var_name and source_env_script:
+                dynamic_default = get_var_from_shell_script(source_env_script, env_var_name)
+                if dynamic_default:
+                    log_message(
+                        "DEBUG",
+                        f"Found default for '{param['name']}' from script '{source_env_script.name}': {dynamic_default}",
+                    )
+
+            final_default = dynamic_default if dynamic_default is not None else static_default
             prompt_text = param["prompt"]
             help_text = param.get("help")
             if help_text:
                 prompt_text = f"{prompt_text} ({help_text})"
 
-            default_value = param.get("default")
-            is_required = param.get("required", False)
+            user_input = click.prompt(prompt_text, default=final_default, type=param.get("type", str))
+
+            value_to_set = user_input if user_input else final_default
 
-            user_input = click.prompt(prompt_text, default=default_value, type=param.get("type", str))
+            is_required = param.get("required", False)
 
-            while is_required and (not user_input or user_input == default_value):
+            while is_required and not value_to_set:
                 log_message("WARN", f"A valid '{param['prompt']}' is required. Please provide a real value.")
                 user_input = click.prompt(prompt_text, type=param.get("type", str), default=None)
+                value_to_set = user_input if user_input else None
 
-            setattr(self.args, param["name"], user_input)
+            setattr(self.args, param["name"], value_to_set)
 
         self.args.do_check_env = click.confirm("Run environment check?", default=False, show_default=True)
 
@@ -428,15 +450,21 @@ def _interactive_setup_for_clear(self):
             "Which deployment mode to clear?", type=click.Choice(["docker", "k8s"]), default="docker"
         )
 
+        self.args.os = click.prompt(
+            "On which target OS was it deployed?",
+            type=click.Choice(self.config.get("supported_os")),
+            default=self.config.get("default_os"),
+        )
         if self.args.deploy_mode == "docker":
             self.args.device = click.prompt(
                 "On which target device was it deployed?",
-                type=click.Choice(self.config.get("supported_devices")),
+                type=click.Choice(self.config.get("supported_devices").get(self.args.os)),
                 default=self.config.get("default_device"),
             )
             # Set project name for clearing
             self.project_name = f"{self.example_name.lower().replace(' ', '')}-{self.args.device}"
         else:
+
             self.args.device = self.config.get("default_device")
 
         if self.args.deploy_mode == "k8s":
@@ -678,9 +706,14 @@ def _interactive_setup_for_test(self):
         self.args.deploy_mode = click.prompt(
             "How is the service deployed?", type=click.Choice(["docker", "k8s"]), default="docker"
         )
+        self.args.os = click.prompt(
+            "On which target OS is it deployed?",
+            type=click.Choice(self.config.get("supported_os")),
+            default=self.config.get("default_os"),
+        )
         self.args.device = click.prompt(
             "On which target device is it running?",
-            type=click.Choice(self.config.get("supported_devices")),
+            type=click.Choice(self.config.get("supported_devices").get(self.args.os)),
             default=self.config.get("default_device"),
         )
         if self.args.deploy_mode == "docker":
@@ -739,7 +772,16 @@ def update_images(self):
             log_message("WARN", f"Image update script '{script_path}' not found. Skipping this step.")
             return True
 
-        cmd = ["bash", str(script_path), "--example", self.example_name, "--device", self.args.device]
+        cmd = [
+            "bash",
+            str(script_path),
+            "--example",
+            self.example_name,
+            "--device",
+            self.args.device,
+            "--os",
+            self.args.os,
+        ]
 
         if getattr(self.args, "setup_local_registry", False):
             cmd.append("--setup-registry")
@@ -790,7 +832,7 @@ def _configure_docker(self):
         updates = {
             env_var: getattr(self.args, arg_name)
             for arg_name, env_var in params_to_env_map.items()
-            if hasattr(self.args, arg_name) and getattr(self.args, arg_name) is not None
+            if hasattr(self.args, arg_name) and getattr(self.args, arg_name)
         }
 
         user_proxies = {p.strip() for p in self.args.no_proxy.split(",") if p.strip()}
@@ -834,7 +876,7 @@ def _configure_kubernetes(self):
         for name, path_or_paths in params_to_values.items():
             if hasattr(self.args, name):
                 value = getattr(self.args, name)
-                if value is None:
+                if not value:
                     continue
 
                 if isinstance(path_or_paths, list) and len(path_or_paths) > 0 and isinstance(path_or_paths[0], list):
@@ -889,7 +931,7 @@ def deploy(self):
                 log_message("ERROR", f"Local environment script '{local_env_file}' not found. Cannot deploy.")
                 return False
 
-            compose_up_cmd = " ".join(compose_base_cmd + ["up", "-d", "--remove-orphans"])
+            compose_up_cmd = " ".join(compose_base_cmd + ["up", "-d", "--remove-orphans", "--quiet-pull"])
             if self.example_name == "ChatQnA" and self.args.device == "gaudi":
                 compose_up_cmd = "source .env&&" + compose_up_cmd
             compose_dir = self._get_docker_compose_files()[0].parent
diff --git a/one_click_deploy/core/utils.py b/one_click_deploy/core/utils.py
index eb3880bade..74deacbf54 100644
--- a/one_click_deploy/core/utils.py
+++ b/one_click_deploy/core/utils.py
@@ -377,28 +377,52 @@ def stop_all_kubectl_port_forwards():
 
 
 def get_var_from_shell_script(script_path: pathlib.Path, var_name: str) -> str | None:
+    """Gets the value of an environment variable by executing a shell script.
+
+    This method is robust as it handles scripts with functions, sourcing other files,
+    and conditional logic. It executes the script in a non-interactive mode.
+
+    Args:
+        script_path: The absolute path to the shell script.
+        var_name: The name of the environment variable to retrieve.
+
+    Returns:
+        The value of the variable as a string, or None if not found or on error.
+    """
     if not script_path or not script_path.exists():
         log_message("DEBUG", f"Source script for variable extraction not found: {script_path}")
         return None
-    assignment_pattern = re.compile(rf"^\s*(?:export\s+)?{re.escape(var_name)}\s*=\s*(.*)")
-    self_ref_pattern = re.compile(r"^\s*(\$\{?" + re.escape(var_name) + r"\}?\,?)")
+
+    command_string = f"NON_INTERACTIVE=true; " f'source "{script_path.resolve()}" > /dev/null; ' f'echo "${var_name}"'
     try:
-        lines = script_path.read_text().splitlines()
-        for line in reversed(lines):
-            match = assignment_pattern.match(line)
-            if match:
-                value = match.group(1).strip()
-                value = value.split("#", 1)[0].strip()
-                if (value.startswith('"') and value.endswith('"')) or (value.startswith("'") and value.endswith("'")):
-                    value = value[1:-1]
-                value = self_ref_pattern.sub("", value).strip()
-                value = value.lstrip(",")
-                log_message("DEBUG", f"Extracted and cleaned value for '{var_name}': {value}")
-                return value
-        log_message("DEBUG", f"Variable '{var_name}' not found in {script_path}.")
-        return None
+        result = run_command(
+            ["bash", "-c", command_string],
+            cwd=script_path.parent,
+            capture_output=True,
+            check=False,
+            display_cmd=False,
+        )
+
+        if result.returncode != 0:
+            log_message(
+                "WARN",
+                f"Execution of '{script_path.name}' failed when trying to get var '{var_name}'. Stderr: {result.stderr.strip()}",
+            )
+            return None
+
+        value = result.stdout.strip()
+
+        if value:
+            log_message("DEBUG", f"Extracted value for '{var_name}' from '{script_path.name}': {value}")
+            return value
+        else:
+            log_message("DEBUG", f"Variable '{var_name}' was not set or is empty in '{script_path.name}'.")
+            return None
+
     except Exception as e:
-        log_message("WARN", f"Failed to parse variable '{var_name}' from {script_path}: {e}")
+        log_message(
+            "WARN", f"An unexpected error occurred while executing {script_path.name} to get var '{var_name}': {e}"
+        )
         return None
 
 
diff --git a/one_click_deploy/deployment.log b/one_click_deploy/deployment.log
new file mode 100644
index 0000000000..042ee1e4ce
--- /dev/null
+++ b/one_click_deploy/deployment.log
@@ -0,0 +1,36 @@
+2025-09-29 16:20:16,829 [INFO] 📘 Example selected: 'ChatQnA'
+2025-09-29 16:20:19,567 [INFO] 📘 Deployment type selected: 'Offline Deployment Management'
+2025-09-29 16:20:19,567 [INFO] 
+======================================================================
+== OFFLINE DEPLOYMENT MANAGEMENT FOR CHATQNA ==
+======================================================================
+2025-09-29 16:20:29,583 [WARNING] ⚠️ Operation aborted by user or invalid input: 
+2025-09-29 16:20:29,583 [INFO] 📘 Script finished.
+2025-09-29 16:20:31,740 [INFO] 📘 Example selected: 'ChatQnA'
+2025-09-29 16:20:32,979 [INFO] 📘 Deployment type selected: 'Online Deployment'
+2025-09-29 16:20:34,637 [INFO] 📘 Action selected: 'Clear'
+2025-09-29 16:20:34,637 [INFO] 
+======================================================================
+== CHATQNA INTERACTIVE CLEAR SETUP ==
+======================================================================
+2025-09-29 16:20:43,516 [INFO] 📘 Will attempt to clear 'ChatQnA' deployed via k8s.
+2025-09-29 16:22:18,009 [WARNING] ⚠️ Operation aborted by user or invalid input: 
+2025-09-29 16:22:18,009 [INFO] 📘 Script finished.
+2025-09-29 16:22:20,508 [INFO] 📘 Example selected: 'ChatQnA'
+2025-09-29 16:22:21,885 [INFO] 📘 Deployment type selected: 'Online Deployment'
+2025-09-29 16:22:23,438 [INFO] 📘 Action selected: 'Clear'
+2025-09-29 16:22:23,438 [INFO] 
+======================================================================
+== CHATQNA INTERACTIVE CLEAR SETUP ==
+======================================================================
+2025-09-29 16:24:44,933 [WARNING] ⚠️ Operation aborted by user or invalid input: 
+2025-09-29 16:24:44,934 [INFO] 📘 Script finished.
+2025-09-29 16:24:48,076 [INFO] 📘 Example selected: 'ChatQnA'
+2025-09-29 16:24:49,293 [INFO] 📘 Deployment type selected: 'Online Deployment'
+2025-09-29 16:24:50,882 [INFO] 📘 Action selected: 'Clear'
+2025-09-29 16:24:50,883 [INFO] 
+======================================================================
+== CHATQNA INTERACTIVE CLEAR SETUP ==
+======================================================================
+2025-09-29 16:24:57,948 [WARNING] ⚠️ Operation aborted by user or invalid input: 
+2025-09-29 16:24:57,949 [INFO] 📘 Script finished.
diff --git a/one_click_deploy/requirements.in b/one_click_deploy/requirements.in
new file mode 100644
index 0000000000..de28cda74a
--- /dev/null
+++ b/one_click_deploy/requirements.in
@@ -0,0 +1,4 @@
+click
+requests
+ruamel.yaml
+urllib3==2.6.0
\ No newline at end of file
diff --git a/one_click_deploy/requirements.txt b/one_click_deploy/requirements.txt
index ba5a359b99..6684899445 100644
--- a/one_click_deploy/requirements.txt
+++ b/one_click_deploy/requirements.txt
@@ -1,4 +1,210 @@
-click
-requests
-ruamel.yaml
-
+# This file was autogenerated by uv via the following command:
+#    uv pip compile --python=/usr/local/bin/python3.11 --generate-hashes requirements.in --universal -o requirements.txt
+certifi==2025.11.12 \
+    --hash=sha256:97de8790030bbd5c2d96b7ec782fc2f7820ef8dba6db909ccf95449f2d062d4b \
+    --hash=sha256:d8ab5478f2ecd78af242878415affce761ca6bc54a22a27e026d7c25357c3316
+    # via requests
+charset-normalizer==3.4.4 \
+    --hash=sha256:027f6de494925c0ab2a55eab46ae5129951638a49a34d87f4c3eda90f696b4ad \
+    --hash=sha256:077fbb858e903c73f6c9db43374fd213b0b6a778106bc7032446a8e8b5b38b93 \
+    --hash=sha256:0a98e6759f854bd25a58a73fa88833fba3b7c491169f86ce1180c948ab3fd394 \
+    --hash=sha256:0d3d8f15c07f86e9ff82319b3d9ef6f4bf907608f53fe9d92b28ea9ae3d1fd89 \
+    --hash=sha256:0f04b14ffe5fdc8c4933862d8306109a2c51e0704acfa35d51598eb45a1e89fc \
+    --hash=sha256:11d694519d7f29d6cd09f6ac70028dba10f92f6cdd059096db198c283794ac86 \
+    --hash=sha256:194f08cbb32dc406d6e1aea671a68be0823673db2832b38405deba2fb0d88f63 \
+    --hash=sha256:1bee1e43c28aa63cb16e5c14e582580546b08e535299b8b6158a7c9c768a1f3d \
+    --hash=sha256:21d142cc6c0ec30d2efee5068ca36c128a30b0f2c53c1c07bd78cb6bc1d3be5f \
+    --hash=sha256:2437418e20515acec67d86e12bf70056a33abdacb5cb1655042f6538d6b085a8 \
+    --hash=sha256:244bfb999c71b35de57821b8ea746b24e863398194a4014e4c76adc2bbdfeff0 \
+    --hash=sha256:2677acec1a2f8ef614c6888b5b4ae4060cc184174a938ed4e8ef690e15d3e505 \
+    --hash=sha256:277e970e750505ed74c832b4bf75dac7476262ee2a013f5574dd49075879e161 \
+    --hash=sha256:2aaba3b0819274cc41757a1da876f810a3e4d7b6eb25699253a4effef9e8e4af \
+    --hash=sha256:2b7d8f6c26245217bd2ad053761201e9f9680f8ce52f0fcd8d0755aeae5b2152 \
+    --hash=sha256:2c9d3c380143a1fedbff95a312aa798578371eb29da42106a29019368a475318 \
+    --hash=sha256:3162d5d8ce1bb98dd51af660f2121c55d0fa541b46dff7bb9b9f86ea1d87de72 \
+    --hash=sha256:31fd66405eaf47bb62e8cd575dc621c56c668f27d46a61d975a249930dd5e2a4 \
+    --hash=sha256:362d61fd13843997c1c446760ef36f240cf81d3ebf74ac62652aebaf7838561e \
+    --hash=sha256:376bec83a63b8021bb5c8ea75e21c4ccb86e7e45ca4eb81146091b56599b80c3 \
+    --hash=sha256:44c2a8734b333e0578090c4cd6b16f275e07aa6614ca8715e6c038e865e70576 \
+    --hash=sha256:47cc91b2f4dd2833fddaedd2893006b0106129d4b94fdb6af1f4ce5a9965577c \
+    --hash=sha256:4902828217069c3c5c71094537a8e623f5d097858ac6ca8252f7b4d10b7560f1 \
+    --hash=sha256:4bd5d4137d500351a30687c2d3971758aac9a19208fc110ccb9d7188fbe709e8 \
+    --hash=sha256:4fe7859a4e3e8457458e2ff592f15ccb02f3da787fcd31e0183879c3ad4692a1 \
+    --hash=sha256:542d2cee80be6f80247095cc36c418f7bddd14f4a6de45af91dfad36d817bba2 \
+    --hash=sha256:554af85e960429cf30784dd47447d5125aaa3b99a6f0683589dbd27e2f45da44 \
+    --hash=sha256:5833d2c39d8896e4e19b689ffc198f08ea58116bee26dea51e362ecc7cd3ed26 \
+    --hash=sha256:5947809c8a2417be3267efc979c47d76a079758166f7d43ef5ae8e9f92751f88 \
+    --hash=sha256:5ae497466c7901d54b639cf42d5b8c1b6a4fead55215500d2f486d34db48d016 \
+    --hash=sha256:5bd2293095d766545ec1a8f612559f6b40abc0eb18bb2f5d1171872d34036ede \
+    --hash=sha256:5bfbb1b9acf3334612667b61bd3002196fe2a1eb4dd74d247e0f2a4d50ec9bbf \
+    --hash=sha256:5cb4d72eea50c8868f5288b7f7f33ed276118325c1dfd3957089f6b519e1382a \
+    --hash=sha256:5dbe56a36425d26d6cfb40ce79c314a2e4dd6211d51d6d2191c00bed34f354cc \
+    --hash=sha256:5f819d5fe9234f9f82d75bdfa9aef3a3d72c4d24a6e57aeaebba32a704553aa0 \
+    --hash=sha256:64b55f9dce520635f018f907ff1b0df1fdc31f2795a922fb49dd14fbcdf48c84 \
+    --hash=sha256:6515f3182dbe4ea06ced2d9e8666d97b46ef4c75e326b79bb624110f122551db \
+    --hash=sha256:65e2befcd84bc6f37095f5961e68a6f077bf44946771354a28ad434c2cce0ae1 \
+    --hash=sha256:6aee717dcfead04c6eb1ce3bd29ac1e22663cdea57f943c87d1eab9a025438d7 \
+    --hash=sha256:6b39f987ae8ccdf0d2642338faf2abb1862340facc796048b604ef14919e55ed \
+    --hash=sha256:6e1fcf0720908f200cd21aa4e6750a48ff6ce4afe7ff5a79a90d5ed8a08296f8 \
+    --hash=sha256:74018750915ee7ad843a774364e13a3db91682f26142baddf775342c3f5b1133 \
+    --hash=sha256:74664978bb272435107de04e36db5a9735e78232b85b77d45cfb38f758efd33e \
+    --hash=sha256:74bb723680f9f7a6234dcf67aea57e708ec1fbdf5699fb91dfd6f511b0a320ef \
+    --hash=sha256:752944c7ffbfdd10c074dc58ec2d5a8a4cd9493b314d367c14d24c17684ddd14 \
+    --hash=sha256:778d2e08eda00f4256d7f672ca9fef386071c9202f5e4607920b86d7803387f2 \
+    --hash=sha256:780236ac706e66881f3b7f2f32dfe90507a09e67d1d454c762cf642e6e1586e0 \
+    --hash=sha256:798d75d81754988d2565bff1b97ba5a44411867c0cf32b77a7e8f8d84796b10d \
+    --hash=sha256:799a7a5e4fb2d5898c60b640fd4981d6a25f1c11790935a44ce38c54e985f828 \
+    --hash=sha256:7a32c560861a02ff789ad905a2fe94e3f840803362c84fecf1851cb4cf3dc37f \
+    --hash=sha256:7c308f7e26e4363d79df40ca5b2be1c6ba9f02bdbccfed5abddb7859a6ce72cf \
+    --hash=sha256:7fa17817dc5625de8a027cb8b26d9fefa3ea28c8253929b8d6649e705d2835b6 \
+    --hash=sha256:81d5eb2a312700f4ecaa977a8235b634ce853200e828fbadf3a9c50bab278328 \
+    --hash=sha256:82004af6c302b5d3ab2cfc4cc5f29db16123b1a8417f2e25f9066f91d4411090 \
+    --hash=sha256:837c2ce8c5a65a2035be9b3569c684358dfbf109fd3b6969630a87535495ceaa \
+    --hash=sha256:840c25fb618a231545cbab0564a799f101b63b9901f2569faecd6b222ac72381 \
+    --hash=sha256:8a6562c3700cce886c5be75ade4a5db4214fda19fede41d9792d100288d8f94c \
+    --hash=sha256:8af65f14dc14a79b924524b1e7fffe304517b2bff5a58bf64f30b98bbc5079eb \
+    --hash=sha256:8ef3c867360f88ac904fd3f5e1f902f13307af9052646963ee08ff4f131adafc \
+    --hash=sha256:94537985111c35f28720e43603b8e7b43a6ecfb2ce1d3058bbe955b73404e21a \
+    --hash=sha256:99ae2cffebb06e6c22bdc25801d7b30f503cc87dbd283479e7b606f70aff57ec \
+    --hash=sha256:9a26f18905b8dd5d685d6d07b0cdf98a79f3c7a918906af7cc143ea2e164c8bc \
+    --hash=sha256:9b35f4c90079ff2e2edc5b26c0c77925e5d2d255c42c74fdb70fb49b172726ac \
+    --hash=sha256:9cd98cdc06614a2f768d2b7286d66805f94c48cde050acdbbb7db2600ab3197e \
+    --hash=sha256:9d1bb833febdff5c8927f922386db610b49db6e0d4f4ee29601d71e7c2694313 \
+    --hash=sha256:9f7fcd74d410a36883701fafa2482a6af2ff5ba96b9a620e9e0721e28ead5569 \
+    --hash=sha256:a59cb51917aa591b1c4e6a43c132f0cdc3c76dbad6155df4e28ee626cc77a0a3 \
+    --hash=sha256:a61900df84c667873b292c3de315a786dd8dac506704dea57bc957bd31e22c7d \
+    --hash=sha256:a79cfe37875f822425b89a82333404539ae63dbdddf97f84dcbc3d339aae9525 \
+    --hash=sha256:a8a8b89589086a25749f471e6a900d3f662d1d3b6e2e59dcecf787b1cc3a1894 \
+    --hash=sha256:a8bf8d0f749c5757af2142fe7903a9df1d2e8aa3841559b2bad34b08d0e2bcf3 \
+    --hash=sha256:a9768c477b9d7bd54bc0c86dbaebdec6f03306675526c9927c0e8a04e8f94af9 \
+    --hash=sha256:ac1c4a689edcc530fc9d9aa11f5774b9e2f33f9a0c6a57864e90908f5208d30a \
+    --hash=sha256:af2d8c67d8e573d6de5bc30cdb27e9b95e49115cd9baad5ddbd1a6207aaa82a9 \
+    --hash=sha256:b435cba5f4f750aa6c0a0d92c541fb79f69a387c91e61f1795227e4ed9cece14 \
+    --hash=sha256:b5b290ccc2a263e8d185130284f8501e3e36c5e02750fc6b6bdeb2e9e96f1e25 \
+    --hash=sha256:b5d84d37db046c5ca74ee7bb47dd6cbc13f80665fdde3e8040bdd3fb015ecb50 \
+    --hash=sha256:b7cf1017d601aa35e6bb650b6ad28652c9cd78ee6caff19f3c28d03e1c80acbf \
+    --hash=sha256:bc7637e2f80d8530ee4a78e878bce464f70087ce73cf7c1caf142416923b98f1 \
+    --hash=sha256:c0463276121fdee9c49b98908b3a89c39be45d86d1dbaa22957e38f6321d4ce3 \
+    --hash=sha256:c4ef880e27901b6cc782f1b95f82da9313c0eb95c3af699103088fa0ac3ce9ac \
+    --hash=sha256:c8ae8a0f02f57a6e61203a31428fa1d677cbe50c93622b4149d5c0f319c1d19e \
+    --hash=sha256:ca5862d5b3928c4940729dacc329aa9102900382fea192fc5e52eb69d6093815 \
+    --hash=sha256:cb01158d8b88ee68f15949894ccc6712278243d95f344770fa7593fa2d94410c \
+    --hash=sha256:cb6254dc36b47a990e59e1068afacdcd02958bdcce30bb50cc1700a8b9d624a6 \
+    --hash=sha256:cc00f04ed596e9dc0da42ed17ac5e596c6ccba999ba6bd92b0e0aef2f170f2d6 \
+    --hash=sha256:cd09d08005f958f370f539f186d10aec3377d55b9eeb0d796025d4886119d76e \
+    --hash=sha256:cd4b7ca9984e5e7985c12bc60a6f173f3c958eae74f3ef6624bb6b26e2abbae4 \
+    --hash=sha256:ce8a0633f41a967713a59c4139d29110c07e826d131a316b50ce11b1d79b4f84 \
+    --hash=sha256:cead0978fc57397645f12578bfd2d5ea9138ea0fac82b2f63f7f7c6877986a69 \
+    --hash=sha256:d055ec1e26e441f6187acf818b73564e6e6282709e9bcb5b63f5b23068356a15 \
+    --hash=sha256:d1f13550535ad8cff21b8d757a3257963e951d96e20ec82ab44bc64aeb62a191 \
+    --hash=sha256:d9c7f57c3d666a53421049053eaacdd14bbd0a528e2186fcb2e672effd053bb0 \
+    --hash=sha256:d9e45d7faa48ee908174d8fe84854479ef838fc6a705c9315372eacbc2f02897 \
+    --hash=sha256:da3326d9e65ef63a817ecbcc0df6e94463713b754fe293eaa03da99befb9a5bd \
+    --hash=sha256:de00632ca48df9daf77a2c65a484531649261ec9f25489917f09e455cb09ddb2 \
+    --hash=sha256:e1f185f86a6f3403aa2420e815904c67b2f9ebc443f045edd0de921108345794 \
+    --hash=sha256:e824f1492727fa856dd6eda4f7cee25f8518a12f3c4a56a74e8095695089cf6d \
+    --hash=sha256:e912091979546adf63357d7e2ccff9b44f026c075aeaf25a52d0e95ad2281074 \
+    --hash=sha256:eaabd426fe94daf8fd157c32e571c85cb12e66692f15516a83a03264b08d06c3 \
+    --hash=sha256:ebf3e58c7ec8a8bed6d66a75d7fb37b55e5015b03ceae72a8e7c74495551e224 \
+    --hash=sha256:ecaae4149d99b1c9e7b88bb03e3221956f68fd6d50be2ef061b2381b61d20838 \
+    --hash=sha256:eecbc200c7fd5ddb9a7f16c7decb07b566c29fa2161a16cf67b8d068bd21690a \
+    --hash=sha256:f155a433c2ec037d4e8df17d18922c3a0d9b3232a396690f17175d2946f0218d \
+    --hash=sha256:f1e34719c6ed0b92f418c7c780480b26b5d9c50349e9a9af7d76bf757530350d \
+    --hash=sha256:f34be2938726fc13801220747472850852fe6b1ea75869a048d6f896838c896f \
+    --hash=sha256:f820802628d2694cb7e56db99213f930856014862f3fd943d290ea8438d07ca8 \
+    --hash=sha256:f8bf04158c6b607d747e93949aa60618b61312fe647a6369f88ce2ff16043490 \
+    --hash=sha256:f8e160feb2aed042cd657a72acc0b481212ed28b1b9a95c0cee1621b524e1966 \
+    --hash=sha256:f9d332f8c2a2fcbffe1378594431458ddbef721c1769d78e2cbc06280d8155f9 \
+    --hash=sha256:fa09f53c465e532f4d3db095e0c55b615f010ad81803d383195b6b5ca6cbf5f3 \
+    --hash=sha256:faa3a41b2b66b6e50f84ae4a68c64fcd0c44355741c6374813a800cd6695db9e \
+    --hash=sha256:fd44c878ea55ba351104cb93cc85e74916eb8fa440ca7903e57575e97394f608
+    # via requests
+click==8.3.1 \
+    --hash=sha256:12ff4785d337a1bb490bb7e9c2b1ee5da3112e94a8622f26a6c77f5d2fc6842a \
+    --hash=sha256:981153a64e25f12d547d3426c367a4857371575ee7ad18df2a6183ab0545b2a6
+    # via -r requirements.in
+colorama==0.4.6 ; sys_platform == 'win32' \
+    --hash=sha256:08695f5cb7ed6e0531a20572697297273c47b8cae5a63ffc6d6ed5c201be6e44 \
+    --hash=sha256:4f1d9991f5acc0ca119f9d443620b77f9d6b33703e51011c16baf57afb285fc6
+    # via click
+idna==3.11 \
+    --hash=sha256:771a87f49d9defaf64091e6e6fe9c18d4833f140bd19464795bc32d966ca37ea \
+    --hash=sha256:795dafcc9c04ed0c1fb032c2aa73654d8e8c5023a7df64a53f39190ada629902
+    # via requests
+requests==2.32.5 \
+    --hash=sha256:2462f94637a34fd532264295e186976db0f5d453d1cdd31473c85a6a161affb6 \
+    --hash=sha256:dbba0bac56e100853db0ea71b82b4dfd5fe2bf6d3754a8893c3af500cec7d7cf
+    # via -r requirements.in
+ruamel-yaml==0.18.16 \
+    --hash=sha256:048f26d64245bae57a4f9ef6feb5b552a386830ef7a826f235ffb804c59efbba \
+    --hash=sha256:a6e587512f3c998b2225d68aa1f35111c29fad14aed561a26e73fab729ec5e5a
+    # via -r requirements.in
+ruamel-yaml-clib==0.2.15 ; python_full_version < '3.14' and platform_python_implementation == 'CPython' \
+    --hash=sha256:014181cdec565c8745b7cbc4de3bf2cc8ced05183d986e6d1200168e5bb59490 \
+    --hash=sha256:04d21dc9c57d9608225da28285900762befbb0165ae48482c15d8d4989d4af14 \
+    --hash=sha256:05c70f7f86be6f7bee53794d80050a28ae7e13e4a0087c1839dcdefd68eb36b6 \
+    --hash=sha256:0ba6604bbc3dfcef844631932d06a1a4dcac3fee904efccf582261948431628a \
+    --hash=sha256:11e5499db1ccbc7f4b41f0565e4f799d863ea720e01d3e99fa0b7b5fcd7802c9 \
+    --hash=sha256:1b45498cc81a4724a2d42273d6cfc243c0547ad7c6b87b4f774cb7bcc131c98d \
+    --hash=sha256:1bb7b728fd9f405aa00b4a0b17ba3f3b810d0ccc5f77f7373162e9b5f0ff75d5 \
+    --hash=sha256:1f66f600833af58bea694d5892453f2270695b92200280ee8c625ec5a477eed3 \
+    --hash=sha256:27dc656e84396e6d687f97c6e65fb284d100483628f02d95464fd731743a4afe \
+    --hash=sha256:2812ff359ec1f30129b62372e5f22a52936fac13d5d21e70373dbca5d64bb97c \
+    --hash=sha256:2b216904750889133d9222b7b873c199d48ecbb12912aca78970f84a5aa1a4bc \
+    --hash=sha256:331fb180858dd8534f0e61aa243b944f25e73a4dae9962bd44c46d1761126bbf \
+    --hash=sha256:3cb75a3c14f1d6c3c2a94631e362802f70e83e20d1f2b2ef3026c05b415c4900 \
+    --hash=sha256:3eb199178b08956e5be6288ee0b05b2fb0b5c1f309725ad25d9c6ea7e27f962a \
+    --hash=sha256:424ead8cef3939d690c4b5c85ef5b52155a231ff8b252961b6516ed7cf05f6aa \
+    --hash=sha256:45702dfbea1420ba3450bb3dd9a80b33f0badd57539c6aac09f42584303e0db6 \
+    --hash=sha256:468858e5cbde0198337e6a2a78eda8c3fb148bdf4c6498eaf4bc9ba3f8e780bd \
+    --hash=sha256:46895c17ead5e22bea5e576f1db7e41cb273e8d062c04a6a49013d9f60996c25 \
+    --hash=sha256:46e4cc8c43ef6a94885f72512094e482114a8a706d3c555a34ed4b0d20200600 \
+    --hash=sha256:480894aee0b29752560a9de46c0e5f84a82602f2bc5c6cde8db9a345319acfdf \
+    --hash=sha256:4b293a37dc97e2b1e8a1aec62792d1e52027087c8eea4fc7b5abd2bdafdd6642 \
+    --hash=sha256:4be366220090d7c3424ac2b71c90d1044ea34fca8c0b88f250064fd06087e614 \
+    --hash=sha256:4d1032919280ebc04a80e4fb1e93f7a738129857eaec9448310e638c8bccefcf \
+    --hash=sha256:4d3b58ab2454b4747442ac76fab66739c72b1e2bb9bd173d7694b9f9dbc9c000 \
+    --hash=sha256:4dcec721fddbb62e60c2801ba08c87010bd6b700054a09998c4d09c08147b8fb \
+    --hash=sha256:512571ad41bba04eac7268fe33f7f4742210ca26a81fe0c75357fa682636c690 \
+    --hash=sha256:542d77b72786a35563f97069b9379ce762944e67055bea293480f7734b2c7e5e \
+    --hash=sha256:56ea19c157ed8c74b6be51b5fa1c3aff6e289a041575f0556f66e5fb848bb137 \
+    --hash=sha256:5d3c9210219cbc0f22706f19b154c9a798ff65a6beeafbf77fc9c057ec806f7d \
+    --hash=sha256:5fea0932358e18293407feb921d4f4457db837b67ec1837f87074667449f9401 \
+    --hash=sha256:617d35dc765715fa86f8c3ccdae1e4229055832c452d4ec20856136acc75053f \
+    --hash=sha256:64da03cbe93c1e91af133f5bec37fd24d0d4ba2418eaf970d7166b0a26a148a2 \
+    --hash=sha256:65f48245279f9bb301d1276f9679b82e4c080a1ae25e679f682ac62446fac471 \
+    --hash=sha256:6f1d38cbe622039d111b69e9ca945e7e3efebb30ba998867908773183357f3ed \
+    --hash=sha256:713cd68af9dfbe0bb588e144a61aad8dcc00ef92a82d2e87183ca662d242f524 \
+    --hash=sha256:71845d377c7a47afc6592aacfea738cc8a7e876d586dfba814501d8c53c1ba60 \
+    --hash=sha256:753faf20b3a5906faf1fc50e4ddb8c074cb9b251e00b14c18b28492f933ac8ef \
+    --hash=sha256:7e74ea87307303ba91073b63e67f2c667e93f05a8c63079ee5b7a5c8d0d7b043 \
+    --hash=sha256:88eea8baf72f0ccf232c22124d122a7f26e8a24110a0273d9bcddcb0f7e1fa03 \
+    --hash=sha256:923816815974425fbb1f1bf57e85eca6e14d8adc313c66db21c094927ad01815 \
+    --hash=sha256:9b6f7d74d094d1f3a4e157278da97752f16ee230080ae331fcc219056ca54f77 \
+    --hash=sha256:a8220fd4c6f98485e97aea65e1df76d4fed1678ede1fe1d0eed2957230d287c4 \
+    --hash=sha256:ab0df0648d86a7ecbd9c632e8f8d6b21bb21b5fc9d9e095c796cacf32a728d2d \
+    --hash=sha256:ac9b8d5fa4bb7fd2917ab5027f60d4234345fd366fe39aa711d5dca090aa1467 \
+    --hash=sha256:badd1d7283f3e5894779a6ea8944cc765138b96804496c91812b2829f70e18a7 \
+    --hash=sha256:bdc06ad71173b915167702f55d0f3f027fc61abd975bd308a0968c02db4a4c3e \
+    --hash=sha256:bf0846d629e160223805db9fe8cc7aec16aaa11a07310c50c8c7164efa440aec \
+    --hash=sha256:bfd309b316228acecfa30670c3887dcedf9b7a44ea39e2101e75d2654522acd4 \
+    --hash=sha256:c583229f336682b7212a43d2fa32c30e643d3076178fb9f7a6a14dde85a2d8bd \
+    --hash=sha256:cb15a2e2a90c8475df45c0949793af1ff413acfb0a716b8b94e488ea95ce7cff \
+    --hash=sha256:d290eda8f6ada19e1771b54e5706b8f9807e6bb08e873900d5ba114ced13e02c \
+    --hash=sha256:da3d6adadcf55a93c214d23941aef4abfd45652110aed6580e814152f385b862 \
+    --hash=sha256:dcc7f3162d3711fd5d52e2267e44636e3e566d1e5675a5f0b30e98f2c4af7974 \
+    --hash=sha256:def5663361f6771b18646620fca12968aae730132e104688766cf8a3b1d65922 \
+    --hash=sha256:e5e9f630c73a490b758bf14d859a39f375e6999aea5ddd2e2e9da89b9953486a \
+    --hash=sha256:e9fde97ecb7bb9c41261c2ce0da10323e9227555c674989f8d9eb7572fc2098d \
+    --hash=sha256:ef71831bd61fbdb7aa0399d5c4da06bea37107ab5c79ff884cc07f2450910262 \
+    --hash=sha256:f4421ab780c37210a07d138e56dd4b51f8642187cdfb433eb687fe8c11de0144 \
+    --hash=sha256:f6d3655e95a80325b84c4e14c080b2470fe4f33b6846f288379ce36154993fb1 \
+    --hash=sha256:fd4c928ddf6bce586285daa6d90680b9c291cfd045fc40aad34e445d57b1bf51 \
+    --hash=sha256:fe239bdfdae2302e93bd6e8264bd9b71290218fff7084a9db250b55caaccf43f
+    # via ruamel-yaml
+urllib3==2.6.0 \
+    --hash=sha256:c90f7a39f716c572c4e3e58509581ebd83f9b59cced005b7db7ad2d22b0db99f \
+    --hash=sha256:cb9bcef5a4b345d5da5d145dc3e30834f58e8018828cbc724d30b4cb7d4d49f1
+    # via
+    #   -r requirements.in
+    #   requests
diff --git a/validated_configurations.md b/validated_configurations.md
index 0816c9ef89..fea6438b54 100644
--- a/validated_configurations.md
+++ b/validated_configurations.md
@@ -21,3 +21,21 @@ Example specific test matrix can be found in examples' README.md files, for exam
 |                        | vLLM v0.8.3 (Xeon, ROCm)                                                                                     |
 |                        | TGI v2.4.0 (Xeon), v2.3.1 (Gaudi), v2.4.1 (ROCm)                                                             |
 |                        | TEI v1.6                                                                                                     |
+
+## v1.4 Release Test Config Overview
+
+| **HW/SW Stake**        | **Description**                                                                        |
+| ---------------------- | -------------------------------------------------------------------------------------- |
+| **Validated Hardware** | Intel Gaudi AI Accelerators (2nd)                                                      |
+|                        | Intel Xeon Scalable processor (3rd)                                                    |
+|                        | Intel Arc Graphics GPU (A770)                                                          |
+|                        | AMD EPYC processors (4th, 5th)                                                         |
+| **Validated Software** | Ubuntu 22.04                                                                           |
+|                        | Habana v1.21 ([link](https://docs.habana.ai/en/v1.21.2/Installation_Guide/index.html)) |
+|                        | Docker version 28.3.3                                                                  |
+|                        | Docker Compose version v2.39.1                                                         |
+|                        | Kubernetes v1.32.7                                                                     |
+|                        | HabanaAI vLLM v0.6.6.post1+Gaudi-1.20.0                                                |
+|                        | vLLM v1.10.0                                                                           |
+|                        | TGI v2.4.0 (Xeon), v2.3.1 (Gaudi), v2.4.1 (ROCm)                                       |
+|                        | TEI v1.7                                                                               |
diff --git a/version.txt b/version.txt
new file mode 100644
index 0000000000..84b677a43f
--- /dev/null
+++ b/version.txt
@@ -0,0 +1,3 @@
+VERSION_MAJOR 1
+VERSION_MINOR 5
+VERSION_PATCH