diff --git a/MultimodalQnA/README.md b/MultimodalQnA/README.md
index bda42ee285..6b92b19062 100644
--- a/MultimodalQnA/README.md
+++ b/MultimodalQnA/README.md
@@ -90,7 +90,7 @@ In the below, we provide a table that describes for each microservice component
 | MicroService | Open Source Project   | HW    | Port | Endpoint                                                    |
 | ------------ | --------------------- | ----- | ---- | ----------------------------------------------------------- |
 | Embedding    | Langchain             | Xeon  | 6000 | /v1/embeddings                                              |
-| Retriever    | Langchain, Redis      | Xeon  | 7000 | /v1/multimodal_retrieval                                    |
+| Retriever    | Langchain, Redis      | Xeon  | 7000 | /v1/retrieval                                               |
 | LVM          | Langchain, TGI        | Gaudi | 9399 | /v1/lvm                                                     |
 | Dataprep     | Redis, Langchain, TGI | Gaudi | 6007 | /v1/generate_transcripts, /v1/generate_captions, /v1/ingest |
 
diff --git a/MultimodalQnA/docker_compose/amd/gpu/rocm/README.md b/MultimodalQnA/docker_compose/amd/gpu/rocm/README.md
index f49b9815f1..4e3a031da9 100644
--- a/MultimodalQnA/docker_compose/amd/gpu/rocm/README.md
+++ b/MultimodalQnA/docker_compose/amd/gpu/rocm/README.md
@@ -178,7 +178,7 @@ curl http://${host_ip}:$MM_EMBEDDING_PORT_MICROSERVICE/v1/embeddings \
 
 ```bash
 export your_embedding=$(python3 -c "import random; embedding = [random.uniform(-1, 1) for _ in range(512)]; print(embedding)")
-curl http://${host_ip}:7000/v1/multimodal_retrieval \
+curl http://${host_ip}:7000/v1/retrieval \
     -X POST \
     -H "Content-Type: application/json" \
     -d "{\"text\":\"test\",\"embedding\":${your_embedding}}"
diff --git a/MultimodalQnA/docker_compose/intel/cpu/xeon/README.md b/MultimodalQnA/docker_compose/intel/cpu/xeon/README.md
index 7e4fa6894a..d3cff8e32c 100644
--- a/MultimodalQnA/docker_compose/intel/cpu/xeon/README.md
+++ b/MultimodalQnA/docker_compose/intel/cpu/xeon/README.md
@@ -10,116 +10,16 @@ For detailed information about these instance types, you can refer to this [link
 
 After launching your instance, you can connect to it using SSH (for Linux instances) or Remote Desktop Protocol (RDP) (for Windows instances). From there, you'll have full access to your Xeon server, allowing you to install, configure, and manage your applications as needed.
 
-**Certain ports in the EC2 instance need to opened up in the security group, for the microservices to work with the curl commands**
-
-> See one example below. Please open up these ports in the EC2 instance based on the IP addresses you want to allow
-
-```
-redis-vector-db
-===============
-Port 6379 - Open to 0.0.0.0/0
-Port 8001 - Open to 0.0.0.0/0
-
-embedding-multimodal-bridgetower
-=====================
-Port 6006 - Open to 0.0.0.0/0
-
-embedding
-=========
-Port 6000 - Open to 0.0.0.0/0
-
-retriever-multimodal-redis
-=========
-Port 7000 - Open to 0.0.0.0/0
-
-lvm-llava
-================
-Port 8399 - Open to 0.0.0.0/0
-
-lvm
-===
-Port 9399 - Open to 0.0.0.0/0
-
-whisper
-===
-port 7066 - Open to 0.0.0.0/0
-
-dataprep-multimodal-redis
-===
-Port 6007 - Open to 0.0.0.0/0
-
-multimodalqna
-==========================
-Port 8888 - Open to 0.0.0.0/0
-
-multimodalqna-ui
-=====================
-Port 5173 - Open to 0.0.0.0/0
-```
-
 ## Setup Environment Variables
 
 Since the `compose.yaml` will consume some environment variables, you need to setup them in advance as below.
 
-**Export the value of the public IP address of your Xeon server to the `host_ip` environment variable**
-
-> Change the External_Public_IP below with the actual IPV4 value
-
-```
-export host_ip="External_Public_IP"
-```
-
-**Append the value of the public IP address to the no_proxy list**
-
-```bash
-export your_no_proxy=${your_no_proxy},"External_Public_IP"
-```
-
 ```bash
-export no_proxy=${your_no_proxy}
-export http_proxy=${your_http_proxy}
-export https_proxy=${your_http_proxy}
-export MM_EMBEDDING_SERVICE_HOST_IP=${host_ip}
-export MM_RETRIEVER_SERVICE_HOST_IP=${host_ip}
-export LVM_SERVICE_HOST_IP=${host_ip}
-export MEGA_SERVICE_HOST_IP=${host_ip}
-export WHISPER_PORT=7066
-export WHISPER_SERVER_ENDPOINT="http://${host_ip}:${WHISPER_PORT}/v1/asr"
-export WHISPER_MODEL="base"
-export MAX_IMAGES=1
-export REDIS_DB_PORT=6379
-export REDIS_INSIGHTS_PORT=8001
-export REDIS_URL="redis://${host_ip}:${REDIS_DB_PORT}"
-export REDIS_HOST=${host_ip}
-export INDEX_NAME="mm-rag-redis"
-export DATAPREP_MMR_PORT=6007
-export DATAPREP_INGEST_SERVICE_ENDPOINT="http://${host_ip}:${DATAPREP_MMR_PORT}/v1/dataprep/ingest"
-export DATAPREP_GEN_TRANSCRIPT_SERVICE_ENDPOINT="http://${host_ip}:${DATAPREP_MMR_PORT}/v1/dataprep/generate_transcripts"
-export DATAPREP_GEN_CAPTION_SERVICE_ENDPOINT="http://${host_ip}:${DATAPREP_MMR_PORT}/v1/dataprep/generate_captions"
-export DATAPREP_GET_FILE_ENDPOINT="http://${host_ip}:${DATAPREP_MMR_PORT}/v1/dataprep/get"
-export DATAPREP_DELETE_FILE_ENDPOINT="http://${host_ip}:${DATAPREP_MMR_PORT}/v1/dataprep/delete"
-export EMM_BRIDGETOWER_PORT=6006
-export EMBEDDING_MODEL_ID="BridgeTower/bridgetower-large-itm-mlm-itc"
-export BRIDGE_TOWER_EMBEDDING=true
-export MMEI_EMBEDDING_ENDPOINT="http://${host_ip}:$EMM_BRIDGETOWER_PORT"
-export MM_EMBEDDING_PORT_MICROSERVICE=6000
-export REDIS_RETRIEVER_PORT=7000
-export LVM_PORT=9399
-export LLAVA_SERVER_PORT=8399
-export LVM_MODEL_ID="llava-hf/llava-1.5-7b-hf"
-export LVM_ENDPOINT="http://${host_ip}:$LLAVA_SERVER_PORT"
-export MEGA_SERVICE_PORT=8888
-export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:$MEGA_SERVICE_PORT/v1/multimodalqna"
-export UI_PORT=5173
+source set_env.sh
 ```
 
 Note: Please replace with `host_ip` with you external IP address, do not use localhost.
 
-> Note: The `MAX_IMAGES` environment variable is used to specify the maximum number of images that will be sent from the LVM service to the LLaVA server.
-> If an image list longer than `MAX_IMAGES` is sent to the LVM server, a shortened image list will be sent to the LLaVA service. If the image list
-> needs to be shortened, the most recent images (the ones at the end of the list) are prioritized to send to the LLaVA service. Some LLaVA models have not
-> been trained with multiple images and may lead to inaccurate results. If `MAX_IMAGES` is not set, it will default to `1`.
-
 ## 🚀 Build Docker Images
 
 ### 1. Build embedding-multimodal-bridgetower Image
@@ -146,7 +46,13 @@ docker build --no-cache -t opea/retriever:latest --build-arg https_proxy=$https_
 
 ### 3. Build LVM Images
 
-Build lvm-llava image
+Pull vllm image
+
+```bash
+docker pull opea/vllm:latest
+```
+
+Build lvm-llava image (Optional)
 
 ```bash
 docker build --no-cache -t opea/lvm-llava:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/lvms/src/integrations/dependency/llava/Dockerfile .
@@ -197,14 +103,15 @@ Then run the command `docker images`, you will have the following 11 Docker Imag
 
 1. `opea/dataprep:latest`
 2. `opea/lvm:latest`
-3. `opea/lvm-llava:latest`
-4. `opea/retriever:latest`
-5. `opea/whisper:latest`
-6. `opea/redis-vector-db`
-7. `opea/embedding:latest`
-8. `opea/embedding-multimodal-bridgetower:latest`
-9. `opea/multimodalqna:latest`
-10. `opea/multimodalqna-ui:latest`
+3. `opea/vllm:latest`
+4. `opea/lvm-llava:latest` (Optional)
+5. `opea/retriever:latest`
+6. `opea/whisper:latest`
+7. `opea/redis-vector-db`
+8. `opea/embedding:latest`
+9. `opea/embedding-multimodal-bridgetower:latest`
+10. `opea/multimodalqna:latest`
+11. `opea/multimodalqna-ui:latest`
 
 ## 🚀 Start Microservices
 
@@ -264,7 +171,7 @@ curl http://${host_ip}:$MM_EMBEDDING_PORT_MICROSERVICE/v1/embeddings \
 
 ```bash
 export your_embedding=$(python3 -c "import random; embedding = [random.uniform(-1, 1) for _ in range(512)]; print(embedding)")
-curl http://${host_ip}:${REDIS_RETRIEVER_PORT}/v1/multimodal_retrieval \
+curl http://${host_ip}:${REDIS_RETRIEVER_PORT}/v1/retrieval \
     -X POST \
     -H "Content-Type: application/json" \
     -d "{\"text\":\"test\",\"embedding\":${your_embedding}}"
@@ -279,7 +186,7 @@ curl ${WHISPER_SERVER_ENDPOINT} \
     -d '{"audio" : "UklGRigAAABXQVZFZm10IBIAAAABAAEARKwAAIhYAQACABAAAABkYXRhAgAAAAEA"}'
 ```
 
-5. lvm-llava
+5. lvm-llava (Optional)
 
 ```bash
 curl http://${host_ip}:${LLAVA_SERVER_PORT}/generate \
diff --git a/MultimodalQnA/docker_compose/intel/cpu/xeon/compose.yaml b/MultimodalQnA/docker_compose/intel/cpu/xeon/compose.yaml
index 31f543c755..328cdd43ee 100644
--- a/MultimodalQnA/docker_compose/intel/cpu/xeon/compose.yaml
+++ b/MultimodalQnA/docker_compose/intel/cpu/xeon/compose.yaml
@@ -24,7 +24,7 @@ services:
     container_name: dataprep-multimodal-redis
     depends_on:
       - redis-vector-db
-      - lvm-llava
+      - vllm-service
     ports:
       - "${DATAPREP_MMR_PORT}:5000"
     environment:
@@ -97,24 +97,31 @@ services:
       LOGFLAG: ${LOGFLAG}
       RETRIEVER_COMPONENT_NAME: "OPEA_RETRIEVER_REDIS"
     restart: unless-stopped
-  lvm-llava:
-    image: ${REGISTRY:-opea}/lvm-llava:${TAG:-latest}
-    container_name: lvm-llava
+  vllm-service:
+    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
+    container_name: vllm-service
     ports:
-      - "${LLAVA_SERVER_PORT}:${LLAVA_SERVER_PORT}"
+      - ${VLLM_PORT:-8399}:80
+    volumes:
+      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
     environment:
       no_proxy: ${no_proxy}
       http_proxy: ${http_proxy}
       https_proxy: ${https_proxy}
-      LLAVA_SERVER_PORT: ${LLAVA_SERVER_PORT}
-      LVM_PORT: ${LVM_PORT}
-    entrypoint: ["python", "llava_server.py", "--device", "cpu", "--model_name_or_path", $LVM_MODEL_ID]
-    restart: unless-stopped
+      HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      VLLM_TORCH_PROFILER_DIR: "/mnt"
+    healthcheck:
+      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
+      interval: 10s
+      timeout: 10s
+      retries: 100
+    command: --model $LVM_MODEL_ID --host 0.0.0.0 --port 80 --chat-template examples/template_llava.jinja  # https://docs.vllm.ai/en/v0.5.0/models/vlm.html
+
   lvm:
     image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
     container_name: lvm
     depends_on:
-      - lvm-llava
+      - vllm-service
     ports:
       - "${LVM_PORT}:${LVM_PORT}"
     ipc: host
@@ -122,11 +129,10 @@ services:
       no_proxy: ${no_proxy}
       http_proxy: ${http_proxy}
       https_proxy: ${https_proxy}
-      LVM_COMPONENT_NAME: "OPEA_LLAVA_LVM"
+      LVM_COMPONENT_NAME: "OPEA_VLLM_LVM"
       LVM_ENDPOINT: ${LVM_ENDPOINT}
       LLAVA_SERVER_PORT: ${LLAVA_SERVER_PORT}
       LVM_PORT: ${LVM_PORT}
-      MAX_IMAGES: ${MAX_IMAGES:-1}
     restart: unless-stopped
   multimodalqna:
     image: ${REGISTRY:-opea}/multimodalqna:${TAG:-latest}
diff --git a/MultimodalQnA/docker_compose/intel/cpu/xeon/set_env.sh b/MultimodalQnA/docker_compose/intel/cpu/xeon/set_env.sh
index 057f90990c..9556aa321d 100755
--- a/MultimodalQnA/docker_compose/intel/cpu/xeon/set_env.sh
+++ b/MultimodalQnA/docker_compose/intel/cpu/xeon/set_env.sh
@@ -8,10 +8,6 @@ popd > /dev/null
 
 export host_ip=$(hostname -I | awk '{print $1}')
 
-export no_proxy=${your_no_proxy}
-export http_proxy=${your_http_proxy}
-export https_proxy=${your_http_proxy}
-
 export MM_EMBEDDING_SERVICE_HOST_IP=${host_ip}
 export MM_RETRIEVER_SERVICE_HOST_IP=${host_ip}
 export LVM_SERVICE_HOST_IP=${host_ip}
@@ -44,6 +40,9 @@ export BRIDGE_TOWER_EMBEDDING=true
 export REDIS_RETRIEVER_PORT=7000
 
 export LVM_PORT=9399
+# for vllm server
+export VLLM_PORT=8399
+# for llava naive server
 export LLAVA_SERVER_PORT=8399
 export LVM_MODEL_ID="llava-hf/llava-1.5-7b-hf"
 export LVM_ENDPOINT="http://${host_ip}:${LLAVA_SERVER_PORT}"
diff --git a/MultimodalQnA/docker_compose/intel/hpu/gaudi/README.md b/MultimodalQnA/docker_compose/intel/hpu/gaudi/README.md
index 2379fc3d4d..0276236ede 100644
--- a/MultimodalQnA/docker_compose/intel/hpu/gaudi/README.md
+++ b/MultimodalQnA/docker_compose/intel/hpu/gaudi/README.md
@@ -210,7 +210,7 @@ curl http://${host_ip}:$MM_EMBEDDING_PORT_MICROSERVICE/v1/embeddings \
 
 ```bash
 export your_embedding=$(python3 -c "import random; embedding = [random.uniform(-1, 1) for _ in range(512)]; print(embedding)")
-curl http://${host_ip}:7000/v1/multimodal_retrieval \
+curl http://${host_ip}:7000/v1/retrieval \
     -X POST \
     -H "Content-Type: application/json" \
     -d "{\"text\":\"test\",\"embedding\":${your_embedding}}"
diff --git a/VideoQnA/Dockerfile b/VideoQnA/Dockerfile
deleted file mode 100644
index 2aade6088f..0000000000
--- a/VideoQnA/Dockerfile
+++ /dev/null
@@ -1,9 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-ARG BASE_TAG=latest
-FROM opea/comps-base:$BASE_TAG
-
-COPY ./videoqna.py $HOME/videoqna.py
-
-ENTRYPOINT ["python", "videoqna.py"]
diff --git a/VideoQnA/README.md b/VideoQnA/README.md
deleted file mode 100644
index e64a045df0..0000000000
--- a/VideoQnA/README.md
+++ /dev/null
@@ -1,100 +0,0 @@
-# VideoQnA Application
-
-VideoQnA is a framework that retrieves video based on provided user prompt. It uses only the video embeddings to perform vector similarity search in Intel's VDMS vector database and performs all operations on Intel Xeon CPU. The pipeline supports long form videos and time-based search.
-
-VideoQnA is implemented on top of [GenAIComps](https://github.com/opea-project/GenAIComps), with the architecture flow chart shows below:
-
-```mermaid
----
-config:
-  flowchart:
-    nodeSpacing: 400
-    rankSpacing: 100
-    curve: linear
-  themeVariables:
-    fontSize: 50px
----
-flowchart LR
-    %% Colors %%
-    classDef blue fill:#ADD8E6,stroke:#ADD8E6,stroke-width:2px,fill-opacity:0.5
-    classDef orange fill:#FBAA60,stroke:#ADD8E6,stroke-width:2px,fill-opacity:0.5
-    classDef orchid fill:#C26DBC,stroke:#ADD8E6,stroke-width:2px,fill-opacity:0.5
-    classDef invisible fill:transparent,stroke:transparent;
-    style VideoQnA-MegaService stroke:#000000
-    %% Subgraphs %%
-    subgraph VideoQnA-MegaService["VideoQnA-MegaService"]
-        direction LR
-        EM([Embedding MicroService]):::blue
-        RET([Retrieval MicroService]):::blue
-        RER([Rerank MicroService]):::blue
-        LVM([LVM MicroService]):::blue
-    end
-    subgraph User Interface
-        direction LR
-        a([User Input Query]):::orchid
-        UI([UI server<br>]):::orchid
-        Ingest([Ingest<br>]):::orchid
-    end
-
-    LOCAL_RER{{Reranking service<br>}}
-    CLIP_EM{{Embedding service <br>}}
-    VDB{{Vector DB<br><br>}}
-    V_RET{{Retriever service <br>}}
-    Ingest{{Ingest data <br>}}
-    DP([Data Preparation<br>]):::blue
-    LVM_gen{{LVM Service <br>}}
-    GW([VideoQnA GateWay<br>]):::orange
-
-    %% Data Preparation flow
-    %% Ingest data flow
-    direction LR
-    Ingest[Ingest data] --> UI
-    UI --> DP
-    DP <-.-> CLIP_EM
-
-    %% Questions interaction
-    direction LR
-    a[User Input Query] --> UI
-    UI --> GW
-    GW <==> VideoQnA-MegaService
-    EM ==> RET
-    RET ==> RER
-    RER ==> LVM
-
-
-    %% Embedding service flow
-    direction LR
-    EM <-.-> CLIP_EM
-    RET <-.-> V_RET
-    RER <-.-> LOCAL_RER
-    LVM <-.-> LVM_gen
-
-    direction TB
-    %% Vector DB interaction
-    V_RET <-.->VDB
-    DP <-.->VDB
-```
-
-- This project implements a Retrieval-Augmented Generation (RAG) workflow using LangChain, Intel VDMS VectorDB, and Text Generation Inference, optimized for Intel Xeon Scalable Processors.
-- Video Processing: Videos are converted into feature vectors using mean aggregation and stored in the VDMS vector store.
-- Query Handling: When a user submits a query, the system performs a similarity search in the vector store to retrieve the best-matching videos.
-- Contextual Inference: The retrieved videos are then sent to the Large Vision Model (LVM) for inference, providing supplemental context for the query.
-
-## Deploy VideoQnA Service
-
-The VideoQnA service can be effortlessly deployed on Intel Xeon Scalable Processors.
-
-### Required Models
-
-By default, the embedding and LVM models are set to a default value as listed below:
-
-| Service   | Model                        |
-| --------- | ---------------------------- |
-| Embedding | openai/clip-vit-base-patch32 |
-| LVM       | DAMO-NLP-SG/Video-LLaMA      |
-
-### Deploy VideoQnA on Xeon
-
-For full instruction of deployment, please check [Guide](docker_compose/intel/cpu/xeon/README.md)
-
-Currently we support deploying VideoQnA services with docker compose, using the docker images `built from source`. Find the corresponding [compose.yaml](docker_compose/intel/cpu/xeon/compose.yaml).
diff --git a/VideoQnA/assets/img/videoqna.gif b/VideoQnA/assets/img/videoqna.gif
deleted file mode 100644
index 45bf7a462a..0000000000
Binary files a/VideoQnA/assets/img/videoqna.gif and /dev/null differ
diff --git a/VideoQnA/docker_compose/intel/cpu/xeon/README.md b/VideoQnA/docker_compose/intel/cpu/xeon/README.md
deleted file mode 100644
index 478f99fe38..0000000000
--- a/VideoQnA/docker_compose/intel/cpu/xeon/README.md
+++ /dev/null
@@ -1,346 +0,0 @@
-# Build Mega Service of VideoQnA on Xeon
-
-This document outlines the deployment process for a videoqna application utilizing the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline on Intel Xeon server. The steps include Docker image creation, container deployment via Docker Compose, and service execution to integrate microservices such as `embedding`, `retriever`, `rerank`, and `lvm`. We will publish the Docker images to Docker Hub soon, it will simplify the deployment process for this service.
-
-VideoQnA is a pipeline that retrieves video based on provided user prompt. It uses only the video embeddings to perform vector similarity search in Intel's VDMS vector database and performs all operations on Intel Xeon CPU. The pipeline supports long form videos and time-based search.
-
-## 🚀 Port used for the microservices
-
-```
-dataprep
-========
-Port 6007 - Open to 0.0.0.0/0
-
-vdms-vector-db
-===============
-Port 8001 - Open to 0.0.0.0/0
-
-embedding
-=========
-Port 6000 - Open to 0.0.0.0/0
-
-retriever
-=========
-Port 7000 - Open to 0.0.0.0/0
-
-reranking
-=========
-Port 8000 - Open to 0.0.0.0/0
-
-lvm video-llama
-===============
-Port 9009 - Open to 0.0.0.0/0
-
-lvm
-===
-Port 9000 - Open to 0.0.0.0/0
-
-chaqna-xeon-backend-server
-==========================
-Port 8888 - Open to 0.0.0.0/0
-
-chaqna-xeon-ui-server
-=====================
-Port 5173 - Open to 0.0.0.0/0
-```
-
-## 🚀 Build Docker Images
-
-First of all, you need to build Docker Images locally and install the python package of it.
-
-### 1. Build Embedding Image
-
-```bash
-git clone https://github.com/opea-project/GenAIComps.git
-cd GenAIComps
-docker build -t opea/embedding-multimodal-clip:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/third_parties/clip/src/Dockerfile .
-```
-
-### 2. Build Retriever Image
-
-```bash
-docker build -t opea/retriever:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/retrievers/src/Dockerfile .
-```
-
-### 3. Build Reranking Image
-
-```bash
-docker build -t opea/reranking:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy  -f comps/rerankings/src/Dockerfile .
-```
-
-### 4. Build LVM Image (Xeon)
-
-```bash
-docker build -t opea/lvm-video-llama:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/lvms/src/integrations/dependency/video-llama/Dockerfile .
-
-# LVM Service Image
-docker build -t opea/lvm:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/lvms/src/Dockerfile .
-```
-
-### 5. Build Dataprep Image
-
-```bash
-docker build -t opea/dataprep:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/dataprep/src/Dockerfile .
-```
-
-### 6. Build MegaService Docker Image
-
-To construct the Mega Service, we utilize the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline within the `videoqna.py` Python script.
-
-Build MegaService Docker image via below command:
-
-```bash
-git clone https://github.com/opea-project/GenAIExamples.git
-cd GenAIExamples/VideoQnA/
-docker build -t opea/videoqna:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
-```
-
-### 7. Build UI Docker Image
-
-Build frontend Docker image via below command:
-
-```bash
-cd GenAIExamples/VideoQnA/ui/
-docker build -t opea/videoqna-ui:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f ./docker/Dockerfile .
-```
-
-Then run the command `docker images`, you will have the following 8 Docker Images:
-
-1. `opea/dataprep:latest`
-2. `opea/embedding-multimodal-clip:latest`
-3. `opea/retriever:latest`
-4. `opea/reranking:latest`
-5. `opea/video-llama-lvm-server:latest`
-6. # `opea/lvm-video-llama:latest`
-7. `opea/reranking-tei:latest`
-8. `opea/lvm-video-llama:latest`
-9. `opea/lvm:latest`
-10. `opea/videoqna:latest`
-11. `opea/videoqna-ui:latest`
-
-## 🚀 Start Microservices
-
-### Setup Environment Variables
-
-Since the `compose.yaml` will consume some environment variables, you need to setup them in advance as below.
-
-**Export the value of the public IP address of your Xeon server to the `host_ip` environment variable**
-
-> Change the `External_Public_IP` below with the actual IPV4 value
-
-```
-export host_ip="External_Public_IP"
-```
-
-**Export the value of your Huggingface API token to the `your_hf_api_token` environment variable**
-
-> Change the `Your_Huggingface_API_Token` below with your actual Huggingface API Token value
-
-```
-export your_hf_api_token="Your_Huggingface_API_Token"
-```
-
-**Append the value of the public IP address to the no_proxy list**
-
-```
-export your_no_proxy="${your_no_proxy},${host_ip}"
-```
-
-Then you can run below commands or `source set_env.sh` to set all the variables
-
-```bash
-export no_proxy=${your_no_proxy}
-export http_proxy=${your_http_proxy}
-export https_proxy=${your_http_proxy}
-export MEGA_SERVICE_HOST_IP=${host_ip}
-export EMBEDDING_SERVICE_HOST_IP=${host_ip}
-export RETRIEVER_SERVICE_HOST_IP=${host_ip}
-export RERANK_SERVICE_HOST_IP=${host_ip}
-export LVM_SERVICE_HOST_IP=${host_ip}
-
-export LVM_ENDPOINT="http://${host_ip}:9009"
-export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:8888/v1/videoqna"
-export BACKEND_HEALTH_CHECK_ENDPOINT="http://${host_ip}:8888/v1/health_check"
-export DATAPREP_SERVICE_ENDPOINT="http://${host_ip}:6007/v1/dataprep/ingest"
-export DATAPREP_GET_FILE_ENDPOINT="http://${host_ip}:6007/v1/dataprep/get"
-export DATAPREP_GET_VIDEO_LIST_ENDPOINT="http://${host_ip}:6007/v1/dataprep/get_videos"
-
-export VDMS_HOST=${host_ip}
-export VDMS_PORT=8001
-export INDEX_NAME="mega-videoqna"
-export LLM_DOWNLOAD="True"
-export USECLIP=1
-
-export HUGGINGFACEHUB_API_TOKEN=${your_hf_api_token}
-```
-
-Note: Replace with `host_ip` with you external IP address, do not use localhost.
-
-### Start all the services with Docker Containers
-
-Before running the docker compose command, you need to be in the folder that has the docker compose yaml file. To avoid model re-download, we manage the volume separately using [external volume](https://docs.docker.com/reference/compose-file/volumes/#external).
-
-There are 2 parts of the pipeline:
-
-- The first is the data preparation, with which you could add your videos into the database.
-- The second is the megaservice, serves as the main service, takes the user query, consumes the microservices to give the response. Including embedding, retrieving, reranking and LVM.
-
-In the deploy steps, you need to start the VDMS DB and dataprep firstly, then insert some sample data into it. After that you could get the megaservice up.
-
-```bash
-cd GenAIExamples/VideoQnA/docker_compose/intel/cpu/xeon/
-
-docker volume create video-llama-model
-docker compose up vdms-vector-db dataprep -d
-sleep 1m # wait for the services ready
-
-# Insert some sample data to the DB
-curl -X POST http://${host_ip}:6007/v1/dataprep/ingest \
-      -H "Content-Type: multipart/form-data" \
-      -F "files=@./data/op_1_0320241830.mp4"
-
-# Bring all the others
-docker compose up -d
-# wait until all the services is up. The LVM server will download models, so it take ~1.5hr to get ready.
-```
-
-### Validate Microservices
-
-1. Dataprep Microservice
-
-   Once the microservice is up, ingest the videos files into vector store using dataprep microservice. Both single and multiple file(s) uploads are supported.
-
-   ```bash
-   # Single file upload
-   curl -X POST ${DATAPREP_SERVICE_ENDPOINT} \
-       -H "Content-Type: multipart/form-data" \
-       -F "files=@./file1.mp4"
-   # Multiple file upload
-   curl -X POST ${DATAPREP_SERVICE_ENDPOINT} \
-       -H "Content-Type: multipart/form-data" \
-       -F "files=@./file1.mp4" \
-       -F "files=@./file2.mp4" \
-       -F "files=@./file3.mp4"
-   ```
-
-   Use below method to check and download available videos the microservice. The download endpoint is also used for LVM and UI.
-
-   ```bash
-   # List available videos
-   curl -X 'GET' ${DATAPREP_GET_VIDEO_LIST_ENDPOINT} -H 'accept: application/json'
-   # Download available video
-   curl -X 'GET' ${DATAPREP_GET_FILE_ENDPOINT}/video_name.mp4 -H 'accept: application/json'
-   ```
-
-2. Embedding Microservice
-
-   ```bash
-   curl http://${host_ip}:6000/v1/embeddings \
-       -X POST \
-       -d '{"text":"Sample text"}' \
-       -H 'Content-Type: application/json'
-   ```
-
-3. Retriever Microservice
-
-   To consume the retriever microservice, you need to generate a mock embedding vector by Python script. The length of embedding vector
-   is determined by the embedding model.
-   Here we use the model `openai/clip-vit-base-patch32`, which vector size is 512.
-
-   Check the vector dimension of your embedding model, set `your_embedding` dimension equals to it.
-
-   ```bash
-   export your_embedding=$(python3 -c "import random; embedding = [random.uniform(-1, 1) for _ in range(512)]; print(embedding)")
-   curl http://${host_ip}:7000/v1/retrieval \
-     -X POST \
-     -d "{\"text\":\"test\",\"embedding\":${your_embedding}}" \
-     -H 'Content-Type: application/json'
-   ```
-
-4. Reranking Microservice
-
-   ```bash
-   curl http://${host_ip}:8000/v1/reranking \
-     -X 'POST' \
-     -H 'accept: application/json' \
-     -H 'Content-Type: application/json' \
-     -d '{
-       "retrieved_docs": [{"doc": [{"text": "this is the retrieved text"}]}],
-       "initial_query": "this is the query",
-       "top_n": 1,
-       "metadata": [
-           {"other_key": "value", "video":"top_video_name", "timestamp":"20"}
-       ]
-     }'
-   ```
-
-5. LVM backend Service
-
-   In first startup, this service will take times to download the LLM file. After it's finished, the service will be ready.
-
-   Use `docker logs lvm-video-llama` to check if the download is finished.
-
-   ```bash
-   curl -X POST \
-     "http://${host_ip}:9009/generate?video_url=silence_girl.mp4&start=0.0&duration=9&prompt=What%20is%20the%20person%20doing%3F&max_new_tokens=150" \
-     -H "accept: */*" \
-     -d ''
-   ```
-
-   > To avoid re-download for the model in case of restart, see [here](#clean-microservices)
-
-6. LVM Microservice
-
-   This service depends on above LLM backend service startup. It will be ready after long time, to wait for them being ready in first startup.
-
-   ```bash
-   curl http://${host_ip}:9000/v1/lvm\
-     -X POST \
-     -d '{"video_url":"https://github.com/DAMO-NLP-SG/Video-LLaMA/raw/main/examples/silence_girl.mp4","chunk_start": 0,"chunk_duration": 7,"prompt":"What is the person doing?","max_new_tokens": 50}' \
-     -H 'Content-Type: application/json'
-   ```
-
-   > Note that the local video file will be deleted after completion to conserve disk space.
-
-7. MegaService
-
-   ```bash
-   curl http://${host_ip}:8888/v1/videoqna -H "Content-Type: application/json" -d '{
-         "messages": "What is the man doing?",
-         "stream": "True"
-         }'
-   ```
-
-   > Note that the megaservice support only stream output.
-
-## 🚀 Launch the UI
-
-To access the frontend, open the following URL in your browser: http://{host_ip}:5173. By default, the UI runs on port 5173 internally. If you prefer to use a different host port to access the frontend, you can modify the port mapping in the `compose.yaml` file as shown below:
-
-```yaml
-  videoqna-xeon-ui-server:
-    image: opea/videoqna-ui:latest
-    ...
-    ports:
-      - "80:5173" # port map to host port 80
-```
-
-Here is an example of running videoqna:
-
-![project-screenshot](../../../../assets/img/videoqna.gif)
-
-## Clean Microservices
-
-All the allocated resources could be easily removed by:
-
-```bash
-docker compose -f compose.yaml down
-```
-
-If you plan to restart the service in the future, the above command is enough. The model file is saved in docker volume `video-llama-model` and will be reserved on your server. Next time when you restart the service, set `export LLM_DOWNLOAD="False"` before start to reuse the volume.
-
-To clean the volume:
-
-```bash
-docker volume rm video-llama-model
-```
diff --git a/VideoQnA/docker_compose/intel/cpu/xeon/compose.yaml b/VideoQnA/docker_compose/intel/cpu/xeon/compose.yaml
deleted file mode 100644
index 780ff3c704..0000000000
--- a/VideoQnA/docker_compose/intel/cpu/xeon/compose.yaml
+++ /dev/null
@@ -1,155 +0,0 @@
-
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-
-services:
-  vdms-vector-db:
-    image: intellabs/vdms:v2.8.0
-    container_name: vdms-vector-db
-    ports:
-      - "8001:55555"
-  dataprep:
-    image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}
-    container_name: dataprep-vdms-server
-    depends_on:
-      - vdms-vector-db
-    ports:
-      - "6007:5000"
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      VDMS_HOST: ${VDMS_HOST}
-      VDMS_PORT: ${VDMS_PORT}
-      INDEX_NAME: ${INDEX_NAME}
-      MULTIMODAL_DATAPREP: true
-    entrypoint: sh -c 'sleep 15 && python ingest_videos.py'
-    volumes:
-      - /home/$USER/.cache/clip:/home/user/.cache/clip
-      - /home/$USER/.cache/huggingface/hub:/home/user/.cache/huggingface/hub
-  embedding:
-    image: ${REGISTRY:-opea}/embedding-multimodal-clip:${TAG:-latest}
-    container_name: embedding-multimodal-server
-    ports:
-      - "6000:6000"
-    ipc: host
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-    volumes:
-      - /home/$USER/.cache/huggingface/hub:/home/user/.cache/huggingface/hub
-    restart: unless-stopped
-  retriever:
-    image: ${REGISTRY:-opea}/retriever:${TAG:-latest}
-    container_name: retriever-vdms-server
-    depends_on:
-      - vdms-vector-db
-    ports:
-      - "7000:7000"
-    ipc: host
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      VDMS_INDEX_NAME: ${INDEX_NAME}
-      VDMS_HOST: ${VDMS_HOST}
-      VDMS_PORT: ${VDMS_PORT}
-      VDMS_USE_CLIP: ${USECLIP}
-      LOGFLAG: ${LOGFLAG}
-      RETRIEVER_COMPONENT_NAME: "OPEA_RETRIEVER_VDMS"
-    entrypoint: sh -c 'sleep 30 && python retriever_vdms.py'
-    restart: unless-stopped
-    volumes:
-      - /home/$USER/.cache/huggingface/hub:/home/user/.cache/huggingface/hub
-  reranking:
-    image: ${REGISTRY:-opea}/reranking:${TAG:-latest}
-    container_name: reranking-tei-server
-    ports:
-      - "8000:8000"
-    ipc: host
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      CHUNK_DURATION: ${CHUNK_DURATION}
-      FILE_SERVER_ENDPOINT: ${DATAPREP_GET_FILE_ENDPOINT}
-      DATAPREP_GET_VIDEO_LIST_ENDPOINT: ${DATAPREP_GET_VIDEO_LIST_ENDPOINT}
-    restart: unless-stopped
-  lvm-video-llama:
-    image: ${REGISTRY:-opea}/lvm-video-llama:${TAG:-latest}
-    container_name: lvm-video-llama
-    ports:
-      - "9009:9009"
-    ipc: host
-    environment:
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      no_proxy: ${no_proxy}
-      llm_download: ${LLM_DOWNLOAD}
-    volumes:
-      - "/home/$USER/.cache:/home/user/.cache"
-      - video-llama-model:/home/user/model
-    restart: unless-stopped
-  lvm:
-    image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
-    container_name: lvm
-    ports:
-      - "9000:9000"
-    ipc: host
-    environment:
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      no_proxy: ${no_proxy}
-      LVM_COMPONENT_NAME: "OPEA_VIDEO_LLAMA_LVM"
-      LVM_ENDPOINT: ${LVM_ENDPOINT}
-    restart: unless-stopped
-    depends_on:
-      - lvm-video-llama
-  videoqna-xeon-backend-server:
-    image: ${REGISTRY:-opea}/videoqna:${TAG:-latest}
-    container_name: videoqna-xeon-backend-server
-    depends_on:
-      - vdms-vector-db
-      - dataprep
-      - embedding
-      - retriever
-      - reranking
-      - lvm-video-llama
-      - lvm
-    ports:
-      - "8888:8888"
-    entrypoint: sh -c 'sleep 45 && python videoqna.py'
-    environment:
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      no_proxy: ${no_proxy}
-      MEGA_SERVICE_HOST_IP: ${MEGA_SERVICE_HOST_IP}
-      EMBEDDING_SERVICE_HOST_IP: ${EMBEDDING_SERVICE_HOST_IP}
-      RETRIEVER_SERVICE_HOST_IP: ${RETRIEVER_SERVICE_HOST_IP}
-      RERANK_SERVICE_HOST_IP: ${RERANK_SERVICE_HOST_IP}
-      LVM_SERVICE_HOST_IP: ${LVM_SERVICE_HOST_IP}
-    ipc: host
-    restart: always
-  videoqna-xeon-ui-server:
-    image: ${REGISTRY:-opea}/videoqna-ui:${TAG:-latest}
-    container_name: videoqna-xeon-ui-server
-    depends_on:
-      - videoqna-xeon-backend-server
-    ports:
-      - "5173:5173"
-    environment:
-      https_proxy: ${https_proxy}
-      http_proxy: ${http_proxy}
-      no_proxy: ${no_proxy}
-      BACKEND_SERVICE_ENDPOINT: ${BACKEND_SERVICE_ENDPOINT}
-      BACKEND_HEALTH_CHECK_ENDPOINT: ${BACKEND_HEALTH_CHECK_ENDPOINT}
-    ipc: host
-    restart: always
-volumes:
-  video-llama-model:
-    external: true
-networks:
-  default:
-    driver: bridge
diff --git a/VideoQnA/docker_compose/intel/cpu/xeon/data/op_1_0320241830.mp4 b/VideoQnA/docker_compose/intel/cpu/xeon/data/op_1_0320241830.mp4
deleted file mode 100644
index 29c5dffcdb..0000000000
Binary files a/VideoQnA/docker_compose/intel/cpu/xeon/data/op_1_0320241830.mp4 and /dev/null differ
diff --git a/VideoQnA/docker_compose/intel/cpu/xeon/set_env.sh b/VideoQnA/docker_compose/intel/cpu/xeon/set_env.sh
deleted file mode 100644
index dcf574774b..0000000000
--- a/VideoQnA/docker_compose/intel/cpu/xeon/set_env.sh
+++ /dev/null
@@ -1,28 +0,0 @@
-#!/usr/bin/env bash
-
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-pushd "../../../../../" > /dev/null
-source .set_env.sh
-popd > /dev/null
-
-host_ip=$(hostname -I | awk '{print $1}')
-
-export MEGA_SERVICE_HOST_IP=${host_ip}
-export EMBEDDING_SERVICE_HOST_IP=${host_ip}
-export RETRIEVER_SERVICE_HOST_IP=${host_ip}
-export RERANK_SERVICE_HOST_IP=${host_ip}
-export LVM_SERVICE_HOST_IP=${host_ip}
-
-export LVM_ENDPOINT="http://${host_ip}:9009"
-export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:8888/v1/videoqna"
-export BACKEND_HEALTH_CHECK_ENDPOINT="http://${host_ip}:8888/v1/health_check"
-export DATAPREP_SERVICE_ENDPOINT="http://${host_ip}:6007/v1/dataprep/ingest"
-export DATAPREP_GET_FILE_ENDPOINT="http://${host_ip}:6007/v1/dataprep/get"
-export DATAPREP_GET_VIDEO_LIST_ENDPOINT="http://${host_ip}:6007/v1/dataprep/get_videos"
-
-export VDMS_HOST=${host_ip}
-export VDMS_PORT=8001
-export INDEX_NAME="mega-videoqna"
-export USECLIP=1
-export LLM_DOWNLOAD="True" # Set to "False" before redeploy LVM server to avoid model download
diff --git a/VideoQnA/docker_image_build/build.yaml b/VideoQnA/docker_image_build/build.yaml
deleted file mode 100644
index 9ed0bee955..0000000000
--- a/VideoQnA/docker_image_build/build.yaml
+++ /dev/null
@@ -1,55 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  videoqna:
-    build:
-      args:
-        http_proxy: ${http_proxy}
-        https_proxy: ${https_proxy}
-        no_proxy: ${no_proxy}
-      context: ../
-      dockerfile: ./Dockerfile
-    image: ${REGISTRY:-opea}/videoqna:${TAG:-latest}
-  videoqna-ui:
-    build:
-      context: ../ui
-      dockerfile: ./docker/Dockerfile
-    extends: videoqna
-    image: ${REGISTRY:-opea}/videoqna-ui:${TAG:-latest}
-  dataprep:
-    build:
-      context: GenAIComps
-      dockerfile: comps/dataprep/src/Dockerfile
-    extends: videoqna
-    image: ${REGISTRY:-opea}/dataprep:${TAG:-latest}
-  embedding-multimodal-clip:
-    build:
-      context: GenAIComps
-      dockerfile: comps/third_parties/clip/src/Dockerfile
-    extends: videoqna
-    image: ${REGISTRY:-opea}/embedding-multimodal-clip:${TAG:-latest}
-  retriever:
-    build:
-      context: GenAIComps
-      dockerfile: comps/retrievers/src/Dockerfile
-    extends: videoqna
-    image: ${REGISTRY:-opea}/retriever:${TAG:-latest}
-  reranking:
-    build:
-      context: GenAIComps
-      dockerfile: comps/rerankings/src/Dockerfile
-    extends: videoqna
-    image: ${REGISTRY:-opea}/reranking:${TAG:-latest}
-  lvm-video-llama:
-    build:
-      context: GenAIComps
-      dockerfile: comps/lvms/src/integrations/dependency/video-llama/Dockerfile
-    extends: videoqna
-    image: ${REGISTRY:-opea}/lvm-video-llama:${TAG:-latest}
-  lvm:
-    build:
-      context: GenAIComps
-      dockerfile: comps/lvms/src/Dockerfile
-    extends: videoqna
-    image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
diff --git a/VideoQnA/tests/test_compose_on_xeon.sh b/VideoQnA/tests/test_compose_on_xeon.sh
deleted file mode 100755
index 614c2efc47..0000000000
--- a/VideoQnA/tests/test_compose_on_xeon.sh
+++ /dev/null
@@ -1,263 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-set -x
-IMAGE_REPO=${IMAGE_REPO:-"opea"}
-IMAGE_TAG=${IMAGE_TAG:-"latest"}
-echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
-echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
-export REGISTRY=${IMAGE_REPO}
-export TAG=${IMAGE_TAG}
-
-WORKPATH=$(dirname "$PWD")
-LOG_PATH="$WORKPATH/tests"
-ip_address=$(hostname -I | awk '{print $1}')
-
-function build_docker_images() {
-    opea_branch=${opea_branch:-"main"}
-    # If the opea_branch isn't main, replace the git clone branch in Dockerfile.
-    if [[ "${opea_branch}" != "main" ]]; then
-        cd $WORKPATH
-        OLD_STRING="RUN git clone --depth 1 https://github.com/opea-project/GenAIComps.git"
-        NEW_STRING="RUN git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git"
-        find . -type f -name "Dockerfile*" | while read -r file; do
-            echo "Processing file: $file"
-            sed -i "s|$OLD_STRING|$NEW_STRING|g" "$file"
-        done
-    fi
-
-    cd $WORKPATH/docker_image_build
-    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
-
-    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
-
-    docker pull intellabs/vdms:v2.8.0
-    docker images && sleep 1s
-}
-
-
-function start_services() {
-    cd $WORKPATH/docker_compose/intel/cpu/xeon/
-
-    source set_env.sh
-    docker volume create video-llama-model
-    docker compose up vdms-vector-db dataprep -d
-    sleep 30s
-
-    # Insert some sample data to the DB
-    HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST http://${ip_address}:6007/v1/dataprep/ingest \
-    -H "Content-Type: multipart/form-data" \
-    -F "files=@./data/op_1_0320241830.mp4")
-
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "Inserted some data at the beginning."
-    else
-        echo "Inserted failed at the beginning. Received status was $HTTP_STATUS"
-        docker logs dataprep-vdms-server >> ${LOG_PATH}/dataprep.log
-        exit 1
-    fi
-    # Bring all the others
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
-    sleep 1m
-
-    # List of containers running uvicorn
-    list=("dataprep-vdms-server" "embedding-multimodal-server" "retriever-vdms-server" "reranking-tei-server" "lvm-video-llama" "lvm-video-llama" "videoqna-xeon-backend-server")
-
-    # Define the maximum time limit in seconds
-    TIME_LIMIT=5400
-    start_time=$(date +%s)
-
-    check_condition() {
-        local item=$1
-
-        if docker logs $item 2>&1 | grep -q "Uvicorn running on"; then
-            return 0
-        else
-            return 1
-        fi
-    }
-
-    # Main loop
-    while [[ ${#list[@]} -gt 0 ]]; do
-        # Get the current time
-        current_time=$(date +%s)
-        elapsed_time=$((current_time - start_time))
-
-        # Exit if time exceeds the limit
-        if (( elapsed_time >= TIME_LIMIT )); then
-            echo "Time limit exceeded."
-            break
-        fi
-
-        # Iterate through the list
-        for i in "${!list[@]}"; do
-            item=${list[i]}
-            if check_condition "$item"; then
-                echo "Condition met for $item, removing from list."
-                unset list[i]
-            else
-                echo "Condition not met for $item, keeping in list."
-            fi
-        done
-
-        # Clean up the list to remove empty elements
-        list=("${list[@]}")
-
-        # Check if the list is empty
-        if [[ ${#list[@]} -eq 0 ]]; then
-            echo "List is empty. Exiting."
-            break
-        fi
-        sleep 5m
-    done
-
-    if docker logs videoqna-xeon-ui-server 2>&1 | grep -q "Streamlit app"; then
-        return 0
-    else
-        return 1
-    fi
-
-}
-
-function validate_services() {
-    local URL="$1"
-    local EXPECTED_RESULT="$2"
-    local SERVICE_NAME="$3"
-    local DOCKER_NAME="$4"
-    local INPUT_DATA="$5"
-
-    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
-
-        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
-
-        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
-            echo "[ $SERVICE_NAME ] Content is as expected."
-        else
-            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
-            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-            exit 1
-        fi
-    else
-        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
-        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-        exit 1
-    fi
-    sleep 1s
-}
-
-function validate_microservices() {
-    # Check if the microservices are running correctly.
-    cd $WORKPATH/docker_compose/intel/cpu/xeon//data
-
-    # dataprep microservice
-    HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST http://${ip_address}:6007/v1/dataprep/ingest \
-    -H "Content-Type: multipart/form-data" \
-    -F "files=@./op_1_0320241830.mp4")
-
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "Dataprep microservice is running correctly."
-    else
-        echo "Dataprep microservice is not running correctly. Received status was $HTTP_STATUS"
-        docker logs dataprep-vdms-server >> ${LOG_PATH}/dataprep.log
-        exit 1
-    fi
-
-    # Embedding Microservice
-    validate_services \
-        "${ip_address}:6000/v1/embeddings" \
-        "Sample text" \
-        "embedding" \
-        "embedding-multimodal-server" \
-        '{"text":"Sample text"}'
-
-    # Retriever Microservice
-    export your_embedding=$(python -c "import random; embedding = [random.uniform(-1, 1) for _ in range(512)]; print(embedding)")
-    validate_services \
-        "${ip_address}:7000/v1/retrieval" \
-        "retrieved_docs" \
-        "retriever" \
-        "retriever-vdms-server" \
-        "{\"text\":\"test\",\"embedding\":${your_embedding}}"
-
-    # Reranking Microservice
-    validate_services \
-        "${ip_address}:8000/v1/reranking" \
-        "video_url" \
-        "reranking" \
-        "reranking-tei-server" \
-        '{
-            "retrieved_docs": [{"doc": [{"text": "retrieved text"}]}],
-            "initial_query": "query",
-            "top_n": 1,
-            "metadata": [
-                {"other_key": "value", "video":"top_video_name", "timestamp":"20"}
-            ]
-        }'
-
-    # LVM Microservice
-    validate_services \
-        "${ip_address}:9000/v1/lvm" \
-        "silence" \
-        "lvm" \
-        "lvm-video-llama" \
-        '{"video_url":"https://github.com/DAMO-NLP-SG/Video-LLaMA/raw/main/examples/silence_girl.mp4","chunk_start": 0,"chunk_duration": 7,"prompt":"What is the person doing?","max_new_tokens": 50}'
-
-    sleep 1s
-}
-
-function validate_megaservice() {
-    validate_services \
-    "${ip_address}:8888/v1/videoqna" \
-    "man" \
-    "videoqna-xeon-backend-server" \
-    "videoqna-xeon-backend-server" \
-    '{"messages":"What is the man doing?","stream":"True"}'
-}
-
-function validate_frontend() {
-    HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X GET http://${ip_address}:5173/_stcore/health)
-
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "Frontend is running correctly."
-        local CONTENT=$(curl -s -X GET http://${ip_address}:5173/_stcore/health)
-        if echo "$CONTENT" | grep -q "ok"; then
-            echo "Frontend Content is as expected."
-        else
-            echo "Frontend Content does not match the expected result: $CONTENT"
-            docker logs videoqna-xeon-ui-server >> ${LOG_PATH}/ui.log
-            exit 1
-        fi
-    else
-        echo "Frontend is not running correctly. Received status was $HTTP_STATUS"
-        docker logs videoqna-xeon-ui-server >> ${LOG_PATH}/ui.log
-        exit 1
-    fi
-}
-
-function stop_docker() {
-    cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose stop && docker compose rm -f
-    docker volume rm video-llama-model
-}
-
-function main() {
-
-    stop_docker
-
-    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
-    start_services
-
-    validate_microservices
-    validate_megaservice
-    validate_frontend
-
-    stop_docker
-    echo y | docker system prune
-
-}
-
-# main
diff --git a/VideoQnA/ui/docker/Dockerfile b/VideoQnA/ui/docker/Dockerfile
deleted file mode 100644
index 019999de8a..0000000000
--- a/VideoQnA/ui/docker/Dockerfile
+++ /dev/null
@@ -1,21 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-FROM python:3.9-slim
-
-WORKDIR /app
-
-RUN apt-get update && apt-get install -y curl && \
-    rm -rf /var/lib/apt/lists/*
-
-
-RUN pip install --no-cache-dir --upgrade pip setuptools && \
-    pip install --no-cache-dir streamlit
-
-COPY ui.py /app/ui.py
-
-EXPOSE 5173
-
-HEALTHCHECK CMD curl --fail http://localhost:5173/_stcore/health
-
-ENTRYPOINT ["streamlit", "run", "ui.py", "--server.port=5173", "--server.address=0.0.0.0"]
diff --git a/VideoQnA/ui/ui.py b/VideoQnA/ui/ui.py
deleted file mode 100644
index cfcbaf0897..0000000000
--- a/VideoQnA/ui/ui.py
+++ /dev/null
@@ -1,207 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-import json
-import os
-import time
-from io import BytesIO
-
-import requests
-import streamlit as st
-
-BACKEND_SERVICE_ENDPOINT = os.getenv("BACKEND_SERVICE_ENDPOINT", "http://localhost:8888/v1/videoqna")
-BACKEND_HEALTH_CHECK_ENDPOINT = os.getenv("BACKEND_HEALTH_CHECK_ENDPOINT", "http://localhost:8888/v1/health_check")
-
-
-def perform_health_check():
-    url = BACKEND_HEALTH_CHECK_ENDPOINT
-    response = requests.get(url, headers={"accept": "application/json"})
-    return response
-
-
-def download_video(url):
-    """Download video from URL and return as bytes."""
-    response = requests.get(url)
-    if response.status_code == 200:
-        return BytesIO(response.content)
-    else:
-        st.error(f"Failed to download video. Status code: {response.status_code}")
-        return None
-
-
-def play_video(url, offset):
-    """Play video from URL with specified offset."""
-    with st.spinner("Loading Video ..."):
-        video_bytes = download_video(url)
-    if video_bytes:
-        st.video(video_bytes, start_time=int(offset))
-
-
-def clear_chat_history():
-    st.session_state.example_video = "Enter Text"
-    st.session_state.messages = [{"role": "assistant", "content": "How may I assist you today?"}]
-
-
-def handle_selectbox_change():
-    prompt = st.session_state.example_video
-
-    if prompt is not None:
-        st.session_state["prompt"] = prompt
-        st.session_state.messages.append({"role": "user", "content": prompt})
-
-
-def handle_chat_input():
-    print("st.session_state.custom_prompt update", st.session_state.custom_prompt)
-    prompt = st.session_state.custom_prompt
-
-    st.session_state["prompt"] = prompt
-    st.session_state.messages.append({"role": "user", "content": prompt})
-
-
-def handle_message(col):
-    params = None
-    full_response = ""
-
-    # Generate a new response if last message is not from assistant
-    if st.session_state.messages[-1]["role"] != "assistant":
-        # Handle user messages here
-        with st.chat_message("assistant"):
-            placeholder = st.empty()
-            start = time.time()
-            prompt = st.session_state["prompt"]
-            request_data = {"messages": prompt, "stream": "True"}
-            try:
-                response = requests.post(BACKEND_SERVICE_ENDPOINT, data=json.dumps(request_data), stream=True)
-                response.raise_for_status()
-                for chunk in response.iter_content(chunk_size=8192):
-                    if chunk:
-                        if params is None:
-                            try:
-                                chunk_str = chunk.decode("utf-8").replace("'", '"')
-                                params = json.loads(chunk_str)
-
-                                video_url = params["video_url"]
-                                chunk_start = params["chunk_start"]
-                                print("VIDEO NAME USED IN PLAYBACK: ", video_url)
-
-                                video_name = video_url.split("/")[-1]
-                                full_response += f"Most relevant retrieved video is **{video_name}** \n\n"
-                                placeholder.markdown(full_response)
-
-                                with col:
-                                    play_video(video_url, chunk_start)
-
-                            except json.JSONDecodeError:
-                                print("In the param decode error branch")
-                                print(chunk.decode("utf-8"))
-                        else:
-                            new_text = chunk.decode("utf-8")
-                            # print(new_text, end=" ", flush=True)
-                            full_response += new_text
-                            placeholder.markdown(full_response)
-                # Fake response
-                # video_url = "https://github.com/DAMO-NLP-SG/Video-LLaMA/raw/main/examples/silence_girl.mp4"
-                # chunk_start=0
-                # video_name = video_url.split('/')[-1]
-                # full_response += f"Most relevant retrieved video is **{video_name}** \n\n"
-                # placeholder.markdown(full_response)
-                # with col:
-                #     play_video(video_url, chunk_start)
-                # for i in range(10):
-                #     full_response += f"new_text {i} "
-                #     time.sleep(1)
-                #     placeholder.markdown(full_response)
-
-            except requests.HTTPError as http_err:
-                st.error(f"HTTP error occurred: {http_err}")
-            except requests.RequestException as req_err:
-                st.error(f"Error occurred: {req_err}")
-            except Exception as err:
-                st.error(f"An unexpected error occurred: {err}")
-
-            end = time.time()
-            full_response += f"\n\n🚀 Generated in {(end - start):.4f} seconds."
-            placeholder.markdown(full_response)
-
-        message = {"role": "assistant", "content": full_response}
-
-        st.session_state.messages.append(message)
-
-
-def display_messages():
-    # Display chat messages
-    for message in st.session_state.messages:
-        with st.chat_message(message["role"]):
-            st.write(message["content"])
-
-
-def main():
-    st.set_page_config(initial_sidebar_state="collapsed", layout="wide")
-    st.title("VideoQnA")
-    title_alignment = """
-    <style>
-    h1 {
-    text-align: center
-    }
-
-    video.stVideo {
-        width: 200px;
-        height: 500px;
-    }
-    </style>
-    """
-    st.markdown(title_alignment, unsafe_allow_html=True)
-    st.sidebar.button("Clear Chat History", on_click=clear_chat_history)
-
-    placeholder = st.empty()
-
-    # check server health
-    if "health_check" not in st.session_state.keys():
-        with st.spinner("Checking health of the server..."):
-            time.sleep(1)
-            response = perform_health_check()
-        if response.status_code == 200:
-            placeholder.success("Server is healthy!", icon="✅")
-            time.sleep(1)
-            placeholder.empty()  # Remove the message
-            st.session_state["health_check"] = True
-        else:
-            st.error(f"Server health check failed with status code {response.status_code}")
-            st.stop()
-
-    # Initialize conversation state
-    if "messages" not in st.session_state.keys():
-        st.session_state.messages = [{"role": "assistant", "content": "How may I assist you today?"}]
-    if "prompt" not in st.session_state.keys():
-        st.session_state["prompt"] = ""
-
-    col1, col2 = st.columns([2, 1])
-
-    with col1:
-        st.selectbox(
-            "Example Prompts",
-            (
-                "Man wearing glasses",
-                "People reading item description",
-                "Man holding red shopping basket",
-                "Was there any person wearing a blue shirt seen today?",
-                "Was there any person wearing a blue shirt seen in the last 6 hours?",
-                "Was there any person wearing a blue shirt seen last Sunday?",
-                "Was a person wearing glasses seen in the last 30 minutes?",
-                "Was a person wearing glasses seen in the last 72 hours?",
-            ),
-            key="example_video",
-            index=None,
-            placeholder="--- Options ---",
-            on_change=handle_selectbox_change,
-        )
-
-    st.chat_input(disabled=False, key="custom_prompt", on_submit=handle_chat_input)
-
-    with col1:
-        display_messages()
-        handle_message(col2)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/VideoQnA/videoqna.py b/VideoQnA/videoqna.py
deleted file mode 100644
index c447dd2abf..0000000000
--- a/VideoQnA/videoqna.py
+++ /dev/null
@@ -1,131 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-import os
-
-from comps import MegaServiceEndpoint, MicroService, ServiceOrchestrator, ServiceRoleType, ServiceType
-from comps.cores.mega.utils import handle_message
-from comps.cores.proto.api_protocol import (
-    ChatCompletionRequest,
-    ChatCompletionResponse,
-    ChatCompletionResponseChoice,
-    ChatMessage,
-    UsageInfo,
-)
-from comps.cores.proto.docarray import LLMParams
-from fastapi import Request
-from fastapi.responses import StreamingResponse
-
-MEGA_SERVICE_PORT = int(os.getenv("MEGA_SERVICE_PORT", 8888))
-EMBEDDING_SERVICE_HOST_IP = os.getenv("EMBEDDING_SERVICE_HOST_IP", "0.0.0.0")
-EMBEDDING_SERVICE_PORT = int(os.getenv("EMBEDDING_SERVICE_PORT", 6000))
-RETRIEVER_SERVICE_HOST_IP = os.getenv("RETRIEVER_SERVICE_HOST_IP", "0.0.0.0")
-RETRIEVER_SERVICE_PORT = int(os.getenv("RETRIEVER_SERVICE_PORT", 7000))
-RERANK_SERVICE_HOST_IP = os.getenv("RERANK_SERVICE_HOST_IP", "0.0.0.0")
-RERANK_SERVICE_PORT = int(os.getenv("RERANK_SERVICE_PORT", 8000))
-LVM_SERVICE_HOST_IP = os.getenv("LVM_SERVICE_HOST_IP", "0.0.0.0")
-LVM_SERVICE_PORT = int(os.getenv("LVM_SERVICE_PORT", 9000))
-
-
-class VideoQnAService:
-    def __init__(self, host="0.0.0.0", port=8888):
-        self.host = host
-        self.port = port
-        self.megaservice = ServiceOrchestrator()
-        self.endpoint = str(MegaServiceEndpoint.VIDEO_RAG_QNA)
-
-    def add_remote_service(self):
-        embedding = MicroService(
-            name="embedding",
-            host=EMBEDDING_SERVICE_HOST_IP,
-            port=EMBEDDING_SERVICE_PORT,
-            endpoint="/v1/embeddings",
-            use_remote_service=True,
-            service_type=ServiceType.EMBEDDING,
-        )
-        retriever = MicroService(
-            name="retriever",
-            host=RETRIEVER_SERVICE_HOST_IP,
-            port=RETRIEVER_SERVICE_PORT,
-            endpoint="/v1/retrieval",
-            use_remote_service=True,
-            service_type=ServiceType.RETRIEVER,
-        )
-        rerank = MicroService(
-            name="rerank",
-            host=RERANK_SERVICE_HOST_IP,
-            port=RERANK_SERVICE_PORT,
-            endpoint="/v1/reranking",
-            use_remote_service=True,
-            service_type=ServiceType.RERANK,
-        )
-        lvm = MicroService(
-            name="lvm",
-            host=LVM_SERVICE_HOST_IP,
-            port=LVM_SERVICE_PORT,
-            endpoint="/v1/lvm",
-            use_remote_service=True,
-            service_type=ServiceType.LVM,
-        )
-        self.megaservice.add(embedding).add(retriever).add(rerank).add(lvm)
-        self.megaservice.flow_to(embedding, retriever)
-        self.megaservice.flow_to(retriever, rerank)
-        self.megaservice.flow_to(rerank, lvm)
-
-    async def handle_request(self, request: Request):
-        data = await request.json()
-        stream_opt = data.get("stream", False)
-        chat_request = ChatCompletionRequest.parse_obj(data)
-        prompt = handle_message(chat_request.messages)
-        parameters = LLMParams(
-            max_new_tokens=chat_request.max_tokens if chat_request.max_tokens else 1024,
-            top_k=chat_request.top_k if chat_request.top_k else 10,
-            top_p=chat_request.top_p if chat_request.top_p else 0.95,
-            temperature=chat_request.temperature if chat_request.temperature else 0.01,
-            frequency_penalty=chat_request.frequency_penalty if chat_request.frequency_penalty else 0.0,
-            presence_penalty=chat_request.presence_penalty if chat_request.presence_penalty else 0.0,
-            repetition_penalty=chat_request.repetition_penalty if chat_request.repetition_penalty else 1.03,
-            stream=stream_opt,
-        )
-        result_dict, runtime_graph = await self.megaservice.schedule(
-            initial_inputs={"text": prompt}, llm_parameters=parameters
-        )
-        for node, response in result_dict.items():
-            # Here it suppose the last microservice in the megaservice is LVM.
-            if (
-                isinstance(response, StreamingResponse)
-                and node == list(self.megaservice.services.keys())[-1]
-                and self.megaservice.services[node].service_type == ServiceType.LVM
-            ):
-                return response
-        last_node = runtime_graph.all_leaves()[-1]
-        response = result_dict[last_node]["text"]
-        choices = []
-        usage = UsageInfo()
-        choices.append(
-            ChatCompletionResponseChoice(
-                index=0,
-                message=ChatMessage(role="assistant", content=response),
-                finish_reason="stop",
-            )
-        )
-        return ChatCompletionResponse(model="videoqna", choices=choices, usage=usage)
-
-    def start(self):
-        self.service = MicroService(
-            self.__class__.__name__,
-            service_role=ServiceRoleType.MEGASERVICE,
-            host=self.host,
-            port=self.port,
-            endpoint=self.endpoint,
-            input_datatype=ChatCompletionRequest,
-            output_datatype=ChatCompletionResponse,
-        )
-        self.service.add_route(self.endpoint, self.handle_request, methods=["POST"])
-        self.service.start()
-
-
-if __name__ == "__main__":
-    videoqna = VideoQnAService(port=MEGA_SERVICE_PORT)
-    videoqna.add_remote_service()
-    videoqna.start()
diff --git a/VisualQnA/Dockerfile b/VisualQnA/Dockerfile
deleted file mode 100644
index 95936d9c03..0000000000
--- a/VisualQnA/Dockerfile
+++ /dev/null
@@ -1,9 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-ARG BASE_TAG=latest
-FROM opea/comps-base:$BASE_TAG
-
-COPY ./visualqna.py $HOME/visualqna.py
-
-ENTRYPOINT ["python", "visualqna.py"]
diff --git a/VisualQnA/README.md b/VisualQnA/README.md
deleted file mode 100644
index 74ab54fdff..0000000000
--- a/VisualQnA/README.md
+++ /dev/null
@@ -1,146 +0,0 @@
-# Visual Question and Answering
-
-Visual Question Answering (VQA) is the task of answering open-ended questions based on an image. The input to models supporting this task is typically a combination of an image and a question, and the output is an answer expressed in natural language.
-
-Some noteworthy use case examples for VQA include:
-
-- Accessibility applications for visually impaired individuals.
-- Education: posing questions about visual materials presented in lectures or textbooks. VQA can also be utilized in interactive museum exhibits or historical sites.
-- Customer service and e-commerce: VQA can enhance user experience by letting users ask questions about products.
-- Image retrieval: VQA models can be used to retrieve images with specific characteristics. For example, the user can ask “Is there a dog?” to find all images with dogs from a set of images.
-
-General architecture of VQA shows below:
-
-![VQA](./assets/img/vqa.png)
-
-The VisualQnA example is implemented using the component-level microservices defined in [GenAIComps](https://github.com/opea-project/GenAIComps). The flow chart below shows the information flow between different microservices for this example.
-
-```mermaid
----
-config:
-  flowchart:
-    nodeSpacing: 400
-    rankSpacing: 100
-    curve: linear
-  themeVariables:
-    fontSize: 50px
----
-flowchart LR
-    %% Colors %%
-    classDef blue fill:#ADD8E6,stroke:#ADD8E6,stroke-width:2px,fill-opacity:0.5
-    classDef orange fill:#FBAA60,stroke:#ADD8E6,stroke-width:2px,fill-opacity:0.5
-    classDef orchid fill:#C26DBC,stroke:#ADD8E6,stroke-width:2px,fill-opacity:0.5
-    classDef invisible fill:transparent,stroke:transparent;
-    style VisualQnA-MegaService stroke:#000000
-
-    %% Subgraphs %%
-    subgraph VisualQnA-MegaService["VisualQnA MegaService "]
-        direction LR
-        LVM([LVM MicroService]):::blue
-    end
-    subgraph UserInterface[" User Interface "]
-        direction LR
-        a([User Input Query]):::orchid
-        Ingest([Ingest data]):::orchid
-        UI([UI server<br>]):::orchid
-    end
-
-
-    LVM_gen{{LVM Service <br>}}
-    GW([VisualQnA GateWay<br>]):::orange
-    NG([Nginx MicroService]):::blue
-
-
-    %% Questions interaction
-    direction LR
-    Ingest[Ingest data] --> UI
-    a[User Input Query] --> |Need Proxy Server|NG
-    a[User Input Query] --> UI
-    NG --> UI
-    UI --> GW
-    GW <==> VisualQnA-MegaService
-
-
-    %% Embedding service flow
-    direction LR
-    LVM <-.-> LVM_gen
-
-```
-
-This example guides you through how to deploy a [LLaVA-NeXT](https://github.com/LLaVA-VL/LLaVA-NeXT) (Open Large Multimodal Models) model on [Intel Gaudi2](https://www.intel.com/content/www/us/en/products/details/processors/ai-accelerators/gaudi-overview.html) and [Intel Xeon Scalable Processors](https://www.intel.com/content/www/us/en/products/details/processors/xeon.html). We invite contributions from other hardware vendors to expand the OPEA ecosystem.
-
-![llava screenshot](./assets/img/llava_screenshot1.png)
-![llava-screenshot](./assets/img/llava_screenshot2.png)
-
-## Required Models
-
-By default, the model is set to `llava-hf/llava-v1.6-mistral-7b-hf`. To use a different model, update the `LVM_MODEL_ID` variable in the [`set_env.sh`](./docker_compose/intel/hpu/gaudi/set_env.sh) file.
-
-```
-export LVM_MODEL_ID="llava-hf/llava-v1.6-mistral-7b-hf"
-```
-
-You can choose other llava-next models, such as `llava-hf/llava-v1.6-vicuna-13b-hf`, as needed.
-
-## Deploy VisualQnA Service
-
-The VisualQnA service can be effortlessly deployed on either Intel Gaudi2 or Intel Xeon Scalable Processors.
-
-Currently we support deploying VisualQnA services with docker compose.
-
-### Setup Environment Variable
-
-To set up environment variables for deploying VisualQnA services, follow these steps:
-
-1. Set the required environment variables:
-
-   ```bash
-   # Example: host_ip="192.168.1.1"
-   export host_ip="External_Public_IP"
-   # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
-   export no_proxy="Your_No_Proxy"
-   ```
-
-2. If you are in a proxy environment, also set the proxy-related environment variables:
-
-   ```bash
-   export http_proxy="Your_HTTP_Proxy"
-   export https_proxy="Your_HTTPs_Proxy"
-   ```
-
-3. Set up other environment variables:
-
-   > Notice that you can only choose **one** command below to set up envs according to your hardware. Other that the port numbers may be set incorrectly.
-
-   ```bash
-   # on Gaudi
-   source ./docker_compose/intel/hpu/gaudi/set_env.sh
-   # on Xeon
-   source ./docker_compose/intel/cpu/xeon/set_env.sh
-   ```
-
-### Deploy VisualQnA on Gaudi
-
-Refer to the [Gaudi Guide](./docker_compose/intel/hpu/gaudi/README.md) to build docker images from source.
-
-Find the corresponding [compose.yaml](./docker_compose/intel/hpu/gaudi/compose.yaml).
-
-```bash
-cd GenAIExamples/VisualQnA/docker_compose/intel/hpu/gaudi/
-docker compose up -d
-```
-
-### Deploy VisualQnA on Xeon
-
-Refer to the [Xeon Guide](./docker_compose/intel/cpu/xeon/README.md) for more instructions on building docker images from source.
-
-Find the corresponding [compose.yaml](./docker_compose/intel/cpu/xeon/compose.yaml).
-
-```bash
-cd GenAIExamples/VisualQnA/docker_compose/intel/cpu/xeon/
-docker compose up -d
-```
-
-### Deploy VisualQnA on Kubernetes using Helm Chart
-
-Refer to the [VisualQnA helm chart](./kubernetes/helm/README.md) for instructions on deploying VisualQnA on Kubernetes.
diff --git a/VisualQnA/assets/img/llava_screenshot1.png b/VisualQnA/assets/img/llava_screenshot1.png
deleted file mode 100644
index b08c8b2459..0000000000
Binary files a/VisualQnA/assets/img/llava_screenshot1.png and /dev/null differ
diff --git a/VisualQnA/assets/img/llava_screenshot2.png b/VisualQnA/assets/img/llava_screenshot2.png
deleted file mode 100644
index ed6255e565..0000000000
Binary files a/VisualQnA/assets/img/llava_screenshot2.png and /dev/null differ
diff --git a/VisualQnA/assets/img/vqa.png b/VisualQnA/assets/img/vqa.png
deleted file mode 100644
index 7022a92568..0000000000
Binary files a/VisualQnA/assets/img/vqa.png and /dev/null differ
diff --git a/VisualQnA/benchmark/performance/README.md b/VisualQnA/benchmark/performance/README.md
deleted file mode 100644
index 45e76558ca..0000000000
--- a/VisualQnA/benchmark/performance/README.md
+++ /dev/null
@@ -1,77 +0,0 @@
-# VisualQnA Benchmarking
-
-This folder contains a collection of scripts to enable inference benchmarking by leveraging a comprehensive benchmarking tool, [GenAIEval](https://github.com/opea-project/GenAIEval/blob/main/evals/benchmark/README.md), that enables throughput analysis to assess inference performance.
-
-By following this guide, you can run benchmarks on your deployment and share the results with the OPEA community.
-
-## Purpose
-
-We aim to run these benchmarks and share them with the OPEA community for three primary reasons:
-
-- To offer insights on inference throughput in real-world scenarios, helping you choose the best service or deployment for your needs.
-- To establish a baseline for validating optimization solutions across different implementations, providing clear guidance on which methods are most effective for your use case.
-- To inspire the community to build upon our benchmarks, allowing us to better quantify new solutions in conjunction with current leading llms, serving frameworks etc.
-
-## Metrics
-
-The benchmark will report the below metrics, including:
-
-- Number of Concurrent Requests
-- End-to-End Latency: P50, P90, P99 (in milliseconds)
-- End-to-End First Token Latency: P50, P90, P99 (in milliseconds)
-- Average Next Token Latency (in milliseconds)
-- Average Token Latency (in milliseconds)
-- Requests Per Second (RPS)
-- Output Tokens Per Second
-- Input Tokens Per Second
-
-Results will be displayed in the terminal and saved as CSV file named `1_testspec.yaml`.
-
-## Getting Started
-
-We recommend using Kubernetes to deploy the VisualQnA service, as it offers benefits such as load balancing and improved scalability. However, you can also deploy the service using Docker if that better suits your needs.
-
-### Prerequisites
-
-- Install Kubernetes by following [this guide](https://github.com/opea-project/docs/blob/main/guide/installation/k8s_install/k8s_install_kubespray.md).
-
-- Every node has direct internet access
-- Set up kubectl on the master node with access to the Kubernetes cluster.
-- Install Python 3.8+ on the master node for running GenAIEval.
-- Ensure all nodes have a local /mnt/models folder, which will be mounted by the pods.
-- Ensure that the container's ulimit can meet the the number of requests.
-
-```bash
-# The way to modify the containered ulimit:
-sudo systemctl edit containerd
-# Add two lines:
-[Service]
-LimitNOFILE=65536:1048576
-
-sudo systemctl daemon-reload; sudo systemctl restart containerd
-```
-
-### Test Steps
-
-Please deploy VisualQnA service before benchmarking.
-
-#### Run Benchmark Test
-
-Before the benchmark, we can configure the number of test queries and test output directory by:
-
-```bash
-export USER_QUERIES="[1, 1, 1, 1]"
-export TEST_OUTPUT_DIR="/tmp/benchmark_output"
-```
-
-And then run the benchmark by:
-
-```bash
-bash benchmark.sh -n <node_count>
-```
-
-The argument `-n` refers to the number of test nodes.
-
-#### Data collection
-
-All the test results will come to this folder `/tmp/benchmark_output` configured by the environment variable `TEST_OUTPUT_DIR` in previous steps.
diff --git a/VisualQnA/benchmark/performance/benchmark.sh b/VisualQnA/benchmark/performance/benchmark.sh
deleted file mode 100644
index 44abdecbb1..0000000000
--- a/VisualQnA/benchmark/performance/benchmark.sh
+++ /dev/null
@@ -1,99 +0,0 @@
-#!/bin/bash
-
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-deployment_type="k8s"
-node_number=1
-service_port=8888
-query_per_node=128
-
-benchmark_tool_path="$(pwd)/GenAIEval"
-
-usage() {
-    echo "Usage: $0 [-d deployment_type] [-n node_number] [-i service_ip] [-p service_port]"
-    echo "  -d deployment_type    deployment type, select between k8s and docker (default: ${deployment_type})"
-    echo "  -n node_number        Test node number, required only for k8s deployment_type, (default: ${node_number})"
-    echo "  -i service_ip         service ip, required only for docker deployment_type"
-    echo "  -p service_port       service port, required only for docker deployment_type, (default: ${service_port})"
-    exit 1
-}
-
-while getopts ":d:n:i:p:" opt; do
-    case ${opt} in
-        d )
-            deployment_type=$OPTARG
-            ;;
-        n )
-            node_number=$OPTARG
-            ;;
-        i )
-            service_ip=$OPTARG
-            ;;
-        p )
-            service_port=$OPTARG
-            ;;
-        \? )
-            echo "Invalid option: -$OPTARG" 1>&2
-            usage
-            ;;
-        : )
-            echo "Invalid option: -$OPTARG requires an argument" 1>&2
-            usage
-            ;;
-    esac
-done
-
-if [[ "$deployment_type" == "docker" && -z "$service_ip" ]]; then
-    echo "Error: service_ip is required for docker deployment_type" 1>&2
-    usage
-fi
-
-if [[ "$deployment_type" == "k8s" && ( -n "$service_ip" || -n "$service_port" ) ]]; then
-    echo "Warning: service_ip and service_port are ignored for k8s deployment_type" 1>&2
-fi
-
-function main() {
-    if [[ ! -d ${benchmark_tool_path} ]]; then
-        echo "Benchmark tool not found, setting up..."
-        setup_env
-    fi
-    run_benchmark
-}
-
-function setup_env() {
-    git clone https://github.com/opea-project/GenAIEval.git
-    pushd ${benchmark_tool_path}
-    python3 -m venv stress_venv
-    source stress_venv/bin/activate
-    pip install -r requirements.txt
-    popd
-}
-
-function run_benchmark() {
-    source ${benchmark_tool_path}/stress_venv/bin/activate
-    export DEPLOYMENT_TYPE=${deployment_type}
-    export SERVICE_IP=${service_ip:-"None"}
-    export SERVICE_PORT=${service_port:-"None"}
-    if [[ -z $USER_QUERIES ]]; then
-        user_query=$((query_per_node*node_number))
-        export USER_QUERIES="[${user_query}, ${user_query}, ${user_query}, ${user_query}]"
-        echo "USER_QUERIES not configured, setting to: ${USER_QUERIES}."
-    fi
-    export WARMUP=$(echo $USER_QUERIES | sed -e 's/[][]//g' -e 's/,.*//')
-    if [[ -z $WARMUP ]]; then export WARMUP=0; fi
-    if [[ -z $TEST_OUTPUT_DIR ]]; then
-        if [[ $DEPLOYMENT_TYPE == "k8s" ]]; then
-            export TEST_OUTPUT_DIR="${benchmark_tool_path}/evals/benchmark/benchmark_output/node_${node_number}"
-        else
-            export TEST_OUTPUT_DIR="${benchmark_tool_path}/evals/benchmark/benchmark_output/docker"
-        fi
-        echo "TEST_OUTPUT_DIR not configured, setting to: ${TEST_OUTPUT_DIR}."
-    fi
-
-    envsubst < ./benchmark.yaml > ${benchmark_tool_path}/evals/benchmark/benchmark.yaml
-    cd ${benchmark_tool_path}/evals/benchmark
-    python benchmark.py
-}
-
-main
diff --git a/VisualQnA/benchmark/performance/benchmark.yaml b/VisualQnA/benchmark/performance/benchmark.yaml
deleted file mode 100644
index 179317bdba..0000000000
--- a/VisualQnA/benchmark/performance/benchmark.yaml
+++ /dev/null
@@ -1,47 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-test_suite_config: # Overall configuration settings for the test suite
-  examples: ["visualqna"]  # The specific test cases being tested, e.g., chatqna, codegen, codetrans, faqgen, audioqna, visualqna
-  deployment_type: "k8s"  # Default is "k8s", can also be "docker"
-  service_ip: None  # Leave as None for k8s, specify for Docker
-  service_port: None  # Leave as None for k8s, specify for Docker
-  warm_ups: 0  # Number of test requests for warm-up
-  run_time: 60m  # The max total run time for the test suite
-  seed:  # The seed for all RNGs
-  user_queries: [1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048]  # Number of test requests at each concurrency level
-  query_timeout: 120  # Number of seconds to wait for a simulated user to complete any executing task before exiting. 120 sec by defeult.
-  random_prompt: false  # Use random prompts if true, fixed prompts if false
-  collect_service_metric: false  # Collect service metrics if true, do not collect service metrics if false
-  data_visualization: false # Generate data visualization if true, do not generate data visualization if false
-  llm_model: "llava-hf/llava-v1.6-mistral-7b-hf"  # The LLM model used for the test
-  test_output_dir: "/tmp/benchmark_output"  # The directory to store the test output
-  load_shape:              # Tenant concurrency pattern
-    name: constant           # poisson or constant(locust default load shape)
-    params:                  # Loadshape-specific parameters
-      constant:                # Constant load shape specific parameters, activate only if load_shape.name is constant
-        concurrent_level: 4      # If user_queries is specified, concurrent_level is target number of requests per user. If not, it is the number of simulated users
-        # arrival_rate: 1.0       # Request arrival rate. If set, concurrent_level will be overridden, constant load will be generated based on arrival-rate
-      poisson:                 # Poisson load shape specific parameters, activate only if load_shape.name is poisson
-        arrival_rate: 1.0        # Request arrival rate
-  namespace: "" # Fill the user-defined namespace. Otherwise, it will be default.
-
-test_cases:
-  visualqna:
-    lvm:
-      run_test: true
-      service_name: "llm-svc"  # Replace with your service name
-      parameters:
-        model_name: "llava-hf/llava-v1.6-mistral-7b-hf"
-        max_new_tokens: 128
-        temperature: 0.01
-        top_k: 10
-        top_p: 0.95
-        repetition_penalty: 1.03
-        stream: true
-    lvmserve:
-      run_test: true
-      service_name: "lvm-serving-svc"  # Replace with your service name
-    e2e:
-      run_test: true
-      service_name: "visualqna-backend-server-svc"  # Replace with your service name
diff --git a/VisualQnA/docker_compose/amd/gpu/rocm/README.md b/VisualQnA/docker_compose/amd/gpu/rocm/README.md
deleted file mode 100644
index 483e9b0da6..0000000000
--- a/VisualQnA/docker_compose/amd/gpu/rocm/README.md
+++ /dev/null
@@ -1,156 +0,0 @@
-# Build Mega Service of VisualQnA on AMD ROCm
-
-This document outlines the deployment process for a VisualQnA application utilizing the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline on Intel Xeon server. The steps include Docker image creation, container deployment via Docker Compose, and service execution to integrate microservices such as `llm`. We will publish the Docker images to Docker Hub soon, it will simplify the deployment process for this service.
-
-## 🚀 Build Docker Images
-
-First of all, you need to build Docker Images locally and install the python package of it.
-
-### 1. Build LVM and NGINX Docker Images
-
-```bash
-git clone https://github.com/opea-project/GenAIComps.git
-cd GenAIComps
-docker build --no-cache -t opea/lvm:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/lvms/src/Dockerfile .
-docker build --no-cache -t opea/nginx:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/third_parties/nginx/src/Dockerfile .
-```
-
-### 2. Build MegaService Docker Image
-
-To construct the Mega Service, we utilize the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline within the `visualqna.py` Python script. Build MegaService Docker image via below command:
-
-```bash
-git clone https://github.com/opea-project/GenAIExamples.git
-cd GenAIExamples/VisualQnA
-docker build --no-cache -t opea/visualqna:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
-```
-
-### 3. Build UI Docker Image
-
-Build frontend Docker image via below command:
-
-```bash
-cd GenAIExamples/VisualQnA/ui
-docker build --no-cache -t opea/visualqna-ui:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f docker/Dockerfile .
-```
-
-### 4. Pull TGI AMD ROCm Image
-
-```bash
-docker pull ghcr.io/huggingface/text-generation-inference:2.4.1-rocm
-```
-
-Then run the command `docker images`, you will have the following 5 Docker Images:
-
-1. `ghcr.io/huggingface/text-generation-inference:2.4.1-rocm`
-2. `opea/lvm:latest`
-3. `opea/visualqna:latest`
-4. `opea/visualqna-ui:latest`
-5. `opea/nginx`
-
-## 🚀 Start Microservices
-
-### Setup Environment Variables
-
-Since the `compose.yaml` will consume some environment variables, you need to setup them in advance as below.
-
-**Export the value of the public IP address of your ROCM server to the `host_ip` environment variable**
-
-> Change the External_Public_IP below with the actual IPV4 value
-
-```
-export host_ip="External_Public_IP"
-```
-
-**Append the value of the public IP address to the no_proxy list**
-
-```
-export your_no_proxy="${your_no_proxy},${host_ip}"
-```
-
-```bash
-export HOST_IP=${your_host_ip}
-export VISUALQNA_TGI_SERVICE_PORT="8399"
-export VISUALQNA_HUGGINGFACEHUB_API_TOKEN={your_hugginface_api_token}
-export VISUALQNA_CARD_ID="card1"
-export VISUALQNA_RENDER_ID="renderD136"
-export LVM_MODEL_ID="Xkev/Llama-3.2V-11B-cot"
-export MODEL="llava-hf/llava-v1.6-mistral-7b-hf"
-export LVM_ENDPOINT="http://${HOST_IP}:8399"
-export LVM_SERVICE_PORT=9399
-export MEGA_SERVICE_HOST_IP=${HOST_IP}
-export LVM_SERVICE_HOST_IP=${HOST_IP}
-export BACKEND_SERVICE_ENDPOINT="http://${HOST_IP}:18003/v1/visualqna"
-export FRONTEND_SERVICE_IP=${HOST_IP}
-export FRONTEND_SERVICE_PORT=18001
-export BACKEND_SERVICE_NAME=visualqna
-export BACKEND_SERVICE_IP=${HOST_IP}
-export BACKEND_SERVICE_PORT=18002
-export NGINX_PORT=18003
-
-```
-
-Note: Please replace with `host_ip` with you external IP address, do not use localhost.
-
-Note: You can use set_env.sh file with bash command (. setset_env.sh) to set up needed variables.
-
-### Start all the services Docker Containers
-
-> Before running the docker compose command, you need to be in the folder that has the docker compose yaml file
-
-```bash
-cd GenAIExamples/VisualQnA/docker_compose/amd/gpu/rocm
-```
-
-```bash
-docker compose -f compose.yaml up -d
-```
-
-### Validate Microservices
-
-Follow the instructions to validate MicroServices.
-
-> Note: If you see an "Internal Server Error" from the `curl` command, wait a few minutes for the microserver to be ready and then try again.
-
-1. LLM Microservice
-
-   ```bash
-   http_proxy="" curl http://${host_ip}:9399/v1/lvm -XPOST -d '{"image": "iVBORw0KGgoAAAANSUhEUgAAAAoAAAAKCAYAAACNMs+9AAAAFUlEQVR42mP8/5+hnoEIwDiqkL4KAcT9GO0U4BxoAAAAAElFTkSuQmCC", "prompt":"What is this?"}' -H 'Content-Type: application/json'
-   ```
-
-2. MegaService
-
-```bash
-curl http://${host_ip}:8888/v1/visualqna -H "Content-Type: application/json" -d '{
-    "messages": [
-      {
-        "role": "user",
-        "content": [
-          {
-            "type": "text",
-            "text": "What'\''s in this image?"
-          },
-          {
-            "type": "image_url",
-            "image_url": {
-              "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-            }
-          }
-        ]
-      }
-    ],
-    "max_tokens": 300
-    }'
-```
-
-## 🚀 Launch the UI
-
-To access the frontend, open the following URL in your browser: http://{host_ip}:5173. By default, the UI runs on port 5173 internally. If you prefer to use a different host port to access the frontend, you can modify the port mapping in the `compose.yaml` file as shown below:
-
-```yaml
-  visualqna-gaudi-ui-server:
-    image: opea/visualqna-ui:latest
-    ...
-    ports:
-      - "80:5173"
-```
diff --git a/VisualQnA/docker_compose/amd/gpu/rocm/compose.yaml b/VisualQnA/docker_compose/amd/gpu/rocm/compose.yaml
deleted file mode 100644
index 72f667ab2f..0000000000
--- a/VisualQnA/docker_compose/amd/gpu/rocm/compose.yaml
+++ /dev/null
@@ -1,100 +0,0 @@
-# Copyright (C) 2024 Advanced Micro Devices, Inc.
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  visualqna-llava-tgi-service:
-    image: ghcr.io/huggingface/text-generation-inference:2.4.1-rocm
-    container_name: visualqna-tgi-service
-    ports:
-      - "${VISUALQNA_TGI_SERVICE_PORT:-8399}:80"
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      TGI_LLM_ENDPOINT: "http://${HOST_IP}:${VISUALQNA_TGI_SERVICE_PORT}"
-      HUGGINGFACEHUB_API_TOKEN: ${VISUALQNA_HUGGINGFACEHUB_API_TOKEN}
-      HUGGING_FACE_HUB_TOKEN: ${VISUALQNA_HUGGINGFACEHUB_API_TOKEN}
-    volumes:
-      - "/var/opea/visualqna-service/data:/data"
-    shm_size: 64g
-    devices:
-      - /dev/kfd:/dev/kfd
-      - /dev/dri/:/dev/dri/
-    cap_add:
-      - SYS_PTRACE
-    group_add:
-      - video
-    security_opt:
-      - seccomp:unconfined
-    ipc: host
-    command: --model-id ${LVM_MODEL_ID} --max-input-length 4096 --max-total-tokens 8192
-  lvm:
-    image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
-    container_name: lvm-server
-    depends_on:
-      - visualqna-llava-tgi-service
-    ports:
-      - "9399:9399"
-    ipc: host
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      LVM_ENDPOINT: ${LVM_ENDPOINT}
-      LVM_COMPONENT_NAME: "OPEA_TGI_LLAVA_LVM"
-      HF_HUB_DISABLE_PROGRESS_BARS: 1
-      HF_HUB_ENABLE_HF_TRANSFER: 0
-    restart: unless-stopped
-  visualqna-rocm-backend-server:
-    image: ${REGISTRY:-opea}/visualqna:${TAG:-latest}
-    container_name: visualqna-rocm-backend-server
-    depends_on:
-      - visualqna-llava-tgi-service
-      - lvm
-    ports:
-      - "${BACKEND_SERVICE_PORT:-8888}:8888"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
-      - LVM_SERVICE_HOST_IP=${LVM_SERVICE_HOST_IP}
-    ipc: host
-    restart: always
-  visualqna-rocm-ui-server:
-    image: ${REGISTRY:-opea}/visualqna-ui:${TAG:-latest}
-    container_name: visualqna-rocm-ui-server
-    depends_on:
-      - visualqna-rocm-backend-server
-    ports:
-      - "${FRONTEND_SERVICE_PORT:-5173}:5173"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - BACKEND_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
-    ipc: host
-    restart: always
-  visualqna-nginx-server:
-    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
-    container_name: visualqna-rocm-nginx-server
-    depends_on:
-      - visualqna-rocm-backend-server
-      - visualqna-rocm-ui-server
-    ports:
-      - "${NGINX_PORT:-80}:80"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - FRONTEND_SERVICE_IP=${HOST_IP}
-      - FRONTEND_SERVICE_PORT=${FRONTEND_SERVICE_PORT}
-      - BACKEND_SERVICE_NAME=${BACKEND_SERVICE_NAME}
-      - BACKEND_SERVICE_IP=${HOST_IP}
-      - BACKEND_SERVICE_PORT=${BACKEND_SERVICE_PORT}
-    ipc: host
-    restart: always
-
-networks:
-  default:
-    driver: bridge
diff --git a/VisualQnA/docker_compose/amd/gpu/rocm/set_env.sh b/VisualQnA/docker_compose/amd/gpu/rocm/set_env.sh
deleted file mode 100644
index bf73465cef..0000000000
--- a/VisualQnA/docker_compose/amd/gpu/rocm/set_env.sh
+++ /dev/null
@@ -1,22 +0,0 @@
-#!/usr/bin/env bash
-
-# Copyright (C) 2024 Advanced Micro Devices, Inc
-# SPDX-License-Identifier: Apache-2.0
-
-export HOST_IP=${Your_host_ip_address}
-export VISUALQNA_TGI_SERVICE_PORT="8399"
-export VISUALQNA_HUGGINGFACEHUB_API_TOKEN=${Your_HUGGINGFACEHUB_API_TOKEN}
-export VISUALQNA_CARD_ID="card1"
-export VISUALQNA_RENDER_ID="renderD136"
-export LVM_MODEL_ID="Xkev/Llama-3.2V-11B-cot"
-export LVM_ENDPOINT="http://${HOST_IP}:8399"
-export LVM_SERVICE_PORT=9399
-export MEGA_SERVICE_HOST_IP=${HOST_IP}
-export LVM_SERVICE_HOST_IP=${HOST_IP}
-export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:${BACKEND_SERVICE_PORT}/v1/visualqna"
-export FRONTEND_SERVICE_IP=${HOST_IP}
-export FRONTEND_SERVICE_PORT=18001
-export BACKEND_SERVICE_NAME=visualqna
-export BACKEND_SERVICE_IP=${HOST_IP}
-export BACKEND_SERVICE_PORT=18002
-export NGINX_PORT=18003
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/README.md b/VisualQnA/docker_compose/intel/cpu/xeon/README.md
deleted file mode 100644
index cfbc3ab1c1..0000000000
--- a/VisualQnA/docker_compose/intel/cpu/xeon/README.md
+++ /dev/null
@@ -1,136 +0,0 @@
-# Build Mega Service of VisualQnA on Xeon
-
-This document outlines the deployment process for a VisualQnA application utilizing the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline on Intel Xeon server. The steps include Docker image creation, container deployment via Docker Compose, and service execution to integrate microservices such as `llm`. We will publish the Docker images to Docker Hub soon, it will simplify the deployment process for this service.
-
-## 🚀 Apply Xeon Server on AWS
-
-To apply a Xeon server on AWS, start by creating an AWS account if you don't have one already. Then, head to the [EC2 Console](https://console.aws.amazon.com/ec2/v2/home) to begin the process. Within the EC2 service, select the Amazon EC2 M7i or M7i-flex instance type to leverage 4th Generation Intel Xeon Scalable processors. These instances are optimized for high-performance computing and demanding workloads.
-
-For detailed information about these instance types, you can refer to this [link](https://aws.amazon.com/ec2/instance-types/m7i/). Once you've chosen the appropriate instance type, proceed with configuring your instance settings, including network configurations, security groups, and storage options.
-
-After launching your instance, you can connect to it using SSH (for Linux instances) or Remote Desktop Protocol (RDP) (for Windows instances). From there, you'll have full access to your Xeon server, allowing you to install, configure, and manage your applications as needed.
-
-## 🚀 Build Docker Images
-
-First of all, you need to build Docker Images locally and install the python package of it.
-
-### 1. Build LVM and NGINX Docker Images
-
-```bash
-git clone https://github.com/opea-project/GenAIComps.git
-cd GenAIComps
-docker build --no-cache -t opea/lvm:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/lvms/src/Dockerfile .
-docker build --no-cache -t opea/nginx:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/third_parties/nginx/src/Dockerfile .
-```
-
-### 2. Build MegaService Docker Image
-
-To construct the Mega Service, we utilize the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline within the `visualqna.py` Python script. Build MegaService Docker image via below command:
-
-```bash
-git clone https://github.com/opea-project/GenAIExamples.git
-cd GenAIExamples/VisualQnA
-docker build --no-cache -t opea/visualqna:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
-```
-
-### 3. Build UI Docker Image
-
-Build frontend Docker image via below command:
-
-```bash
-cd GenAIExamples/VisualQnA/ui
-docker build --no-cache -t opea/visualqna-ui:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f docker/Dockerfile .
-```
-
-### 4. Pull vLLM/TGI Xeon Image
-
-```bash
-# vLLM
-docker pull opea/vllm:latest
-# TGI (Optional)
-docker pull ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
-```
-
-Then run the command `docker images`, you will have the following Docker Images:
-
-1. `opea/vllm:latest`
-2. `ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu` (Optional)
-3. `opea/lvm:latest`
-4. `opea/visualqna:latest`
-5. `opea/visualqna-ui:latest`
-6. `opea/nginx`
-
-## 🚀 Start Microservices
-
-### Setup Environment Variables
-
-Since the `compose.yaml` will consume some environment variables, you need to setup them in advance as below.
-
-```bash
-source set_env.sh
-```
-
-Note: Please replace with `host_ip` with you external IP address, do not use localhost.
-
-### Start all the services Docker Containers
-
-> Before running the docker compose command, you need to be in the folder that has the docker compose yaml file
-
-```bash
-cd GenAIExamples/VisualQnA/docker_compose/intel/cpu/xeon
-```
-
-```bash
-docker compose -f compose.yaml up -d
-# if use TGI as the LLM serving backend
-docker compose -f compose_tgi.yaml up -d
-```
-
-### Validate Microservices
-
-Follow the instructions to validate MicroServices.
-
-> Note: If you see an "Internal Server Error" from the `curl` command, wait a few minutes for the microserver to be ready and then try again.
-
-1. LLM Microservice
-
-   ```bash
-   http_proxy="" curl http://${host_ip}:9399/v1/lvm -XPOST -d '{"image": "iVBORw0KGgoAAAANSUhEUgAAAAoAAAAKCAYAAACNMs+9AAAAFUlEQVR42mP8/5+hnoEIwDiqkL4KAcT9GO0U4BxoAAAAAElFTkSuQmCC", "prompt":"What is this?"}' -H 'Content-Type: application/json'
-   ```
-
-2. MegaService
-
-```bash
-curl http://${host_ip}:8888/v1/visualqna -H "Content-Type: application/json" -d '{
-    "messages": [
-      {
-        "role": "user",
-        "content": [
-          {
-            "type": "text",
-            "text": "What'\''s in this image?"
-          },
-          {
-            "type": "image_url",
-            "image_url": {
-              "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-            }
-          }
-        ]
-      }
-    ],
-    "max_tokens": 300
-    }'
-```
-
-## 🚀 Launch the UI
-
-To access the frontend, open the following URL in your browser: http://{host_ip}:5173. By default, the UI runs on port 5173 internally. If you prefer to use a different host port to access the frontend, you can modify the port mapping in the `compose.yaml` file as shown below:
-
-```yaml
-  visualqna-gaudi-ui-server:
-    image: opea/visualqna-ui:latest
-    ...
-    ports:
-      - "80:5173"
-```
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/compose.yaml b/VisualQnA/docker_compose/intel/cpu/xeon/compose.yaml
deleted file mode 100644
index 9c19695493..0000000000
--- a/VisualQnA/docker_compose/intel/cpu/xeon/compose.yaml
+++ /dev/null
@@ -1,96 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  vllm-service:
-    image: ${REGISTRY:-opea}/vllm:${TAG:-latest}
-    container_name: vllm-service
-    ports:
-      - ${VLLM_PORT:-8399}:80
-    volumes:
-      - "${MODEL_CACHE:-./data}:/root/.cache/huggingface/hub"
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
-      VLLM_TORCH_PROFILER_DIR: "/mnt"
-    healthcheck:
-      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
-      interval: 10s
-      timeout: 10s
-      retries: 100
-    command: --model $LVM_MODEL_ID --host 0.0.0.0 --port 80 --chat-template examples/template_llava.jinja  # https://docs.vllm.ai/en/v0.5.0/models/vlm.html
-
-  lvm:
-    image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
-    container_name: lvm-xeon-server
-    depends_on:
-      vllm-service:
-        condition: service_healthy
-    ports:
-      - "9399:9399"
-    ipc: host
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      LVM_ENDPOINT: ${LVM_ENDPOINT}
-      LVM_COMPONENT_NAME: "OPEA_VLLM_LVM"
-      LLM_MODEL_ID: ${LVM_MODEL_ID}
-      HF_HUB_DISABLE_PROGRESS_BARS: 1
-      HF_HUB_ENABLE_HF_TRANSFER: 0
-    restart: unless-stopped
-  visualqna-xeon-backend-server:
-    image: ${REGISTRY:-opea}/visualqna:${TAG:-latest}
-    container_name: visualqna-xeon-backend-server
-    depends_on:
-      - vllm-service
-      - lvm
-    ports:
-      - "8888:8888"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
-      - LVM_SERVICE_HOST_IP=${LVM_SERVICE_HOST_IP}
-    ipc: host
-    restart: always
-  visualqna-xeon-ui-server:
-    image: ${REGISTRY:-opea}/visualqna-ui:${TAG:-latest}
-    container_name: visualqna-xeon-ui-server
-    depends_on:
-      - visualqna-xeon-backend-server
-    ports:
-      - "5173:5173"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - BACKEND_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
-    ipc: host
-    restart: always
-  visualqna-xeon-nginx-server:
-    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
-    container_name: visualqna-xeon-nginx-server
-    depends_on:
-      - visualqna-xeon-backend-server
-      - visualqna-xeon-ui-server
-    ports:
-      - "${NGINX_PORT:-80}:80"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - FRONTEND_SERVICE_IP=${FRONTEND_SERVICE_IP}
-      - FRONTEND_SERVICE_PORT=${FRONTEND_SERVICE_PORT}
-      - BACKEND_SERVICE_NAME=${BACKEND_SERVICE_NAME}
-      - BACKEND_SERVICE_IP=${BACKEND_SERVICE_IP}
-      - BACKEND_SERVICE_PORT=${BACKEND_SERVICE_PORT}
-    ipc: host
-    restart: always
-
-networks:
-  default:
-    driver: bridge
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/compose_tgi.yaml b/VisualQnA/docker_compose/intel/cpu/xeon/compose_tgi.yaml
deleted file mode 100644
index b595bdcba7..0000000000
--- a/VisualQnA/docker_compose/intel/cpu/xeon/compose_tgi.yaml
+++ /dev/null
@@ -1,96 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  llava-tgi-service:
-    image: ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
-    container_name: tgi-llava-xeon-server
-    ports:
-      - "8399:80"
-    volumes:
-      - "${MODEL_CACHE:-./data}:/data"
-    shm_size: 1g
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      HF_HUB_DISABLE_PROGRESS_BARS: 1
-      HF_HUB_ENABLE_HF_TRANSFER: 0
-      host_ip: ${host_ip}
-    healthcheck:
-      test: ["CMD-SHELL", "curl -f http://$host_ip:8399/health || exit 1"]
-      interval: 10s
-      timeout: 10s
-      retries: 60
-    command: --model-id ${LVM_MODEL_ID} --max-input-length 4096 --max-total-tokens 8192 --cuda-graphs 0
-  lvm:
-    image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
-    container_name: lvm-xeon-server
-    depends_on:
-      llava-tgi-service:
-        condition: service_healthy
-    ports:
-      - "9399:9399"
-    ipc: host
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      LVM_ENDPOINT: ${LVM_ENDPOINT}
-      LVM_COMPONENT_NAME: "OPEA_TGI_LLAVA_LVM"
-      HF_HUB_DISABLE_PROGRESS_BARS: 1
-      HF_HUB_ENABLE_HF_TRANSFER: 0
-    restart: unless-stopped
-  visualqna-xeon-backend-server:
-    image: ${REGISTRY:-opea}/visualqna:${TAG:-latest}
-    container_name: visualqna-xeon-backend-server
-    depends_on:
-      - llava-tgi-service
-      - lvm
-    ports:
-      - "8888:8888"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
-      - LVM_SERVICE_HOST_IP=${LVM_SERVICE_HOST_IP}
-    ipc: host
-    restart: always
-  visualqna-xeon-ui-server:
-    image: ${REGISTRY:-opea}/visualqna-ui:${TAG:-latest}
-    container_name: visualqna-xeon-ui-server
-    depends_on:
-      - visualqna-xeon-backend-server
-    ports:
-      - "5173:5173"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - BACKEND_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
-    ipc: host
-    restart: always
-  visualqna-xeon-nginx-server:
-    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
-    container_name: visualqna-xeon-nginx-server
-    depends_on:
-      - visualqna-xeon-backend-server
-      - visualqna-xeon-ui-server
-    ports:
-      - "${NGINX_PORT:-80}:80"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - FRONTEND_SERVICE_IP=${FRONTEND_SERVICE_IP}
-      - FRONTEND_SERVICE_PORT=${FRONTEND_SERVICE_PORT}
-      - BACKEND_SERVICE_NAME=${BACKEND_SERVICE_NAME}
-      - BACKEND_SERVICE_IP=${BACKEND_SERVICE_IP}
-      - BACKEND_SERVICE_PORT=${BACKEND_SERVICE_PORT}
-    ipc: host
-    restart: always
-
-networks:
-  default:
-    driver: bridge
diff --git a/VisualQnA/docker_compose/intel/cpu/xeon/set_env.sh b/VisualQnA/docker_compose/intel/cpu/xeon/set_env.sh
deleted file mode 100644
index b47f12fe31..0000000000
--- a/VisualQnA/docker_compose/intel/cpu/xeon/set_env.sh
+++ /dev/null
@@ -1,21 +0,0 @@
-#!/usr/bin/env bash
-
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-pushd "../../../../../" > /dev/null
-source .set_env.sh
-popd > /dev/null
-
-export host_ip=$(hostname -I | awk '{print $1}')
-export no_proxy=$host_ip,$no_proxy
-export LVM_MODEL_ID="llava-hf/llava-v1.6-mistral-7b-hf"
-export LVM_ENDPOINT="http://${host_ip}:8399"
-export LVM_SERVICE_PORT=9399
-export MEGA_SERVICE_HOST_IP=${host_ip}
-export LVM_SERVICE_HOST_IP=${host_ip}
-export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:8888/v1/visualqna"
-export FRONTEND_SERVICE_IP=${host_ip}
-export FRONTEND_SERVICE_PORT=5173
-export BACKEND_SERVICE_NAME=visualqna
-export BACKEND_SERVICE_IP=${host_ip}
-export BACKEND_SERVICE_PORT=8888
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/README.md b/VisualQnA/docker_compose/intel/hpu/gaudi/README.md
deleted file mode 100644
index 9c3b0cd4e0..0000000000
--- a/VisualQnA/docker_compose/intel/hpu/gaudi/README.md
+++ /dev/null
@@ -1,140 +0,0 @@
-# Build MegaService of VisualQnA on Gaudi
-
-This document outlines the deployment process for a VisualQnA application utilizing the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline on Intel Gaudi server. The steps include Docker image creation, container deployment via Docker Compose, and service execution to integrate microservices such as llm. We will publish the Docker images to Docker Hub, it will simplify the deployment process for this service.
-
-## 🚀 Build Docker Images
-
-First of all, you need to build Docker Images locally. This step can be ignored after the Docker images published to Docker hub.
-
-### 1. Build LVM and NGINX Docker Images
-
-```bash
-git clone https://github.com/opea-project/GenAIComps.git
-cd GenAIComps
-docker build --no-cache -t opea/lvm:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/lvms/src/Dockerfile .
-docker build --no-cache -t opea/nginx:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f comps/third_parties/nginx/src/Dockerfile .
-```
-
-### 2. Build vLLM/Pull TGI Gaudi Image
-
-```bash
-# vLLM
-
-# currently you have to build the opea/vllm-gaudi with the habana_main branch and the specific commit locally
-# we will update it to stable release tag in the future
-git clone https://github.com/HabanaAI/vllm-fork.git
-cd ./vllm-fork/
-docker build -f Dockerfile.hpu -t opea/vllm-gaudi:latest --shm-size=128g . --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy
-cd ..
-rm -rf vllm-fork
-```
-
-```bash
-# TGI (Optional)
-
-docker pull ghcr.io/huggingface/tgi-gaudi:2.0.6
-```
-
-### 3. Build MegaService Docker Image
-
-To construct the Mega Service, we utilize the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice pipeline within the `visualqna.py` Python script. Build the MegaService Docker image using the command below:
-
-```bash
-git clone https://github.com/opea-project/GenAIExamples.git
-cd GenAIExamples/VisualQnA
-docker build --no-cache -t opea/visualqna:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
-cd ../..
-```
-
-### 4. Build UI Docker Image
-
-Build frontend Docker image via below command:
-
-```bash
-cd GenAIExamples/VisualQnA/ui
-docker build --no-cache -t opea/visualqna-ui:latest --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f ./docker/Dockerfile .
-```
-
-Then run the command `docker images`, you will have the following 5 Docker Images:
-
-1. `opea/vllm-gaudi:latest`
-2. `ghcr.io/huggingface/tgi-gaudi:2.0.6` (Optional)
-3. `opea/lvm:latest`
-4. `opea/visualqna:latest`
-5. `opea/visualqna-ui:latest`
-6. `opea/nginx`
-
-## 🚀 Start MicroServices and MegaService
-
-### Setup Environment Variables
-
-Since the `compose.yaml` will consume some environment variables, you need to setup them in advance as below.
-
-```bash
-source set_env.sh
-```
-
-Note: Please replace with `host_ip` with you external IP address, do not use localhost.
-
-### Start all the services Docker Containers
-
-```bash
-cd GenAIExamples/VisualQnA/docker_compose/intel/hpu/gaudi/
-```
-
-```bash
-docker compose -f compose.yaml up -d
-# if use TGI as the LLM serving backend
-docker compose -f compose_tgi.yaml up -d
-```
-
-> **_NOTE:_** Users need at least one Gaudi cards to run the VisualQnA successfully.
-
-### Validate MicroServices and MegaService
-
-Follow the instructions to validate MicroServices.
-
-> Note: If you see an "Internal Server Error" from the `curl` command, wait a few minutes for the microserver to be ready and then try again.
-
-1. LLM Microservice
-
-   ```bash
-   http_proxy="" curl http://${host_ip}:9399/v1/lvm -XPOST -d '{"image": "iVBORw0KGgoAAAANSUhEUgAAAAoAAAAKCAYAAACNMs+9AAAAFUlEQVR42mP8/5+hnoEIwDiqkL4KAcT9GO0U4BxoAAAAAElFTkSuQmCC", "prompt":"What is this?"}' -H 'Content-Type: application/json'
-   ```
-
-2. MegaService
-
-```bash
-curl http://${host_ip}:8888/v1/visualqna -H "Content-Type: application/json" -d '{
-    "messages": [
-      {
-        "role": "user",
-        "content": [
-          {
-            "type": "text",
-            "text": "What'\''s in this image?"
-          },
-          {
-            "type": "image_url",
-            "image_url": {
-              "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-            }
-          }
-        ]
-      }
-    ],
-    "max_tokens": 300
-    }'
-```
-
-## 🚀 Launch the UI
-
-To access the frontend, open the following URL in your browser: http://{host_ip}:5173. By default, the UI runs on port 5173 internally. If you prefer to use a different host port to access the frontend, you can modify the port mapping in the `compose.yaml` file as shown below:
-
-```yaml
-  visualqna-gaudi-ui-server:
-    image: opea/visualqna-ui:latest
-    ...
-    ports:
-      - "80:5173"
-```
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/compose.yaml b/VisualQnA/docker_compose/intel/hpu/gaudi/compose.yaml
deleted file mode 100644
index c1950a14d4..0000000000
--- a/VisualQnA/docker_compose/intel/hpu/gaudi/compose.yaml
+++ /dev/null
@@ -1,106 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  vllm-gaudi-service:
-    image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
-    container_name: vllm-gaudi-service
-    ports:
-      - ${VLLM_PORT:-8399}:80
-    volumes:
-      - "./data:/root/.cache/huggingface/hub"
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
-      HABANA_VISIBLE_DEVICES: all
-      OMPI_MCA_btl_vader_single_copy_mechanism: none
-      LLM_MODEL_ID: ${LVM_MODEL_ID}
-      VLLM_TORCH_PROFILER_DIR: "/mnt"
-      VLLM_SKIP_WARMUP: ${VLLM_SKIP_WARMUP:-false}
-      MAX_MODEL_LEN: ${MAX_TOTAL_TOKENS:-4096}
-      MAX_SEQ_LEN_TO_CAPTURE: ${MAX_TOTAL_TOKENS:-4096}
-      PT_HPUGRAPH_DISABLE_TENSOR_CACHE: false # https://github.com/HabanaAI/vllm-fork/issues/841#issuecomment-2700421704
-    runtime: habana
-    cap_add:
-      - SYS_NICE
-    ipc: host
-    healthcheck:
-      test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
-      interval: 10s
-      timeout: 10s
-      retries: 150
-    command: --model $LVM_MODEL_ID --tensor-parallel-size 1 --host 0.0.0.0 --port 80 --chat-template examples/template_llava.jinja  # https://docs.vllm.ai/en/v0.5.0/models/vlm.html
-  lvm:
-    image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
-    container_name: lvm-vllm-gaudi-service
-    depends_on:
-      vllm-gaudi-service:
-        condition: service_healthy
-    ports:
-      - "9399:9399"
-    ipc: host
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      LVM_ENDPOINT: ${LVM_ENDPOINT}
-      LVM_COMPONENT_NAME: "OPEA_VLLM_LVM"
-      LLM_MODEL_ID: ${LVM_MODEL_ID}
-      HF_HUB_DISABLE_PROGRESS_BARS: 1
-      HF_HUB_ENABLE_HF_TRANSFER: 0
-    restart: unless-stopped
-  visualqna-gaudi-backend-server:
-    image: ${REGISTRY:-opea}/visualqna:${TAG:-latest}
-    container_name: visualqna-gaudi-backend-server
-    depends_on:
-      - vllm-gaudi-service
-      - lvm
-    ports:
-      - "8888:8888"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
-      - LVM_SERVICE_HOST_IP=${LVM_SERVICE_HOST_IP}
-    ipc: host
-    restart: always
-  visualqna-gaudi-ui-server:
-    image: ${REGISTRY:-opea}/visualqna-ui:${TAG:-latest}
-    container_name: visualqna-gaudi-ui-server
-    depends_on:
-      - visualqna-gaudi-backend-server
-    ports:
-      - "5173:5173"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - BACKEND_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
-    ipc: host
-    restart: always
-  visualqna-gaudi-nginx-server:
-    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
-    container_name: visualqna-gaudi-nginx-server
-    depends_on:
-      - visualqna-gaudi-backend-server
-      - visualqna-gaudi-ui-server
-    ports:
-      - "${NGINX_PORT:-80}:80"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - FRONTEND_SERVICE_IP=${FRONTEND_SERVICE_IP}
-      - FRONTEND_SERVICE_PORT=${FRONTEND_SERVICE_PORT}
-      - BACKEND_SERVICE_NAME=${BACKEND_SERVICE_NAME}
-      - BACKEND_SERVICE_IP=${BACKEND_SERVICE_IP}
-      - BACKEND_SERVICE_PORT=${BACKEND_SERVICE_PORT}
-    ipc: host
-    restart: always
-
-networks:
-  default:
-    driver: bridge
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/compose_tgi.yaml b/VisualQnA/docker_compose/intel/hpu/gaudi/compose_tgi.yaml
deleted file mode 100644
index 251b4fce70..0000000000
--- a/VisualQnA/docker_compose/intel/hpu/gaudi/compose_tgi.yaml
+++ /dev/null
@@ -1,105 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  llava-tgi-service:
-    image: ghcr.io/huggingface/tgi-gaudi:2.3.1
-    container_name: tgi-llava-gaudi-server
-    ports:
-      - "8399:80"
-    volumes:
-      - "${MODEL_CACHE:-./data}:/data"
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      HF_HUB_DISABLE_PROGRESS_BARS: 1
-      HF_HUB_ENABLE_HF_TRANSFER: 0
-      HABANA_VISIBLE_DEVICES: all
-      OMPI_MCA_btl_vader_single_copy_mechanism: none
-      HUGGING_FACE_HUB_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
-      ENABLE_HPU_GRAPH: true
-      LIMIT_HPU_GRAPH: true
-      USE_FLASH_ATTENTION: true
-      FLASH_ATTENTION_RECOMPUTE: true
-    healthcheck:
-      test: ["CMD-SHELL", "curl -f http://$host_ip:8399/health || exit 1"]
-      interval: 10s
-      timeout: 10s
-      retries: 60
-    runtime: habana
-    cap_add:
-      - SYS_NICE
-    ipc: host
-    command: --model-id ${LVM_MODEL_ID} --max-input-length 4096 --max-total-tokens 8192
-  lvm:
-    image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
-    container_name: lvm-gaudi-server
-    depends_on:
-      llava-tgi-service:
-        condition: service_healthy
-    ports:
-      - "9399:9399"
-    ipc: host
-    environment:
-      no_proxy: ${no_proxy}
-      http_proxy: ${http_proxy}
-      https_proxy: ${https_proxy}
-      LVM_ENDPOINT: ${LVM_ENDPOINT}
-      LVM_COMPONENT_NAME: "OPEA_TGI_LLAVA_LVM"
-      HF_HUB_DISABLE_PROGRESS_BARS: 1
-      HF_HUB_ENABLE_HF_TRANSFER: 0
-    restart: unless-stopped
-  visualqna-gaudi-backend-server:
-    image: ${REGISTRY:-opea}/visualqna:${TAG:-latest}
-    container_name: visualqna-gaudi-backend-server
-    depends_on:
-      - llava-tgi-service
-      - lvm
-    ports:
-      - "8888:8888"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - MEGA_SERVICE_HOST_IP=${MEGA_SERVICE_HOST_IP}
-      - LVM_SERVICE_HOST_IP=${LVM_SERVICE_HOST_IP}
-    ipc: host
-    restart: always
-  visualqna-gaudi-ui-server:
-    image: ${REGISTRY:-opea}/visualqna-ui:${TAG:-latest}
-    container_name: visualqna-gaudi-ui-server
-    depends_on:
-      - visualqna-gaudi-backend-server
-    ports:
-      - "5173:5173"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - BACKEND_BASE_URL=${BACKEND_SERVICE_ENDPOINT}
-    ipc: host
-    restart: always
-  visualqna-gaudi-nginx-server:
-    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
-    container_name: visualqna-gaudi-nginx-server
-    depends_on:
-      - visualqna-gaudi-backend-server
-      - visualqna-gaudi-ui-server
-    ports:
-      - "${NGINX_PORT:-80}:80"
-    environment:
-      - no_proxy=${no_proxy}
-      - https_proxy=${https_proxy}
-      - http_proxy=${http_proxy}
-      - FRONTEND_SERVICE_IP=${FRONTEND_SERVICE_IP}
-      - FRONTEND_SERVICE_PORT=${FRONTEND_SERVICE_PORT}
-      - BACKEND_SERVICE_NAME=${BACKEND_SERVICE_NAME}
-      - BACKEND_SERVICE_IP=${BACKEND_SERVICE_IP}
-      - BACKEND_SERVICE_PORT=${BACKEND_SERVICE_PORT}
-    ipc: host
-    restart: always
-
-networks:
-  default:
-    driver: bridge
diff --git a/VisualQnA/docker_compose/intel/hpu/gaudi/set_env.sh b/VisualQnA/docker_compose/intel/hpu/gaudi/set_env.sh
deleted file mode 100644
index 57032fdce5..0000000000
--- a/VisualQnA/docker_compose/intel/hpu/gaudi/set_env.sh
+++ /dev/null
@@ -1,22 +0,0 @@
-#!/usr/bin/env bash
-
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-pushd "../../../../../" > /dev/null
-source .set_env.sh
-popd > /dev/null
-
-export host_ip=$(hostname -I | awk '{print $1}')
-export no_proxy=$host_ip,$no_proxy
-# export LVM_MODEL_ID="llava-hf/llava-v1.6-mistral-7b-hf"
-export LVM_MODEL_ID="llava-hf/llava-1.5-7b-hf"
-export LVM_ENDPOINT="http://${host_ip}:8399"
-export LVM_SERVICE_PORT=9399
-export MEGA_SERVICE_HOST_IP=${host_ip}
-export LVM_SERVICE_HOST_IP=${host_ip}
-export BACKEND_SERVICE_ENDPOINT="http://${host_ip}:8888/v1/visualqna"
-export FRONTEND_SERVICE_IP=${host_ip}
-export FRONTEND_SERVICE_PORT=5173
-export BACKEND_SERVICE_NAME=visualqna
-export BACKEND_SERVICE_IP=${host_ip}
-export BACKEND_SERVICE_PORT=8888
diff --git a/VisualQnA/docker_image_build/build.yaml b/VisualQnA/docker_image_build/build.yaml
deleted file mode 100644
index 7dcb7be0a1..0000000000
--- a/VisualQnA/docker_image_build/build.yaml
+++ /dev/null
@@ -1,31 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-services:
-  visualqna:
-    build:
-      args:
-        http_proxy: ${http_proxy}
-        https_proxy: ${https_proxy}
-        no_proxy: ${no_proxy}
-      context: ../
-      dockerfile: ./Dockerfile
-    image: ${REGISTRY:-opea}/visualqna:${TAG:-latest}
-  visualqna-ui:
-    build:
-      context: ../ui
-      dockerfile: ./docker/Dockerfile
-    extends: visualqna
-    image: ${REGISTRY:-opea}/visualqna-ui:${TAG:-latest}
-  lvm:
-    build:
-      context: GenAIComps
-      dockerfile: comps/lvms/src/Dockerfile
-    extends: visualqna
-    image: ${REGISTRY:-opea}/lvm:${TAG:-latest}
-  nginx:
-    build:
-      context: GenAIComps
-      dockerfile: comps/third_parties/nginx/src/Dockerfile
-    extends: visualqna
-    image: ${REGISTRY:-opea}/nginx:${TAG:-latest}
diff --git a/VisualQnA/kubernetes/gmc/README.md b/VisualQnA/kubernetes/gmc/README.md
deleted file mode 100644
index 75669d4e39..0000000000
--- a/VisualQnA/kubernetes/gmc/README.md
+++ /dev/null
@@ -1,56 +0,0 @@
-# Deploy VisualQnA in a Kubernetes Cluster
-
-This document outlines the deployment process for a Visual Question Answering (VisualQnA) application that utilizes the [GenAIComps](https://github.com/opea-project/GenAIComps.git) microservice components on Intel Xeon servers and Gaudi machines.
-
-Please install GMC in your Kubernetes cluster, if you have not already done so, by following the steps in Section "Getting Started" at [GMC Install](https://github.com/opea-project/GenAIInfra/tree/main/microservices-connector/README.md). We will soon publish images to Docker Hub, at which point no builds will be required, further simplifying install.
-
-If you have only Intel Xeon machines you could use the visualqna_xeon.yaml file or if you have a Gaudi cluster you could use visualqna_gaudi.yaml
-In the below example we illustrate on Xeon.
-
-## Deploy the VisualQnA application
-
-1. Create the desired namespace if it does not already exist and deploy the application
-   ```bash
-   export APP_NAMESPACE=visualqna
-   kubectl create ns $APP_NAMESPACE
-   kubectl apply -f ./visualqna_xeon.yaml
-   ```
-
-2. Check if the application is up and ready
-   ```bash
-   kubectl get pods -n $APP_NAMESPACE
-   ```
-
-3. Deploy a client pod for testing
-   ```bash
-   kubectl create deployment client-test -n $APP_NAMESPACE --image=python:3.8.13 -- sleep infinity
-   ```
-
-4. Check that client pod is ready
-   ```bash
-   kubectl get pods -n $APP_NAMESPACE
-   ```
-
-5. Send request to application
-   ```bash
-   export CLIENT_POD=$(kubectl get pod -n $APP_NAMESPACE -l app=client-test -o jsonpath={.items..metadata.name})
-   export accessUrl=$(kubectl get gmc -n $APP_NAMESPACE -o jsonpath="{.items[?(@.metadata.name=='visualqna')].status.accessUrl}")
-   kubectl exec "$CLIENT_POD" -n $APP_NAMESPACE -- curl $accessUrl -X POST -d '{"messages": [
-      {
-        "role": "user",
-        "content": [
-          {
-            "type": "text",
-            "text": "What'\''s in this image?"
-          },
-          {
-            "type": "image_url",
-            "image_url": {
-              "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-            }
-          }
-        ]
-      }
-    ],
-    "max_tokens": 128}' -H 'Content-Type: application/json' > $LOG_PATH/gmc_visualqna.log
-   ```
diff --git a/VisualQnA/kubernetes/gmc/visualqna_gaudi.yaml b/VisualQnA/kubernetes/gmc/visualqna_gaudi.yaml
deleted file mode 100644
index 4bd8248026..0000000000
--- a/VisualQnA/kubernetes/gmc/visualqna_gaudi.yaml
+++ /dev/null
@@ -1,34 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-apiVersion: gmc.opea.io/v1alpha3
-kind: GMConnector
-metadata:
-  labels:
-    app.kubernetes.io/name: gmconnector
-    app.kubernetes.io/managed-by: kustomize
-    gmc/platform: gaudi
-  name: visualqna
-  namespace: visualqna
-spec:
-  routerConfig:
-    name: router
-    serviceName: router-service
-  nodes:
-    root:
-      routerType: Sequence
-      steps:
-      - name: Lvm
-        data: $response
-        internalService:
-          serviceName: visualqna-service
-          config:
-            endpoint: /v1/lvm
-            LVM_ENDPOINT: visualqna-tgi-svc
-      - name: TgiGaudi
-        internalService:
-          serviceName: visualqna-tgi-svc
-          config:
-            MODEL_ID: llava-hf/llava-v1.6-mistral-7b-hf
-            endpoint: /generate
-          isDownstreamService: true
diff --git a/VisualQnA/kubernetes/gmc/visualqna_xeon.yaml b/VisualQnA/kubernetes/gmc/visualqna_xeon.yaml
deleted file mode 100644
index c789c09dab..0000000000
--- a/VisualQnA/kubernetes/gmc/visualqna_xeon.yaml
+++ /dev/null
@@ -1,34 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-apiVersion: gmc.opea.io/v1alpha3
-kind: GMConnector
-metadata:
-  labels:
-    app.kubernetes.io/name: gmconnector
-    app.kubernetes.io/managed-by: kustomize
-    gmc/platform: xeon
-  name: visualqna
-  namespace: visualqna
-spec:
-  routerConfig:
-    name: router
-    serviceName: router-service
-  nodes:
-    root:
-      routerType: Sequence
-      steps:
-      - name: Lvm
-        data: $response
-        internalService:
-          serviceName: visualqna-service
-          config:
-            endpoint: /v1/lvm
-            LVM_ENDPOINT: visualqna-tgi-svc
-      - name: Tgi
-        internalService:
-          serviceName: visualqna-tgi-svc
-          config:
-            MODEL_ID: llava-hf/llava-v1.6-mistral-7b-hf
-            endpoint: /generate
-          isDownstreamService: true
diff --git a/VisualQnA/kubernetes/helm/README.md b/VisualQnA/kubernetes/helm/README.md
deleted file mode 100644
index d6dd382b90..0000000000
--- a/VisualQnA/kubernetes/helm/README.md
+++ /dev/null
@@ -1,18 +0,0 @@
-# Deploy VisualQnA on Kubernetes cluster
-
-- You should have Helm (version >= 3.15) installed. Refer to the [Helm Installation Guide](https://helm.sh/docs/intro/install/) for more information.
-- For more deploy options, refer to [helm charts README](https://github.com/opea-project/GenAIInfra/tree/main/helm-charts#readme).
-
-## Deploy on Xeon
-
-```
-export HFTOKEN="insert-your-huggingface-token-here"
-helm install visualqna oci://ghcr.io/opea-project/charts/visualqna  --set global.HUGGINGFACEHUB_API_TOKEN=${HFTOKEN} -f cpu-values.yaml
-```
-
-## Deploy on Gaudi
-
-```
-export HFTOKEN="insert-your-huggingface-token-here"
-helm install visualqna oci://ghcr.io/opea-project/charts/visualqna  --set global.HUGGINGFACEHUB_API_TOKEN=${HFTOKEN} -f gaudi-values.yaml
-```
diff --git a/VisualQnA/kubernetes/helm/cpu-values.yaml b/VisualQnA/kubernetes/helm/cpu-values.yaml
deleted file mode 100644
index acc9d4e28d..0000000000
--- a/VisualQnA/kubernetes/helm/cpu-values.yaml
+++ /dev/null
@@ -1,7 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-tgi:
-  MAX_INPUT_LENGTH: "4096"
-  MAX_TOTAL_TOKENS: "8192"
-  LLM_MODEL_ID: llava-hf/llava-v1.6-mistral-7b-hf
diff --git a/VisualQnA/kubernetes/helm/gaudi-values.yaml b/VisualQnA/kubernetes/helm/gaudi-values.yaml
deleted file mode 100644
index eb6494a142..0000000000
--- a/VisualQnA/kubernetes/helm/gaudi-values.yaml
+++ /dev/null
@@ -1,36 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-# Accelerate inferencing in heaviest components to improve performance
-# by overriding their subchart values
-
-# TGI: largest bottleneck for VisualQnA
-tgi:
-  accelDevice: "gaudi"
-  image:
-    repository: ghcr.io/huggingface/tgi-gaudi
-    tag: "2.3.1"
-  resources:
-    limits:
-      habana.ai/gaudi: 1
-  MAX_INPUT_LENGTH: "4096"
-  MAX_TOTAL_TOKENS: "8192"
-  CUDA_GRAPHS: ""
-  OMPI_MCA_btl_vader_single_copy_mechanism: "none"
-  ENABLE_HPU_GRAPH: "true"
-  LIMIT_HPU_GRAPH: "true"
-  USE_FLASH_ATTENTION: "true"
-  FLASH_ATTENTION_RECOMPUTE: "true"
-  livenessProbe:
-    initialDelaySeconds: 5
-    periodSeconds: 5
-    timeoutSeconds: 1
-  readinessProbe:
-    initialDelaySeconds: 5
-    periodSeconds: 5
-    timeoutSeconds: 1
-  startupProbe:
-    initialDelaySeconds: 5
-    periodSeconds: 5
-    timeoutSeconds: 1
-    failureThreshold: 120
diff --git a/VisualQnA/tests/test_compose_on_gaudi.sh b/VisualQnA/tests/test_compose_on_gaudi.sh
deleted file mode 100644
index 3fbc8e0adc..0000000000
--- a/VisualQnA/tests/test_compose_on_gaudi.sh
+++ /dev/null
@@ -1,203 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-set -x
-IMAGE_REPO=${IMAGE_REPO:-"opea"}
-IMAGE_TAG=${IMAGE_TAG:-"latest"}
-echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
-echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
-export REGISTRY=${IMAGE_REPO}
-export TAG=${IMAGE_TAG}
-export MODEL_CACHE=${model_cache:-"./data"}
-export NGINX_PORT=81
-export VLLM_SKIP_WARMUP=true
-
-WORKPATH=$(dirname "$PWD")
-LOG_PATH="$WORKPATH/tests"
-ip_address=$(hostname -I | awk '{print $1}')
-
-function build_docker_images() {
-    cd $WORKPATH/docker_image_build
-    git clone --depth 1 --branch main https://github.com/opea-project/GenAIComps.git
-    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
-
-    git clone https://github.com/HabanaAI/vllm-fork.git
-    cd ./vllm-fork/
-    docker build -f Dockerfile.hpu -t opea/vllm-gaudi:${TAG} --shm-size=128g . --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy
-    cd ..
-    rm -rf vllm-fork
-
-    docker images && sleep 1s
-}
-
-function start_services() {
-    cd $WORKPATH/docker_compose/intel/hpu/gaudi
-
-    source ./set_env.sh
-
-
-    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
-
-    # Start Docker Containers
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
-
-    n=0
-    until [[ "$n" -ge 100 ]]; do
-        docker logs vllm-gaudi-service > ${LOG_PATH}/lvm_vllm_service_start.log
-        if grep -q Starting ${LOG_PATH}/lvm_vllm_service_start.log; then
-            break
-        fi
-        sleep 5s
-        n=$((n+1))
-    done
-}
-
-function validate_services() {
-    local URL="$1"
-    local EXPECTED_RESULT="$2"
-    local SERVICE_NAME="$3"
-    local DOCKER_NAME="$4"
-    local INPUT_DATA="$5"
-
-    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
-
-        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
-
-        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
-            echo "[ $SERVICE_NAME ] Content is as expected."
-        else
-            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
-            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-            exit 1
-        fi
-    else
-        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
-        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-        exit 1
-    fi
-    sleep 1s
-}
-
-function validate_microservices() {
-    sleep 15s
-    # Check if the microservices are running correctly.
-
-    # lvm microservice
-    validate_services \
-        "${ip_address}:9399/v1/lvm" \
-        "yellow" \
-        "lvm" \
-        "lvm-vllm-gaudi-service" \
-        '{"image": "iVBORw0KGgoAAAANSUhEUgAAAAoAAAAKCAYAAACNMs+9AAAAFUlEQVR42mP8/5+hnoEIwDiqkL4KAcT9GO0U4BxoAAAAAElFTkSuQmCC", "prompt":"What is this?"}'
-}
-
-function validate_megaservice() {
-    sleep 15s
-    # Curl the Mega Service
-    validate_services \
-    "${ip_address}:8888/v1/visualqna" \
-    "sign" \
-    "visualqna-gaudi-backend-server" \
-    "visualqna-gaudi-backend-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-
-    # test the megeservice via nginx
-    validate_services \
-    "${ip_address}:${NGINX_PORT}/v1/visualqna" \
-    "sign" \
-    "visualqna-gaudi-nginx-server" \
-    "visualqna-gaudi-nginx-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-}
-
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-function stop_docker() {
-    cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose stop && docker compose rm -f
-}
-
-function main() {
-
-    stop_docker
-
-    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
-    start_services
-
-    validate_microservices
-    validate_megaservice
-    #validate_frontend
-
-    stop_docker
-    echo y | docker system prune
-
-}
-
-main
diff --git a/VisualQnA/tests/test_compose_on_rocm.sh b/VisualQnA/tests/test_compose_on_rocm.sh
deleted file mode 100644
index 5092dd39cd..0000000000
--- a/VisualQnA/tests/test_compose_on_rocm.sh
+++ /dev/null
@@ -1,224 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2024 Advanced Micro Devices, Inc.
-# SPDX-License-Identifier: Apache-2.0
-
-set -x
-IMAGE_REPO=${IMAGE_REPO:-"opea"}
-IMAGE_TAG=${IMAGE_TAG:-"latest"}
-echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
-echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
-
-WORKPATH=$(dirname "$PWD")
-LOG_PATH="$WORKPATH/tests"
-ip_address=$(hostname -I | awk '{print $1}')
-
-export REGISTRY=${IMAGE_REPO}
-export TAG=${IMAGE_TAG}
-export HOST_IP=${ip_address}
-export VISUALQNA_TGI_SERVICE_PORT="8399"
-export VISUALQNA_HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
-export VISUALQNA_CARD_ID="card1"
-export VISUALQNA_RENDER_ID="renderD136"
-export LVM_MODEL_ID="Xkev/Llama-3.2V-11B-cot"
-export MODEL="llava-hf/llava-v1.6-mistral-7b-hf"
-export LVM_ENDPOINT="http://${HOST_IP}:8399"
-export LVM_SERVICE_PORT=9399
-export MEGA_SERVICE_HOST_IP=${HOST_IP}
-export LVM_SERVICE_HOST_IP=${HOST_IP}
-export BACKEND_SERVICE_ENDPOINT="http://${HOST_IP}:${BACKEND_SERVICE_PORT}/v1/visualqna"
-export FRONTEND_SERVICE_IP=${HOST_IP}
-export FRONTEND_SERVICE_PORT=5173
-export BACKEND_SERVICE_NAME=visualqna
-export BACKEND_SERVICE_IP=${HOST_IP}
-export BACKEND_SERVICE_PORT=8888
-export NGINX_PORT=18003
-export PATH="~/miniconda3/bin:$PATH"
-
-function build_docker_images() {
-    opea_branch=${opea_branch:-"main"}
-    # If the opea_branch isn't main, replace the git clone branch in Dockerfile.
-    if [[ "${opea_branch}" != "main" ]]; then
-        cd $WORKPATH
-        OLD_STRING="RUN git clone --depth 1 https://github.com/opea-project/GenAIComps.git"
-        NEW_STRING="RUN git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git"
-        find . -type f -name "Dockerfile*" | while read -r file; do
-            echo "Processing file: $file"
-            sed -i "s|$OLD_STRING|$NEW_STRING|g" "$file"
-        done
-    fi
-
-    cd $WORKPATH/docker_image_build
-    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
-
-    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
-
-    docker pull ghcr.io/huggingface/text-generation-inference:2.4.1-rocm
-    docker images && sleep 1s
-}
-
-function start_services() {
-    cd $WORKPATH/docker_compose/amd/gpu/rocm
-
-    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
-
-    # Start Docker Containers
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
-
-    n=0
-    until [[ "$n" -ge 100 ]]; do
-        docker logs visualqna-tgi-service > ${LOG_PATH}/lvm_tgi_service_start.log
-        if grep -q Connected ${LOG_PATH}/lvm_tgi_service_start.log; then
-            break
-        fi
-        sleep 5s
-        n=$((n+1))
-    done
-}
-
-function validate_services() {
-    local URL="$1"
-    local EXPECTED_RESULT="$2"
-    local SERVICE_NAME="$3"
-    local DOCKER_NAME="$4"
-    local INPUT_DATA="$5"
-
-    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
-
-        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
-
-        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
-            echo "[ $SERVICE_NAME ] Content is as expected."
-        else
-            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
-            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-            exit 1
-        fi
-    else
-        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
-        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-        exit 1
-    fi
-    sleep 1s
-}
-
-function validate_microservices() {
-    # Check if the microservices are running correctly.
-
-    # lvm microservice
-    validate_services \
-        "${ip_address}:9399/v1/lvm" \
-        "The image" \
-        "lvm" \
-        "visualqna-tgi-service" \
-        '{"image": "iVBORw0KGgoAAAANSUhEUgAAAAoAAAAKCAYAAACNMs+9AAAAFUlEQVR42mP8/5+hnoEIwDiqkL4KAcT9GO0U4BxoAAAAAElFTkSuQmCC", "prompt":"What is this?"}'
-}
-
-function validate_megaservice() {
-    # Curl the Mega Service
-    validate_services \
-    "${ip_address}:8888/v1/visualqna" \
-    "The image" \
-    "visualqna-rocm-backend-server" \
-    "visualqna-rocm-backend-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-
-    # test the megeservice via nginx
-    validate_services \
-    "${ip_address}:${NGINX_PORT}/v1/visualqna" \
-    "The image" \
-    "visualqna-rocm-nginx-server" \
-    "visualqna-rocm-nginx-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-}
-
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-function stop_docker() {
-    cd $WORKPATH/docker_compose/amd/gpu/rocm/
-    docker compose stop && docker compose rm -f
-}
-
-function main() {
-
-    stop_docker
-
-    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
-    start_services
-
-    validate_microservices
-    validate_megaservice
-    #validate_frontend
-
-    stop_docker
-    echo y | docker system prune
-
-}
-
-main
diff --git a/VisualQnA/tests/test_compose_on_xeon.sh b/VisualQnA/tests/test_compose_on_xeon.sh
deleted file mode 100644
index 0e645c324b..0000000000
--- a/VisualQnA/tests/test_compose_on_xeon.sh
+++ /dev/null
@@ -1,196 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-set -x
-IMAGE_REPO=${IMAGE_REPO:-"opea"}
-IMAGE_TAG=${IMAGE_TAG:-"latest"}
-echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
-echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
-export REGISTRY=${IMAGE_REPO}
-export TAG=${IMAGE_TAG}
-export MODEL_CACHE=${model_cache:-"./data"}
-export NGINX_PORT=81
-
-WORKPATH=$(dirname "$PWD")
-LOG_PATH="$WORKPATH/tests"
-ip_address=$(hostname -I | awk '{print $1}')
-
-function build_docker_images() {
-    cd $WORKPATH/docker_image_build
-    git clone --depth 1 --branch main https://github.com/opea-project/GenAIComps.git
-    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
-
-    docker pull opea/vllm:latest
-    docker tag opea/vllm:latest opea/vllm:${TAG}
-    docker images && sleep 1s
-}
-
-function start_services() {
-    cd $WORKPATH/docker_compose/intel/cpu/xeon/
-
-    source ./set_env.sh
-
-    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
-
-    # Start Docker Containers
-    docker compose up -d > ${LOG_PATH}/start_services_with_compose.log
-
-    n=0
-    until [[ "$n" -ge 200 ]]; do
-        docker logs vllm-service > ${LOG_PATH}/lvm_vllm_service_start.log
-        if grep -q Starting ${LOG_PATH}/lvm_vllm_service_start.log; then
-            break
-        fi
-        sleep 5s
-        n=$((n+1))
-    done
-}
-
-function validate_services() {
-    local URL="$1"
-    local EXPECTED_RESULT="$2"
-    local SERVICE_NAME="$3"
-    local DOCKER_NAME="$4"
-    local INPUT_DATA="$5"
-
-    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
-
-        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
-
-        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
-            echo "[ $SERVICE_NAME ] Content is as expected."
-        else
-            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
-            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-            exit 1
-        fi
-    else
-        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
-        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-        exit 1
-    fi
-    sleep 1s
-}
-
-function validate_microservices() {
-    sleep 15s
-    # Check if the microservices are running correctly.
-
-    # lvm microservice
-    validate_services \
-        "${ip_address}:9399/v1/lvm" \
-        "yellow" \
-        "lvm" \
-        "lvm-xeon-server" \
-        '{"image": "iVBORw0KGgoAAAANSUhEUgAAAAoAAAAKCAYAAACNMs+9AAAAFUlEQVR42mP8/5+hnoEIwDiqkL4KAcT9GO0U4BxoAAAAAElFTkSuQmCC", "prompt":"What is this?"}'
-}
-
-function validate_megaservice() {
-    # Curl the Mega Service
-    validate_services \
-    "${ip_address}:8888/v1/visualqna" \
-    "sign" \
-    "visualqna-xeon-backend-server" \
-    "visualqna-xeon-backend-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-
-    # test the megeservice via nginx
-    validate_services \
-    "${ip_address}:${NGINX_PORT}/v1/visualqna" \
-    "sign" \
-    "visualqna-xeon-nginx-server" \
-    "visualqna-xeon-nginx-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-}
-
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-function stop_docker() {
-    cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose stop && docker compose rm -f
-}
-
-function main() {
-
-    stop_docker
-
-    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
-    start_services
-
-    validate_microservices
-    validate_megaservice
-    #validate_frontend
-
-    stop_docker
-    echo y | docker system prune
-
-}
-
-main
diff --git a/VisualQnA/tests/test_compose_tgi_on_gaudi.sh b/VisualQnA/tests/test_compose_tgi_on_gaudi.sh
deleted file mode 100644
index 913d6ed527..0000000000
--- a/VisualQnA/tests/test_compose_tgi_on_gaudi.sh
+++ /dev/null
@@ -1,222 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-set -x
-IMAGE_REPO=${IMAGE_REPO:-"opea"}
-IMAGE_TAG=${IMAGE_TAG:-"latest"}
-echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
-echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
-export REGISTRY=${IMAGE_REPO}
-export TAG=${IMAGE_TAG}
-export MODEL_CACHE=${model_cache:-"./data"}
-
-WORKPATH=$(dirname "$PWD")
-LOG_PATH="$WORKPATH/tests"
-ip_address=$(hostname -I | awk '{print $1}')
-
-function build_docker_images() {
-    opea_branch=${opea_branch:-"main"}
-    # If the opea_branch isn't main, replace the git clone branch in Dockerfile.
-    if [[ "${opea_branch}" != "main" ]]; then
-        cd $WORKPATH
-        OLD_STRING="RUN git clone --depth 1 https://github.com/opea-project/GenAIComps.git"
-        NEW_STRING="RUN git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git"
-        find . -type f -name "Dockerfile*" | while read -r file; do
-            echo "Processing file: $file"
-            sed -i "s|$OLD_STRING|$NEW_STRING|g" "$file"
-        done
-    fi
-
-    cd $WORKPATH/docker_image_build
-    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
-
-    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
-
-    docker pull ghcr.io/huggingface/tgi-gaudi:2.0.6
-    docker images && sleep 1s
-}
-
-function start_services() {
-    cd $WORKPATH/docker_compose/intel/hpu/gaudi
-
-    export LVM_MODEL_ID="llava-hf/llava-v1.6-mistral-7b-hf"
-    export LVM_ENDPOINT="http://${ip_address}:8399"
-    export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
-    export LVM_SERVICE_PORT=9399
-    export MEGA_SERVICE_HOST_IP=${ip_address}
-    export LVM_SERVICE_HOST_IP=${ip_address}
-    export BACKEND_SERVICE_ENDPOINT="http://${ip_address}:8888/v1/visualqna"
-    export FRONTEND_SERVICE_IP=${ip_address}
-    export FRONTEND_SERVICE_PORT=5173
-    export BACKEND_SERVICE_NAME=visualqna
-    export BACKEND_SERVICE_IP=${ip_address}
-    export BACKEND_SERVICE_PORT=8888
-    export NGINX_PORT=80
-    export host_ip=${ip_address}
-
-    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
-
-    # Start Docker Containers
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
-
-    n=0
-    until [[ "$n" -ge 100 ]]; do
-        docker logs tgi-llava-gaudi-server > ${LOG_PATH}/lvm_tgi_service_start.log
-        if grep -q Connected ${LOG_PATH}/lvm_tgi_service_start.log; then
-            break
-        fi
-        sleep 5s
-        n=$((n+1))
-    done
-}
-
-function validate_services() {
-    local URL="$1"
-    local EXPECTED_RESULT="$2"
-    local SERVICE_NAME="$3"
-    local DOCKER_NAME="$4"
-    local INPUT_DATA="$5"
-
-    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
-
-        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
-
-        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
-            echo "[ $SERVICE_NAME ] Content is as expected."
-        else
-            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
-            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-            exit 1
-        fi
-    else
-        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
-        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-        exit 1
-    fi
-    sleep 1s
-}
-
-function validate_microservices() {
-    sleep 15s
-    # Check if the microservices are running correctly.
-
-    # lvm microservice
-    validate_services \
-        "${ip_address}:9399/v1/lvm" \
-        "The image" \
-        "lvm" \
-        "lvm-gaudi-server" \
-        '{"image": "iVBORw0KGgoAAAANSUhEUgAAAAoAAAAKCAYAAACNMs+9AAAAFUlEQVR42mP8/5+hnoEIwDiqkL4KAcT9GO0U4BxoAAAAAElFTkSuQmCC", "prompt":"What is this?"}'
-}
-
-function validate_megaservice() {
-    sleep 15s
-    # Curl the Mega Service
-    validate_services \
-    "${ip_address}:8888/v1/visualqna" \
-    "The image" \
-    "visualqna-gaudi-backend-server" \
-    "visualqna-gaudi-backend-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-
-    # test the megeservice via nginx
-    validate_services \
-    "${ip_address}:80/v1/visualqna" \
-    "The image" \
-    "visualqna-gaudi-nginx-server" \
-    "visualqna-gaudi-nginx-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-}
-
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-function stop_docker() {
-    cd $WORKPATH/docker_compose/intel/hpu/gaudi
-    docker compose stop && docker compose rm -f
-}
-
-function main() {
-
-    stop_docker
-
-    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
-    start_services
-
-    validate_microservices
-    validate_megaservice
-    # validate_frontend
-
-    stop_docker
-    echo y | docker system prune
-
-}
-
-main
diff --git a/VisualQnA/tests/test_compose_tgi_on_xeon.sh b/VisualQnA/tests/test_compose_tgi_on_xeon.sh
deleted file mode 100644
index d6311719d0..0000000000
--- a/VisualQnA/tests/test_compose_tgi_on_xeon.sh
+++ /dev/null
@@ -1,222 +0,0 @@
-#!/bin/bash
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-set -x
-IMAGE_REPO=${IMAGE_REPO:-"opea"}
-IMAGE_TAG=${IMAGE_TAG:-"latest"}
-echo "REGISTRY=IMAGE_REPO=${IMAGE_REPO}"
-echo "TAG=IMAGE_TAG=${IMAGE_TAG}"
-export REGISTRY=${IMAGE_REPO}
-export TAG=${IMAGE_TAG}
-export MODEL_CACHE=${model_cache:-"./data"}
-
-WORKPATH=$(dirname "$PWD")
-LOG_PATH="$WORKPATH/tests"
-ip_address=$(hostname -I | awk '{print $1}')
-
-function build_docker_images() {
-    opea_branch=${opea_branch:-"main"}
-    # If the opea_branch isn't main, replace the git clone branch in Dockerfile.
-    if [[ "${opea_branch}" != "main" ]]; then
-        cd $WORKPATH
-        OLD_STRING="RUN git clone --depth 1 https://github.com/opea-project/GenAIComps.git"
-        NEW_STRING="RUN git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git"
-        find . -type f -name "Dockerfile*" | while read -r file; do
-            echo "Processing file: $file"
-            sed -i "s|$OLD_STRING|$NEW_STRING|g" "$file"
-        done
-    fi
-
-    cd $WORKPATH/docker_image_build
-    git clone --depth 1 --branch ${opea_branch} https://github.com/opea-project/GenAIComps.git
-
-    echo "Build all the images with --no-cache, check docker_image_build.log for details..."
-    docker compose -f build.yaml build --no-cache > ${LOG_PATH}/docker_image_build.log
-
-    docker pull ghcr.io/huggingface/text-generation-inference:2.4.0-intel-cpu
-    docker images && sleep 1s
-}
-
-function start_services() {
-    cd $WORKPATH/docker_compose/intel/cpu/xeon/
-
-    export LVM_MODEL_ID="llava-hf/llava-v1.6-mistral-7b-hf"
-    export LVM_ENDPOINT="http://${ip_address}:8399"
-    export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
-    export LVM_SERVICE_PORT=9399
-    export MEGA_SERVICE_HOST_IP=${ip_address}
-    export LVM_SERVICE_HOST_IP=${ip_address}
-    export BACKEND_SERVICE_ENDPOINT="http://${ip_address}:8888/v1/visualqna"
-    export FRONTEND_SERVICE_IP=${ip_address}
-    export FRONTEND_SERVICE_PORT=5173
-    export BACKEND_SERVICE_NAME=visualqna
-    export BACKEND_SERVICE_IP=${ip_address}
-    export BACKEND_SERVICE_PORT=8888
-    export NGINX_PORT=80
-    export host_ip=${ip_address}
-
-    sed -i "s/backend_address/$ip_address/g" $WORKPATH/ui/svelte/.env
-
-    # Start Docker Containers
-    docker compose -f compose_tgi.yaml up -d > ${LOG_PATH}/start_services_with_compose.log
-
-    n=0
-    until [[ "$n" -ge 200 ]]; do
-        docker logs tgi-llava-xeon-server > ${LOG_PATH}/lvm_tgi_service_start.log
-        if grep -q Connected ${LOG_PATH}/lvm_tgi_service_start.log; then
-            break
-        fi
-        sleep 5s
-        n=$((n+1))
-    done
-}
-
-function validate_services() {
-    local URL="$1"
-    local EXPECTED_RESULT="$2"
-    local SERVICE_NAME="$3"
-    local DOCKER_NAME="$4"
-    local INPUT_DATA="$5"
-
-    local HTTP_STATUS=$(curl -s -o /dev/null -w "%{http_code}" -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL")
-    if [ "$HTTP_STATUS" -eq 200 ]; then
-        echo "[ $SERVICE_NAME ] HTTP status is 200. Checking content..."
-
-        local CONTENT=$(curl -s -X POST -d "$INPUT_DATA" -H 'Content-Type: application/json' "$URL" | tee ${LOG_PATH}/${SERVICE_NAME}.log)
-
-        if echo "$CONTENT" | grep -q "$EXPECTED_RESULT"; then
-            echo "[ $SERVICE_NAME ] Content is as expected."
-        else
-            echo "[ $SERVICE_NAME ] Content does not match the expected result: $CONTENT"
-            docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-            exit 1
-        fi
-    else
-        echo "[ $SERVICE_NAME ] HTTP status is not 200. Received status was $HTTP_STATUS"
-        docker logs ${DOCKER_NAME} >> ${LOG_PATH}/${SERVICE_NAME}.log
-        exit 1
-    fi
-    sleep 1s
-}
-
-function validate_microservices() {
-    sleep 15s
-    # Check if the microservices are running correctly.
-
-    # lvm microservice
-    validate_services \
-        "${ip_address}:9399/v1/lvm" \
-        "The image" \
-        "lvm" \
-        "lvm-xeon-server" \
-        '{"image": "iVBORw0KGgoAAAANSUhEUgAAAAoAAAAKCAYAAACNMs+9AAAAFUlEQVR42mP8/5+hnoEIwDiqkL4KAcT9GO0U4BxoAAAAAElFTkSuQmCC", "prompt":"What is this?"}'
-}
-
-function validate_megaservice() {
-    sleep 15s
-    # Curl the Mega Service
-    validate_services \
-    "${ip_address}:8888/v1/visualqna" \
-    "The image" \
-    "visualqna-xeon-backend-server" \
-    "visualqna-xeon-backend-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-
-    # test the megeservice via nginx
-    validate_services \
-    "${ip_address}:80/v1/visualqna" \
-    "The image" \
-    "visualqna-xeon-nginx-server" \
-    "visualqna-xeon-nginx-server" \
-    '{
-        "messages": [
-        {
-            "role": "user",
-            "content": [
-            {
-                "type": "text",
-                "text": "What'\''s in this image?"
-            },
-            {
-                "type": "image_url",
-                "image_url": {
-                "url": "https://www.ilankelman.org/stopsigns/australia.jpg"
-                }
-            }
-            ]
-        }
-        ],
-        "max_tokens": 300
-    }'
-}
-
-function validate_frontend() {
-    cd $WORKPATH/ui/svelte
-    local conda_env_name="OPEA_e2e"
-    export PATH=${HOME}/miniforge3/bin/:$PATH
-    if conda info --envs | grep -q "$conda_env_name"; then
-        echo "$conda_env_name exist!"
-    else
-        conda create -n ${conda_env_name} python=3.12 -y
-    fi
-    source activate ${conda_env_name}
-
-    sed -i "s/localhost/$ip_address/g" playwright.config.ts
-
-    conda install -c conda-forge nodejs=22.6.0 -y
-    npm install && npm ci && npx playwright install --with-deps
-    node -v && npm -v && pip list
-
-    exit_status=0
-    npx playwright test || exit_status=$?
-
-    if [ $exit_status -ne 0 ]; then
-        echo "[TEST INFO]: ---------frontend test failed---------"
-        exit $exit_status
-    else
-        echo "[TEST INFO]: ---------frontend test passed---------"
-    fi
-}
-
-function stop_docker() {
-    cd $WORKPATH/docker_compose/intel/cpu/xeon/
-    docker compose stop && docker compose rm -f
-}
-
-function main() {
-
-    stop_docker
-
-    if [[ "$IMAGE_REPO" == "opea" ]]; then build_docker_images; fi
-    start_services
-
-    validate_microservices
-    validate_megaservice
-    # validate_frontend
-
-    stop_docker
-    echo y | docker system prune
-
-}
-
-main
diff --git a/VisualQnA/ui/docker/Dockerfile b/VisualQnA/ui/docker/Dockerfile
deleted file mode 100644
index 1d5115f4b5..0000000000
--- a/VisualQnA/ui/docker/Dockerfile
+++ /dev/null
@@ -1,26 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-# Use node 20.11.1 as the base image
-FROM node:20.11.1
-
-# Update package manager and install Git
-RUN apt-get update -y && apt-get install -y git
-
-# Copy the front-end code repository
-COPY svelte /home/user/svelte
-
-# Set the working directory
-WORKDIR /home/user/svelte
-
-# Install front-end dependencies
-RUN npm install
-
-# Build the front-end application
-RUN npm run build
-
-# Expose the port of the front-end application
-EXPOSE 5173
-
-# Run the front-end application in preview mode
-CMD ["npm", "run", "preview", "--", "--port", "5173", "--host", "0.0.0.0"]
diff --git a/VisualQnA/ui/svelte/.editorconfig b/VisualQnA/ui/svelte/.editorconfig
deleted file mode 100644
index 2b7a6637f7..0000000000
--- a/VisualQnA/ui/svelte/.editorconfig
+++ /dev/null
@@ -1,10 +0,0 @@
-[*]
-indent_style = tab
-
-[package.json]
-indent_style = space
-indent_size = 2
-
-[*.md]
-indent_style = space
-indent_size = 2
diff --git a/VisualQnA/ui/svelte/.env b/VisualQnA/ui/svelte/.env
deleted file mode 100644
index ce3ce40333..0000000000
--- a/VisualQnA/ui/svelte/.env
+++ /dev/null
@@ -1 +0,0 @@
-BACKEND_BASE_URL = '/v1/visualqna'
diff --git a/VisualQnA/ui/svelte/.eslintignore b/VisualQnA/ui/svelte/.eslintignore
deleted file mode 100644
index 38972655fa..0000000000
--- a/VisualQnA/ui/svelte/.eslintignore
+++ /dev/null
@@ -1,13 +0,0 @@
-.DS_Store
-node_modules
-/build
-/.svelte-kit
-/package
-.env
-.env.*
-!.env.example
-
-# Ignore files for PNPM, NPM and YARN
-pnpm-lock.yaml
-package-lock.json
-yarn.lock
diff --git a/VisualQnA/ui/svelte/.eslintrc.cjs b/VisualQnA/ui/svelte/.eslintrc.cjs
deleted file mode 100644
index a6592d11f7..0000000000
--- a/VisualQnA/ui/svelte/.eslintrc.cjs
+++ /dev/null
@@ -1,34 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-module.exports = {
-	root: true,
-	parser: "@typescript-eslint/parser",
-	extends: ["eslint:recommended", "plugin:@typescript-eslint/recommended", "prettier"],
-	plugins: ["svelte3", "@typescript-eslint", "neverthrow"],
-	ignorePatterns: ["*.cjs"],
-	overrides: [{ files: ["*.svelte"], processor: "svelte3/svelte3" }],
-	settings: {
-		"svelte3/typescript": () => require("typescript"),
-	},
-	parserOptions: {
-		sourceType: "module",
-		ecmaVersion: 2020,
-	},
-	env: {
-		browser: true,
-		es2017: true,
-		node: true,
-	},
-};
diff --git a/VisualQnA/ui/svelte/.prettierignore b/VisualQnA/ui/svelte/.prettierignore
deleted file mode 100644
index 38972655fa..0000000000
--- a/VisualQnA/ui/svelte/.prettierignore
+++ /dev/null
@@ -1,13 +0,0 @@
-.DS_Store
-node_modules
-/build
-/.svelte-kit
-/package
-.env
-.env.*
-!.env.example
-
-# Ignore files for PNPM, NPM and YARN
-pnpm-lock.yaml
-package-lock.json
-yarn.lock
diff --git a/VisualQnA/ui/svelte/.prettierrc b/VisualQnA/ui/svelte/.prettierrc
deleted file mode 100644
index c932dd178f..0000000000
--- a/VisualQnA/ui/svelte/.prettierrc
+++ /dev/null
@@ -1 +0,0 @@
-{"pluginSearchDirs": ["."], "overrides": [{"files": "*.svelte", "options": {"parser": "svelte"}}]}
diff --git a/VisualQnA/ui/svelte/package.json b/VisualQnA/ui/svelte/package.json
deleted file mode 100644
index 7f5f496ba5..0000000000
--- a/VisualQnA/ui/svelte/package.json
+++ /dev/null
@@ -1,62 +0,0 @@
-{
-  "name": "visual-qna",
-  "version": "0.0.1",
-  "private": true,
-  "scripts": {
-    "dev": "vite dev",
-    "build": "vite build",
-    "preview": "vite preview",
-    "check": "svelte-kit sync && svelte-check --tsconfig ./tsconfig.json",
-    "check:watch": "svelte-kit sync && svelte-check --tsconfig ./tsconfig.json --watch",
-    "lint": "prettier --check . && eslint .",
-    "format": "prettier --write ."
-  },
-  "peerDependencies": {
-    "svelte": "^4.0.0"
-  },
-  "devDependencies": {
-    "@fortawesome/free-solid-svg-icons": "6.2.0",
-    "@playwright/test": "^1.45.2",
-    "@sveltejs/adapter-auto": "^3.0.0",
-    "@sveltejs/kit": "^2.0.0",
-    "@sveltejs/vite-plugin-svelte": "^3.0.0",
-    "@tailwindcss/typography": "0.5.7",
-    "@types/debug": "4.1.7",
-    "@types/node": "^20.12.13",
-    "@types/pica": "^9.0.5",
-    "@typescript-eslint/eslint-plugin": "^5.27.0",
-    "@typescript-eslint/parser": "^5.27.0",
-    "autoprefixer": "^10.4.16",
-    "date-picker-svelte": "^2.6.0",
-    "debug": "4.3.4",
-    "postcss": "^8.4.31",
-    "postcss-load-config": "^4.0.1",
-    "postcss-preset-env": "^8.3.2",
-    "prettier": "^2.8.8",
-    "prettier-plugin-svelte": "^2.7.0",
-    "prettier-plugin-tailwindcss": "^0.3.0",
-    "svelte": "^4.2.7",
-    "svelte-check": "^3.6.0",
-    "svelte-fa": "3.0.3",
-    "tailwindcss": "^3.3.6",
-    "tslib": "^2.4.1",
-    "typescript": "^5.0.0",
-    "vite": "^5.0.11"
-  },
-  "type": "module",
-  "dependencies": {
-    "date-fns": "^2.30.0",
-    "driver.js": "^1.3.0",
-    "flowbite": "^2.5.2",
-    "flowbite-svelte": "^0.38.5",
-    "flowbite-svelte-icons": "^1.4.0",
-    "fuse.js": "^6.6.2",
-    "lodash": "^4.17.21",
-    "pica": "^9.0.1",
-    "playwright": "^1.44.0",
-    "ramda": "^0.29.0",
-    "sse.js": "^0.6.1",
-    "svelte-notifications": "^0.9.98",
-    "svrollbar": "^0.12.0"
-  }
-}
diff --git a/VisualQnA/ui/svelte/playwright.config.ts b/VisualQnA/ui/svelte/playwright.config.ts
deleted file mode 100644
index 578a1c2872..0000000000
--- a/VisualQnA/ui/svelte/playwright.config.ts
+++ /dev/null
@@ -1,54 +0,0 @@
-// Copyright (C) 2024 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-
-import { defineConfig, devices } from "@playwright/test";
-
-/**
- * Read environment variables from file.
- * https://github.com/motdotla/dotenv
- */
-// require('dotenv').config();
-
-/**
- * See https://playwright.dev/docs/test-configuration.
- */
-export default defineConfig({
-	testDir: "./tests",
-	/* Maximum time one test can run for. */
-	timeout: 30 * 1000,
-	expect: {
-		/**
-		 * Maximum time expect() should wait for the condition to be met.
-		 * For example in `await expect(locator).toHaveText();`
-		 */
-		timeout: 5000,
-	},
-	/* Run tests in files in parallel */
-	fullyParallel: true,
-	/* Fail the build on CI if you accidentally left test.only in the source code. */
-	forbidOnly: !!process.env.CI,
-	/* Retry on CI only */
-	retries: process.env.CI ? 2 : 0,
-	/* Opt out of parallel tests on CI. */
-	workers: process.env.CI ? 1 : undefined,
-	/* Reporter to use. See https://playwright.dev/docs/test-reporters */
-	reporter: [["html", { open: "never" }]],
-	/* Shared settings for all the projects below. See https://playwright.dev/docs/api/class-testoptions. */
-	use: {
-		/* Maximum time each action such as `click()` can take. Defaults to 0 (no limit). */
-		actionTimeout: 0,
-		/* Base URL to use in actions like `await page.goto('/')`. */
-		baseURL: "http://localhost:5173",
-
-		/* Collect trace when retrying the failed test. See https://playwright.dev/docs/trace-viewer */
-		trace: "on-first-retry",
-	},
-
-	/* Configure projects for major browsers */
-	projects: [
-		{
-			name: "webkit",
-			use: { ...devices["Desktop Safari"] },
-		},
-	],
-});
diff --git a/VisualQnA/ui/svelte/postcss.config.cjs b/VisualQnA/ui/svelte/postcss.config.cjs
deleted file mode 100644
index b384b43ebe..0000000000
--- a/VisualQnA/ui/svelte/postcss.config.cjs
+++ /dev/null
@@ -1,27 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-const tailwindcss = require("tailwindcss");
-const autoprefixer = require("autoprefixer");
-
-const config = {
-	plugins: [
-		//Some plugins, like tailwindcss/nesting, need to run before Tailwind,
-		tailwindcss(),
-		//But others, like autoprefixer, need to run after,
-		autoprefixer,
-	],
-};
-
-module.exports = config;
diff --git a/VisualQnA/ui/svelte/src/app.d.ts b/VisualQnA/ui/svelte/src/app.d.ts
deleted file mode 100644
index fa6a0abf77..0000000000
--- a/VisualQnA/ui/svelte/src/app.d.ts
+++ /dev/null
@@ -1,19 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-// See: https://kit.svelte.dev/docs/types#app
-// import { Result} from "neverthrow";
-interface Window {
-	deviceType: string;
-}
diff --git a/VisualQnA/ui/svelte/src/app.html b/VisualQnA/ui/svelte/src/app.html
deleted file mode 100644
index db69926ea8..0000000000
--- a/VisualQnA/ui/svelte/src/app.html
+++ /dev/null
@@ -1,28 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<!doctype html>
-<html lang="en">
-	<head>
-		<meta charset="utf-8" />
-		<link rel="icon" href="%sveltekit.assets%/favicon.png" />
-		<meta name="viewport" content="width=device-width" />
-		%sveltekit.head%
-	</head>
-	<body>
-		<div class="h-full w-full">%sveltekit.body%</div>
-	</body>
-</html>
diff --git a/VisualQnA/ui/svelte/src/app.postcss b/VisualQnA/ui/svelte/src/app.postcss
deleted file mode 100644
index 963bbca4ef..0000000000
--- a/VisualQnA/ui/svelte/src/app.postcss
+++ /dev/null
@@ -1,86 +0,0 @@
-/* Write your global styles here, in PostCSS syntax */
-@tailwind base;
-@tailwind components;
-@tailwind utilities;
-
-html, body {
-    height: 100%;
-}
-
-.btn {
-	@apply flex-nowrap;
-}
-a.btn {
-	@apply no-underline;
-}
-.input {
-	@apply text-base;
-}
-
-.bg-dark-blue {
-	background-color: #004a86;
-}
-
-.bg-light-blue {
-	background-color: #0068b5;
-}
-
-.bg-turquoise {
-	background-color: #00a3f6;
-}
-
-.bg-header {
-	background-color: #ffffff;
-}
-
-.bg-button {
-	background-color: #0068b5;
-}
-
-.bg-title {
-	background-color: #f7f7f7;
-}
-
-.text-header {
-	color: #0068b5;
-}
-
-.text-button {
-	color: #252e47;
-}
-
-.text-title-color {
-	color: rgb(38,38,38);
-}
-
-.font-intel {
-	font-family: "intel-clear","tahoma",Helvetica,"helvetica",Arial,sans-serif;
-}
-
-.font-title-intel {
-	font-family: "intel-one","intel-clear",Helvetica,Arial,sans-serif;
-}
-
-.bg-footer {
-	background-color: #e7e7e7;
-}
-
-.bg-light-green {
-	background-color: #d7f3a1;
-}
-
-.bg-purple {
-	background-color: #653171;
-}
-
-.bg-dark-blue {
-	background-color: #224678;
-}
-
-.border-input-color {
-	border-color: #605e5c;
-}
-
-.w-12\/12 {
-	width: 100%
-}
diff --git a/VisualQnA/ui/svelte/src/lib/assets/avatar/svelte/Delete.svelte b/VisualQnA/ui/svelte/src/lib/assets/avatar/svelte/Delete.svelte
deleted file mode 100644
index 8847a22275..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/avatar/svelte/Delete.svelte
+++ /dev/null
@@ -1,30 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script lang="ts">
-	import { createEventDispatcher } from "svelte";
-
-	let dispatch = createEventDispatcher();
-</script>
-
-<!-- svelte-ignore a11y-click-events-have-key-events -->
-<svg
-class="absolute top-0 right-0 hover:opacity-70"
-on:click={() => {
-	dispatch('DeleteAvatar') }}
-viewBox="0 0 1024 1024" version="1.1" xmlns="http://www.w3.org/2000/svg" width="20" height="20">
-<path d="M512 832c-176.448 0-320-143.552-320-320S335.552 192 512 192s320 143.552 320 320-143.552 320-320 320m0-704C300.256 128 128 300.256 128 512s172.256 384 384 384 384-172.256 384-384S723.744 128 512 128" fill="#bbbbbb"></path><path d="M649.824 361.376a31.968 31.968 0 0 0-45.248 0L505.6 460.352l-98.976-98.976a31.968 31.968 0 1 0-45.248 45.248l98.976 98.976-98.976 98.976a32 32 0 0 0 45.248 45.248l98.976-98.976 98.976 98.976a31.904 31.904 0 0 0 45.248 0 31.968 31.968 0 0 0 0-45.248L550.848 505.6l98.976-98.976a31.968 31.968 0 0 0 0-45.248" fill="#bbbbbb"></path>
-</svg>
diff --git a/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/Assistant.svelte b/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/Assistant.svelte
deleted file mode 100644
index b68d2a08cd..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/Assistant.svelte
+++ /dev/null
@@ -1,44 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-	<!-- <svg
-		width="35"
-		height="35"
-		viewBox="0 0 48 48"
-		fill="none"
-		xmlns="http://www.w3.org/2000/svg"
-	>
-		<g clip-path="url(#clip0_16_93)">
-			<rect x="0.5" y="0.238312" width="47" height="47" fill="#0068B5" />
-			<path
-				d="M39.51 0.238312H8.49C4.0955 0.238312 0.5 3.83381 0.5 8.22831V39.2483C0.5 43.6428 4.0955 47.2383 8.49 47.2383H39.51C43.9045 47.2383 47.5 43.6428 47.5 39.2483V8.22831C47.5 3.83381 43.9045 0.238312 39.51 0.238312ZM44.915 39.2483C44.915 42.2328 42.4945 44.6533 39.51 44.6533H8.49C5.5055 44.6533 3.085 42.2328 3.085 39.2483V8.22831C3.085 5.24381 5.5055 2.82331 8.49 2.82331H39.51C42.4945 2.82331 44.915 5.24381 44.915 8.22831V39.2483Z"
-				fill="#0068B5"
-			/>
-			<path
-				d="M9.52393 21.3178H11.7094L11.7094 29.3548H9.52393V21.3178ZM20.3574 22.2108C20.1694 21.9523 19.8874 21.7408 19.4879 21.5763C19.1119 21.4118 18.6889 21.3178 18.2424 21.3178C17.2084 21.3178 16.3389 21.7643 15.6574 22.6338V21.4823H13.7304V29.3078H15.7984V25.7593C15.7984 24.8898 15.8454 24.2788 15.9629 23.9498C16.0569 23.6208 16.2684 23.3623 16.5504 23.1743C16.8324 22.9863 17.1614 22.8688 17.5139 22.8688C17.7959 22.8688 18.0309 22.9393 18.2424 23.0803C18.4304 23.2213 18.5949 23.4093 18.6654 23.6678C18.7594 23.9263 18.8064 24.4668 18.8064 25.3128V29.3078H20.8744V24.4433C20.8744 23.8323 20.8274 23.3858 20.7569 23.0568C20.6864 22.7513 20.5689 22.4693 20.3574 22.2108ZM25.7389 27.8038C25.5979 27.8038 25.4804 27.7803 25.3864 27.7098C25.2924 27.6393 25.2219 27.5453 25.1984 27.4513C25.1749 27.3573 25.1514 26.9813 25.1514 26.3233V23.1508H26.5614V21.5058H25.1514V18.7563L23.0834 19.9548V21.5058V23.1508V26.5583C23.0834 27.2868 23.1069 27.7803 23.1539 28.0153C23.2009 28.3443 23.2949 28.6263 23.4359 28.8143C23.5769 29.0023 23.7884 29.1668 24.0939 29.3078C24.3994 29.4253 24.7284 29.4958 25.1044 29.4958C25.7154 29.4958 26.2559 29.4018 26.7494 29.1903L26.5614 27.5923C26.2089 27.7333 25.9269 27.8038 25.7389 27.8038ZM33.7524 22.4928C33.0709 21.7173 32.1544 21.3413 31.0029 21.3413C29.9689 21.3413 29.0994 21.7173 28.4414 22.4458C27.7599 23.1743 27.4309 24.1848 27.4309 25.5008C27.4309 26.5818 27.6894 27.4748 28.2064 28.2033C28.8644 29.0963 29.8749 29.5428 31.2379 29.5428C32.1074 29.5428 32.8124 29.3548 33.3764 28.9553C33.9404 28.5558 34.3634 27.9918 34.6219 27.2163L32.5539 26.8638C32.4364 27.2633 32.2719 27.5453 32.0604 27.7098C31.8489 27.8743 31.5669 27.9683 31.2379 27.9683C30.7679 27.9683 30.3684 27.8038 30.0394 27.4513C29.7104 27.0988 29.5459 26.6288 29.5459 26.0178H34.7394C34.7394 24.4433 34.4339 23.2448 33.7524 22.4928ZM29.5694 24.7488C29.5694 24.1848 29.7104 23.7383 29.9924 23.4093C30.2979 23.0803 30.6504 22.9158 31.1204 22.9158C31.5434 22.9158 31.8959 23.0803 32.2014 23.3858C32.5069 23.6913 32.6479 24.1613 32.6714 24.7488H29.5694ZM36.4079 18.5448H38.4759V29.3548H36.4079V18.5448Z"
-				fill="white"
-			/>
-			<path
-				d="M9.52393 18.5448H11.7094L11.7094 20.5654H9.52393V18.5448ZM39.2058 53.1889C59.7131 70.5741 37.9465 53.1367 37.547 52.9722C60.5267 71.228 41.5876 53.1889 41.1411 53.1889C40.1071 53.1889 54.2638 57.2959 53.5823 58.1654L44.3775 54.0099L42.8 56.0803L44.9335 56.0763L43.617 55.1029L49.2888 57.4321C49.2888 56.5626 69.0838 68.5409 41.665 52.9722C67.9574 69.2353 48.7539 58.3534 49.0359 58.1654C49.3179 57.9774 72.2331 77.3305 48.0529 59.0448C73.8431 77.373 40.6532 52.2185 40.8647 52.3595C64.5928 69.3279 66.2469 69.734 44.0477 53.3531C68.4587 70.8049 45.1808 54.42 45.1808 55.266L49.6436 57.6191L50.8176 56.2254L46.645 54.7317C46.645 54.1207 47.0599 55.184 46.9894 54.855C46.9189 54.5495 63.0924 72.6928 39.2058 53.1889ZM45.3834 56.0442C45.2424 56.0442 60.49 64.1373 43.0764 53.1889C59.6606 67.1938 58.0346 62.1756 40.8647 50.7007C58.8678 64.6804 43.7296 53.3942 43.7296 52.7362L43.617 55.1029L43.3529 52.3595L44.7353 53.7418L43.0764 53.1889L44.244 54.855L46.1176 55.6771L42.8 57.336L45.5647 53.1889L41.9705 49.5948L46.1176 55.1029L46.3941 55.6771C46.3941 56.4056 44.3403 54.3363 44.3873 54.5713C65.2775 66.4664 68.0297 70.4029 45.348 56.6803C69.965 73.7705 43.9793 55.5361 44.2848 55.6771C44.5903 55.7946 60.4832 66.2088 41.9705 53.7418C42.5815 53.7418 44.8545 53.1837 45.348 52.9722L43.7511 52.3595C43.3986 52.5005 45.5714 56.0442 45.3834 56.0442ZM44.0342 56.5108C43.3527 55.7353 45.3338 56.783 44.1823 56.783C43.1483 56.783 44.9043 55.6048 44.2463 56.3333C43.5648 57.0618 43.7511 51.0435 43.7511 52.3595C43.7511 53.4405 43.6653 53.0133 44.1823 53.7418C44.8403 54.6348 41.7134 54.2598 43.0764 54.2598C43.9459 54.2598 43.4702 56.9103 44.0342 56.5108C44.5982 56.1113 44.1288 57.5428 44.3873 56.7673L43.7511 56.2254C55.3795 71.8986 44.3938 54.9384 44.1823 55.1029C43.9708 55.2674 44.0801 54.2598 43.7511 54.2598C56.2643 69.3767 58.4567 71.4935 44.1823 55.1029C57.894 68.7712 44.3873 57.3783 44.3873 56.7673L44.1823 56.945C44.1823 55.3705 44.7157 57.2628 44.0342 56.5108ZM44.3873 54.5713C44.3873 54.0073 43.7522 56.8398 44.0342 56.5108C44.3397 56.1818 43.495 56.2254 43.965 56.2254C44.388 56.2254 55.4258 75.7185 43.7511 56.2254C44.0566 56.5309 44.1588 56.1955 44.1823 56.783L44.3873 54.5713Z"
-				fill="#00C7FD"
-			/>
-		</g>
-		<defs>
-			<clipPath id="clip0_16_93">
-				<rect x="0.5" y="0.238312" width="47" height="47" fill="white" />
-			</clipPath>
-		</defs>
-	</svg> -->
diff --git a/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/PaperAirplane.svelte b/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/PaperAirplane.svelte
deleted file mode 100644
index d1d14077f2..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/PaperAirplane.svelte
+++ /dev/null
@@ -1,68 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script lang="ts">
-	export let overrideClasses = "";
-
-	const classes = overrideClasses ? overrideClasses : `w-5 h-5 text-gray-400`;
-</script>
-
-<!-- <svg
-	class={classes}
-	width="10"
-	height="10"
-	fill="none"
-	viewBox="0 0 18 18"
-	style="min-width: 18px; min-height: 18px;"
-	><g
-		><path
-			fill="#3369FF"
-			d="M15.71 8.019 3.835 1.368a1.125 1.125 0 0 0-1.61 1.36l2.04 5.71h5.298a.562.562 0 1 1 0 1.125H4.264l-2.04 5.71a1.128 1.128 0 0 0 1.058 1.506c.194 0 .384-.05.552-.146l11.877-6.65a1.125 1.125 0 0 0 0-1.964Z"
-		/></g
-	></svg
-> -->
-<!--
-<svg
-	class={classes}
-	xmlns="http://www.w3.org/2000/svg"
-	fill="none"
-	viewBox="0 0 24 24"
-	stroke-width="1.5"
-	stroke="currentColor"
->
-	<path
-		stroke-linecap="round"
-		stroke-linejoin="round"
-		d="M6 12L3.269 3.126A59.768 59.768 0 0121.485 12 59.77 59.77 0 013.27 20.876L5.999 12zm0 0h7.5"
-	/>
-</svg> -->
-
-<svg
-	t="1708926517502"
-	class={classes}
-	viewBox="0 0 1024 1024"
-	version="1.1"
-	xmlns="http://www.w3.org/2000/svg"
-	p-id="4586"
-	id="mx_n_1708926517503"
-	width="200"
-	height="200"
-	><path
-		d="M0 1024l106.496-474.112 588.8-36.864-588.8-39.936-106.496-473.088 1024 512z"
-		p-id="4587"
-		fill="#0068b5"
-	/></svg
->
diff --git a/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/PersonOutlined.svelte b/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/PersonOutlined.svelte
deleted file mode 100644
index dd2f9fdb78..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/chat/svelte/PersonOutlined.svelte
+++ /dev/null
@@ -1,26 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<!-- <svg
-	viewBox="0 0 1024 1024"
-	version="1.1"
-	xmlns="http://www.w3.org/2000/svg"
-	width="32"
-	height="32"
->
-<path d="M512 512c93.866667 0 170.666667-76.8 170.666667-170.666667 0-93.866667-76.8-170.666667-170.666667-170.666667C418.133333 170.666667 341.333333 247.466667 341.333333 341.333333 341.333333 435.2 418.133333 512 512 512zM512 597.333333c-115.2 0-341.333333 55.466667-341.333333 170.666667l0 85.333333 682.666667 0 0-85.333333C853.333333 652.8 627.2 597.333333 512 597.333333z" p-id="4050" fill="#ffffff"></path></svg> -->
-
-<svg t="1708914168912" class="icon" viewBox="0 0 1024 1024" version="1.1" xmlns="http://www.w3.org/2000/svg" p-id="1581" width="200" height="200"><path d="M447.13 46.545h101.818v930.91H447.13V46.545z" fill="#0068b5" p-id="1582" data-spm-anchor-id="a313x.search_index.0.i0.12a13a81x9rPe6" class="selected"></path></svg>
diff --git a/VisualQnA/ui/svelte/src/lib/assets/header/intelLogo.svelte b/VisualQnA/ui/svelte/src/lib/assets/header/intelLogo.svelte
deleted file mode 100644
index 50039d5b37..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/header/intelLogo.svelte
+++ /dev/null
@@ -1,49 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<svg
-aria-hidden="true"
-class="intel-brand-logo"
-width="75"
-height="50"
-viewBox="0 0 103 42"
->
-<g fill-rule="evenodd" transform="translate(.363 .363)">
-  <rect
-    class="spark"
-    width="7.245"
-    height="7.245"
-    x=".134"
-    y=".291"
-    fill="#00c7fd"
-    transform="translate(.503 .874)"
-  ></rect>
-  <path
-    fill-rule="nonzero"
-    class="letters"
-    d="M61.1464956,23.3063694 C61.144586,21.3987261 63.3363057,18.0675159 68.0579618,18.0624204 C72.7802548,18.0624204 74.9751592,21.3904459 74.9751592,23.2980892 L61.1464956,23.3063694 Z M81.5649682,25.6974522 C81.5649682,23.8292994 81.2312102,22.0566879 80.5732484,20.4273885 C79.9159236,18.8019108 78.9859873,17.3541401 77.8095541,16.1254777 C76.6343949,14.8987261 75.2057325,13.9254777 73.5630573,13.233758 C71.9197452,12.5420382 70.0853503,12.1910828 68.110828,12.1910828 C66.2426752,12.1910828 64.4624204,12.5503185 62.8184713,13.2598726 C61.1732484,13.9694268 59.7254777,14.9433121 58.5146497,16.1541401 C57.3031847,17.366242 56.3292994,18.8140127 55.6197452,20.4579618 C54.910828,22.1 54.5515924,23.8808917 54.5515924,25.7503185 C54.5515924,27.6210191 54.8936306,29.4025478 55.5681529,31.0458599 C56.2433121,32.6910828 57.1910828,34.1382166 58.3834395,35.3471338 C59.5770701,36.5585987 61.0414013,37.5318471 62.7369427,38.2407643 C64.4343949,38.9503185 66.3133758,39.3095541 68.322293,39.3095541 C74.1305732,39.3095541 77.7535032,36.6675159 79.9159236,34.1955414 L74.9751592,30.4318471 C73.933758,31.6675159 71.4624204,33.343949 68.3751592,33.343949 C66.4382166,33.343949 64.843949,32.8955414 63.6356688,32.011465 C62.4261146,31.1273885 61.5923567,29.9101911 61.1592357,28.3936306 L61.0898089,28.1515924 L81.5649682,28.1515924 L81.5649682,25.6974522 Z M34.2031847,15.2859873 C32.3012739,13.233121 29.6146497,12.1910828 26.2171975,12.1910828 C24.5789809,12.1910828 23.0636943,12.5286624 21.7133758,13.1942675 C20.3624204,13.8605096 19.2146497,14.7961783 18.3019108,15.9745223 L17.9280255,16.4573248 L17.9254777,16.0229299 L17.9254777,12.7197452 L11.1541401,12.7197452 L11.1541401,38.7808917 L17.9783439,38.7808917 L17.9783439,24.8968153 L17.9840764,25.8605096 C17.9840764,25.7012739 17.9866242,25.5452229 17.9910828,25.3904459 C18.0611465,22.956051 18.6694268,21.1394904 19.8019108,19.9859873 C21.0095541,18.7566879 22.4757962,18.133758 24.1592357,18.133758 C26.1401274,18.133758 27.6522293,18.7407643 28.6535032,19.9369427 C29.633758,21.1101911 30.1350318,22.7910828 30.1458599,24.9324841 L30.1464968,24.9324841 L30.1464968,38.7808917 L37.0751592,38.7808917 L37.0751592,23.9859873 C37.0751592,20.2719745 36.1089172,17.3452229 34.2031847,15.2859873 M92.0076433,0.557324841 L85.1426752,0.557324841 L85.1426752,38.7808917 L92.0076433,38.7808917 L92.0076433,0.557324841 Z M52.6592357,39.0452229 L52.6592357,32.656051 C51.6477707,32.6496815 50.8127389,32.5955414 50.1751592,32.4955414 C49.466879,32.3834395 48.9248408,32.1433121 48.5636943,31.7815287 C48.2019108,31.4197452 47.9617834,30.8955414 47.8496815,30.2235669 C47.7426752,29.5815287 47.688535,28.7343949 47.688535,27.7070064 L47.688535,18.5910828 L52.6592357,18.5910828 L52.6592357,12.7197452 L47.688535,12.7197452 L47.688535,2.56624204 L40.8229299,2.56624204 L40.8229299,27.7598726 C40.8229299,29.8847134 41.0076433,31.6929936 41.3726115,33.133758 C41.733121,34.5573248 42.3477707,35.7203822 43.2019108,36.5904459 C44.0541401,37.4611465 45.1821656,38.0936306 46.5535032,38.4707006 C47.9382166,38.8522293 49.7,39.0452229 51.7910828,39.0452229 L52.6592357,39.0452229 Z M7.15031847,12.7197452 L0.285350318,12.7197452 L0.285350318,38.7808917 L7.15031847,38.7808917 L7.15031847,12.7197452 Z"
-    transform="translate(.541 .08)"
-    fill="#fff"
-  ></path>
-  <path
-    fill-rule="nonzero"
-    class="regmark"
-    fill="#fff"
-    d="M3.18471338,2.75477707 C3.10254777,2.76178344 3.02101911,2.76496815 2.9388535,2.76496815 L2.54904459,2.76496815 L2.54904459,1.95159236 L2.9388535,1.95159236 C3.02101911,1.95159236 3.10254777,1.95414013 3.18471338,1.95859873 C3.26687898,1.96305732 3.34076433,1.97898089 3.40700637,2.00636943 C3.47261146,2.03375796 3.52611465,2.07515924 3.56751592,2.12993631 C3.60828025,2.18407643 3.62866242,2.25923567 3.62866242,2.35477707 C3.62866242,2.45031847 3.60828025,2.52611465 3.56751592,2.58089172 C3.52611465,2.63566879 3.47261146,2.67579618 3.40700637,2.70318471 C3.34076433,2.73057325 3.26687898,2.7477707 3.18471338,2.75477707 M3.47197452,3.17452229 C3.67006369,3.1522293 3.83503185,3.07707006 3.9656051,2.94968153 C4.09617834,2.82165605 4.16178344,2.63057325 4.16178344,2.37515924 C4.16178344,2.09299363 4.07834395,1.87643312 3.91273885,1.72611465 C3.74585987,1.57579618 3.48789809,1.50063694 3.13694268,1.50063694 L2.01656051,1.50063694 L2.01656051,4.40509554 L2.54904459,4.40509554 L2.54904459,3.21592357 L2.9388535,3.21592357 L3.66305732,4.40509554 L4.22292994,4.40509554 L3.47197452,3.17452229 Z M4.92038217,3.78280255 C4.81082803,4.03821656 4.66178344,4.25987261 4.47261146,4.44904459 C4.28343949,4.63821656 4.0611465,4.78726115 3.80636943,4.89681529 C3.55159236,5.00573248 3.28025478,5.06050955 2.99299363,5.06050955 C2.70636943,5.06050955 2.43503185,5.00573248 2.18025478,4.89681529 C1.92484076,4.78726115 1.70318471,4.63821656 1.51401274,4.44904459 C1.32484076,4.25987261 1.17579618,4.03821656 1.06624204,3.78280255 C0.956687898,3.52802548 0.902547771,3.2566879 0.902547771,2.97006369 C0.902547771,2.68280255 0.956687898,2.41210191 1.06624204,2.15732484 C1.17579618,1.90191083 1.32484076,1.67961783 1.51401274,1.49044586 C1.70318471,1.30191083 1.92484076,1.1522293 2.18025478,1.04267516 C2.43503185,0.933757962 2.70636943,0.878980892 2.99299363,0.878980892 C3.28025478,0.878980892 3.55159236,0.933757962 3.80636943,1.04267516 C4.0611465,1.1522293 4.28343949,1.30191083 4.47261146,1.49044586 C4.66178344,1.67961783 4.81082803,1.90191083 4.92038217,2.15732484 C5.02929936,2.41210191 5.08407643,2.68280255 5.08407643,2.97006369 C5.08407643,3.2566879 5.02929936,3.52802548 4.92038217,3.78280255 M5.33375796,1.98280255 C5.19936306,1.67515924 5.01656051,1.40636943 4.78726115,1.17579618 C4.5566879,0.945859873 4.28789809,0.76433121 3.98089172,0.629299363 C3.67324841,0.494904459 3.34394904,0.428025478 2.99299363,0.428025478 C2.64267516,0.428025478 2.3133758,0.494904459 2.00573248,0.629299363 C1.69872611,0.76433121 1.42993631,0.945859873 1.2,1.17579618 C0.969426752,1.40636943 0.787261146,1.67515924 0.652866242,1.98280255 C0.518471338,2.29044586 0.451592357,2.61910828 0.451592357,2.97006369 C0.451592357,3.32101911 0.518471338,3.64968153 0.652866242,3.95732484 C0.787261146,4.26433121 0.969426752,4.53375796 1.2,4.76305732 C1.42993631,4.99363057 1.69872611,5.17579618 2.00573248,5.31019108 C2.3133758,5.44458599 2.64267516,5.51146497 2.99299363,5.51146497 C3.34394904,5.51146497 3.67324841,5.44458599 3.98089172,5.31019108 C4.28789809,5.17579618 4.5566879,4.99363057 4.78726115,4.76305732 C5.01656051,4.53375796 5.19936306,4.26433121 5.33375796,3.95732484 C5.46751592,3.64968153 5.53503185,3.32101911 5.53503185,2.97006369 C5.53503185,2.61910828 5.46751592,2.29044586 5.33375796,1.98280255"
-    transform="translate(95.036 34)"
-  ></path>
-</g>
-</svg>
diff --git a/VisualQnA/ui/svelte/src/lib/assets/imageData/extreme_ironing.png b/VisualQnA/ui/svelte/src/lib/assets/imageData/extreme_ironing.png
deleted file mode 100644
index 93ef4b7961..0000000000
Binary files a/VisualQnA/ui/svelte/src/lib/assets/imageData/extreme_ironing.png and /dev/null differ
diff --git a/VisualQnA/ui/svelte/src/lib/assets/imageData/waterview.png b/VisualQnA/ui/svelte/src/lib/assets/imageData/waterview.png
deleted file mode 100644
index d5562df1d0..0000000000
Binary files a/VisualQnA/ui/svelte/src/lib/assets/imageData/waterview.png and /dev/null differ
diff --git a/VisualQnA/ui/svelte/src/lib/assets/layout/css/driver.css b/VisualQnA/ui/svelte/src/lib/assets/layout/css/driver.css
deleted file mode 100644
index 453db6082a..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/layout/css/driver.css
+++ /dev/null
@@ -1,94 +0,0 @@
-.driverjs-theme {
-	background: transparent;
-	color: #fff;
-	box-shadow: none;
-	padding: 0;
-}
-
-.driver-popover-arrow {
-	border: 10px solid transparent;
-	animation: blink 1s 3 steps(1);
-}
-
-@keyframes blink {
-	0% {
-		opacity: 1;
-	}
-	50% {
-		opacity: 0.2;
-	}
-	100% {
-		opacity: 1;
-	}
-}
-
-.driver-popover.driverjs-theme .driver-popover-arrow-side-left.driver-popover-arrow {
-	border-left-color: #174ed1;
-}
-
-.driver-popover.driverjs-theme .driver-popover-arrow-side-right.driver-popover-arrow {
-	border-right-color: #174ed1;
-}
-
-.driver-popover.driverjs-theme .driver-popover-arrow-side-top.driver-popover-arrow {
-	border-top-color: #174ed1;
-}
-
-.driver-popover.driverjs-theme .driver-popover-arrow-side-bottom.driver-popover-arrow {
-	border-bottom-color: #174ed1;
-}
-
-.driver-popover-footer {
-	background: transparent;
-	color: #fff;
-}
-.driver-popover-title {
-	border-top-left-radius: 5px;
-	border-top-right-radius: 5px;
-}
-
-.driver-popover-title,
-.driver-popover-description {
-	display: block;
-	padding: 15px 15px 7px 15px;
-	background: #174ed1;
-	border: none;
-}
-
-.driver-popover-close-btn {
-	color: #fff;
-}
-
-.driver-popover-footer button:hover,
-.driver-popover-footer button:focus {
-	background: #174ed1;
-	color: #fff;
-}
-
-.driver-popover-description {
-	padding: 5px 15px;
-	border-bottom-left-radius: 5px;
-	border-bottom-right-radius: 5px;
-}
-
-.driver-popover-title[style*="block"] + .driver-popover-description {
-	margin: 0;
-}
-.driver-popover-progress-text {
-	color: #fff;
-}
-
-.driver-popover-footer button {
-	background: #174ed1;
-	border: 2px #174ed1 dashed;
-	color: #fff;
-	border-radius: 50%;
-	text-shadow: none;
-}
-.driver-popover-close-btn:hover,
-.driver-popover-close-btn:focus {
-	color: #fff;
-}
-.driver-popover-navigation-btns button + button {
-	margin-left: 10px;
-}
diff --git a/VisualQnA/ui/svelte/src/lib/assets/upload/help.svelte b/VisualQnA/ui/svelte/src/lib/assets/upload/help.svelte
deleted file mode 100644
index adccf7bb56..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/upload/help.svelte
+++ /dev/null
@@ -1,24 +0,0 @@
-<!--
-  Copyright (C) 2024 Intel Corporation
-  SPDX-License-Identifier: Apache-2.0
--->
-
-<svg
-	t="1723185303018"
-	class="icon"
-	viewBox="0 0 1024 1024"
-	version="1.1"
-	xmlns="http://www.w3.org/2000/svg"
-	p-id="4249"
-	width="15"
-	height="15"
-	><path
-		d="M512 0C229.696 0 0 229.696 0 512s229.696 512 512 512 512-229.696 512-512-229.696-512-512-512z m0 931.2A419.712 419.712 0 0 1 92.8 512 419.712 419.712 0 0 1 512 92.8 419.712 419.712 0 0 1 931.2 512 419.712 419.712 0 0 1 512 931.2z"
-		fill="#747A7D"
-		p-id="4250"
-	/><path
-		d="M507.328 192.256c-75.904 3.52-134.528 41.856-165.184 108.032A246.848 246.848 0 0 0 320 396.288l89.664 0.128c0-0.32 0.512-31.168 14.912-60.736 16.96-34.944 44.544-52.096 86.848-54.016 41.792-1.92 71.68 10.24 88.64 36.096 16.896 25.792 15.36 55.68 11.968 62.528-13.696 23.488-40.96 51.52-60.8 72.064-9.728 9.984-18.112 18.56-24.448 26.048a410.688 410.688 0 0 1-4.608 5.248c-20.096 22.976-57.6 65.728-57.6 156.352h89.6c0-56.96 18.88-78.464 35.456-97.344l5.568-6.4c4.416-5.184 12.16-13.184 20.416-21.696 23.04-23.808 54.656-56.32 73.856-89.216 23.04-39.232 18.304-102.912-11.2-151.488-19.712-32.448-68.032-86.272-170.944-81.6zM448 768a64 64 0 1 0 128 0 64 64 0 0 0-128 0z"
-		fill="#747A7D"
-		p-id="4251"
-	/></svg
->
diff --git a/VisualQnA/ui/svelte/src/lib/assets/upload/next.svelte b/VisualQnA/ui/svelte/src/lib/assets/upload/next.svelte
deleted file mode 100644
index 70f4fe25e8..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/upload/next.svelte
+++ /dev/null
@@ -1,31 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<svg
-	class="h-4 w-4 text-white rtl:rotate-180 dark:text-white-800"
-	aria-hidden="true"
-	xmlns="http://www.w3.org/2000/svg"
-	fill="none"
-	viewBox="0 0 6 10"
->
-	<path
-		stroke="currentColor"
-		stroke-linecap="round"
-		stroke-linejoin="round"
-		stroke-width="2"
-		d="m1 9 4-4-4-4"
-	/>
-</svg>
diff --git a/VisualQnA/ui/svelte/src/lib/assets/upload/previous.svelte b/VisualQnA/ui/svelte/src/lib/assets/upload/previous.svelte
deleted file mode 100644
index c47d9c49da..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/upload/previous.svelte
+++ /dev/null
@@ -1,31 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<svg
-	class="h-4 w-4 text-white rtl:rotate-180 dark:text-white-800"
-	aria-hidden="true"
-	xmlns="http://www.w3.org/2000/svg"
-	fill="none"
-	viewBox="0 0 6 10"
->
-	<path
-		stroke="currentColor"
-		stroke-linecap="round"
-		stroke-linejoin="round"
-		stroke-width="2"
-		d="M5 1 1 5l4 4"
-	/>
-</svg>
diff --git a/VisualQnA/ui/svelte/src/lib/assets/voice/svg/paste.svg b/VisualQnA/ui/svelte/src/lib/assets/voice/svg/paste.svg
deleted file mode 100644
index 8910f0ea64..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/voice/svg/paste.svg
+++ /dev/null
@@ -1 +0,0 @@
-<?xml version="1.0" standalone="no"?><!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd"><svg t="1699596229588" class="icon" viewBox="0 0 1024 1024" version="1.1" xmlns="http://www.w3.org/2000/svg" p-id="20460" xmlns:xlink="http://www.w3.org/1999/xlink" width="32" height="32"><path d="M576 128a96 96 0 0 1 96 96v128h-224a96 96 0 0 0-95.84 90.368L352 448v224H224a96 96 0 0 1-96-96V224a96 96 0 0 1 96-96h352z" fill="#CCD9FF" p-id="20461"></path><path d="M576 96a128 128 0 0 1 128 128v128h-64V224a64 64 0 0 0-59.2-63.84L576 160H224a64 64 0 0 0-64 64v352a64 64 0 0 0 64 64h128v64H224a128 128 0 0 1-128-128V224a128 128 0 0 1 128-128z" fill="#3671FD" p-id="20462"></path><path d="M800 320H448a128 128 0 0 0-128 128v352a128 128 0 0 0 128 128h352a128 128 0 0 0 128-128V448a128 128 0 0 0-128-128z m-352 64h352a64 64 0 0 1 64 64v352a64 64 0 0 1-64 64H448a64 64 0 0 1-64-64V448a64 64 0 0 1 64-64z" fill="#3671FD" p-id="20463"></path><path d="M128 736a32 32 0 0 1 32 32 96 96 0 0 0 90.368 95.84L256 864a32 32 0 0 1 0 64 160 160 0 0 1-160-160 32 32 0 0 1 32-32z" fill="#FE9C23" p-id="20464"></path></svg>
diff --git a/VisualQnA/ui/svelte/src/lib/assets/voice/svg/uploadFile.svg b/VisualQnA/ui/svelte/src/lib/assets/voice/svg/uploadFile.svg
deleted file mode 100644
index 9a77286a8f..0000000000
--- a/VisualQnA/ui/svelte/src/lib/assets/voice/svg/uploadFile.svg
+++ /dev/null
@@ -1 +0,0 @@
-<?xml version="1.0" standalone="no"?><!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd"><svg height="480" node-id="1" sillyvg="true" template-height="480" template-width="480" version="1.1" viewBox="0 0 480 480" width="480" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><defs node-id="21"><linearGradient gradientUnits="objectBoundingBox" id="linearGradient-1" node-id="7" spreadMethod="pad" x1="0.5" x2="0.5" y1="1" y2="0.054371078"><stop offset="0" stop-color="#eeeeee" stop-opacity="0.19006774"></stop><stop offset="1" stop-color="#ffffff"></stop></linearGradient></defs><g node-id="28"><g node-id="29"><g node-id="30"><path d="M 251.86 431.42 L 258.68 432.65 L 265.55 433.47 L 272.49 433.88 L 279.51 433.89 L 286.61 433.48 L 295.40 432.44 L 304.22 430.82 L 313.07 428.63 L 321.98 425.84 L 330.68 422.57 L 339.31 418.79 L 347.87 414.49 L 356.38 409.64 L 364.61 404.41 L 372.65 398.73 L 380.52 392.60 L 388.22 386.00 L 395.58 379.08 L 402.65 371.78 L 409.42 364.11 L 415.91 356.04 L 422.00 347.70 L 427.69 339.07 L 432.97 330.13 L 437.86 320.89 L 442.27 311.42 L 446.18 301.74 L 449.58 291.82 L 452.49 281.66 L 454.82 271.38 L 456.55 260.93 L 457.68 250.31 L 458.20 239.48 L 457.28 227.35 L 455.75 215.45 L 453.62 203.78 L 450.88 192.31 L 447.53 180.97 L 443.63 169.93 L 439.19 159.19 L 434.19 148.71 L 428.65 138.50 L 422.61 128.66 L 416.08 119.18 L 409.05 110.05 L 401.55 101.30 L 393.60 93.00 L 385.22 85.13 L 376.37 77.69 L 369.02 72.09 L 361.42 66.83 L 353.56 61.89 L 345.44 57.28 L 337.05 52.98 L 328.52 49.10 L 319.76 45.58 L 310.76 42.44 L 301.51 39.68 L 292.00 37.30 L 282.49 35.38 L 272.76 33.88 L 262.80 32.81 L 252.60 32.18 L 242.14 32.01 L 233.00 32.31 L 224.10 33.02 L 215.42 34.14 L 206.95 35.65 L 198.68 37.56 L 188.40 40.51 L 178.46 43.97 L 168.83 47.95 L 159.49 52.45 L 150.38 57.45 L 141.60 62.86 L 133.13 68.68 L 124.96 74.91 L 117.08 81.54 L 109.55 88.45 L 102.35 95.67 L 95.48 103.20 L 88.92 111.02 L 82.73 119.02 L 76.90 127.20 L 71.44 135.56 L 66.28 144.15 L 61.53 152.80 L 57.18 161.48 L 53.22 170.23 L 49.58 179.17 L 46.37 188.02 L 43.58 196.78 L 41.21 205.45 L 39.19 214.31 L 37.63 222.92 L 36.50 231.31 L 35.80 239.48 L 35.54 248.08 L 35.77 256.51 L 36.49 264.80 L 37.69 272.96 L 39.36 281.00 L 41.50 288.96 L 44.07 296.77 L 47.07 304.44 L 50.51 311.98 L 54.39 319.40 L 58.62 326.58 L 63.24 333.59 L 68.24 340.45 L 73.64 347.16 L 79.45 353.72 L 87.06 361.49 L 95.20 368.97 L 103.89 376.15 L 113.15 383.03 L 122.68 389.41 L 132.66 395.43 L 143.12 401.09 L 154.06 406.38 L 165.17 411.14 L 176.65 415.48 L 188.51 419.37 L 200.77 422.82 L 213.11 425.73 L 225.72 428.14 L 238.63 430.04 L 251.86 431.42 Z" fill="#909efc" fill-opacity="0.2" fill-rule="evenodd" group-id="1,2,3" id="1" node-id="13" stroke="none" target-height="401.88" target-width="422.66" target-x="35.54" target-y="32.01"></path></g><g node-id="31"><path d="M 214.12 447.32 L 223.10 447.45 L 231.95 447.13 L 240.68 446.36 L 249.31 445.14 L 257.84 443.47 L 268.40 440.80 L 278.71 437.54 L 288.78 433.71 L 298.63 429.28 L 308.23 424.32 L 317.49 418.90 L 326.42 413.03 L 335.04 406.68 L 343.34 399.90 L 351.20 392.80 L 358.63 385.37 L 365.64 377.61 L 372.28 369.48 L 378.37 361.17 L 383.94 352.68 L 389.00 344.00 L 393.60 335.00 L 397.56 325.98 L 400.92 316.91 L 403.68 307.78 L 405.47 300.31 L 406.82 292.89 L 407.72 285.53 L 408.19 278.20 L 408.24 270.90 L 406.91 259.68 L 405.17 248.72 L 403.02 238.03 L 400.48 227.58 L 397.53 217.37 L 394.12 207.20 L 390.35 197.37 L 386.23 187.87 L 381.74 178.69 L 376.91 169.81 L 371.62 161.10 L 366.01 152.79 L 360.10 144.89 L 353.86 137.36 L 347.31 130.21 L 340.35 123.37 L 333.12 117.00 L 325.60 111.09 L 317.79 105.61 L 309.68 100.56 L 301.30 96.00 L 292.65 91.96 L 283.73 88.42 L 274.51 85.39 L 264.97 82.86 L 255.40 80.94 L 245.56 79.59 L 235.41 78.82 L 224.94 78.65 L 214.12 79.10 L 202.62 80.21 L 191.38 81.84 L 180.38 83.97 L 169.61 86.59 L 158.93 89.74 L 148.57 93.32 L 138.51 97.32 L 128.75 101.76 L 119.17 106.67 L 109.98 111.93 L 101.16 117.55 L 92.71 123.53 L 84.52 129.94 L 76.79 136.63 L 69.50 143.60 L 62.65 150.85 L 56.15 158.49 L 50.18 166.33 L 44.71 174.38 L 39.73 182.66 L 35.23 191.24 L 31.30 199.96 L 27.94 208.84 L 25.13 217.90 L 22.90 227.12 L 21.31 236.45 L 20.34 245.91 L 20.00 255.51 L 20.50 262.17 L 21.47 269.08 L 22.94 276.28 L 24.92 283.79 L 27.26 291.07 L 30.04 298.51 L 33.28 306.13 L 37.00 313.92 L 42.41 324.00 L 48.54 334.14 L 55.42 344.37 L 62.78 354.27 L 70.76 364.00 L 79.37 373.60 L 88.42 382.78 L 97.97 391.59 L 108.03 400.05 L 115.85 406.06 L 123.87 411.75 L 132.12 417.12 L 140.59 422.18 L 149.26 426.88 L 158.09 431.15 L 167.07 435.01 L 176.22 438.45 L 185.53 441.44 L 194.94 443.91 L 204.46 445.87 L 214.12 447.32 Z" fill="#909efc" fill-opacity="0.3" fill-rule="evenodd" group-id="1,2,4" id="2" node-id="14" stroke="none" target-height="368.80002" target-width="388.24" target-x="20" target-y="78.65"></path></g><g node-id="32"><path d="M 227.92 410.45 L 238.47 411.99 L 248.68 412.98 L 258.56 413.44 L 268.15 413.39 L 277.45 412.85 L 286.89 411.80 L 296.00 410.31 L 304.80 408.38 L 313.32 406.03 L 321.57 403.27 L 329.74 400.03 L 337.61 396.44 L 345.17 392.49 L 352.45 388.19 L 359.45 383.53 L 366.24 378.48 L 372.71 373.16 L 378.87 367.55 L 384.72 361.64 L 390.29 355.43 L 396.81 347.30 L 402.81 338.83 L 408.29 330.01 L 413.27 320.81 L 417.69 311.34 L 421.55 301.64 L 424.84 291.68 L 427.57 281.46 L 429.70 271.11 L 431.21 260.63 L 432.11 250.00 L 432.39 239.20 L 432.71 232.07 L 432.60 224.95 L 432.06 217.81 L 431.09 210.65 L 429.67 203.45 L 427.37 194.63 L 424.48 185.84 L 420.99 177.08 L 416.89 168.32 L 412.34 159.85 L 407.28 151.50 L 401.72 143.27 L 395.62 135.14 L 389.18 127.33 L 382.34 119.75 L 375.08 112.38 L 367.41 105.23 L 359.45 98.42 L 351.21 91.93 L 342.66 85.77 L 333.81 79.93 L 324.72 74.46 L 315.46 69.41 L 306.02 64.79 L 296.39 60.57 L 286.56 56.79 L 276.68 53.53 L 266.73 50.76 L 256.70 48.50 L 246.55 46.76 L 236.44 45.60 L 226.37 45.03 L 216.31 45.03 L 204.95 45.35 L 194.05 46.20 L 183.58 47.57 L 173.50 49.44 L 163.81 51.80 L 154.08 54.73 L 144.78 58.08 L 135.89 61.84 L 127.37 66.01 L 119.22 70.58 L 111.25 75.64 L 103.69 81.03 L 96.52 86.73 L 89.74 92.75 L 83.33 99.11 L 77.23 105.84 L 71.55 112.79 L 66.27 119.99 L 61.39 127.43 L 56.90 135.12 L 52.81 143.05 L 49.14 151.13 L 45.91 159.36 L 43.10 167.76 L 40.71 176.34 L 38.77 185.02 L 37.28 193.76 L 36.25 202.58 L 35.67 211.49 L 35.54 220.50 L 36.72 228.95 L 38.50 239.23 L 40.78 249.96 L 43.91 262.03 L 46.36 270.12 L 49.28 278.58 L 52.69 287.41 L 56.47 296.08 L 60.82 304.90 L 65.77 313.89 L 71.17 322.60 L 77.26 331.29 L 84.07 339.96 L 89.48 346.17 L 95.34 352.26 L 101.68 358.26 L 108.51 364.15 L 115.54 369.63 L 123.12 374.93 L 131.27 380.04 L 140.02 384.95 L 148.87 389.35 L 158.37 393.48 L 168.58 397.33 L 179.52 400.88 L 190.39 403.86 L 202.05 406.46 L 214.55 408.66 L 227.92 410.45 Z" fill="#909efc" fill-opacity="0.4" fill-rule="evenodd" group-id="1,2,5" id="3" node-id="15" stroke="none" target-height="368.41" target-width="397.16998" target-x="35.54" target-y="45.03"></path></g><g node-id="33"><path d="M 213.18 406.50 L 224.92 408.67 L 236.29 410.39 L 247.31 411.67 L 257.99 412.52 L 268.84 412.93 L 279.24 412.81 L 289.23 412.18 L 298.83 411.05 L 306.54 409.72 L 313.96 408.00 L 321.10 405.90 L 327.97 403.44 L 334.59 400.60 L 341.03 397.32 L 347.20 393.61 L 353.11 389.43 L 358.77 384.80 L 364.20 379.68 L 369.15 374.28 L 373.87 368.33 L 378.34 361.79 L 382.57 354.63 L 386.55 346.80 L 389.91 339.05 L 393.01 330.60 L 395.83 321.39 L 398.35 311.36 L 400.56 300.48 L 402.19 290.05 L 403.50 278.76 L 404.44 266.57 L 405.00 253.41 L 405.13 239.22 L 402.23 226.31 L 398.92 214.24 L 395.23 202.95 L 391.16 192.41 L 386.48 181.91 L 381.51 172.13 L 376.25 163.01 L 370.71 154.53 L 364.64 146.27 L 358.37 138.61 L 351.89 131.52 L 345.21 124.98 L 338.13 118.76 L 330.92 113.06 L 323.59 107.86 L 316.13 103.14 L 308.39 98.78 L 300.61 94.87 L 292.79 91.41 L 284.92 88.38 L 276.86 85.71 L 268.87 83.45 L 260.92 81.58 L 253.02 80.10 L 242.36 78.66 L 231.99 77.86 L 221.88 77.67 L 208.81 78.44 L 196.53 79.62 L 185.01 81.18 L 174.21 83.10 L 164.08 85.36 L 153.69 88.18 L 143.96 91.32 L 134.87 94.75 L 126.37 98.48 L 118.44 102.48 L 110.54 107.03 L 103.17 111.83 L 96.31 116.88 L 89.93 122.18 L 84.02 127.73 L 78.37 133.68 L 73.15 139.86 L 68.33 146.27 L 63.91 152.91 L 59.87 159.80 L 55.36 168.70 L 51.39 177.92 L 47.95 187.48 L 45.06 197.40 L 42.73 207.42 L 40.88 217.72 L 39.51 228.31 L 38.63 239.22 L 39.87 245.65 L 41.59 252.78 L 43.84 260.67 L 46.42 268.42 L 49.53 276.63 L 53.21 285.33 L 57.24 293.84 L 61.83 302.57 L 67.03 311.51 L 72.61 320.21 L 78.79 328.88 L 85.59 337.54 L 92.82 345.83 L 100.68 353.90 L 109.20 361.73 L 115.85 367.26 L 122.88 372.55 L 130.30 377.60 L 138.13 382.41 L 146.12 386.79 L 154.54 390.84 L 163.38 394.54 L 172.70 397.89 L 182.07 400.72 L 191.92 403.10 L 202.28 405.04 L 213.18 406.50 Z" fill="#909efc" fill-opacity="0.4" fill-rule="evenodd" group-id="1,2,6" id="4" node-id="16" stroke="none" target-height="335.26" target-width="366.5" target-x="38.63" target-y="77.67"></path></g><path d="M 215.43 367.61 L 228.38 365.58 L 240.79 363.09 L 252.69 360.15 L 264.10 356.78 L 275.47 352.85 L 286.26 348.54 L 296.50 343.88 L 306.21 338.86 L 315.75 333.30 L 324.68 327.46 L 333.02 321.34 L 340.80 314.94 L 348.27 308.04 L 355.10 300.94 L 361.31 293.63 L 366.93 286.11 L 371.11 279.78 L 374.85 273.36 L 378.18 266.84 L 381.11 260.21 L 383.65 253.47 L 385.78 246.57 L 387.48 239.59 L 388.75 232.53 L 389.59 225.38 L 389.99 218.11 L 390.99 207.41 L 391.38 197.25 L 391.20 187.58 L 390.47 178.38 L 389.22 169.61 L 387.37 160.72 L 385.03 152.29 L 382.23 144.28 L 378.97 136.68 L 375.25 129.45 L 370.99 122.43 L 366.33 115.79 L 361.27 109.53 L 355.78 103.62 L 349.86 98.06 L 343.61 92.91 L 337.01 88.12 L 330.03 83.68 L 322.65 79.60 L 314.86 75.87 L 306.97 72.62 L 298.77 69.73 L 290.22 67.21 L 281.32 65.07 L 272.04 63.32 L 262.85 62.02 L 253.38 61.11 L 243.63 60.60 L 233.57 60.51 L 223.20 60.84 L 211.53 63.82 L 200.46 67.12 L 189.97 70.74 L 180.02 74.66 L 170.60 78.87 L 161.68 83.38 L 152.72 88.45 L 144.27 93.80 L 136.32 99.43 L 128.83 105.32 L 121.80 111.50 L 115.20 117.95 L 108.89 124.82 L 103.01 131.95 L 97.56 139.36 L 92.51 147.04 L 87.86 155.01 L 83.62 163.28 L 79.84 171.70 L 76.44 180.38 L 73.43 189.35 L 70.81 198.62 L 68.58 208.20 L 66.75 218.11 L 66.59 242.02 L 66.69 254.60 L 67.16 267.49 L 67.76 276.10 L 68.68 284.62 L 69.93 293.06 L 71.60 301.41 L 73.75 309.48 L 76.38 317.28 L 78.74 322.99 L 81.46 328.46 L 84.54 333.70 L 87.99 338.72 L 91.81 343.43 L 96.10 347.86 L 100.90 352.02 L 106.23 355.92 L 111.77 359.29 L 117.97 362.34 L 124.88 365.06 L 132.56 367.43 L 140.16 369.19 L 148.63 370.53 L 158.03 371.42 L 168.47 371.81 L 178.53 371.66 L 189.65 370.95 L 201.92 369.62 L 215.43 367.61 Z" fill="#909efc" fill-opacity="0.6" fill-rule="evenodd" group-id="1,2,7" id="5" node-id="17" stroke="none" target-height="311.3" target-width="324.79" target-x="66.59" target-y="60.51"></path></g><path d="M 193.00 208.00 L 281.00 208.00 L 281.00 291.00 L 193.00 291.00 Z" fill="url(#linearGradient-1)" fill-rule="evenodd" group-id="1" id="矩形" node-id="18" stroke="none" target-height="83" target-width="88" target-x="193" target-y="208"></path><path d="M 204.34 187.40 L 205.82 184.30 L 207.42 181.42 L 209.93 177.40 L 212.87 173.22 L 216.68 168.52 L 221.00 163.96 L 226.13 159.47 L 229.84 156.76 L 233.89 154.30 L 238.30 152.10 L 242.89 150.34 L 247.86 149.04 L 253.23 148.21 L 257.26 147.99 L 261.54 148.14 L 266.10 148.68 L 270.96 149.65 L 275.71 151.04 L 280.04 152.70 L 283.99 154.61 L 287.59 156.76 L 292.14 160.10 L 296.15 163.69 L 299.67 167.56 L 302.85 171.73 L 305.60 175.97 L 307.94 180.29 L 310.91 186.93 L 313.11 193.22 L 314.81 199.39 L 315.91 204.60 L 316.69 209.44 L 317.06 212.71 L 317.29 215.80 L 320.19 216.75 L 323.18 217.90 L 327.40 219.80 L 331.79 222.15 L 336.64 225.29 L 339.75 227.69 L 342.75 230.44 L 345.64 233.56 L 348.18 236.94 L 350.35 240.71 L 352.13 244.92 L 353.09 248.17 L 353.71 251.69 L 353.97 255.53 L 353.85 259.71 L 353.08 265.18 L 351.88 270.02 L 350.29 274.31 L 348.26 278.41 L 346.02 282.02 L 343.58 285.18 L 340.85 288.13 L 338.12 290.66 L 335.39 292.82 L 331.16 295.64 L 327.45 297.68 L 323.90 299.30 L 321.43 300.25 L 319.05 301.00 L 319.05 301.00 L 251.99 301.00 L 251.99 301.00 L 263.46 301.00 L 263.46 290.63 L 251.99 290.63 L 251.99 260.46 L 268.27 260.46 L 268.27 260.39 L 268.34 260.43 L 269.03 260.29 L 269.57 259.91 L 269.94 259.36 L 270.08 258.68 L 269.82 257.84 L 269.82 257.84 L 269.92 257.84 L 269.63 257.54 L 269.48 257.40 L 269.48 257.40 L 239.43 225.61 L 238.65 224.96 L 237.66 224.72 L 236.69 224.94 L 235.94 225.52 L 235.94 225.52 L 205.66 257.57 L 205.17 258.11 L 204.98 258.82 L 205.11 259.44 L 205.43 259.93 L 205.91 260.25 L 206.51 260.38 L 206.51 260.38 L 206.51 260.45 L 223.60 260.45 L 223.60 290.63 L 211.72 290.63 L 211.72 300.98 L 149.72 300.98 L 147.36 300.29 L 141.43 298.02 L 137.76 296.26 L 133.63 293.89 L 129.60 291.08 L 125.67 287.63 L 123.28 285.04 L 121.15 282.15 L 119.25 278.95 L 117.77 275.54 L 116.71 271.77 L 116.09 267.57 L 116.03 263.33 L 116.60 258.57 L 117.89 253.21 L 118.25 252.08 L 120.57 245.82 L 122.94 240.56 L 125.36 236.19 L 128.13 232.00 L 130.82 228.57 L 133.44 225.80 L 136.31 223.27 L 138.99 221.28 L 141.49 219.76 L 145.33 217.95 L 148.49 216.90 L 151.46 216.26 L 153.44 216.03 L 155.31 216.01 L 154.82 213.95 L 154.48 211.78 L 154.26 208.66 L 154.37 205.32 L 155.00 201.50 L 155.74 198.98 L 156.87 196.42 L 158.41 193.81 L 160.28 191.44 L 162.73 189.15 L 165.85 186.93 L 170.12 184.73 L 174.13 183.25 L 177.93 182.41 L 181.82 182.04 L 185.38 182.08 L 188.64 182.49 L 193.30 183.66 L 196.92 185.10 L 200.02 186.82 L 201.70 188.13 L 202.29 188.24 L 203.46 188.19 L 203.98 187.92 L 204.34 187.40 Z" fill="#ffffff" fill-rule="nonzero" group-id="1" id="形状结合" node-id="19" stroke="none" target-height="153.01" target-width="237.94" target-x="116.03" target-y="147.99"></path></g></svg>
diff --git a/VisualQnA/ui/svelte/src/lib/modules/chat/ChatMessage.svelte b/VisualQnA/ui/svelte/src/lib/modules/chat/ChatMessage.svelte
deleted file mode 100644
index 720908163b..0000000000
--- a/VisualQnA/ui/svelte/src/lib/modules/chat/ChatMessage.svelte
+++ /dev/null
@@ -1,76 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script lang="ts">
-	import MessageAvatar from "$lib/modules/chat/MessageAvatar.svelte";
-	import type { Message } from "$lib/shared/constant/Interface";
-	import MessageTimer from "./MessageTimer.svelte";
-	import { createEventDispatcher } from "svelte";
-
-	let dispatch = createEventDispatcher();
-
-	export let msg: Message;
-	export let time: string = "";
-	export const imgSrc: string = "";
-</script>
-
-<div
-	class={msg.role === 0
-		? "flex w-full gap-3"
-		: "flex w-full items-center gap-3"}
-	data-testid={msg.role === 0 ? "display-answer" : "display-question"}
->
-	<div
-		class={msg.role === 0
-			? "flex aspect-square w-[3px]  items-center justify-center rounded bg-[#0597ff] max-sm:hidden"
-			: "flex aspect-square h-10 w-[3px] items-center justify-center rounded bg-[#000] max-sm:hidden"}
-	>
-		<MessageAvatar role={msg.role} />
-	</div>
-	<div class="group relative flex items-start">
-		<div class="flex flex-col items-start">
-			{#if msg.imgSrc}
-				<img
-					src={msg.imgSrc}
-					alt="Uploaded Image"
-					class="max-w-28 m-2 max-h-28"
-				/>
-			{/if}
-			<p
-				class="max-w-[60vw] items-start whitespace-pre-line break-keep text-[0.8rem] leading-5 sm:max-w-[50rem] xl:max-w-[65vw]"
-			>
-				{@html msg.content}
-			</p>
-		</div>
-	</div>
-</div>
-{#if time}
-	<div>
-		<MessageTimer
-			{time}
-			on:handleTop={() => {
-				dispatch("scrollTop");
-			}}
-		/>
-	</div>
-{/if}
-
-<style>
-	.wrap-style {
-		word-wrap: break-word;
-		word-break: break-all;
-	}
-</style>
diff --git a/VisualQnA/ui/svelte/src/lib/modules/chat/MessageAvatar.svelte b/VisualQnA/ui/svelte/src/lib/modules/chat/MessageAvatar.svelte
deleted file mode 100644
index 0f6a24b96d..0000000000
--- a/VisualQnA/ui/svelte/src/lib/modules/chat/MessageAvatar.svelte
+++ /dev/null
@@ -1,30 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script lang="ts">
-	import AssistantIcon from "$lib/assets/chat/svelte/Assistant.svelte";
-	import PersonOutlined from "$lib/assets/chat/svelte/PersonOutlined.svelte";
-	import { MessageRole } from "$lib/shared/constant/Interface";
-	export let role: MessageRole;
-
-
-</script>
-
-{#if role === MessageRole.User}
-	<PersonOutlined />
-{:else}
-	<AssistantIcon />
-{/if}
diff --git a/VisualQnA/ui/svelte/src/lib/modules/chat/MessageTimer.svelte b/VisualQnA/ui/svelte/src/lib/modules/chat/MessageTimer.svelte
deleted file mode 100644
index 9416cc8795..0000000000
--- a/VisualQnA/ui/svelte/src/lib/modules/chat/MessageTimer.svelte
+++ /dev/null
@@ -1,68 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script lang="ts">
-	export let time: string;
-	import { createEventDispatcher } from "svelte";
-
-	let dispatch = createEventDispatcher();
-</script>
-
-<div class="ml-2 flex flex-col">
-	<div class="my-4 flex items-center justify-end gap-2 space-x-2">
-		<div class="ml-2 w-min cursor-pointer" data-state="closed">
-			<!-- svelte-ignore a11y-click-events-have-key-events -->
-			<svg
-				xmlns="http://www.w3.org/2000/svg"
-				xml:space="preserve"
-				viewBox="0 0 21.6 21.6"
-				width="24"
-				height="24"
-				class="w-5 fill-[#0597ff] hover:fill-[#0597ff]"
-				on:click={() => {
-					dispatch("handleTop");
-				}}
-				><path
-					d="M2.2 3.6V.8h17.2v2.8zm7.2 17.2V10.4L5.8 14l-1.9-1.9 6.9-6.9 6.9 6.9-1.9 1.9-3.6-3.6v10.4z"
-				/></svg
-			>
-		</div>
-		<div
-			class="inline-block w-0.5 self-stretch bg-gray-300 opacity-100 dark:opacity-50"
-		/>
-		<div class="w-min cursor-pointer" data-state="closed">
-			<svg
-				xmlns="http://www.w3.org/2000/svg"
-				xml:space="preserve"
-				viewBox="0 0 21.6 21.6"
-				width="24"
-				height="24"
-				class="w-5 fill-[#0597ff] hover:fill-[#0597ff]"
-				><path d="M12.3 17.1V7.6H7.6v2.8h1.9v6.7H6.4v2.7h8.8v-2.7z" /><circle
-					cx="10.8"
-					cy="3.6"
-					r="1.9"
-				/></svg
-			>
-		</div>
-		<div class="flex items-center space-x-1 text-base text-gray-800" id='msg-time'
-		>
-			<strong>End to End Time: </strong>
-			<p>{time}s</p>
-		</div>
-	</div>
-	<div class="ml-2 flex flex-col" />
-</div>
diff --git a/VisualQnA/ui/svelte/src/lib/modules/frame/Layout.svelte b/VisualQnA/ui/svelte/src/lib/modules/frame/Layout.svelte
deleted file mode 100644
index 0c5b997d28..0000000000
--- a/VisualQnA/ui/svelte/src/lib/modules/frame/Layout.svelte
+++ /dev/null
@@ -1,48 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script lang="ts">
-	import { onMount } from "svelte";
-	import { page } from "$app/stores";
-	import { browser } from "$app/environment";
-	import { open } from "$lib/shared/stores/common/Store";
-	import Scrollbar from "$lib/shared/components/scrollbar/Scrollbar.svelte";
-
-	let root: HTMLElement
-	onMount(() => {
-		document.getElementsByTagName("body").item(0)!.removeAttribute("tabindex");
-		// root.style.height = document.documentElement.clientHeight + 'px'
-	});
-
-	if (browser) {
-		page.subscribe(() => {
-			// close side navigation when route changes
-			if (window.innerWidth > 768) {
-				$open = true;
-			}
-		});
-	}
-</script>
-
-<div bind:this={root} class='h-full overflow-hidden relative'>
-	<div class="h-full flex items-start">
-		<div class='relative flex flex-col h-full pl-0 w-full  bg-white'>
-			<Scrollbar className="h-0 grow " classLayout="h-full" alwaysVisible={false}>
-				<slot />
-			</Scrollbar>
-		</div>
-	</div>
-</div>
diff --git a/VisualQnA/ui/svelte/src/lib/modules/upload/imagePrompt.svelte b/VisualQnA/ui/svelte/src/lib/modules/upload/imagePrompt.svelte
deleted file mode 100644
index 90e55bff96..0000000000
--- a/VisualQnA/ui/svelte/src/lib/modules/upload/imagePrompt.svelte
+++ /dev/null
@@ -1,102 +0,0 @@
-<!--
-  Copyright (C) 2024 Intel Corporation
-  SPDX-License-Identifier: Apache-2.0
--->
-
-<script>
-	import { createEventDispatcher } from "svelte";
-	import extreme_ironing from "$lib/assets/imageData/extreme_ironing.png";
-	import waterview from "$lib/assets/imageData/waterview.png";
-	import { base64ImageStore } from "$lib/shared/stores/common/Store";
-
-	let dispatch = createEventDispatcher();
-
-	let images = [
-		{
-			id: 1,
-			alt: "Waterview",
-			imgurl: waterview,
-			prompt:
-				"What are the things I should be cautious about when I visit here?",
-		},
-		{
-			id: 0,
-			alt: "Extreme Ironing",
-			imgurl: extreme_ironing,
-			prompt: "What is unusual about this image?",
-		},
-	];
-
-	let currentIndex = 0;
-
-	function nextImage() {
-		currentIndex = (currentIndex + 1) % images.length;
-	}
-
-	function prevImage() {
-		currentIndex = (currentIndex - 1 + images.length) % images.length;
-	}
-
-	async function handleImageClick() {
-		const imgUrl = images[currentIndex].imgurl;
-
-		const base64Data = await convertImageToBase64(imgUrl);
-
-		base64ImageStore.set(base64Data);
-
-		const currentPrompt = images[currentIndex].prompt;
-		dispatch("imagePrompt", { content: currentPrompt });
-	}
-
-	async function convertImageToBase64(url) {
-		const response = await fetch(url);
-		const blob = await response.blob();
-		return new Promise((resolve, reject) => {
-			const reader = new FileReader();
-			reader.onloadend = () => resolve(reader.result);
-			reader.onerror = reject;
-			reader.readAsDataURL(blob);
-		});
-	}
-</script>
-
-<div class="my-2 flex w-full flex-col gap-3 rounded-xl bg-white p-5">
-	<p>Example</p>
-	<div class="relative mx-auto w-full max-w-4xl">
-		<button
-			class="absolute left-0 top-1/2 z-10 h-8 w-8 -translate-y-1/2 transform rounded-full bg-white/30 group-hover:bg-white/50 group-focus:outline-none group-focus:ring-4 group-focus:ring-white dark:bg-gray-800/30 dark:group-hover:bg-gray-800/60 dark:group-focus:ring-gray-800/70 sm:h-10 sm:w-10"
-			on:click={prevImage}
-			aria-label="Previous image"
-		>
-			&#10094;
-		</button>
-
-		<div class="relative">
-			<img
-				src={images[currentIndex].imgurl}
-				alt={images[currentIndex].alt}
-				class="carousel-image h-auto w-full cursor-pointer"
-				on:click={handleImageClick}
-			/>
-			<div
-				class="absolute bottom-0 left-0 w-full bg-black bg-opacity-55 p-3 text-white"
-			>
-				<p>{images[currentIndex].prompt}</p>
-			</div>
-		</div>
-
-		<button
-			class="absolute right-0 top-1/2 z-10 h-8 w-8 -translate-y-1/2 transform rounded-full bg-white/30 group-hover:bg-white/50 group-focus:outline-none group-focus:ring-4 group-focus:ring-white dark:bg-gray-800/30 dark:group-hover:bg-gray-800/60 dark:group-focus:ring-gray-800/70 sm:h-10 sm:w-10"
-			on:click={nextImage}
-			aria-label="Next image"
-		>
-			&#10095;
-		</button>
-	</div>
-</div>
-
-<style>
-	.relative img {
-		object-fit: cover;
-	}
-</style>
diff --git a/VisualQnA/ui/svelte/src/lib/modules/upload/upload.svelte b/VisualQnA/ui/svelte/src/lib/modules/upload/upload.svelte
deleted file mode 100644
index 5347d6bd77..0000000000
--- a/VisualQnA/ui/svelte/src/lib/modules/upload/upload.svelte
+++ /dev/null
@@ -1,32 +0,0 @@
-<!--
-  Copyright (C) 2024 Intel Corporation
-  SPDX-License-Identifier: Apache-2.0
--->
-
-<script lang="ts">
-	import { Hr, Label, Input } from "flowbite-svelte";
-	import UploadImg from "./uploadImg.svelte";
-
-	import { Range } from "flowbite-svelte";
-	import { FilePasteSolid } from "flowbite-svelte-icons";
-	import { stepValueStore } from "$lib/shared/stores/common/Store";
-	let stepValue = 512;
-    let imageUrl = '';
-
-	$: stepValueStore.set(stepValue);
-</script>
-
-<div class="flex w-full flex-col gap-3 rounded-xl bg-white p-5">
-	<p>Upload Images</p>
-	<UploadImg imageUrl={imageUrl}/>
-	<Hr classHr="my-8 w-64">or</Hr>
-	<div class="mb-6">
-		<Label for="input-group-1" class="block mb-2">Import from URL</Label>
-		<Input type="text" placeholder=""  bind:value={imageUrl}>
-		  <FilePasteSolid slot="left" class="w-5 h-5 text-gray-500 dark:text-gray-400" />
-		</Input>
-	  </div>
-	<p>Parameters</p>
-	<Range id="range-steps" min="0" max="1024" bind:value={stepValue} step="1" />
-	<p>Max output tokens: {stepValue}</p>
-</div>
diff --git a/VisualQnA/ui/svelte/src/lib/modules/upload/uploadImg.svelte b/VisualQnA/ui/svelte/src/lib/modules/upload/uploadImg.svelte
deleted file mode 100644
index 9fcf6eefcc..0000000000
--- a/VisualQnA/ui/svelte/src/lib/modules/upload/uploadImg.svelte
+++ /dev/null
@@ -1,168 +0,0 @@
-<!--
-  Copyright (C) 2024 Intel Corporation
-  SPDX-License-Identifier: Apache-2.0
--->
-
-<script lang="ts">
-	import { base64ImageStore } from "$lib/shared/stores/common/Store";
-	import { Dropzone } from "flowbite-svelte";
-	import Pica from 'pica';
-
-	let value = [];
-	export let imageUrl = "";
-
-	$: if (imageUrl !== "") {
-		uploadImage();
-	}
-
-	const uploadImage = async () => {
-		try {
-			if (imageUrl.startsWith("http://") || imageUrl.startsWith("https://")) {
-				base64ImageStore.set(imageUrl);
-				console.log("Image URL Stored:", imageUrl);
-				return;
-			}
-		} catch (error) {
-			console.error("Error converting image to Base64:", error);
-		}
-	};
-
-	const dropHandle = (event) => {
-		event.preventDefault();
-		if (event.dataTransfer.items) {
-			[...event.dataTransfer.items].forEach((item) => {
-				if (item.kind === "file") {
-					const file = item.getAsFile();
-					if (file) {
-						value = [file.name]; // Allow only one file selection
-						readFileAsBase64(file); // Convert to Base64
-					}
-				}
-			});
-		} else {
-			[...event.dataTransfer.files].forEach((file) => {
-				value = [file.name]; // Allow only one file selection
-				readFileAsBase64(file); // Convert to Base64
-			});
-		}
-	};
-
-	const handleChange = (event) => {
-				const files = event.target.files;
-		if (files.length > 0) {
-			value = [files[0].name]; // Allow only one file selection
-			readFileAsBase64(files[0]); // Convert to Base64
-		}
-	};
-
-	const readFileAsBase64 = (file) => {
-    const reader = new FileReader();
-    reader.onload = () => {
-        const base64Data = reader.result;
-        const fileType = file.type;
-
-        if (!fileType.includes("png")) {
-            convertImageToPNG(base64Data); // Convert if not PNG
-        } else {
-            base64ImageStore.set(base64Data); // Store Base64
-        }
-
-        imageUrl = URL.createObjectURL(file); // Create URL for preview
-    };
-    reader.readAsDataURL(file); // Read file as Data URL
-};
-
-const convertImageToPNG = async (base64Data) => {
-    if (!base64Data || !base64Data.startsWith("data:image/")) {
-        console.error("Invalid Base64 data");
-        return;
-    }
-
-    console.log("Starting image conversion...");
-
-    const img = new Image();
-    img.src = base64Data;
-
-    img.onload = async () => {
-        const canvas = document.createElement("canvas");
-        const ctx = canvas.getContext("2d");
-        let width = img.width;
-        let height = img.height;
-
-        // Set resize factor to 1 (no scaling) to keep the original size
-        const scaleFactor = 0.1; // Resize factor (keep original size)
-        width = Math.floor(width * scaleFactor);
-        height = Math.floor(height * scaleFactor);
-
-        canvas.width = width;
-        canvas.height = height;
-
-        ctx.drawImage(img, 0, 0, width, height); // Draw the original image (no resizing)
-
-        const outputCanvas = document.createElement("canvas");
-        outputCanvas.width = width;
-        outputCanvas.height = height;
-
-        const pica = new Pica();
-
-        try {
-            // Resize and compress the image using Pica
-            await pica.resize(canvas, outputCanvas);
-
-            // Convert canvas to PNG format with data URL
-            const pngDataUrl = outputCanvas.toDataURL("image/png", 0.8); // Adjust quality (0.9 is high, between 0-1)
-
-            // Store the Base64 PNG image
-            base64ImageStore.set(pngDataUrl);
-        } catch (err) {
-            console.error("Error during image processing:", err);
-        }
-    };
-
-    img.onerror = (err) => {
-        console.error("Error loading image:", err);
-    };
-};
-
-	const showFiles = (files) => {
-		if (files.length === 1) return files[0];
-		let concat = files.join(", ");
-		if (concat.length > 40) concat = concat.slice(0, 40) + "...";
-		return concat;
-	};
-</script>
-
-<Dropzone
-	id="dropzone"
-	on:drop={dropHandle}
-	on:dragover={(event) => {
-		event.preventDefault();
-	}}
-	on:change={handleChange}
->
-	{#if value.length === 0 && !imageUrl}
-		<svg
-			aria-hidden="true"
-			class="mx-auto mb-3 h-10 w-10 text-gray-400"
-			fill="none"
-			stroke="currentColor"
-			viewBox="0 0 24 24"
-			xmlns="http://www.w3.org/2000/svg"
-		>
-			<path
-				stroke-linecap="round"
-				stroke-linejoin="round"
-				stroke-width="2"
-				d="M7 16a4 4 0 01-.88-7.903A5 5 0 1115.9 6L16 6a5 5 0 011 9.9M15 13l-3-3m0 0l-3 3m3-3v12"
-			/>
-		</svg>
-		<p class="mb-2 text-center text-sm text-gray-500 dark:text-gray-400">
-			<span class="font-semibold">Click to upload</span> or drag and drop
-		</p>
-		<p class="text-center text-xs text-gray-500 dark:text-gray-400">
-			SVG, PNG, JPG
-		</p>
-	{:else if imageUrl}
-		<img src={imageUrl} alt="Uploaded Image" class="m-2 mx-auto block" />
-	{/if}
-</Dropzone>
diff --git a/VisualQnA/ui/svelte/src/lib/network/chat/Network.ts b/VisualQnA/ui/svelte/src/lib/network/chat/Network.ts
deleted file mode 100644
index 8a78c0cda8..0000000000
--- a/VisualQnA/ui/svelte/src/lib/network/chat/Network.ts
+++ /dev/null
@@ -1,52 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-import { env } from "$env/dynamic/public";
-import { SSE } from "sse.js";
-
-const BACKEND_BASE_URL = env.BACKEND_BASE_URL;
-
-export async function fetchTextStream(query: string, stepValueStore: number, base64ImageStore: string) {
-	let payload = {};
-	let url = "";
-	base64ImageStore = base64ImageStore.replace(/^data:[a-zA-Z]+\/[a-zA-Z]+;base64,/, "");
-
-	payload = {
-		messages: [
-			{
-				role: "user",
-				content: [
-					{
-						type: "text",
-						text: query,
-					},
-					{
-						type: "image_url",
-						image_url: { url: base64ImageStore },
-					},
-				],
-			},
-		],
-		max_tokens: stepValueStore,
-		stream: true,
-	};
-	console.log("payload", payload);
-
-	url = `${BACKEND_BASE_URL}`;
-
-	return new SSE(url, {
-		headers: { "Content-Type": "application/json" },
-		payload: JSON.stringify(payload),
-	});
-}
diff --git a/VisualQnA/ui/svelte/src/lib/network/upload/Network.ts b/VisualQnA/ui/svelte/src/lib/network/upload/Network.ts
deleted file mode 100644
index 284494f851..0000000000
--- a/VisualQnA/ui/svelte/src/lib/network/upload/Network.ts
+++ /dev/null
@@ -1,57 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-import { env } from "$env/dynamic/public";
-
-const BACKEND_BASE_URL = env.BACKEND_BASE_URL;
-
-export async function fetchKnowledgeBaseId(file: Blob, fileName: string) {
-	const url = `${BACKEND_BASE_URL}/create`;
-	const formData = new FormData();
-	formData.append("file", file, fileName);
-	const init: RequestInit = {
-		method: "POST",
-		body: formData,
-	};
-
-	try {
-		const response = await fetch(url, init);
-		if (!response.ok) throw response.status;
-		return await response.json();
-	} catch (error) {
-		console.error("network error: ", error);
-		return undefined;
-	}
-}
-
-export async function fetchKnowledgeBaseIdByPaste(pasteUrlList: any, urlType: string | undefined) {
-	const url = `${BACKEND_BASE_URL}/upload_link`;
-	const data = {
-		link_list: pasteUrlList,
-	};
-	const init: RequestInit = {
-		method: "POST",
-		headers: { "Content-Type": "application/json" },
-		body: JSON.stringify(data),
-	};
-
-	try {
-		const response = await fetch(url, init);
-		if (!response.ok) throw response.status;
-		return await response.json();
-	} catch (error) {
-		console.error("network error: ", error);
-		return undefined;
-	}
-}
diff --git a/VisualQnA/ui/svelte/src/lib/shared/Utils.ts b/VisualQnA/ui/svelte/src/lib/shared/Utils.ts
deleted file mode 100644
index fb182cef67..0000000000
--- a/VisualQnA/ui/svelte/src/lib/shared/Utils.ts
+++ /dev/null
@@ -1,54 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-export function scrollToBottom(scrollToDiv: HTMLElement) {
-	if (scrollToDiv) {
-		setTimeout(
-			() =>
-				scrollToDiv.scroll({
-					behavior: "auto",
-					top: scrollToDiv.scrollHeight,
-				}),
-			100,
-		);
-	}
-}
-
-export function scrollToTop(scrollToDiv: HTMLElement) {
-	if (scrollToDiv) {
-		setTimeout(
-			() =>
-				scrollToDiv.scroll({
-					behavior: "auto",
-					top: 0,
-				}),
-			100,
-		);
-	}
-}
-
-export function getCurrentTimeStamp() {
-	return Math.floor(new Date().getTime());
-}
-
-export function fromTimeStampToTime(timeStamp: number) {
-	return new Date(timeStamp * 1000).toTimeString().slice(0, 8);
-}
-
-export function formatTime(seconds) {
-	const hours = String(Math.floor(seconds / 3600)).padStart(2, "0");
-	const minutes = String(Math.floor((seconds % 3600) / 60)).padStart(2, "0");
-	const remainingSeconds = String(seconds % 60).padStart(2, "0");
-	return `${hours}:${minutes}:${remainingSeconds}`;
-}
diff --git a/VisualQnA/ui/svelte/src/lib/shared/components/header/header.svelte b/VisualQnA/ui/svelte/src/lib/shared/components/header/header.svelte
deleted file mode 100644
index c851dec988..0000000000
--- a/VisualQnA/ui/svelte/src/lib/shared/components/header/header.svelte
+++ /dev/null
@@ -1,33 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script>
-
-</script>
-<header
-  class="sticky top-0 z-40 flex-none w-full mx-auto bg-[#0054ae] border-b border-gray-200 dark:border-gray-600 dark:bg-gray-800"
->
-  <nav
-    class="bg-[#0054ae] dark:bg-gray-800 text-gray-500 dark:text-gray-400 border-gray-200 dark:border-gray-700 divide-gray-200 dark:divide-gray-700 px-2 sm:px-4 w-full py-1.5"
-  >
-    <div class="mx-auto flex flex-wrap justify-end items-center w-full">
-      <span
-        class="self-center py-2 whitespace-nowrap text-2xl font-semibold text-white ml-4"
-        data-svelte-h="svelte-1hbktnk">VisualQnA</span
-      >
-    </div>
-  </nav>
-</header>
diff --git a/VisualQnA/ui/svelte/src/lib/shared/components/loading/Loading.svelte b/VisualQnA/ui/svelte/src/lib/shared/components/loading/Loading.svelte
deleted file mode 100644
index 51e89cfe7e..0000000000
--- a/VisualQnA/ui/svelte/src/lib/shared/components/loading/Loading.svelte
+++ /dev/null
@@ -1,48 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<div
-	class="mb-6 flex items-center justify-center self-center bg-black text-sm text-gray-500"
-/>
-<div class="flex items-center justify-center gap-3">
-	<div class="relative inline-flex">
-		<div class="h-2 w-2 rounded-full bg-blue-600" />
-		<div
-			class="absolute left-0 top-0 h-2 w-2 animate-[ping_1s_infinite_100ms] rounded-full bg-blue-600"
-		/>
-		<div
-			class="duration-800 absolute left-0 top-0 h-2 w-2 animate-pulse rounded-full bg-blue-600"
-		/>
-	</div>
-	<div class="relative inline-flex">
-		<div class="h-2 w-2 rounded-full bg-blue-600" />
-		<div
-			class="absolute left-0 top-0 h-2 w-2 animate-[ping_1s_infinite_300ms] rounded-full bg-blue-600"
-		/>
-		<div
-			class="absolute left-0 top-0 h-2 w-2 animate-pulse rounded-full bg-blue-600"
-		/>
-	</div>
-	<div class="relative inline-flex">
-		<div class="h-2 w-2 rounded-full bg-blue-600" />
-		<div
-			class="absolute left-0 top-0 h-2 w-2 animate-[ping_1s_infinite_500ms] rounded-full bg-blue-600"
-		/>
-		<div
-			class="absolute left-0 top-0 h-2 w-2 animate-pulse rounded-full bg-blue-600"
-		/>
-	</div>
-</div>
diff --git a/VisualQnA/ui/svelte/src/lib/shared/components/scrollbar/Scrollbar.svelte b/VisualQnA/ui/svelte/src/lib/shared/components/scrollbar/Scrollbar.svelte
deleted file mode 100644
index f18e23e690..0000000000
--- a/VisualQnA/ui/svelte/src/lib/shared/components/scrollbar/Scrollbar.svelte
+++ /dev/null
@@ -1,48 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script lang="ts">
-	import { Svroller } from "svrollbar";
-    export let className: string = "";
-    export let classLayout: string = "";
-    export let alwaysVisible = true;
-</script>
-
-<div class={className}>
-    <Svroller height="100%" width="100%" {alwaysVisible}>
-        <div class={classLayout}>
-            <slot></slot>
-        </div>
-    </Svroller>
-</div>
-
-<style>
-    :global(.svlr-contents) {
-        height: 100%;
-    }
-
-    .row::-webkit-scrollbar {
-		display: none;
-	}
-
-	.row {
-		scrollbar-width: none;
-	}
-
-	.row {
-		-ms-overflow-style: none;
-	}
-</style>
diff --git a/VisualQnA/ui/svelte/src/lib/shared/constant/Interface.ts b/VisualQnA/ui/svelte/src/lib/shared/constant/Interface.ts
deleted file mode 100644
index c461e2b791..0000000000
--- a/VisualQnA/ui/svelte/src/lib/shared/constant/Interface.ts
+++ /dev/null
@@ -1,48 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-export enum MessageRole {
-	Assistant,
-	User,
-}
-
-export enum MessageType {
-	Text,
-	SingleAudio,
-	AudioList,
-	SingleImage,
-	ImageList,
-	singleVideo,
-}
-
-type Map<T> = T extends MessageType.Text | MessageType.SingleAudio
-	? string
-	: T extends MessageType.AudioList
-		? string[]
-		: T extends MessageType.SingleImage
-			? { imgSrc: string; imgId: string }
-			: { imgSrc: string; imgId: string }[];
-
-export interface Message {
-	imgSrc: string | null | undefined;
-	role: MessageRole;
-	type: MessageType;
-	content: Map<Message["type"]>;
-	time: number;
-}
-
-export enum LOCAL_STORAGE_KEY {
-	STORAGE_CHAT_KEY = "chatMessages",
-	STORAGE_TIME_KEY = "initTime",
-}
diff --git a/VisualQnA/ui/svelte/src/lib/shared/stores/common/Store.ts b/VisualQnA/ui/svelte/src/lib/shared/stores/common/Store.ts
deleted file mode 100644
index 88a581ab68..0000000000
--- a/VisualQnA/ui/svelte/src/lib/shared/stores/common/Store.ts
+++ /dev/null
@@ -1,45 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-import { writable } from "svelte/store";
-
-export let open = writable(true);
-
-export let knowledgeAccess = writable(true);
-
-export let showTemplate = writable(false);
-
-export let showSidePage = writable(false);
-
-export let droppedObj = writable({});
-
-export let isLoading = writable(false);
-
-export let newUploadNum = writable(0);
-
-export let ifStoreMsg = writable(true);
-
-export let isCheckedStore = writable(false);
-
-export const resetControl = writable(false);
-
-export const knowledge1 = writable<{
-	id: string;
-}>();
-
-export const knowledgeName = writable("");
-
-export const base64ImageStore = writable("");
-
-export const stepValueStore = writable(512);
diff --git a/VisualQnA/ui/svelte/src/routes/+layout.svelte b/VisualQnA/ui/svelte/src/routes/+layout.svelte
deleted file mode 100644
index 8141177d4a..0000000000
--- a/VisualQnA/ui/svelte/src/routes/+layout.svelte
+++ /dev/null
@@ -1,48 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script>
-	import "tailwindcss/tailwind.css";
-	import "../app.postcss";
-	import Notifications from "svelte-notifications";
-	import Layout from "$lib/modules/frame/Layout.svelte";
-	import { onMount } from "svelte";
-
-	onMount(() => {
-		window.deviceType = window.innerWidth > 640 ? "pc" : "mobile";
-		window.onresize = () => {
-			window.deviceType = window.innerWidth > 640 ? "pc" : "mobile";
-		};
-		window.addEventListener("load", function () {
-			setTimeout(function () {
-				// This hides the address bar:
-				window.scrollTo(0, 1);
-			}, 0);
-		});
-
-	});
-</script>
-
-<Notifications>
-	<Layout>
-		<div class="flex h-full flex-col">
-			<div class="h-0 grow bg-white  lg:rounded-tl-3xl">
-				<slot />
-			</div>
-		</div>
-
-	</Layout>
-</Notifications>
diff --git a/VisualQnA/ui/svelte/src/routes/+page.svelte b/VisualQnA/ui/svelte/src/routes/+page.svelte
deleted file mode 100644
index 4dd3e6efda..0000000000
--- a/VisualQnA/ui/svelte/src/routes/+page.svelte
+++ /dev/null
@@ -1,279 +0,0 @@
-<!--
-  Copyright (c) 2024 Intel Corporation
-
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.
--->
-
-<script lang="ts">
-	export let data;
-	import {
-		base64ImageStore,
-		stepValueStore,
-	} from "$lib/shared/stores/common/Store";
-	import { onMount } from "svelte";
-	import Header from "$lib/shared/components/header/header.svelte";
-	import {
-		LOCAL_STORAGE_KEY,
-		MessageRole,
-		MessageType,
-		type Message,
-	} from "$lib/shared/constant/Interface";
-	import {
-		getCurrentTimeStamp,
-		scrollToBottom,
-		scrollToTop,
-	} from "$lib/shared/Utils";
-	import { fetchTextStream } from "$lib/network/chat/Network";
-	import LoadingAnimation from "$lib/shared/components/loading/Loading.svelte";
-	import "driver.js/dist/driver.css";
-	import "$lib/assets/layout/css/driver.css";
-	import PaperAirplane from "$lib/assets/chat/svelte/PaperAirplane.svelte";
-	import Scrollbar from "$lib/shared/components/scrollbar/Scrollbar.svelte";
-	import ChatMessage from "$lib/modules/chat/ChatMessage.svelte";
-	import Upload from "$lib/modules/upload/upload.svelte";
-	import ImagePrompt from "$lib/modules/upload/imagePrompt.svelte";
-
-	let query: string = "";
-	let loading: boolean = false;
-	let scrollToDiv: HTMLDivElement;
-	let chatMessages: Message[] = data.chatMsg ? data.chatMsg : [];
-	console.log("chatMessages", chatMessages);
-
-	onMount(async () => {
-		scrollToDiv = document
-			.querySelector(".chat-scrollbar")
-			?.querySelector(".svlr-viewport")!;
-	});
-
-	function handleTop() {
-		scrollToTop(scrollToDiv);
-	}
-
-	function storeMessages() {
-		localStorage.setItem(
-			LOCAL_STORAGE_KEY.STORAGE_CHAT_KEY,
-			JSON.stringify(chatMessages)
-		);
-	}
-
-	function decodeEscapedBytes(str: string): string {
-		const byteArray = str
-			.split("\\x")
-			.slice(1)
-			.map((byte) => parseInt(byte, 16));
-		return new TextDecoder("utf-8").decode(new Uint8Array(byteArray));
-	}
-
-	function decodeUnicode(str: string): string {
-		return str.replace(/\\u[\dA-Fa-f]{4}/g, (match) => {
-			return String.fromCharCode(parseInt(match.replace(/\\u/g, ""), 16));
-		});
-	}
-
-	const callTextStream = async (query: string) => {
-		const eventSource = await fetchTextStream(
-			query,
-			$stepValueStore,
-			$base64ImageStore
-		);
-
-		eventSource.addEventListener("message", (e: any) => {
-			let Msg = e.data;
-			if (Msg.startsWith("b")) {
-				let trimmedData = Msg.slice(2, -1);
-
-				if (/\\x[\dA-Fa-f]{2}/.test(trimmedData)) {
-					trimmedData = decodeEscapedBytes(trimmedData);
-				} else if (/\\u[\dA-Fa-f]{4}/.test(trimmedData)) {
-					trimmedData = decodeUnicode(trimmedData);
-				}
-
-				if (trimmedData !== "</s>") {
-					trimmedData = trimmedData.replace(/\\n/g, "\n");
-				}
-				if (chatMessages[chatMessages.length - 1].role == MessageRole.User) {
-					chatMessages = [
-						...chatMessages,
-						{
-							role: MessageRole.Assistant,
-							type: MessageType.Text,
-							content: trimmedData,
-							time: getCurrentTimeStamp(),
-							imgSrc: null, // Add the imgSrc property here
-						},
-					];
-					console.log("? chatMessages", chatMessages);
-				} else {
-					let content = chatMessages[chatMessages.length - 1].content as string;
-					chatMessages[chatMessages.length - 1].content = content + trimmedData;
-				}
-				scrollToBottom(scrollToDiv);
-			} else if (Msg === "[DONE]") {
-				let startTime = chatMessages[chatMessages.length - 1].time;
-
-				loading = false;
-				let totalTime = parseFloat(
-					((getCurrentTimeStamp() - startTime) / 1000).toFixed(2)
-				);
-				if (chatMessages.length - 1 !== -1) {
-					chatMessages[chatMessages.length - 1].time = totalTime;
-				}
-				storeMessages();
-			}
-		});
-		eventSource.stream();
-	};
-
-	const handleTextSubmit = async () => {
-		loading = true;
-		console.log("handleTextSubmit", $base64ImageStore);
-
-		const newMessage = {
-			role: MessageRole.User,
-			type: MessageType.Text,
-			content: query,
-			imgSrc: $base64ImageStore,
-			time: 0,
-		};
-		chatMessages = [...chatMessages, newMessage];
-		scrollToBottom(scrollToDiv);
-		storeMessages();
-		query = "";
-
-		await callTextStream(newMessage.content);
-
-		scrollToBottom(scrollToDiv);
-		storeMessages();
-	};
-
-	function handelClearHistory() {
-		localStorage.removeItem(LOCAL_STORAGE_KEY.STORAGE_CHAT_KEY);
-		chatMessages = [];
-	}
-
-	function handleUpdateQuery(event) {
-		if (event.detail && event.detail.content) {
-			query = event.detail.content;
-			handleTextSubmit();
-		}
-	}
-</script>
-
-<Header />
-<div class="h-full gap-5 bg-white sm:flex sm:pb-2 lg:rounded-tl-3xl">
-	<div class="w-1/5 bg-gray-200 p-4">
-		<Upload />
-		<ImagePrompt on:imagePrompt={handleUpdateQuery} />
-	</div>
-	<div class="flex-1 bg-gray-100 p-4">
-		<div
-			class="mx-auto flex h-full w-full flex-col bg-white px-10 sm:mt-0 sm:w-[80%]"
-		>
-			<div
-				class="fixed relative flex w-full flex-col items-center justify-between bg-white p-2 pb-0"
-			>
-				<div class="relative my-4 flex w-full flex-row justify-center">
-					<div class="relative w-full focus:border-none">
-						<input
-							class="text-md block w-full border-0 border-b-2 border-gray-300 px-1 py-4
-						text-gray-900 focus:border-gray-300 focus:ring-0 dark:border-gray-600 dark:bg-gray-700 dark:text-white dark:placeholder-gray-400 dark:focus:border-blue-500 dark:focus:ring-blue-500"
-							type="text"
-							data-testid="chat-input"
-							placeholder="Enter prompt here"
-							disabled={loading}
-							maxlength="1200"
-							bind:value={query}
-							on:keydown={(event) => {
-								if (event.key === "Enter" && !event.shiftKey && query) {
-									event.preventDefault();
-									handleTextSubmit();
-								}
-							}}
-						/>
-						<button
-							on:click={() => {
-								if (query) {
-									handleTextSubmit();
-								}
-							}}
-							type="submit"
-							class="absolute bottom-2.5 end-2.5 px-4 py-2 text-sm font-medium text-white dark:bg-blue-600 dark:hover:bg-blue-700 dark:focus:ring-blue-800"
-							><PaperAirplane /></button
-						>
-					</div>
-				</div>
-			</div>
-
-			<!-- clear -->
-			{#if Array.isArray(chatMessages) && chatMessages.length > 0 && !loading}
-				<div class="flex w-full justify-between pr-5">
-					<div class="flex items-center">
-						<button
-							class="bg-primary text-primary-foreground hover:bg-primary/90 group flex items-center justify-center space-x-2 p-2"
-							type="button"
-							on:click={() => handelClearHistory()}
-							><svg
-								xmlns="http://www.w3.org/2000/svg"
-								viewBox="0 0 20 20"
-								width="24"
-								height="24"
-								class="fill-[#0597ff] group-hover:fill-[#0597ff]"
-								><path
-									d="M12.6 12 10 9.4 7.4 12 6 10.6 8.6 8 6 5.4 7.4 4 10 6.6 12.6 4 14 5.4 11.4 8l2.6 2.6zm7.4 8V2q0-.824-.587-1.412A1.93 1.93 0 0 0 18 0H2Q1.176 0 .588.588A1.93 1.93 0 0 0 0 2v12q0 .825.588 1.412Q1.175 16 2 16h14zm-3.15-6H2V2h16v13.125z"
-								/></svg
-							><span class="font-medium text-[#0597ff]">CLEAR</span></button
-						>
-					</div>
-				</div>
-			{/if}
-			<!-- clear -->
-
-			<div class="mx-auto flex h-full w-full flex-col">
-				<!-- Loading text -->
-				{#if loading}
-					<LoadingAnimation />
-				{/if}
-				<Scrollbar
-					classLayout="flex flex-col gap-1 mr-4"
-					className="chat-scrollbar h-0 w-full grow px-2 pt-2 mt-3 mr-5"
-				>
-					{#each chatMessages as message, i}
-						<ChatMessage
-							on:scrollTop={() => handleTop()}
-							msg={message}
-							time={i === 0 || (message.time > 0 && message.time < 100)
-								? message.time
-								: ""}
-						/>
-					{/each}
-				</Scrollbar>
-
-			</div>
-			<!-- gallery -->
-		</div>
-	</div>
-</div>
-
-<style>
-	.row::-webkit-scrollbar {
-		display: none;
-	}
-
-	.row {
-		scrollbar-width: none;
-	}
-
-	.row {
-		-ms-overflow-style: none;
-	}
-</style>
diff --git a/VisualQnA/ui/svelte/src/routes/+page.ts b/VisualQnA/ui/svelte/src/routes/+page.ts
deleted file mode 100644
index f4de8d6760..0000000000
--- a/VisualQnA/ui/svelte/src/routes/+page.ts
+++ /dev/null
@@ -1,26 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-import { browser } from "$app/environment";
-import { LOCAL_STORAGE_KEY } from "$lib/shared/constant/Interface";
-
-export const load = async () => {
-	if (browser) {
-		const chat = localStorage.getItem(LOCAL_STORAGE_KEY.STORAGE_CHAT_KEY);
-
-		return {
-			chatMsg: JSON.parse(chat || "[]"),
-		};
-	}
-};
diff --git a/VisualQnA/ui/svelte/static/favicon.png b/VisualQnA/ui/svelte/static/favicon.png
deleted file mode 100644
index 75b997f815..0000000000
Binary files a/VisualQnA/ui/svelte/static/favicon.png and /dev/null differ
diff --git a/VisualQnA/ui/svelte/svelte.config.js b/VisualQnA/ui/svelte/svelte.config.js
deleted file mode 100644
index 0f2977ecce..0000000000
--- a/VisualQnA/ui/svelte/svelte.config.js
+++ /dev/null
@@ -1,38 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-import adapter from "@sveltejs/adapter-auto";
-import preprocess from "svelte-preprocess";
-import postcssPresetEnv from "postcss-preset-env";
-
-/** @type {import('@sveltejs/kit').Config} */
-const config = {
-	// Consult https://github.com/sveltejs/svelte-preprocess
-	// for more information about preprocessors
-	preprocess: preprocess({
-		sourceMap: true,
-		postcss: {
-			plugins: [postcssPresetEnv({ features: { "nesting-rules": true } })],
-		},
-	}),
-
-	kit: {
-		adapter: adapter(),
-		env: {
-			publicPrefix: "",
-		},
-	},
-};
-
-export default config;
diff --git a/VisualQnA/ui/svelte/tailwind.config.cjs b/VisualQnA/ui/svelte/tailwind.config.cjs
deleted file mode 100644
index 6cc3a8b951..0000000000
--- a/VisualQnA/ui/svelte/tailwind.config.cjs
+++ /dev/null
@@ -1,43 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-const config = {
-	content: ["./src/**/*.{html,js,svelte,ts}", "./node_modules/flowbite-svelte/**/*.{html,js,svelte,ts}"],
-
-	plugins: [require("flowbite/plugin")],
-
-	darkMode: "class",
-
-	theme: {
-		extend: {
-			colors: {
-				// flowbite-svelte
-				primary: {
-					50: "#FFF5F2",
-					100: "#FFF1EE",
-					200: "#FFE4DE",
-					300: "#FFD5CC",
-					400: "#FFBCAD",
-					500: "#FE795D",
-					600: "#EF562F",
-					700: "#EB4F27",
-					800: "#CC4522",
-					900: "#A5371B",
-				},
-			},
-		},
-	},
-};
-
-module.exports = config;
diff --git a/VisualQnA/ui/svelte/tsconfig.json b/VisualQnA/ui/svelte/tsconfig.json
deleted file mode 100644
index 0f47472f79..0000000000
--- a/VisualQnA/ui/svelte/tsconfig.json
+++ /dev/null
@@ -1,13 +0,0 @@
-{
-	"extends": "./.svelte-kit/tsconfig.json",
-	"compilerOptions": {
-		"allowJs": true,
-		"checkJs": true,
-		"esModuleInterop": true,
-		"forceConsistentCasingInFileNames": true,
-		"resolveJsonModule": true,
-		"skipLibCheck": true,
-		"sourceMap": true,
-		"strict": true
-	}
-}
diff --git a/VisualQnA/ui/svelte/vite.config.ts b/VisualQnA/ui/svelte/vite.config.ts
deleted file mode 100644
index d095cbdcb6..0000000000
--- a/VisualQnA/ui/svelte/vite.config.ts
+++ /dev/null
@@ -1,24 +0,0 @@
-// Copyright (c) 2024 Intel Corporation
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//    http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-import { sveltekit } from "@sveltejs/kit/vite";
-import type { UserConfig } from "vite";
-
-const config: UserConfig = {
-	plugins: [sveltekit()],
-	server: {
-		allowedHosts: true,
-	},
-};
-export default config;
diff --git a/VisualQnA/visualqna.py b/VisualQnA/visualqna.py
deleted file mode 100644
index 6d7fae1540..0000000000
--- a/VisualQnA/visualqna.py
+++ /dev/null
@@ -1,98 +0,0 @@
-# Copyright (C) 2024 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-
-import os
-
-from comps import MegaServiceEndpoint, MicroService, ServiceOrchestrator, ServiceRoleType, ServiceType
-from comps.cores.mega.utils import handle_message
-from comps.cores.proto.api_protocol import (
-    ChatCompletionRequest,
-    ChatCompletionResponse,
-    ChatCompletionResponseChoice,
-    ChatMessage,
-    UsageInfo,
-)
-from comps.cores.proto.docarray import LLMParams
-from fastapi import Request
-from fastapi.responses import StreamingResponse
-
-MEGA_SERVICE_PORT = int(os.getenv("MEGA_SERVICE_PORT", 8888))
-LVM_SERVICE_HOST_IP = os.getenv("LVM_SERVICE_HOST_IP", "0.0.0.0")
-LVM_SERVICE_PORT = int(os.getenv("LLM_SERVICE_PORT", 9399))
-
-
-class VisualQnAService:
-    def __init__(self, host="0.0.0.0", port=8000):
-        self.host = host
-        self.port = port
-        self.megaservice = ServiceOrchestrator()
-        self.endpoint = str(MegaServiceEndpoint.VISUAL_QNA)
-
-    def add_remote_service(self):
-        llm = MicroService(
-            name="lvm",
-            host=LVM_SERVICE_HOST_IP,
-            port=LVM_SERVICE_PORT,
-            endpoint="/v1/lvm",
-            use_remote_service=True,
-            service_type=ServiceType.LVM,
-        )
-        self.megaservice.add(llm)
-
-    async def handle_request(self, request: Request):
-        data = await request.json()
-        stream_opt = data.get("stream", False)
-        chat_request = ChatCompletionRequest.parse_obj(data)
-        prompt, images = handle_message(chat_request.messages)
-        parameters = LLMParams(
-            max_new_tokens=chat_request.max_tokens if chat_request.max_tokens else 1024,
-            top_k=chat_request.top_k if chat_request.top_k else 10,
-            top_p=chat_request.top_p if chat_request.top_p else 0.95,
-            temperature=chat_request.temperature if chat_request.temperature else 0.01,
-            frequency_penalty=chat_request.frequency_penalty if chat_request.frequency_penalty else 0.0,
-            presence_penalty=chat_request.presence_penalty if chat_request.presence_penalty else 0.0,
-            repetition_penalty=chat_request.repetition_penalty if chat_request.repetition_penalty else 1.03,
-            stream=stream_opt,
-        )
-        result_dict, runtime_graph = await self.megaservice.schedule(
-            initial_inputs={"prompt": prompt, "image": images[0]}, llm_parameters=parameters
-        )
-        for node, response in result_dict.items():
-            # Here it suppose the last microservice in the megaservice is LVM.
-            if (
-                isinstance(response, StreamingResponse)
-                and node == list(self.megaservice.services.keys())[-1]
-                and self.megaservice.services[node].service_type == ServiceType.LVM
-            ):
-                return response
-        last_node = runtime_graph.all_leaves()[-1]
-        response = result_dict[last_node]["text"]
-        choices = []
-        usage = UsageInfo()
-        choices.append(
-            ChatCompletionResponseChoice(
-                index=0,
-                message=ChatMessage(role="assistant", content=response),
-                finish_reason="stop",
-            )
-        )
-        return ChatCompletionResponse(model="visualqna", choices=choices, usage=usage)
-
-    def start(self):
-        self.service = MicroService(
-            self.__class__.__name__,
-            service_role=ServiceRoleType.MEGASERVICE,
-            host=self.host,
-            port=self.port,
-            endpoint=self.endpoint,
-            input_datatype=ChatCompletionRequest,
-            output_datatype=ChatCompletionResponse,
-        )
-        self.service.add_route(self.endpoint, self.handle_request, methods=["POST"])
-        self.service.start()
-
-
-if __name__ == "__main__":
-    visualqna = VisualQnAService(port=MEGA_SERVICE_PORT)
-    visualqna.add_remote_service()
-    visualqna.start()