opea-project
diff --git a/‎EdgeCraftRAG/Dockerfile.server‎
Lines changed: 16 additions & 27 deletions b/‎EdgeCraftRAG/Dockerfile.server‎
Lines changed: 16 additions & 27 deletions
diff --git a/‎EdgeCraftRAG/docker_compose/intel/gpu/arc/README.md‎
Lines changed: 2 additions & 3 deletions b/‎EdgeCraftRAG/docker_compose/intel/gpu/arc/README.md‎
Lines changed: 2 additions & 3 deletions
diff --git a/‎EdgeCraftRAG/docker_compose/intel/gpu/arc/compose_vllm_b60.yaml‎
Lines changed: 1 addition & 1 deletion b/‎EdgeCraftRAG/docker_compose/intel/gpu/arc/compose_vllm_b60.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎EdgeCraftRAG/docs/API_Guide.md‎
Lines changed: 1 addition & 1 deletion b/‎EdgeCraftRAG/docs/API_Guide.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎EdgeCraftRAG/docs/Advanced_Setup.md‎
Lines changed: 1 addition & 1 deletion b/‎EdgeCraftRAG/docs/Advanced_Setup.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎EdgeCraftRAG/docs/Explore_Edge_Craft_RAG.md‎
Lines changed: 2 additions & 2 deletions b/‎EdgeCraftRAG/docs/Explore_Edge_Craft_RAG.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎EdgeCraftRAG/edgecraftrag/api/v1/chatqna.py‎
Lines changed: 2 additions & 2 deletions b/‎EdgeCraftRAG/edgecraftrag/api/v1/chatqna.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎EdgeCraftRAG/edgecraftrag/api/v1/data.py‎
Lines changed: 46 additions & 23 deletions b/‎EdgeCraftRAG/edgecraftrag/api/v1/data.py‎
Lines changed: 46 additions & 23 deletions
@@ -1,49 +1,38 @@
 FROM python:3.11-slim
 
 SHELL ["/bin/bash", "-o", "pipefail", "-c"]
-
-RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missing \
-    libjemalloc-dev \
-    libmagic1 \
-    libglib2.0-0 \
-    poppler-utils \
-    tesseract-ocr
-
-RUN apt-get update && apt-get install -y gnupg wget git
-RUN wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | \
-    gpg --yes --dearmor --output /usr/share/keyrings/intel-graphics.gpg
-RUN echo "deb [arch=amd64,i386 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy client" | \
-    tee /etc/apt/sources.list.d/intel-gpu-jammy.list
-RUN apt-get update && apt-get install -y \
-    intel-opencl-icd intel-level-zero-gpu \
-    intel-level-zero-gpu-raytracing \
-    intel-media-va-driver-non-free libmfx1 libmfxgen1 libvpl2 \
-    libegl-mesa0 libegl1-mesa libegl1-mesa-dev libgbm1 libgl1-mesa-dev libgl1-mesa-dri \
-    libglapi-mesa libgles2-mesa-dev libglx-mesa0 libigdgmm12 libxatracker2 mesa-va-drivers \
-    mesa-vdpau-drivers mesa-vulkan-drivers va-driver-all vainfo hwinfo clinfo 
+RUN apt-get update && apt-get install -y gnupg2 wget git
+RUN apt-get remove -y libze-intel-gpu1 libigc1 libigdfcl1 libze-dev || true; \
+    apt-get update; \
+    apt-get install -y curl
+RUN curl -sL 'https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=get&search=0x0C0E6AF955CE463C03FC51574D098D70AFBE5E1F' | tee /etc/apt/trusted.gpg.d/driver.asc
+RUN echo -e "Types: deb\nURIs: https://ppa.launchpadcontent.net/kobuk-team/intel-graphics/ubuntu/\nSuites: plucky\nComponents: main\nSigned-By: /etc/apt/trusted.gpg.d/driver.asc" > /etc/apt/sources.list.d/driver.sources
+RUN apt update && apt-get install -y libze-intel-gpu1 libze1 intel-metrics-discovery intel-opencl-icd clinfo intel-gsc && apt-get install -y libze-intel-gpu1 libze1 intel-metrics-discovery intel-opencl-icd clinfo intel-gsc && apt-get install -y libze-dev intel-ocloc libze-intel-gpu-raytracing
 
 RUN useradd -m -s /bin/bash user && \
-    mkdir -p /home/user && \
-    chown -R user /home/user/ 
+    mkdir -p /home/user && \
+    chown -R user /home/user/
 
 RUN mkdir /templates && \
-    chown -R user /templates
+    chown -R user /templates
 COPY ./edgecraftrag/prompt_template/default_prompt.txt /templates/
 RUN chown -R user /templates/default_prompt.txt
 
 COPY ./edgecraftrag /home/user/edgecraftrag
 
-RUN mkdir -p /home/user/ui_cache 
+RUN mkdir -p /home/user/ui_cache
 ENV UI_UPLOAD_PATH=/home/user/ui_cache
 
 USER user
 
 WORKDIR /home/user/edgecraftrag
-RUN pip install --no-cache-dir --upgrade pip setuptools==70.0.0 && \
-    pip install --no-cache-dir --extra-index-url https://download.pytorch.org/whl/cpu -r requirements.txt
+RUN pip3 install --no-cache-dir --upgrade setuptools==70.0.0 --break-system-packages && \
+    pip3 install --no-cache-dir --extra-index-url https://download.pytorch.org/whl/cpu -r requirements.txt --break-system-packages
+
+RUN pip3 install --no-cache-dir docarray==0.40.0 --break-system-packages
 
 WORKDIR /home/user/
 RUN git clone https://github.com/openvinotoolkit/openvino.genai.git genai
 ENV PYTHONPATH="$PYTHONPATH:/home/user/genai/tools/llm_bench"
 
-ENTRYPOINT ["python", "-m", "edgecraftrag.server"]
+ENTRYPOINT ["python3", "-m", "edgecraftrag.server"]
@@ -95,8 +95,7 @@ For more advanced env variables and configurations, please refer to [Prepare env
 
 ### 5. Deploy the Service on Intel GPU Using Docker Compose
 
-set Milvus DB and chat history round for inference:
-
+set Milvus DB and chat history round for inference: 
 ```bash
 # EC-RAG support Milvus as persistent database, by default milvus is disabled, you can choose to set MILVUS_ENABLED=1 to enable it
 export MILVUS_ENABLED=0
@@ -124,7 +123,7 @@ docker compose -f docker_compose/intel/gpu/arc/compose_vllm.yaml up -d
 #### option b. Deploy the Service on Arc B60 Using Docker Compose
 
 ```bash
-# Besides MILVUS_ENABLED and CHAT_HISTORY_ROUND, below environments are exposed for vLLM config, you can change them to your preference:
+# Besides MILVUS_ENABLED and CHAT_HISTORY_ROUND, below enviroments are exposed for vLLM config, you can change them to your preference:
 # export VLLM_SERVICE_PORT_B60=8086
 # export DTYPE=float16
 # export TP=1 # for multi GPU, you can change TP value
 
@@ -183,4 +183,4 @@ services:
       -dp=$${DP}"
 networks:
   default:
-    driver: bridge
+    driver: bridge
@@ -219,4 +219,4 @@ curl -X POST http://${HOST_IP}:16010/v1/retrieval -H "Content-Type: application/
 
 ```bash
 curl -X POST http://${HOST_IP}:16011/v1/chatqna -H "Content-Type: application/json" -d '{"messages":"#REPLACE WITH YOUR QUESTION HERE#", "top_n":5, "max_tokens":512}' | jq '.'
-```
+```
@@ -208,6 +208,6 @@ Model preparation is the same as vLLM inference section, please refer to [Prepar
 
 This section is the same as default vLLM inference section, please refer to [Prepare env variables and configurations](../docker_compose/intel/gpu/arc/README.md#prepare-env-variables-and-configurations) and [Start Edge Craft RAG Services with Docker Compose](../docker_compose/intel/gpu/arc/README.md#deploy-the-service-on-arc-a770-using-docker-compose)
 
-### 2. Access Kbadmin UI
+### 2. Access Kbadmin UI 
 
 please refer to [ChatQnA with Kbadmin in UI](./Explore_Edge_Craft_RAG.md#chatqna-with-kbadmin-in-ui)
@@ -34,7 +34,7 @@ After knowledge base creation, you can upload the documents for retrieval.
 Then, you can submit messages in the chat box in `Chat` page.
 ![chat_with_rag](../assets/img/chatqna.png)
 
-## ChatQnA with Kbadmin in UI
+## ChatQnA with Kbadmin in UI 
 
 ### Kbadmin Pipeline
 
@@ -52,4 +52,4 @@ Please select 'kbadmin' in `Type`and select kb name from the kbs you created in
 ![upload_data](../assets/img/kbadmin_kb.png)
 
 Then, you can submit messages in the chat box in `Chat` page.
-![chat_with_rag](../assets/img/chatqna.png)
+![chat_with_rag](../assets/img/chatqna.png)
@@ -38,7 +38,7 @@ async def chatqna(request: ChatCompletionRequest):
         active_kb = ctx.knowledgemgr.get_active_knowledge_base()
         request.user = active_kb if active_kb else None
         if experience_kb:
-            request.tool_choice = "auto" if experience_kb.experience_active else "none"
+            request.tool_choice = 'auto' if experience_kb.experience_active else 'none'
         generator = ctx.get_pipeline_mgr().get_active_pipeline().generator
         if generator:
             request.model = generator.model_id
@@ -62,7 +62,7 @@ async def ragqna(request: ChatCompletionRequest):
         active_kb = ctx.knowledgemgr.get_active_knowledge_base()
         request.user = active_kb if active_kb else None
         if experience_kb:
-            request.tool_choice = "auto" if experience_kb.experience_active else "none"
+            request.tool_choice = 'auto' if experience_kb.experience_active else 'none'
         generator = ctx.get_pipeline_mgr().get_active_pipeline().generator
         if generator:
             request.model = generator.model_id
 
@@ -13,88 +13,111 @@
 
 # Upload a text or files
 @data_app.post(path="/v1/data")
-async def add_data(request: DataIn):
-    pl = ctx.get_pipeline_mgr().get_active_pipeline()
+async def add_data(request: DataIn, docs_name: str = None):
+    active_pl = ctx.get_pipeline_mgr().get_active_pipeline()
     docs = []
     if request.text is not None:
         docs.extend(ctx.get_file_mgr().add_text(text=request.text))
     if request.local_path is not None:
-        docs.extend(ctx.get_file_mgr().add_files(docs=request.local_path))
+        docs.extend(ctx.get_file_mgr().add_files(docs=request.local_path, docs_name=docs_name))
 
     nodelist = ctx.get_pipeline_mgr().run_data_prepare(docs=docs)
-    if pl.indexer.comp_subtype != "kbadmin_indexer":
+    if active_pl.indexer.comp_subtype != "kbadmin_indexer":
         if nodelist is None or len(nodelist) == 0:
             raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="File not found")
-    ctx.get_node_mgr().add_nodes(pl.node_parser.idx, nodelist)
+    ctx.get_node_mgr().add_nodes(active_pl.node_parser.idx, nodelist)
     return "Done"
 
 
 # Reindex all files
 @data_app.post(path="/v1/data/reindex")
 async def redindex_data():
     pl = ctx.get_pipeline_mgr().get_active_pipeline()
-
+    kb = ctx.get_knowledge_mgr().get_active_knowledge_base()
+    if kb:
+        kb_name  = kb.name
+        docs_name = kb_name + pl.name + str(pl.indexer.d)
+    else:
+        kb_name = None
+        docs_name = None
     ctx.get_node_mgr().del_nodes_by_np_idx(pl.node_parser.idx)
-    pl.indexer.reinitialize_indexer()
+    pl.indexer.reinitialize_indexer(kb_name)
     pl.update_indexer_to_retriever()
 
-    all_docs = ctx.get_file_mgr().get_all_docs()
+    all_docs = []
+    docs_list =ctx.get_file_mgr().get_kb_files_by_name(docs_name)
+    for docs_file in docs_list:
+        all_docs.extend(docs_file.documents)
     nodelist = ctx.get_pipeline_mgr().run_data_prepare(docs=all_docs)
     if nodelist is not None and len(nodelist) > 0:
         ctx.get_node_mgr().add_nodes(pl.node_parser.idx, nodelist)
-
     return "Done"
 
 
 # Upload files by a list of file_path
 @data_app.post(path="/v1/data/files")
 async def add_files(request: FilesIn):
     docs = []
+    pl = ctx.get_pipeline_mgr().get_active_pipeline()
+    kb = ctx.get_knowledge_mgr().get_active_knowledge_base()
+    docs_name = kb.name + pl.name + str(pl.indexer.d)
     if request.local_paths is not None:
-        docs.extend(ctx.get_file_mgr().add_files(docs=request.local_paths))
+        docs.extend(ctx.get_file_mgr().add_files(docs=request.local_path, kb_name=docs_name))
 
     nodelist = ctx.get_pipeline_mgr().run_data_prepare(docs=docs)
     if nodelist is None or len(nodelist) == 0:
         raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="File not found")
-    pl = ctx.get_pipeline_mgr().get_active_pipeline()
     ctx.get_node_mgr().add_nodes(pl.node_parser.idx, nodelist)
     return "Done"
 
 
 # GET files
 @data_app.get(path="/v1/data/files")
 async def get_files():
-    return ctx.get_file_mgr().get_files()
+    return ctx.get_file_mgr().get_all_docs()
 
 
 # GET a file
 @data_app.get(path="/v1/data/files/{name}")
-async def get_file_docs(name):
-    return ctx.get_file_mgr().get_file_by_name_or_id(name)
+async def get_kb_files_by_name(name):
+    return ctx.get_file_mgr().get_kb_files_by_name(name)
 
 
 # DELETE a file
 @data_app.delete(path="/v1/data/files/{name}")
-async def delete_file(name):
-    if ctx.get_file_mgr().del_file(name):
-        pl = ctx.get_pipeline_mgr().get_active_pipeline()
-
+async def delete_file(kb_name, file_path):
+    pl = ctx.get_pipeline_mgr().get_active_pipeline()
+    docs_name = kb_name + pl.name + str(pl.indexer.d)
+    if ctx.get_file_mgr().del_file(docs_name, file_path):
         # Current solution: reindexing all docs after deleting one file
         # TODO: delete the nodes related to the file
         ctx.get_node_mgr().del_nodes_by_np_idx(pl.node_parser.idx)
-        pl.indexer.reinitialize_indexer()
+        pl.indexer.reinitialize_indexer(kb_name)
         pl.update_indexer_to_retriever()
-
-        all_docs = ctx.get_file_mgr().get_all_docs()
+        all_docs = ctx.get_file_mgr().get_file_by_name(docs_name)
         nodelist = ctx.get_pipeline_mgr().run_data_prepare(docs=all_docs)
         if nodelist is not None and len(nodelist) > 0:
             ctx.get_node_mgr().add_nodes(pl.node_parser.idx, nodelist)
 
+        return f"File is deleted"
+    else:
+        return f"File not found"
+
+# DELETE a file
+@data_app.delete(path="/v1/data/all_files/{name}")
+async def delete_all_file(name):
+    if ctx.get_file_mgr().del_kb_file(name):
+        pl = ctx.get_pipeline_mgr().get_active_pipeline()
+
+        # Current solution: reindexing all docs after deleting one file
+        # TODO: delete the nodes related to the file
+        ctx.get_node_mgr().del_nodes_by_np_idx(pl.node_parser.idx)
+        pl.indexer.reinitialize_indexer()
+        pl.update_indexer_to_retriever()
         return f"File {name} is deleted"
     else:
         return f"File {name} not found"
 
-
 # Upload & save a file from UI
 @data_app.post(path="/v1/data/file/{file_name}")
 async def upload_file(file_name: str, file: UploadFile = File(...)):
@@ -122,4 +145,4 @@ async def upload_file(file_name: str, file: UploadFile = File(...)):
     except Exception as e:
         raise HTTPException(
             status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=f"Failed to upload file: {str(e)}"
-        )
+        )
-Original file line number
+Diff line change
 ```bash
 curl -X POST http://${HOST_IP}:16011/v1/chatqna -H "Content-Type: application/json" -d '{"messages":"#REPLACE WITH YOUR QUESTION HERE#", "top_n":5, "max_tokens":512}' | jq '.'
 -```
 +```