diff --git a/RAGSDK/MainRepo/Dockerfile/ubuntu/Dockerfile b/RAGSDK/MainRepo/Dockerfile/ubuntu/Dockerfile
index a495a2c395f87ea201a09fa2d359a2dd1044828c..d821939466f0f375bcd2c2ee38a9858c23fde69f 100644
--- a/RAGSDK/MainRepo/Dockerfile/ubuntu/Dockerfile
+++ b/RAGSDK/MainRepo/Dockerfile/ubuntu/Dockerfile
@@ -68,14 +68,14 @@ ENV LD_LIBRARY_PATH=${OPENBLAS_INSTALL_PATH}/lib:$LD_LIBRARY_PATH
 
 
 # 安装faiss
-ARG FAISS_INSTALL_PATH=/usr/local/faiss/faiss1.7.4
+ARG FAISS_INSTALL_PATH=/usr/local/faiss/faiss1.10.0
 RUN . /tmp/urls.conf && wget $FAISS_URL && \
-    tar -xf v1.7.4.tar.gz && \
-    cd faiss-1.7.4/faiss && \
-    sed -i "131 i virtual void search_with_filter (idx_t n, const float *x, idx_t k, float *distances, idx_t *lables, const void *mask = nullptr) const{}" Index.h && \
-    sed -i "38 i template <typename IndexT> IndexIDMapTemplate<IndexT>::IndexIDMapTemplate (IndexT *index, std::vector<idx_t> &ids): index (index), own_fields (false) { this->is_trained = index->is_trained; this->metric_type = index->metric_type; this->verbose = index->verbose; this->d = index->d; id_map = ids; }" IndexIDMap.cpp && \
-    sed -i "29 i explicit IndexIDMapTemplate (IndexT *index, std::vector<idx_t> &ids);" IndexIDMap.h && \
-    sed -i "199 i utils/sorting.h" CMakeLists.txt && \
+    tar -xf v1.10.0.tar.gz && \
+    cd faiss-1.10.0/faiss && \
+    sed -i "149 i virtual void search_with_filter (idx_t n, const float *x, idx_t k, float *distances, idx_t *lables, const void *mask = nullptr) const{}" Index.h && \
+    sed -i "49 i template <typename IndexT> IndexIDMapTemplate<IndexT>::IndexIDMapTemplate (IndexT *index, std::vector<idx_t> &ids): index (index), own_fields (false) { this->is_trained = index->is_trained; this->metric_type = index->metric_type; this->verbose = index->verbose; this->d = index->d; id_map = ids; }" IndexIDMap.cpp && \
+    sed -i "30 i explicit IndexIDMapTemplate (IndexT *index, std::vector<idx_t> &ids);" IndexIDMap.h && \
+    sed -i "217 i utils/sorting.h" CMakeLists.txt && \
     cd .. && cmake -B build . -DFAISS_ENABLE_GPU=OFF -DPython_EXECUTABLE=/usr/bin/python3 -DBUILD_TESTING=OFF -DBUILD_SHARED_LIBS=ON -DCMAKE_BUILD_TYPE=Release -DCMAKE_INSTALL_PREFIX=${FAISS_INSTALL_PATH} && \
     make -C build -j faiss && \
     make -C build -j swigfaiss && \
@@ -83,7 +83,7 @@ RUN . /tmp/urls.conf && wget $FAISS_URL && \
     cd ../../.. && make -C build install && \
     cd build/faiss/python && cp libfaiss_python_callbacks.so ${FAISS_INSTALL_PATH}/lib && \
     cd dist && \
-    pip3 install faiss-1.7.4*.whl
+    pip3 install faiss-1.10.0*.whl
 
 # 安装index
 COPY ./package/Ascend-mindxsdk-mxindex*_linux-${ARCH}.run /tmp/
@@ -92,7 +92,7 @@ ENV MX_INDEX_MODELPATH=/home/ascend/modelpath
 RUN cd /usr/local/Ascend/mxIndex/ops && ./custom_opp_${ARCH}.run && mkdir -p /home/ascend/modelpath
 
 # 安装ascendfaiss，到这里了
-ARG FAISS_INSTALL_PATH=/usr/local/faiss/faiss1.7.4
+ARG FAISS_INSTALL_PATH=/usr/local/faiss/faiss1.10.0
 ARG MXINDEX_INSTALL_PATH=/usr/local/Ascend/mxIndex
 ARG PYTHON_HEADER=/usr/include/${PYTHON_VERSION}/
 ARG ASCEND_INSTALL_PATH=/usr/local/Ascend/ascend-toolkit/latest
@@ -111,7 +111,7 @@ RUN unzip master.zip && \
     cd dist && pip3 install ascendfaiss*.whl
 
     
-#ENV LD_LIBRARY_PATH=/usr/local/Ascend/mxIndex/lib:/usr/local/faiss/faiss1.7.4/lib:$LD_LIBRARY_PATH
+#ENV LD_LIBRARY_PATH=/usr/local/Ascend/mxIndex/lib:/usr/local/faiss/faiss1.10.0/lib:$LD_LIBRARY_PATH
 
 
 # 安装toch_npu
@@ -134,7 +134,7 @@ RUN sed -i '$a\export PYTHONPATH=/root/.local/lib/$PYTHON_VERSION/site-packages/
     sed -i '$a\source /usr/local/Ascend/ascend-toolkit/set_env.sh' /root/.bashrc && \
     sed -i '$a\source /usr/local/Ascend/nnal/atb/set_env.sh' /root/.bashrc && \
 	sed -i '$a\source /usr/local/Ascend/mxRag/script/set_env.sh' /root/.bashrc && \
-    sed -i '$a\export LD_LIBRARY_PATH=/usr/local/Ascend/mxIndex/lib:/usr/local/faiss/faiss1.7.4/lib:$LD_LIBRARY_PATH' /root/.bashrc && \
+    sed -i '$a\export LD_LIBRARY_PATH=/usr/local/Ascend/mxIndex/lib:/usr/local/faiss/faiss1.10.0/lib:$LD_LIBRARY_PATH' /root/.bashrc && \
     sed -i '$a\export PATH=/usr/local/bin:$PATH' /root/.bashrc && \
     sed -i 's/$PYTHON_VERSION/'"$PYTHON_VERSION"'/g' /root/.bashrc && \
 	sed -i '$a\export LOGURU_FORMAT="<green>{time:YYYY-MM-DD HH:mm:ss.SSS}</green> | <level>{level: <8}</level> | <cyan>{name}</cyan>:<cyan>{function}</cyan>:<cyan>{line}</cyan> - <level>{message!r}</level>"' /root/.bashrc
@@ -156,7 +156,7 @@ RUN sed -i '$a\export PYTHONPATH=/home/HwHiAiUser/.local/lib/$PYTHON_VERSION/sit
     sed -i '$a\source /usr/local/Ascend/ascend-toolkit/set_env.sh' /home/HwHiAiUser/.bashrc && \
     sed -i '$a\source /usr/local/Ascend/nnal/atb/set_env.sh' /home/HwHiAiUser/.bashrc && \
 	sed -i '$a\source /home/HwHiAiUser/Ascend/mxRag/script/set_env.sh' /home/HwHiAiUser/.bashrc && \
-    sed -i '$a\export LD_LIBRARY_PATH=/home/HwHiAiUser/Ascend/mxIndex/lib:/usr/local/faiss/faiss1.7.4/lib:$LD_LIBRARY_PATH' /home/HwHiAiUser/.bashrc && \
+    sed -i '$a\export LD_LIBRARY_PATH=/home/HwHiAiUser/Ascend/mxIndex/lib:/usr/local/faiss/faiss1.10.0/lib:$LD_LIBRARY_PATH' /home/HwHiAiUser/.bashrc && \
 	sed -i '$a\export PATH=/usr/local/bin:$PATH' /home/HwHiAiUser/.bashrc && \
     sed -i 's/$PYTHON_VERSION/'"$PYTHON_VERSION"'/g' /home/HwHiAiUser/.bashrc && \
 	sed -i '$a\export LOGURU_FORMAT="<green>{time:YYYY-MM-DD HH:mm:ss.SSS}</green> | <level>{level: <8}</level> | <cyan>{name}</cyan>:<cyan>{function}</cyan>:<cyan>{line}</cyan> - <level>{message!r}</level>"' /home/HwHiAiUser/.bashrc
diff --git a/RAGSDK/MainRepo/Dockerfile/ubuntu/urls.conf b/RAGSDK/MainRepo/Dockerfile/ubuntu/urls.conf
index ba90bb23b30be8fba19d21871427a7eef3ee9184..9dea52d6bd45d2b5a8f24608733ca180cbba899f 100644
--- a/RAGSDK/MainRepo/Dockerfile/ubuntu/urls.conf
+++ b/RAGSDK/MainRepo/Dockerfile/ubuntu/urls.conf
@@ -1,5 +1,5 @@
 PYPI_URL=https://bootstrap.pypa.io/get-pip.py
 CMAKE_URL=https://cmake.org/files/v3.24/cmake-3.24.3.tar.gz
 OPENBLAS_URL=https://github.com/OpenMathLib/OpenBLAS.git
-FAISS_URL=https://github.com/facebookresearch/faiss/archive/v1.7.4.tar.gz
+FAISS_URL=https://github.com/facebookresearch/faiss/archive/v1.10.0.tar.gz
 ASCENDFAISS_URL=https://gitee.com/ascend/mindsdk-referenceapps/repository/archive/master.zip
diff --git a/RAGSDK/PocValidation/dify/README.md b/RAGSDK/PocValidation/dify/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..e2c72a03a8efc7284f7dc9a78a312fcfb4c806ef
--- /dev/null
+++ b/RAGSDK/PocValidation/dify/README.md
@@ -0,0 +1,66 @@
+### 配套版本说明
+dify:0.15.3
+
+milvus: v2.5.0 及以上
+
+streamlit
+
+### 使用步骤：
+
+1 部署milvus服务（[部署参考链接](https://milvus.io/docs/zh/install_standalone-docker.md)）
+
+2 部署mis-tei emb,reranker服务（[部署参考链接](https://www.hiascend.com/developer/ascendhub/detail/07a016975cc341f3a5ae131f2b52399d)）
+
+3 如果需要解析docx、pdf文件中的图片进行图文并茂回答，需部署VLM模型服务（[部署参考链接](https://www.hiascend.com/developer/ascendhub/detail/9eedc82e0c0644b2a2a9d0821ed5e7ad)）, LLM服务（[部署参考链接](https://www.hiascend.com/developer/ascendhub/detail/125b5fb4e7184b8dabc3ae4b18c6ff99)）
+
+4 执行dify_demo.py运行服务,具体参数可执行 --help查看
+```
+python3 dify_demo.py
+```
+5 通过接口上传、删除、查看文档等操作
+
+6 支持在dify界面配置外接知识库，[部署参考参考链接](https://docs.dify.ai/zh-hans/guides/knowledge-base/connect-external-knowledge-base)
+
+7 可调用/query接口问答测试，如需图片并茂内容，启动demo时请配置 --parse_image 使能图片解析功能,代码执行路径下存放了LLM回答文件response.md，可通过如下代码启动web网页可直观展示答复内容，复制如下代码在dify_demo.py同级目录下创建st.py
+
+```
+import streamlit as st
+import re
+
+# 读取 Markdown 文件
+with open("./response.md", "r", encoding="utf-8") as file:
+    markdown_text = file.read()
+
+# 在 Streamlit 应用中显示 Markdown 内容，同时处理图片
+def render_markdown_with_images(markdown_text):
+    # 匹配 Markdown 图片语法 ![alt text](image_url)
+    pattern = re.compile(r'!\[.*?\]\((.*?)\)')
+
+    # 记录上一个位置
+    last_pos = 0
+
+    # 查找所有匹配项
+    for match in pattern.finditer(markdown_text):
+        # 显示上一个位置到匹配位置之间的文本
+        st.markdown(markdown_text[last_pos:match.start()], unsafe_allow_html=True)
+
+        # 显示图片
+        img_url = match.group(1)
+        st.image(img_url)
+
+        # 更新上一个位置
+        last_pos = match.end()
+
+    # 显示剩余的文本
+    st.markdown(markdown_text[last_pos:], unsafe_allow_html=True)
+
+render_markdown_with_images(markdown_text)	
+```
+
+# 调用函数显示内容
+这里只是简单提供展示样例，如果需考虑安全，请开启https安全认证功能
+
+WEB服务启动命令：
+```
+streamlit run st.py --server.address "服务IP" --server.port 服务端口
+```
\ No newline at end of file
diff --git a/RAGSDK/PocValidation/dify/dify_demo.py b/RAGSDK/PocValidation/dify/dify_demo.py
new file mode 100644
index 0000000000000000000000000000000000000000..391a5afd2589a8d8b6f0fa2acbce4becf8bcef46
--- /dev/null
+++ b/RAGSDK/PocValidation/dify/dify_demo.py
@@ -0,0 +1,711 @@
+import argparse
+import base64
+import io
+import json
+import os
+import sys
+import re
+import shutil
+from http import HTTPStatus
+from typing import Optional, List
+from pathlib import Path
+
+import docx
+import fitz
+import httpx
+import uvicorn
+from PIL import Image
+from fastapi import FastAPI, UploadFile
+from langchain_openai import ChatOpenAI
+from loguru import logger
+from openai import OpenAI
+from pydantic import BaseModel
+from pymilvus import MilvusClient
+from starlette.responses import JSONResponse
+
+from langchain_community.document_loaders import TextLoader
+from langchain_text_splitters import RecursiveCharacterTextSplitter
+from mx_rag.document import LoaderMng
+from mx_rag.document.loader import DocxLoader, PdfLoader
+from mx_rag.embedding.service import TEIEmbedding
+from mx_rag.knowledge import KnowledgeStore, KnowledgeDB
+from mx_rag.reranker.service import TEIReranker
+from mx_rag.retrievers import Retriever, FullTextRetriever
+from mx_rag.storage.document_store import MilvusDocstore
+from mx_rag.storage.vectorstore import MilvusDB
+from mx_rag.utils import ClientParam
+
+sys.tracebacklimit = 1000
+
+app = FastAPI()
+
+upload_file_dir = os.environ.get("UPLOAD_FILE_DIR", "/home/data")
+images_store_dir = os.environ.get("IMG_STORE_DIR", "/home/images")
+os.mkdir(upload_file_dir) if not os.path.exists(upload_file_dir) else None
+
+img_to_text_prompt = '''Given an image containing a table or figure, please provide a structured and detailed
+description in chinese with two levels of granularity:
+
+  Coarse-grained Description:
+  - Summarize the overall content and purpose of the image.
+  - Briefly state what type of data or information is presented (e.g., comparison, trend, distribution).
+  - Mention the main topic or message conveyed by the table or figure.
+
+  Fine-grained Description:
+  - Describe the specific details present in the image.
+  - For tables: List the column and row headers, units, and any notable values, patterns, or anomalies.
+  - For figures (e.g., plots, charts): Explain the axes, data series, legends, and any significant trends, outliers,
+  or data points.
+  - Note any labels, captions, or annotations included in the image.
+  - Highlight specific examples or noteworthy details.
+
+  Deliver the description in a clear, organized, and reader-friendly manner, using bullet points or paragraphs
+  as appropriate, answer in chinese'''
+
+text_infer_prompt = '''
+You are a helpful question-answering assistant. Your task is to generate a interleaved text and image response based on provided questions and quotes. Here‘s how to refine your process:
+
+1. **Evidence Selection**:
+   - From both text and image quotes, pinpoint those really relevant for answering the question. Focus on significance and direct relevance.
+   - Each image quote is the description of the image.
+
+2. **Answer Construction**:
+   - Use Markdown to embed text and images in your response, avoid using obvious headings or divisions; ensure the response flows naturally and cohesively.
+   - Conclude with a direct and concise answer to the question in a simple and clear sentence.
+
+3. **Quote Citation**:
+   - Cite text by adding [index]; for example, quote from the first text should be [1].
+   - Cite images using the format `![{conclusion}](image index)`; for the first image, use `![{conclusion}](image1)`;The {conclusion} should be a concise one-sentence summary of the image’s content.
+   - Ensure the cite of the image must strict follow `![{conclusion}](image index)`, do not simply stating "See image1", "image1 shows" ,"[image1]" or "image1".
+   - Each image or text can only be quoted once.
+
+- Do not cite irrelevant quotes.
+- Compose a detailed and articulate interleaved answer to the question.
+- Ensure that your answer is logical, informative, and directly ties back to the evidence provided by the quotes.
+- Interleaved answer must contain both text and image response.
+- Answer in chinese.
+'''
+
+
+# 创建llm_chain 客户端
+def create_llm_chain(base_url, model_name):
+    http_client = httpx.Client()
+    root_client = OpenAI(
+        base_url=base_url,
+        api_key="sk_fake",
+        http_client=http_client
+    )
+
+    client = root_client.chat.completions
+
+    llm = ChatOpenAI(
+        api_key="sk_fake",
+        client=client,
+        model_name=model_name,
+        temperature=0.5,
+        streaming=True,
+    )
+
+    return llm
+
+
+def compose_text_messages(question, text_docs, img_docs):
+    # 2. Add text quotes
+    user_message = "Text Quotes are:"
+    for i, doc in enumerate(text_docs):
+        user_message += f"\n[{i + 1}] {doc.page_content}"
+
+    # 3. Add image quotes vlm-text or ocr-text
+    user_message += "\nImage Quotes are:"
+    for i, doc in enumerate(img_docs):
+        user_message += f"\nimage{i + 1} is described as: {doc.page_content}"
+    user_message += "\n\n"
+
+    # 4. add user question
+    user_message += f"The user question is: {question}"
+
+    return user_message
+
+
+# 从pdf文件中解析出所有的图片并存储到output_folder目录下
+def extract_images_from_docx(image_out_dir, file_path):
+    # 打开文档
+    doc = docx.Document(file_path)
+
+    output_folder = os.path.join(image_out_dir, os.path.basename(file_path))
+    # 创建输出文件夹
+    if not os.path.exists(output_folder):
+        os.makedirs(output_folder)
+
+    # 解析文档中的图片
+    for rel in doc.part.rels.values():
+        if "image" in rel.target_ref:
+            image_part = rel.target_part
+            image_filename = os.path.basename(image_part.partname)
+            image_path = os.path.join(output_folder, image_filename)
+            with open(image_path, "wb") as image_file:
+                image_file.write(image_part.blob)
+
+    logger.info(f"extract images from {file_path} successfully")
+
+
+# 从pdf文件中解析出所有的图片并存储到output_folder目录下
+def extract_images_from_pdf(image_out_dir, file_path):
+    output_folder = os.path.join(image_out_dir, os.path.basename(file_path))
+    # 打开PDF文件
+    if not os.path.exists(output_folder):
+        os.makedirs(output_folder)
+
+    pdf_document = fitz.open(file_path)
+
+    # 遍历每一页
+    for page_num in range(len(pdf_document)):
+        page = pdf_document.load_page(page_num)
+        image_list = page.get_images(full=True)
+
+        # 遍历每一张图片
+        for img_index, img in enumerate(image_list):
+            xref = img[0]
+            base_image = pdf_document.extract_image(xref)
+            image_bytes = base_image["image"]
+            image_ext = base_image["ext"]
+
+            # 保存图片
+            image_filename = f"image_{page_num + 1}_{img_index + 1}.{image_ext}"
+            image_path = f"{output_folder}/{image_filename}"
+            with open(image_path, "wb") as image_file:
+                image_file.write(image_bytes)
+
+    pdf_document.close()
+
+    logger.info(f"extract images from {file_path} successfully")
+
+
+# 获取向量模型对象
+def get_embedding():
+    # 初始化embedding客户端对象
+    return TEIEmbedding(url=os.environ.get("embedding_url"), client_param=ClientParam(use_http=True))
+
+
+# 获取向量数据库对象
+def get_vector_store():
+    knowledge_name = os.environ.get("knowledge_name")
+    milvus_client = MilvusClient(os.environ.get("milvus_url"))
+    vector_store = MilvusDB.create(client=milvus_client,
+                                   x_dim=int(os.environ.get("embedding_dim")),
+                                   collection_name=f"{knowledge_name}_vector")
+    return vector_store
+
+
+# 获取文本数据库对象
+def get_chunk_store():
+    knowledge_name = os.environ.get("knowledge_name")
+    milvus_client = MilvusClient(os.environ.get("milvus_url"))
+    return MilvusDocstore(milvus_client, collection_name=f"{knowledge_name}_chunk")
+
+
+# 获取知识库对象
+def get_knowledge_db():
+    chunk_store = get_chunk_store()
+    user_id = "7d1d04c1-dd5f-43f8-bad5-99795f24bce6"
+    vector_store = get_vector_store()
+    knowledge_store = KnowledgeStore(db_path="./knowledge_store_sql.db")
+    knowledge_name = os.environ.get("knowledge_name")
+    knowledge_store.add_knowledge(knowledge_name, user_id=user_id)
+
+    # 初始化知识库管理
+    knowledge_db = KnowledgeDB(knowledge_store=knowledge_store,
+                               chunk_store=chunk_store,
+                               vector_store=vector_store,
+                               knowledge_name=knowledge_name,
+                               white_paths=["/home"],
+                               user_id=user_id)
+
+    return knowledge_db
+
+
+# 获取文档加载器，和切分器
+def get_document_loader_splitter(file_suffix):
+    # 初始化文档加载切分管理器
+    loader_mng = LoaderMng()
+
+    # 注册文档加载器，可以使用mxrag提供的，也可以使用langchain提供的，同时也可实现langchain_community.document_loaders.base.BaseLoader
+    # 接口类自定义实现文档解析功能
+    loader_mng.register_loader(loader_class=TextLoader, file_types=[".txt", ".md"])
+    loader_mng.register_loader(loader_class=DocxLoader, file_types=[".docx"])
+    loader_mng.register_loader(loader_class=PdfLoader, file_types=[".pdf"])
+    # 注册文档切分器，可自定义实现langchain_text_splitters.base.TextSplitter基类对文档进行切分
+    loader_mng.register_splitter(splitter_class=RecursiveCharacterTextSplitter,
+                                 file_types=[".docx", ".txt", ".md", ".pdf"],
+                                 splitter_params={"chunk_size": 750,
+                                                  "chunk_overlap": 150,
+                                                  "keep_separator": False
+                                                  }
+                                 )
+
+    # 根据文件后缀获取对应的文件解析器信息，包含解析类，及参数
+    loader_info = loader_mng.get_loader(file_suffix)
+    # 根据文件后缀获取对应的文件切分器信息，包含切分类，及参数
+    splitter_info = loader_mng.get_splitter(file_suffix)
+
+    return loader_info, splitter_info
+
+
+# 根据问题从数据库中检索相似片段
+def retrieve_similarity_docs(query, top_k, score_threshold):
+    # 获取embedding对象
+    emb = get_embedding()
+    # 获取文本和向量数据库对象
+    chunk_store = get_chunk_store()
+    vector_store = get_vector_store()
+
+    # 配置向量检索器，
+    dense_retriever = Retriever(vector_store=vector_store,
+                                document_store=chunk_store,
+                                embed_func=emb.embed_documents,
+                                k=top_k,
+                                score_threshold=score_threshold
+                                )
+
+    # 调用检索器从向量数据库中查找出和query最相近的tok个文档chunk
+    dense_res = dense_retriever.invoke(query)
+
+    # 配置全文检索器，其实现原理为BM25检索
+    full_text_retriever = FullTextRetriever(document_store=chunk_store, k=top_k)
+
+    full_text_res = full_text_retriever.invoke(query)
+
+    # 合并检索结果
+    docs = dense_res + full_text_res
+
+    # 两路检索，可能检索到重复的片段，去重处理
+    contents = set()
+    new_docs = []
+    for doc in docs:
+        if doc.page_content not in contents:
+            new_docs.append(doc)
+            contents.add(doc.page_content)
+
+    logger.info(f"retrieve similarity chunks from knowledge successfully")
+    return new_docs
+
+
+def generate_answer(query, q_docs):
+    # 拆分知识片段分为原始文本和图片多粒度信息文本
+    text_docs = [doc for doc in q_docs if doc.metadata.get("type", "") == "text"]
+    img_docs = [doc for doc in q_docs if doc.metadata.get("type", "") == "image"]
+
+    text = compose_text_messages(query, text_docs, img_docs)
+
+    # 构造请求消息
+    messages = [
+        {"role": "system", "content": text_infer_prompt},
+        {"role": "user", "content": text}
+    ]
+
+    # 配置大模型客户端对象
+    llm_chain = create_llm_chain(base_url=os.environ.get("llm_base_url"), model_name=os.environ.get("llm_model_name"))
+
+    response = ""
+    try:
+        response = llm_chain.invoke(messages).content
+        logger.info(f"generate answer by llm successfully")
+    except Exception as e:
+        logger.error(f"call llm invoke failed:{e}")
+
+    result = replace_image_paths(response, img_docs)
+
+    return result
+
+
+def replace_image_paths(text, image_docs):
+    """
+    将response中的imageN替换为image_docs中对应的image_path
+    """
+    if text == "":
+        return text
+
+    # 创建imageN到image_path的映射
+    image_mapping = {}
+    for i, doc in enumerate(image_docs):
+        image_key = f"image{i + 1}"
+        image_path = doc.metadata.get("image_path", "")
+        image_mapping[image_key] = image_path
+
+    # 使用正则表达式找到所有的![...](imageN)模式并替换
+    def replace_match(match):
+        full_match = match.group(0)  # 完整匹配的字符串
+        alt_text = match.group(1)  # 图片描述文本
+        image_ref = match.group(2)  # imageN
+
+        # 如果找到对应的image_path，则替换
+        if image_ref in image_mapping:
+            return f"![{alt_text}]({image_mapping[image_ref]})"
+        else:
+            # 如果没有找到对应的路径，保持原样
+            return full_match
+
+    # 匹配 ![...](imageN) 模式
+    pattern = r'!\[([^\]]*)\]\((image\d+)\)'
+    updated_response = re.sub(pattern, replace_match, text)
+
+    logger.info(f"Image paths replacement completed")
+    return updated_response
+
+
+# 调用vlm对图片进行多粒度理解
+def extract_image_info_by_vlm(image_path):
+    # 将图像转换为 base64 编码的字符串
+    with Image.open(image_path) as img:
+        width, height = img.size
+        # 如果图片小于256*256，直接返回
+        if width < 256 and height < 256:
+            logger.warning(f"----------- image:{image_path} size: ({width},{height}) too little, will be discarded")
+            return ""
+
+        buffer = io.BytesIO()
+        if Path(image_path).suffix == ".png":
+            img = img.convert("RGB")
+
+        if width > 1024 or height > 1024:
+            img = img.resize(size=(width // 2, height // 2))
+
+        img.save(buffer, format="JPEG")
+        img_str = base64.b64encode(buffer.getvalue()).decode('utf-8')
+
+    # 构造请求消息
+    messages = [
+        {
+            "role": "user",
+            "content": [
+                {"type": "text", "text": img_to_text_prompt},
+                {"type": "image_url", "image_url": {"url": f"data:image;base64,{img_str}"}}
+            ]
+        }
+    ]
+
+    vlm = create_llm_chain(base_url=os.environ.get("vlm_base_url"), model_name=os.environ.get("vlm_model_name"))
+
+    try:
+        return vlm.invoke(messages).content
+    except Exception as e:
+        logger.error(f"call vlm invoke failed:{e}")
+        return ""
+
+
+# 获取目录下的所有图片文件路径
+def find_images_files(directory, recursive=False):
+    base_path = Path(directory)
+    exts = ('.jpg', '.jpeg', ".png")
+    files = []
+
+    for ext in exts:
+        pattern = f'**/*{ext}' if recursive else f'*{ext}'
+        file_list = list(base_path.glob(pattern))
+        files.extend(str(p) for p in file_list)
+
+    return files
+
+
+# 将图片目录下的所有有图片调用vlm进行多粒度理解述并保存到json文件中
+def extract_images_info_by_vlm(image_out_dir, file_name):
+    image_dir = os.path.join(image_out_dir, file_name)
+
+    # 避免同一个文件中的所有图片重复调用vlm 提取信息，如果image_info.json如果存在，表示已经提取，不用再次提取，降低vlm算力
+    if os.path.exists(os.path.join(image_dir, "image_info.json")):
+        logger.warning(f"all images in {image_dir} have been extracted, no need to repeat extraction")
+        return
+
+    logger.info(f"start to extract images info in file [{file_name}] by vlm ...")
+
+    image_files = find_images_files(image_dir)
+    info = []
+    for image_file in image_files:
+        logger.debug(f"start to deal {[image_file]} by vlm")
+        res = extract_image_info_by_vlm(image_file)
+        if res:
+            info.append({"image_path": image_file, "image_description": res})
+
+    with open(os.path.join(image_dir, "image_info.json"), "w", encoding='utf-8') as f:
+        f.write(json.dumps(info, indent=4, ensure_ascii=False))
+
+    logger.info(f"extract images info successfully")
+
+
+class RetrievalParam(BaseModel):
+    knowledge_id: str
+    query: str
+    retrieval_setting: Optional[dict] = {"top_k": 3, "score_threshold": 0.5}
+
+
+@app.post("/dify/retrieval")
+async def retrieve(arg: RetrievalParam):
+    logger.info(f"doing retrieval")
+
+    top_k = int(arg.retrieval_setting.get("top_k", 3))
+    score_threshold = arg.retrieval_setting.get("score_threshold", 3)
+
+    text_reranker = TEIReranker(url=os.environ.get("reranker_url"), k=top_k, client_param=ClientParam(use_http=True))
+
+    q_docs = retrieve_similarity_docs(arg.query, top_k, score_threshold)
+    if text_reranker is not None and len(q_docs) > 0:
+        score = text_reranker.rerank(arg.query, [doc.page_content for doc in q_docs])
+        q_docs = text_reranker.rerank_top_k(q_docs, score)
+
+    records = []
+    for doc in q_docs:
+        records.append({
+            "content": doc.page_content,
+            "score": doc.metadata.get("score", 0),
+            "title": doc.metadata.get("source", ""),
+            "metadata": doc.metadata
+        })
+
+    return JSONResponse(content={"records": records})
+
+
+class QueryParam(BaseModel):
+    knowledge_id: str
+    query: str
+    retrieval_setting: Optional[dict] = {"top_k": 3, "score_threshold": 0.5}
+
+
+@app.post("/query")
+async def retrieve(arg: QueryParam):
+    logger.info(f"doing query")
+
+    top_k = int(arg.retrieval_setting.get("top_k", 3))
+    score_threshold = arg.retrieval_setting.get("score_threshold", 3)
+    q_docs = retrieve_similarity_docs(arg.query, top_k, score_threshold)
+
+    text_reranker = TEIReranker(url=os.environ.get("reranker_url"), k=top_k, client_param=ClientParam(use_http=True))
+
+    if text_reranker is not None:
+        score = text_reranker.rerank(arg.query, [doc.page_content for doc in q_docs])
+        q_docs = text_reranker.rerank_top_k(q_docs, score)
+
+    response = generate_answer(arg.query, q_docs)
+
+    with open("response.md", "w", encoding="utf-8") as f:
+        f.write(response)
+
+    return JSONResponse(content=response)
+
+
+@app.post("/uploadfile")
+async def uploadfile(file: UploadFile):
+    logger.info(f"start to upload file: {file.filename}")
+
+    if not os.path.exists(upload_file_dir):
+        os.makedirs(upload_file_dir)
+
+    try:
+        contents = file.file.read()
+        file_path = os.path.join(upload_file_dir, file.filename)
+        with open(file_path, 'wb') as f:
+            f.write(contents)
+    except Exception as e:
+        logger.error(f"write file {file.filename} failed: {e}")
+        return JSONResponse(status_code=HTTPStatus.MISDIRECTED_REQUEST,
+                            content={"error_info": "Something went wrong"})
+    finally:
+        file.file.close()
+
+    file_obj = Path(file_path)
+
+    if os.environ["parse_image"] == 'True':
+        if file_obj.suffix == ".docx":
+            extract_images_from_docx(images_store_dir, file_path)
+        if file_obj.suffix == ".pdf":
+            extract_images_from_pdf(images_store_dir, file_path)
+
+        # 第二步 对image_out_dir下的所有图片进行vlm 多粒度理解，结果存放在image_out_dir/image_info.json中
+        extract_images_info_by_vlm(images_store_dir, file.filename)
+
+    # 根据文类型，获取loader类和splitter类信息
+    loader_info, splitter_info = get_document_loader_splitter(file_obj.suffix)
+
+    # 获取embedding对象
+    emb = get_embedding()
+    # 获取知识库管理对象
+    knowledge_db = get_knowledge_db()
+
+    file_base_name = os.path.basename(file_path)
+
+    # 检查当前文件是否已经入过库
+    if knowledge_db.check_document_exist(file_base_name):
+        logger.warning(f"file {file_base_name} exists in knowledge db")
+        return
+
+    # 创建文件解析器和切分器
+    loader = loader_info.loader_class(file_path=file_obj.as_posix(), **loader_info.loader_params)
+    splitter = splitter_info.splitter_class(**splitter_info.splitter_params)
+    # 解析文件并切分
+    docs = loader.load_and_split(splitter)
+
+    # 获取文档片段chunk内容和元数据信息
+    texts = [doc.page_content for doc in docs if doc.page_content]
+    meta_data = [{**doc.metadata, "type": "text"} for doc in docs if doc.page_content]
+
+    if file_obj.suffix in [".docx", ".pdf"]:
+        # 解析的图片存放目录
+        file_image_out_dir = os.path.join(images_store_dir, file_base_name)
+
+        # 读取图片多粒度解析信息
+        try:
+            with open(os.path.join(file_image_out_dir, "image_info.json"), "r", encoding='utf-8') as f:
+                images_description = json.load(f)
+        except Exception as e:
+            logger.warning(f"read image info failed: {e}")
+            images_description = {}
+
+        for description in images_description:
+            texts.append(description["image_description"])
+            meta_data.append({"type": "image",
+                            "source": file_path,
+                            "image_path": description.get("image_path")
+                            })
+
+    # 存储到文本、向量数据库中
+    knowledge_db.add_file(file_obj, texts, {"dense": emb.embed_documents}, meta_data)
+
+    logger.info(f"upload file {file.filename} to knowledge successfully")
+
+    return JSONResponse(content={"info": f"upload file:{file.file.name} successfully"})
+
+
+class DeleteFileParam(BaseModel):
+    file_name: str
+
+
+@app.post("/deletefile")
+async def deletefile(file: DeleteFileParam):
+    logger.info(f"start to delete file:{file.file_name}")
+    try:
+        # 删除数据库中的文档信息
+        knowledge_db = get_knowledge_db()
+        knowledge_db.delete_file(file.file_name)
+
+        # 删除web上传时存放的文件
+        os.remove(os.path.join(upload_file_dir, file.file_name))
+
+        # 删除从文件解析出来的图片
+        shutil.rmtree(os.path.join(images_store_dir, file.file_name))
+
+    except Exception as e:
+        logger.error(f"delete file [{file.file_name}] failed: {e}")
+        return JSONResponse(content=f"delete file [{file.file_name}] failed: {e}")
+
+    return JSONResponse(content=f"delete file [{file.file_name}] successfully")
+
+
+@app.delete("/deleteallfiles")
+async def deleteallfiles():
+    logger.info(f"start to delete all files")
+    knowledge_db = get_knowledge_db()
+
+    knowledge_db.delete_all()
+
+    vector_store = get_vector_store()
+    chunk_store = get_chunk_store()
+
+    vector_store.drop_collection()
+    chunk_store.drop_collection()
+
+    # 删除从文件解析出来的图片
+    try:
+        shutil.rmtree(upload_file_dir)
+    except Exception as e:
+        logger.info(f"-------- delete {upload_file_dir} failed: {e}")
+
+    return JSONResponse(content="delete file successfully")
+
+
+@app.get("/listfiles")
+async def listfiles():
+    logger.info(f"start to list all file")
+    knowledge_db = get_knowledge_db()
+    docs = knowledge_db.get_all_documents()
+    files = [doc.document_name for doc in docs]
+    return JSONResponse(content=files)
+
+
+class QueryFileContentParam(BaseModel):
+    file_name: str
+
+
+@app.post("/query_file_content")
+async def query_file_content(file: QueryFileContentParam):
+    logger.info(f"start to query file:{file.file_name}")
+
+    doc_id = 0
+    knowledge_db = get_knowledge_db()
+    documents = knowledge_db.get_all_documents()
+    for doc in documents:
+        if doc.document_name == file.file_name:
+            doc_id = doc.document_id
+            break
+    if not doc_id:
+        logger.error(f"there is no {file.file_name} in db")
+        return JSONResponse(content="query file content failed")
+
+    chunk_store = get_chunk_store()
+    chunks = chunk_store.search_by_document_id(doc_id)
+    return JSONResponse(content=[{"page_content": chunk.page_content, "metadata": chunk.metadata} for chunk in chunks])
+
+
+def main():
+    class CustomFormatter(argparse.ArgumentDefaultsHelpFormatter):
+        def _get_default_metavar_for_optional(self, action):
+            return action.type.__name__
+
+        def _get_default_metavar_for_positional(self, action):
+            return action.type.__name__
+
+    parser = argparse.ArgumentParser(formatter_class=CustomFormatter)
+    parser.add_argument("--embedding_dim", type=int, default=1024, help="向量模型输出维度")
+    parser.add_argument("--llm_base_url", type=str, default="http://127.0.0.1:2025/openai/v1",
+                        help="llm大模型服务base url地址")
+    parser.add_argument("--vlm_base_url", type=str, default="http://127.0.0.1:8000/openai/v1",
+                        help="vlm大模型服务base url地址")
+    parser.add_argument("--llm_model_name", type=str, default="Qwen2.5-32B-Instruct", help="llm大模型名")
+    parser.add_argument("--vlm_model_name", type=str, default="Qwen2.5-VL-7B-Instruct", help="vlm大模型名")
+    parser.add_argument("--host", type=str, default="0.0.0.0", help="服务host")
+    parser.add_argument("--port", type=int, default="9098", help="服务端口")
+    parser.add_argument("--white_path", type=str, nargs='+', default=["/home", "/mnt"],
+                        help="知识文档入库时所在目录白名单")
+    parser.add_argument("--ssl_keyfile", type=str, help="ssl_keyfile")
+    parser.add_argument("--ssl_certfile", type=str, help="ssl_certfile")
+    parser.add_argument("--ssl_keyfile_password", type=str, help="ssl_keyfile_password")
+    parser.add_argument("--ssl_ca_certs", type=str, help="ssl_ca_certs")
+    parser.add_argument("--ssl_cert_reqs", type=str, help="ssl_cert_reqs")
+    parser.add_argument("--embedding_url", type=str, default="http://127.0.0.1:9123/embed", help="向量模型服务地址")
+    parser.add_argument("--reranker_url", type=str, default="http://127.0.0.1:9124/rerank", help="排序模型服务地址")
+    parser.add_argument("--milvus_url", type=str, default="http://127.0.0.1:19530", help="milvus数据库服务地址")
+    parser.add_argument("--knowledge_name", type=str, default="test",
+                        help="设置知识库名")
+    parser.add_argument("--parse_image", action='store_true', help="是否解析图片信息")
+
+    args = parser.parse_args().__dict__
+    os.environ["embedding_dim"] = str(args.pop('embedding_dim'))
+    os.environ["llm_base_url"] = args.pop('llm_base_url')
+    os.environ["vlm_base_url"] = args.pop('vlm_base_url')
+    os.environ["llm_model_name"] = args.pop('llm_model_name')
+    os.environ["vlm_model_name"] = args.pop('vlm_model_name')
+    os.environ["milvus_url"] = args.pop('milvus_url')
+    os.environ["embedding_url"] = args.pop('embedding_url')
+    os.environ["reranker_url"] = args.pop('reranker_url')
+    os.environ["knowledge_name"] = args.pop('knowledge_name')
+    os.environ["parse_image"] = str(args.pop('parse_image'))
+
+    uvicorn.run(app, host=args.get("host"),
+                port=int(args.get("port")),
+                ssl_keyfile=args.get("ssl_keyfile", None),
+                ssl_certfile=args.get("ssl_certfile", None),
+                ssl_keyfile_password=args.get("ssl_keyfile_password", None),
+                ssl_ca_certs=args.get("ssl_ca_certs", None),
+                ssl_cert_reqs=args.get("ssl_cert_reqs", None))
+
+
+if __name__ == "__main__":
+    main()