From efa63a870aac068d1c3b6edc27bfd26f83f38c4d Mon Sep 17 00:00:00 2001
From: tanxing <eternaldwellers@gmail.com>
Date: Thu, 14 Aug 2025 14:23:58 +0800
Subject: [PATCH 1/3] =?UTF-8?q?fix:=20=E5=89=8D=E7=AB=AF=E5=8A=A0=E8=BD=BD?=
 =?UTF-8?q?=E6=9C=AC=E5=9C=B0=E6=96=87=E4=BB=B6=E6=97=B6=E4=BF=AE=E6=94=B9?=
 =?UTF-8?q?=E4=B8=BA=E9=BB=98=E8=AE=A4force=5Frebuild=20chore:=20=E8=B0=83?=
 =?UTF-8?q?=E6=95=B4=E6=8F=90=E7=A4=BA=E8=AF=8D=20chore:=20=E8=B0=83?=
 =?UTF-8?q?=E6=95=B4=E5=90=91=E9=87=8F=E6=A3=80=E7=B4=A2=E7=9A=84top=5Fk?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 deepsearcher/agent/deep_search.py      | 49 ++++++++------
 deepsearcher/templates/html/index.html |  4 +-
 deepsearcher/templates/index.html      | 88 --------------------------
 deepsearcher/vector_db/milvus.py       |  4 +-
 main.py                                |  6 +-
 5 files changed, 38 insertions(+), 113 deletions(-)
 delete mode 100644 deepsearcher/templates/index.html
diff --git a/deepsearcher/agent/deep_search.py b/deepsearcher/agent/deep_search.py
index 3d6fdb6..9a5d75a 100644
--- a/deepsearcher/agent/deep_search.py
+++ b/deepsearcher/agent/deep_search.py
@@ -23,9 +23,11 @@ COLLECTION_ROUTE_PROMPT = """
 
 SUB_QUERY_PROMPT = """
 为了能够全面的回答这个问题，请你尝试把原本的问题拆分或扩展为几个子问题
-不可以太多，但是也不可以太少，请根据问题复杂程度来决定子问题的数量
+请你使用自顶向下和自底向上两种方向来思考如何拆分问题
+子问题的数量不可以太多，但是也不可以太少，应当保证问题的回答全面性，请根据问题复杂程度来决定子问题的数量
 如果原问题本身非常简单，没有必要进行拆分，则保留输出原问题本身
-需要保证每个子问题都具体、清晰、不可分（原子性），最终返回一个字符串列表
+需要保证每个子问题都具体、清晰、不可分（原子性，即不可以再包含更细分的子问题），子问题中不要包含"请你回答"、"请你总结"、"请你分析"等祈使类型词语
+你需要最终返回一个字符串列表
 
 原问题: {original_query}
 
@@ -49,8 +51,8 @@ SUB_QUERY_PROMPT = """
 
 
 RERANK_PROMPT = """
-根据当前的问题和获取到的文档片段
-请你对当前获取到的文档是否能帮助回答这个问题（直接或间接，全面或部分，都可以）给出一个快速判断
+根据当前的问题和获取到的文档片段（文档片段包裹都在<reference></reference>和<chunk></chunk>标签中并有对应的id）
+请你对当前获取到的文档是否能帮助回答这个问题（直接或间接、全面或部分，都可以）给出一个快速判断
 对于每一个文档片段，你只应该返回"YES"或者"NO"（需要注意顺序和数量）
 
 问题: {query}
@@ -58,17 +60,18 @@ RERANK_PROMPT = """
 检索到的文档片段:
 {chunks}
 
-例如，给定4个chunks（实际检索到的文档片段不一定是4个），返回: ["YES", "NO", "YES", "YES"]
+例如，假如给出4个chunks（实际检索到的文档片段不一定是这么多），返回4个"YES"或者"NO"（注意这只是一个示例，不代表实际判断）: ["YES", "NO", "YES", "YES"]
 使用的语言与问题相同
 你需要返回的是 a python list of str without any addtional content:
 """
 
 
 REFLECT_PROMPT = """
-根据原问题和子问题，以及获取到的文档片段，请你决定是否要生成更多的问题。
-如果已经获得的文档片段没能覆盖所有的子问题，这意味着这些文档无法被检索到。
-你可以尝试生成相似但些许不同的问题来尝试重新检索，但是也可以根据获得到的文档片段进行批评思考，生成新的问题来保证原问题的回答的准确和全面
-如果没有真的必要继续研究（取决于你的判断），返回一个空列表
+根据原问题和子问题，以及获取到的文档片段，请你决定是否要生成更多的问题，这些问题将被用于后续的思考和搜索。
+你应该根据已经获得到的文档片段进行批评思考，生成其他新的问题来保证原问题的回答的准确和全面。
+如果已经获得的文档片段没能覆盖所有的子问题，这意味着有关这些问题的文档无法被检索到，你应该根据你自己的知识补充思考。
+需要保证每个新的问题都具体、清晰、不可分（原子性）并且不可以和之前的问题重复，新的问题中不要包含"请你回答"、"请你总结"、"请你分析"等祈使类型词语
+如果没有真的必要继续研究（取决于你的判断），返回一个空列表。
 
 原问题: {original_query}
 
@@ -83,24 +86,34 @@ REFLECT_PROMPT = """
 
 
 SUMMARY_PROMPT = """
-你是一个内容分析专家，请你根据提供的问题和检索到的信息生成详尽的长文回答。
-如果检索到的信息不足以回答问题或者必须添加额外信息才能能回答，你应该使用你的知识来进行补充，
-这种情况下，你自己提供的信息需要使用例如"your knowledge here[^0]"引用，注意，这里的"[^0]"的序号0是固定的，表示你的知识，下文当中有文末引用的例子
-同时，你应该根据提供的信息生成文内引用和文末参考资料列表，来自文档切片的reference引用从[^1]开始
-如果多个片段是相同的来源或者一个片段可以回答多个问题，文内引用可以引用多次，但文末只引用一次来源，即文末的引用列表中不能有重复的来源。
+你是一个内容分析专家，请你根据提供的问题和检索到的信息生成详尽的、有逻辑的长文回答。
+同时，你应该根据提供的信息生成文内引用和文末参考资料列表，使用markdown脚注。
+如果检索到的信息不足以回答问题或者必须添加额外信息才能回答，你应该使用你的知识来进行补充，
+这种情况下，你自己提供的信息需要使用例如"your knowledge here[^0]"引用。
+注意，这里的"[^0]"的序号0是固定的，表示你的知识，文末引用使用"[^0]: AI 生成",
+来自<chunk><reference>的引用序号从[^1]开始，来源需要与前文<reference>中的href一致，不需要对每个<chunk>分配一个引用，而是相同<reference>的<chunk>共用一个引用
+另外，如果回答的内容文内引用需要引用多个<reference>，请添加多个[^index]到句尾。
+如果多个片段是相同的来源或者一个片段可以回答多个问题，文内引用可以引用多次，但文末只引用一次来源，即文末的引用列表中不能有重复。
 
 例子:
 <EXAMPLE>
 
-文内引用示例（使用markdown脚注）:
+文内引用示例:
 "XGBoost是非常强大的集成学习模型[^2]"
-(必须使用 "[^index]"，这里的index是对应的<reference>的id)
 
 
-文末引用示例 (需要与前文reference的href一致，不需要对每个chunk分配一个引用，而是每一个referecen共用一个引用):
-[^0]: AI Generated
+文末引用示例:
+正确例子：
+[^0]: AI 生成
+[^1]: files/docs/machine_learning.md
 [^2]: files/docs/chap_001_003_models.md
 
+错误例子：
+[^0]: AI 生成
+[^1]: files/docs/machine_learning.md
+[^2]: files/docs/chap_001_003_models.md
+[^3]: files/docs/chap_001_003_models.md（错误，这是重复引用）
+
 </EXAMPLE>
 
 原问题: {original_query}
diff --git a/deepsearcher/templates/html/index.html b/deepsearcher/templates/html/index.html
index f9591d0..00a7803 100644
--- a/deepsearcher/templates/html/index.html
+++ b/deepsearcher/templates/html/index.html
@@ -33,7 +33,7 @@
             </div>
 
             <div class="card">
-                <h2 class="card-title">网站内容加载</h2>
+                <h2 class="card-title">网站加载</h2>
                 <div class="form-group">
                     <label for="websiteUrls">网站URL（多个URL用逗号分隔）</label>
                     <input type="text" id="websiteUrls" placeholder="例如: https://example.com/page1,https://example.com/page2">
@@ -46,7 +46,7 @@
                     <label for="webCollectionDesc">集合描述（可选）</label>
                     <textarea id="webCollectionDesc" rows="2" placeholder="例如: 来自网站的内容"></textarea>
                 </div>
-                <button id="loadWebsiteBtn">加载网站内容</button>
+                <button id="loadWebsiteBtn">加载网站</button>
                 <div id="webLoadStatus" class="status"></div>
             </div>
 
diff --git a/deepsearcher/templates/index.html b/deepsearcher/templates/index.html
deleted file mode 100644
index 20af32f..0000000
--- a/deepsearcher/templates/index.html
+++ /dev/null
@@ -1,88 +0,0 @@
-<!DOCTYPE html>
-<html lang="zh">
-<head>
-    <meta charset="UTF-8">
-    <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>DeepSearcher - 智能搜索系统</title>
-    <link rel="stylesheet" href="static/css/styles.css">
-</head>
-<body>
-    <div class="container">
-        <header>
-            <h1>DeepSearcher 智能搜索系统</h1>
-            <p class="app-description">基于大型语言模型和向量数据库的企业知识管理系统，支持私有数据搜索和在线内容整合，提供准确答案和综合报告。</p>
-        </header>
-
-        <main>
-            <div class="card">
-                <h2 class="card-title">文件加载</h2>
-                <div class="form-group">
-                    <label for="filePaths">文件路径（多个路径用逗号分隔）</label>
-                    <input type="text" id="filePaths" placeholder="例如: /path/to/file1.pdf,/path/to/file2.txt">
-                </div>
-                <div class="form-group">
-                    <label for="collectionName">集合名称</label>
-                    <input type="text" id="collectionName" placeholder="例如: my_collection">
-                </div>
-                <div class="form-group">
-                    <label for="collectionDesc">集合描述</label>
-                    <textarea id="collectionDesc" rows="2" placeholder="例如: 这是一个测试集合"></textarea>
-                </div>
-                <button id="loadFilesBtn">加载文件</button>
-                <div id="loadStatus" class="status"></div>
-            </div>
-
-            <div class="card">
-                <h2 class="card-title">网站加载</h2>
-                <div class="form-group">
-                    <label for="websiteUrls">网站URL（多个URL用逗号分隔）</label>
-                    <input type="text" id="websiteUrls" placeholder="例如: https://example.com/page1,https://example.com/page2">
-                </div>
-                <div class="form-group">
-                    <label for="webCollectionName">集合名称</label>
-                    <input type="text" id="webCollectionName" placeholder="例如: web_collection">
-                </div>
-                <div class="form-group">
-                    <label for="webCollectionDesc">集合描述</label>
-                    <textarea id="webCollectionDesc" rows="2" placeholder="例如: 来自网站的内容"></textarea>
-                </div>
-                <button id="loadWebsiteBtn">加载网站</button>
-                <div id="webLoadStatus" class="status"></div>
-            </div>
-
-            <div class="card">
-                <h2 class="card-title">智能查询</h2>
-                <div class="form-group">
-                    <label for="queryText">请输入您的问题</label>
-                    <textarea id="queryText" rows="3" placeholder="例如: 请生成一份关于人工智能发展趋势的报告"></textarea>
-                </div>
-                <div class="form-group">
-                    <label for="maxIter">最大迭代次数 (1-10)</label>
-                    <input type="number" id="maxIter" min="1" max="10" value="3">
-                </div>
-                <button id="queryBtn">执行查询</button>
-                <button id="clearMessagesBtn" style="margin-left: 10px; background-color: var(--text-secondary);">清空消息</button>
-                <div id="queryStatus" class="status"></div>
-                
-                <div id="queryResult" class="result-container">
-                    <h3>查询结果:</h3>
-                    <div class="query-result" id="resultText"></div>
-                </div>
-                
-                <div id="processResult" class="result-container">
-                    <h3>处理过程:</h3>
-                    <div id="messageStream" class="message-stream">
-                        <div class="message-container" id="messageContainer"></div>
-                    </div>
-                </div>
-            </div>
-        </main>
-
-        <footer>
-            <p>DeepSearcher © 2025 | 企业知识管理与智能问答系统</p>
-        </footer>
-    </div>
-
-    <script src="static/js/app.js"></script>
-</body>
-</html>
\ No newline at end of file
diff --git a/deepsearcher/vector_db/milvus.py b/deepsearcher/vector_db/milvus.py
index 720bef9..2376b22 100644
--- a/deepsearcher/vector_db/milvus.py
+++ b/deepsearcher/vector_db/milvus.py
@@ -152,7 +152,7 @@ class Milvus(BaseVectorDB):
         self,
         collection: str,
         vector: np.ndarray | list[float],
-        top_k: int = 3,
+        top_k: int = 4,
         query_text: str = None,
         *args,
         **kwargs,
@@ -163,7 +163,7 @@ class Milvus(BaseVectorDB):
         Args:
             collection (Optional[str]): Collection name. If None, uses default_collection.
             vector (Union[np.array, List[float]]): Query vector for similarity search.
-            top_k (int, optional): Number of results to return. Defaults to 5.
+            top_k (int, optional): Number of results to return. Defaults to 4.
             query_text (Optional[str], optional): Original query text for hybrid search. Defaults to None.
             *args: Variable length argument list.
             **kwargs: Arbitrary keyword arguments.
diff --git a/main.py b/main.py
index e9e5eda..d30f423 100644
--- a/main.py
+++ b/main.py
@@ -112,7 +112,7 @@ def load_files(
         examples=[256],
     ),
     force_rebuild: bool = Body(
-        False,
+        True,
         description="Whether to force rebuild the collection if it already exists.",
         examples=[False],
     ),
@@ -141,7 +141,7 @@ def load_files(
             batch_size=batch_size if batch_size is not None else 8,
             force_rebuild=force_rebuild,
         )
-        return {"message": "Files loaded successfully."}
+        return {"message": "成功加载文档"}
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 
@@ -198,7 +198,7 @@ def load_website(
             batch_size=batch_size if batch_size is not None else 8,
             force_rebuild=force_rebuild,
         )
-        return {"message": "Website loaded successfully."}
+        return {"message": "成功加载网址"}
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 

From 7ae94654efaf359d1178ee2b2da249c11077e2b4 Mon Sep 17 00:00:00 2001
From: tanxing <eternaldwellers@gmail.com>
Date: Thu, 14 Aug 2025 18:03:45 +0800
Subject: [PATCH 2/3] =?UTF-8?q?chore:=20=E4=BC=98=E5=8C=96=E5=9B=9E?=
 =?UTF-8?q?=E7=AD=94=E7=94=9F=E6=88=90=20chore:=20=E4=BC=98=E5=8C=96milvus?=
 =?UTF-8?q?=E9=85=8D=E7=BD=AE=20chore:=20=E4=BC=98=E5=8C=96HTML=E6=A8=A1?=
 =?UTF-8?q?=E6=9D=BF=20refactor:=20=E4=BC=98=E5=8C=96=E5=8F=82=E6=95=B0?=
 =?UTF-8?q?=E4=BC=A0=E9=80=92?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 deepsearcher/agent/deep_search.py       | 55 ++++++++++++++-----------
 deepsearcher/config.yaml                |  6 +--
 deepsearcher/llm/openai_llm.py          |  4 +-
 deepsearcher/online_query.py            |  3 +-
 deepsearcher/templates/html/index.html  |  4 +-
 deepsearcher/templates/static/js/app.js |  4 +-
 docs/intro_docs/milvus_benchmark.md     | 16 ++++---
 main.py                                 |  8 ++--
 test.py                                 |  4 +-
 9 files changed, 59 insertions(+), 45 deletions(-)

diff --git a/deepsearcher/agent/deep_search.py b/deepsearcher/agent/deep_search.py
index 9a5d75a..0e35e77 100644
--- a/deepsearcher/agent/deep_search.py
+++ b/deepsearcher/agent/deep_search.py
@@ -38,9 +38,10 @@ SUB_QUERY_PROMPT = """
 示例输出（例子中的数量不是要求）:
 [
     "什么是机器学习?",
-    "机器学习的使用目的是什么?",
-    "机器学习和深度学习的区别是什么？",
-    "机器学习的历史演进过程？"
+    "机器学习的使用目的",
+    "机器学习的常用算法",
+    "机器学习的历史演进过程",
+    "机器学习和深度学习的区别是什么？"
 ]
 
 </EXAMPLE>
@@ -51,16 +52,16 @@ SUB_QUERY_PROMPT = """
 
 
 RERANK_PROMPT = """
-根据当前的问题和获取到的文档片段（文档片段包裹都在<reference></reference>和<chunk></chunk>标签中并有对应的id）
-请你对当前获取到的文档是否能帮助回答这个问题（直接或间接、全面或部分，都可以）给出一个快速判断
-对于每一个文档片段，你只应该返回"YES"或者"NO"（需要注意顺序和数量）
+根据当前的问题和获取到的文档片段（文档片段包裹都在<reference></reference>和<chunk></chunk>标签中并有对应的连续的id）
+请你对当前获取到的文档片段是否能帮助回答这个问题（直接或间接、全面或部分，都可以，但需要有实际有效内容）给出一个快速判断
+对于每一个文档片段，你只应该返回"True"或者"False"（需要注意顺序和数量）
 
 问题: {query}
 
 检索到的文档片段:
 {chunks}
 
-例如，假如给出4个chunks（实际检索到的文档片段不一定是这么多），返回4个"YES"或者"NO"（注意这只是一个示例，不代表实际判断）: ["YES", "NO", "YES", "YES"]
+例如，假如给出4个chunks（实际检索到的文档片段不一定是这么多），返回4个"True"或者"False"（注意这只是一个示例，不代表实际判断）: ["True", "False", "True", "True"]
 使用的语言与问题相同
 你需要返回的是 a python list of str without any addtional content:
 """
@@ -68,7 +69,7 @@ RERANK_PROMPT = """
 
 REFLECT_PROMPT = """
 根据原问题和子问题，以及获取到的文档片段，请你决定是否要生成更多的问题，这些问题将被用于后续的思考和搜索。
-你应该根据已经获得到的文档片段进行批评思考，生成其他新的问题来保证原问题的回答的准确和全面。
+你应该根据已经获得到的文档片段进行批评思考，生成其他新的问题来保证原问题的回答的准确和全面，请你使用自顶向下和自底向上两种方向来思考如何生成新问题。
 如果已经获得的文档片段没能覆盖所有的子问题，这意味着有关这些问题的文档无法被检索到，你应该根据你自己的知识补充思考。
 需要保证每个新的问题都具体、清晰、不可分（原子性）并且不可以和之前的问题重复，新的问题中不要包含"请你回答"、"请你总结"、"请你分析"等祈使类型词语
 如果没有真的必要继续研究（取决于你的判断），返回一个空列表。
@@ -86,12 +87,13 @@ REFLECT_PROMPT = """
 
 
 SUMMARY_PROMPT = """
-你是一个内容分析专家，请你根据提供的问题和检索到的信息生成详尽的、有逻辑的长文回答。
+你是一个内容分析专家，请你根据提供的问题和检索到的信息，生成详细、层次分明、尽可能长的回答。
+如果检索到的信息不足以回答问题，你应该使用你的知识来进行扩展补充。
+注意，不要一个子问题一个子问题的回答，而是应该仔细分析子问题之间的关系、子问题和原问题之间的关系。
 同时，你应该根据提供的信息生成文内引用和文末参考资料列表，使用markdown脚注。
-如果检索到的信息不足以回答问题或者必须添加额外信息才能回答，你应该使用你的知识来进行补充，
-这种情况下，你自己提供的信息需要使用例如"your knowledge here[^0]"引用。
+如果你自己提供的信息需要使用"your knowledge here[^0]"引用。
 注意，这里的"[^0]"的序号0是固定的，表示你的知识，文末引用使用"[^0]: AI 生成",
-来自<chunk><reference>的引用序号从[^1]开始，来源需要与前文<reference>中的href一致，不需要对每个<chunk>分配一个引用，而是相同<reference>的<chunk>共用一个引用
+来自<chunk><reference>的引用序号从[^1]开始，来源需要与前文<reference>中的"href"一致，不需要对每个<chunk>分配一个引用，而是相同<reference>的<chunk>共用一个引用
 另外，如果回答的内容文内引用需要引用多个<reference>，请添加多个[^index]到句尾。
 如果多个片段是相同的来源或者一个片段可以回答多个问题，文内引用可以引用多次，但文末只引用一次来源，即文末的引用列表中不能有重复。
 
@@ -110,9 +112,10 @@ SUMMARY_PROMPT = """
 
 错误例子：
 [^0]: AI 生成
-[^1]: files/docs/machine_learning.md
-[^2]: files/docs/chap_001_003_models.md
+[^1]: files/docs/chap_001_003_models.md
+[^2]: files/docs/machine_learning.md
 [^3]: files/docs/chap_001_003_models.md（错误，这是重复引用）
+[^5]: files/docs/machine_learning.md（错误，也这是重复引用）
 
 </EXAMPLE>
 
@@ -275,14 +278,14 @@ class DeepSearch(BaseAgent):
                 relevance_list = self.llm.literal_eval(content)
                 if not isinstance(relevance_list, list):
                     raise ValueError("Response is not a list")
-            except (ValueError, SyntaxError):
+            except Exception as _:
                 # Fallback: if parsing fails, treat all chunks as relevant
                 log.color_print(f"Warning: Failed to parse relevance response. Treating all chunks as relevant. Response was: {content}")
-                relevance_list = ["YES"] * len(retrieved_results)
+                relevance_list = ["True"] * len(retrieved_results)
 
             # Ensure we have enough relevance judgments for all chunks
             while len(relevance_list) < len(retrieved_results):
-                relevance_list.append("YES")  # Default to relevant if no judgment provided
+                relevance_list.append("True")  # Default to relevant if no judgment provided
 
             # Filter relevant chunks based on LLM response
             accepted_chunk_num = 0
@@ -291,9 +294,9 @@ class DeepSearch(BaseAgent):
                 # Check if we have a relevance judgment for this chunk
                 is_relevant = (
                     i < len(relevance_list) and
-                    "YES" in relevance_list[i].upper() and
-                    "NO" not in relevance_list[i].upper()) if i < len(relevance_list
-                ) else True
+                    "True" in relevance_list[i] and
+                    "False" not in relevance_list[i]
+                ) if i < len(relevance_list) else True
 
                 if is_relevant:
                     all_retrieved_results.append(retrieved_result)
@@ -427,12 +430,16 @@ class DeepSearch(BaseAgent):
         chunks = []
         chunk_count = 0
         for i, reference in enumerate(references):
-            formated = f"<reference id='{i + 1}' href='{reference}'>\n" + "".join(
+            formated = "".join(
                 [
-                    f"<chunk id='{j + 1 + chunk_count}'>\n{chunk}\n</chunk id='{j + 1 + chunk_count}'>\n"
-                    for j, chunk in enumerate(references[reference])
+                    (
+                        f"<reference id='{i + 1}' href='{reference}'>" +
+                        f"<chunk id='{j + 1 + chunk_count}'>\n{chunk}\n</chunk id='{j + 1 + chunk_count}'>" +
+                        f"</reference id='{i + 1}'>\n"
+                    )
+                        for j, chunk in enumerate(references[reference])
                 ]
-            ) + f"</reference id='{i + 1}'>\n"
+            )
             print(formated)
             chunks.append(formated)
             chunk_count += len(references[reference])
diff --git a/deepsearcher/config.yaml b/deepsearcher/config.yaml
index fef4343..e560153 100644
--- a/deepsearcher/config.yaml
+++ b/deepsearcher/config.yaml
@@ -2,7 +2,7 @@ provide_settings:
   llm:
     provider: "OpenAILLM"
     config:
-      model: "Qwen/Qwen3-30B-A3B-Thinking-2507"
+      model: "Qwen/Qwen3-32B"
       api_key: "sk-fpzwvagjkhwysjsozfybvtjzongatcwqdihdxzuijnfdrjzt"
       base_url: "https://api.siliconflow.cn/v1"
 
@@ -83,5 +83,5 @@ query_settings:
   max_iter: 3
 
 load_settings:
-  chunk_size: 1024
-  chunk_overlap: 512
+  chunk_size: 4096
+  chunk_overlap: 1024
diff --git a/deepsearcher/llm/openai_llm.py b/deepsearcher/llm/openai_llm.py
index 1af6046..e5edf6d 100644
--- a/deepsearcher/llm/openai_llm.py
+++ b/deepsearcher/llm/openai_llm.py
@@ -48,9 +48,9 @@ class OpenAILLM(BaseLLM):
             model=self.model,
             messages=messages,
             stream=True,
-            temperature=0.6,
+            temperature=0.7,
             top_p=0.8,
-            presence_penalty=1.2
+            presence_penalty=1.3
         ) as stream:
             # stream到控制台测试
             content = ""
diff --git a/deepsearcher/online_query.py b/deepsearcher/online_query.py
index 096124a..48203a5 100644
--- a/deepsearcher/online_query.py
+++ b/deepsearcher/online_query.py
@@ -3,7 +3,7 @@ from deepsearcher import configuration
 from deepsearcher.vector_db.base import RetrievalResult
 
 
-def query(original_query: str, max_iter: int | None = None) -> tuple[str, list[RetrievalResult]]:
+def query(original_query: str, **kwargs) -> tuple[str, list[RetrievalResult]]:
     """
     Query the knowledge base with a question and get an answer.
 
@@ -20,6 +20,7 @@ def query(original_query: str, max_iter: int | None = None) -> tuple[str, list[R
             - A list of retrieval results that were used to generate the answer
     """
     default_searcher = configuration.default_searcher
+    max_iter = kwargs.get("max_iter", 3)
     return default_searcher.query(original_query, max_iter=max_iter)
 
 
diff --git a/deepsearcher/templates/html/index.html b/deepsearcher/templates/html/index.html
index 00a7803..c716062 100644
--- a/deepsearcher/templates/html/index.html
+++ b/deepsearcher/templates/html/index.html
@@ -10,7 +10,7 @@
     <div class="container">
         <header>
             <h1>DeepSearcher 智能搜索系统</h1>
-            <p class="app-description">基于大型语言模型和向量数据库的企业知识管理系统，支持私有数据搜索和在线内容整合，提供准确答案和综合报告。</p>
+            <p class="app-description">基于大型语言模型和向量数据库的知识管理系统，支持私有数据搜索和在线内容整合，提供准确答案和综合报告。</p>
         </header>
 
         <main>
@@ -54,7 +54,7 @@
                 <h2 class="card-title">智能查询</h2>
                 <div class="form-group">
                     <label for="queryText">请输入您的问题</label>
-                    <textarea id="queryText" rows="3" placeholder="例如: 请生成一份关于人工智能发展趋势的报告"></textarea>
+                    <textarea id="queryText" rows="3" placeholder="例如: 请生成一份关于Milvus向量数据库的详细报告"></textarea>
                 </div>
                 <div class="form-group">
                     <label for="maxIter">最大迭代次数 (1-10)</label>
diff --git a/deepsearcher/templates/static/js/app.js b/deepsearcher/templates/static/js/app.js
index d13cbd2..8a750cb 100644
--- a/deepsearcher/templates/static/js/app.js
+++ b/deepsearcher/templates/static/js/app.js
@@ -250,7 +250,7 @@ document.getElementById('loadFilesBtn').addEventListener('click', async function
     const filePaths = filePathsInput.split(',').map(path => path.trim()).filter(path => path);
     
     setButtonLoading(button, true);
-    showStatus('loadStatus', '正在加载文件...', 'loading');
+    showStatus('loadStatus', ' 正在加载文件...', 'loading');
     hideResult();
     hideProcessResult();
     
@@ -330,7 +330,7 @@ document.getElementById('loadWebsiteBtn').addEventListener('click', async functi
     const urls = urlsInput.split(',').map(url => url.trim()).filter(url => url);
     
     setButtonLoading(button, true);
-    showStatus('webLoadStatus', '正在加载网站内容...', 'loading');
+    showStatus('webLoadStatus', ' 正在加载网站...', 'loading');
     hideResult();
     hideProcessResult();
     
diff --git a/docs/intro_docs/milvus_benchmark.md b/docs/intro_docs/milvus_benchmark.md
index 66bdefd..b1e24e5 100644
--- a/docs/intro_docs/milvus_benchmark.md
+++ b/docs/intro_docs/milvus_benchmark.md
@@ -24,7 +24,13 @@
 
 
 
-<details style="box-sizing: inherit; margin: 8px 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; display: block; line-height: 1.4em; color: rgb(25, 25, 25); font-family: Geist, Inter, &quot;Geist Mono&quot;, SourceCodePro, &quot;serif&quot;; font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 400; letter-spacing: normal; orphans: 2; text-align: start; text-indent: 0px; text-transform: none; widows: 2; word-spacing: 0px; -webkit-text-stroke-width: 0px; white-space: normal; background-color: rgb(255, 255, 255); text-decoration-thickness: initial; text-decoration-style: initial; text-decoration-color: initial;"><summary style="box-sizing: inherit; margin: 0px 0px 8px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; cursor: pointer; color: rgb(25, 25, 25);">点击查看测试中使用的术语详情</summary><table class="terminology" style="box-sizing: inherit; margin: 24px 0px; padding: 0px; border: 1px solid rgb(236, 236, 238); font-size: 16px; vertical-align: baseline; border-collapse: collapse; border-spacing: 0px; overflow-x: auto; width: 886px; border-radius: 12px; display: block; hyphens: none;"><thead style="box-sizing: inherit; margin: 0px; padding: 12px; border-width: 0px 0px 1px; border-top-style: initial; border-right-style: initial; border-bottom-style: solid; border-left-style: initial; border-top-color: initial; border-right-color: initial; border-bottom-color: rgb(238, 238, 238); border-left-color: initial; border-image: initial; font-size: 16px; vertical-align: baseline; line-height: 22px; text-align: left; min-width: 100%; width: calc(-32px + 100vw);"><tr style="box-sizing: inherit; margin: 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline;"><th style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border-width: 0px 1px 0px 0px; border-top-style: initial; border-right-style: solid; border-bottom-style: initial; border-left-style: initial; border-top-color: initial; border-right-color: rgb(236, 236, 238); border-bottom-color: initial; border-left-color: initial; border-image: initial; font-size: 16px; vertical-align: baseline; line-height: 1.5; font-weight: 600; text-align: left !important;"></th><th style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border: 0px; font-size: 16px; vertical-align: baseline; line-height: 1.5; font-weight: 600; text-align: left !important;"></th></tr></thead><tbody style="box-sizing: inherit; margin: 0px; padding: 12px; border: 0px; font-size: 14px; vertical-align: baseline; line-height: 1.4em; text-align: left; font-weight: 400;"><tr style="box-sizing: inherit; margin: 0px; padding: 0px; border-width: 0px 0px 1px; border-top-style: initial; border-right-style: initial; border-bottom-style: solid; border-left-style: initial; border-top-color: initial; border-right-color: initial; border-bottom-color: rgb(236, 236, 238); border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: baseline;"><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border-width: 0px 1px 0px 0px; border-top-style: initial; border-right-style: solid; border-bottom-style: initial; border-left-style: initial; border-top-color: initial; border-right-color: rgb(236, 236, 238); border-bottom-color: initial; border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border: 0px; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td></tr><tr style="box-sizing: inherit; margin: 0px; padding: 0px; border-width: 0px 0px 1px; border-top-style: initial; border-right-style: initial; border-bottom-style: solid; border-left-style: initial; border-top-color: initial; border-right-color: initial; border-bottom-color: rgb(236, 236, 238); border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: baseline;"><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border-width: 0px 1px 0px 0px; border-top-style: initial; border-right-style: solid; border-bottom-style: initial; border-left-style: initial; border-top-color: initial; border-right-color: rgb(236, 236, 238); border-bottom-color: initial; border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border: 0px; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td></tr><tr style="box-sizing: inherit; margin: 0px; padding: 0px; border-width: 0px 0px 1px; border-top-style: initial; border-right-style: initial; border-bottom-style: solid; border-left-style: initial; border-top-color: initial; border-right-color: initial; border-bottom-color: rgb(236, 236, 238); border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: baseline;"><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border-width: 0px 1px 0px 0px; border-top-style: initial; border-right-style: solid; border-bottom-style: initial; border-left-style: initial; border-top-color: initial; border-right-color: rgb(236, 236, 238); border-bottom-color: initial; border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border: 0px; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"><a href="https://milvus.io/docs/v2.2.x/index.md" style="box-sizing: inherit; margin: 0px; padding: 0px; border: 0px; font-size: 14px; vertical-align: baseline; text-decoration: none; color: rgb(102, 113, 118); text-underline-position: from-font; transition: background-color 0.1s linear; hyphens: none; font-weight: 400;"></a></td></tr><tr style="box-sizing: inherit; margin: 0px; padding: 0px; border-width: 0px 0px 1px; border-top-style: initial; border-right-style: initial; border-bottom-style: solid; border-left-style: initial; border-top-color: initial; border-right-color: initial; border-bottom-color: rgb(236, 236, 238); border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: baseline;"><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border-width: 0px 1px 0px 0px; border-top-style: initial; border-right-style: solid; border-bottom-style: initial; border-left-style: initial; border-top-color: initial; border-right-color: rgb(236, 236, 238); border-bottom-color: initial; border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border: 0px; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td></tr><tr style="box-sizing: inherit; margin: 0px; padding: 0px; border-width: 0px 0px 1px; border-top-style: initial; border-right-style: initial; border-bottom-style: solid; border-left-style: initial; border-top-color: initial; border-right-color: initial; border-bottom-color: rgb(236, 236, 238); border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: baseline;"><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border-width: 0px 1px 0px 0px; border-top-style: initial; border-right-style: solid; border-bottom-style: initial; border-left-style: initial; border-top-color: initial; border-right-color: rgb(236, 236, 238); border-bottom-color: initial; border-left-color: initial; border-image: initial; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td><td style="box-sizing: inherit; margin: 0px; padding: 10px 20px; border: 0px; font-size: 14px; vertical-align: text-top; line-height: 1.5; width: calc(-32px + 100vw); font-weight: 500; color: rgb(102, 113, 118); text-align: left !important;"></td></tr></tbody></table></details>
+| 术语 | 说明                                                         |
+| ---- | ------------------------------------------------------------ |
+| nq   | 一次搜索请求中要搜索的向量数量                               |
+| topk | 搜索请求中每个向量（以 nq 为单位）的最近向量数               |
+| ef   | [HNSW 索引](https://milvus.io/docs/v2.2.x/index.md)特有的搜索参数 |
+| RT   | 从发送请求到接收响应的响应时间                               |
+| QPS  | 每秒成功处理的搜索请求数                                     |
 
 
 
@@ -76,7 +82,7 @@
 
 
 
-<details style="box-sizing: inherit; margin: 8px 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; display: block; line-height: 1.4em; color: rgb(25, 25, 25); font-family: Geist, Inter, &quot;Geist Mono&quot;, SourceCodePro, &quot;serif&quot;; font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 400; letter-spacing: normal; orphans: 2; text-align: start; text-indent: 0px; text-transform: none; widows: 2; word-spacing: 0px; -webkit-text-stroke-width: 0px; white-space: normal; background-color: rgb(255, 255, 255); text-decoration-thickness: initial; text-decoration-style: initial; text-decoration-color: initial;"><summary style="box-sizing: inherit; margin: 0px 0px 8px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; cursor: pointer; color: rgb(25, 25, 25);"><b style="box-sizing: inherit; margin: 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline;">服务器配置（群集）</b></summary><code translate="no" style="box-sizing: inherit; margin: 0px; padding: 0px 8px; border: 0px; font-size: 14px; vertical-align: baseline; line-height: 1.4rem; font-family: SourceCodePro; background-color: rgb(208, 215, 220); border-radius: 4px; color: rgb(0, 19, 26); display: inline-block; font-weight: 600;"></code></details>
+```yaml queryNode: replicas: 1 resources: limits: cpu: "12.0" memory: 8Gi requests: cpu: "12.0" memory: 8Gi```
 
 
 
@@ -93,7 +99,7 @@
 
 
 
-<details style="box-sizing: inherit; margin: 8px 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; display: block; line-height: 1.4em; color: rgb(25, 25, 25); font-family: Geist, Inter, &quot;Geist Mono&quot;, SourceCodePro, &quot;serif&quot;; font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 400; letter-spacing: normal; orphans: 2; text-align: start; text-indent: 0px; text-transform: none; widows: 2; word-spacing: 0px; -webkit-text-stroke-width: 0px; white-space: normal; background-color: rgb(255, 255, 255); text-decoration-thickness: initial; text-decoration-style: initial; text-decoration-color: initial;"><summary style="box-sizing: inherit; margin: 0px 0px 8px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; cursor: pointer; color: rgb(25, 25, 25);"><b style="box-sizing: inherit; margin: 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline;">服务器配置（单机）</b></summary><code translate="no" style="box-sizing: inherit; margin: 0px; padding: 0px 8px; border: 0px; font-size: 14px; vertical-align: baseline; line-height: 1.4rem; font-family: SourceCodePro; background-color: rgb(208, 215, 220); border-radius: 4px; color: rgb(0, 19, 26); display: inline-block; font-weight: 600;"></code></details>
+```yaml standalone: replicas: 1 resources: limits: cpu: "12.0" memory: 16Gi requests: cpu: "12.0" memory: 16Gi```
 
 
 
@@ -112,7 +118,7 @@
 
 
 
-<details style="box-sizing: inherit; margin: 8px 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; display: block; line-height: 1.4em; color: rgb(25, 25, 25); font-family: Geist, Inter, &quot;Geist Mono&quot;, SourceCodePro, &quot;serif&quot;; font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 400; letter-spacing: normal; orphans: 2; text-align: start; text-indent: 0px; text-transform: none; widows: 2; word-spacing: 0px; -webkit-text-stroke-width: 0px; white-space: normal; background-color: rgb(255, 255, 255); text-decoration-thickness: initial; text-decoration-style: initial; text-decoration-color: initial;"><summary style="box-sizing: inherit; margin: 0px 0px 8px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; cursor: pointer; color: rgb(25, 25, 25);"><b style="box-sizing: inherit; margin: 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline;">服务器配置（群集）</b></summary><code translate="no" style="box-sizing: inherit; margin: 0px; padding: 0px 8px; border: 0px; font-size: 14px; vertical-align: baseline; line-height: 1.4rem; font-family: SourceCodePro; background-color: rgb(208, 215, 220); border-radius: 4px; color: rgb(0, 19, 26); display: inline-block; font-weight: 600;"></code></details>
+```yaml queryNode: replicas: 1 resources: limits: cpu: "8.0" /"12.0" /"16.0" /"32.0" memory: 8Gi requests: cpu: "8.0" /"12.0" /"16.0" /"32.0" memory: 8Gi```
 
 
 
@@ -135,7 +141,7 @@
 
 
 
-<details style="box-sizing: inherit; margin: 8px 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; display: block; line-height: 1.4em; color: rgb(25, 25, 25); font-family: Geist, Inter, &quot;Geist Mono&quot;, SourceCodePro, &quot;serif&quot;; font-style: normal; font-variant-ligatures: normal; font-variant-caps: normal; font-weight: 400; letter-spacing: normal; orphans: 2; text-align: start; text-indent: 0px; text-transform: none; widows: 2; word-spacing: 0px; -webkit-text-stroke-width: 0px; white-space: normal; background-color: rgb(255, 255, 255); text-decoration-thickness: initial; text-decoration-style: initial; text-decoration-color: initial;"><summary style="box-sizing: inherit; margin: 0px 0px 8px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline; cursor: pointer; color: rgb(25, 25, 25);"><b style="box-sizing: inherit; margin: 0px; padding: 0px; border: 0px; font-size: 16px; vertical-align: baseline;">服务器配置（群集）</b></summary><code translate="no" style="box-sizing: inherit; margin: 0px; padding: 0px 8px; border: 0px; font-size: 14px; vertical-align: baseline; line-height: 1.4rem; font-family: SourceCodePro; background-color: rgb(208, 215, 220); border-radius: 4px; color: rgb(0, 19, 26); display: inline-block; font-weight: 600;"></code></details>
+```yaml queryNode: replicas: 1 / 2 / 4 / 8 resources: limits: cpu: "8.0" memory: 8Gi requests: cpu: "8.0" memory: 8Gi```
 
 
 
diff --git a/main.py b/main.py
index d30f423..a1a76b0 100644
--- a/main.py
+++ b/main.py
@@ -141,7 +141,7 @@ def load_files(
             batch_size=batch_size if batch_size is not None else 8,
             force_rebuild=force_rebuild,
         )
-        return {"message": "成功加载文档"}
+        return {"message": "成功加载"}
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 
@@ -198,7 +198,7 @@ def load_website(
             batch_size=batch_size if batch_size is not None else 8,
             force_rebuild=force_rebuild,
         )
-        return {"message": "成功加载网址"}
+        return {"message": "成功加载"}
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 
@@ -234,7 +234,7 @@ def perform_query(
         # 清空之前的消息
         message_stream = get_message_stream()
         message_stream.clear_messages()
-        result_text, _ = query(original_query, max_iter)
+        result_text, _ = query(original_query, max_iter=max_iter)
 
         return {
             "result": result_text,
@@ -297,7 +297,7 @@ async def perform_query_stream(
             def run_query():
                 try:
                     print(f"Starting query: {original_query} with max_iter: {max_iter}")
-                    result_text, retrieval_results = query(original_query, max_iter)
+                    result_text, retrieval_results = query(original_query, max_iter=max_iter)
                     print(f"Query completed with result length: {len(result_text) if result_text else 0}")
                     print(f"Retrieved {len(retrieval_results) if retrieval_results else 0} documents")
                     return result_text, None
diff --git a/test.py b/test.py
index 171e4c8..72f45d0 100644
--- a/test.py
+++ b/test.py
@@ -16,7 +16,7 @@ load_from_local_files(
     paths_or_directory="docs",
     collection_name="default",
     collection_description="a general collection for all documents",
-    force_rebuild=True, batch_size=8
+    force_rebuild=True, batch_size=16
 )
 
 
@@ -25,4 +25,4 @@ load_from_local_files(
 # load_from_website(urls=website_url)
 
 # Query
-result = query("Write a comprehensive report about Milvus.") # Your question here
+result = query("Write a comprehensive report about Milvus.", max_iter=2) # Your question here

From f063a2d72f5e36f39994eb1446e95309bd5a14d3 Mon Sep 17 00:00:00 2001
From: tanxing <eternaldwellers@gmail.com>
Date: Fri, 15 Aug 2025 10:55:45 +0800
Subject: [PATCH 3/3] =?UTF-8?q?fix:=20=E7=A7=BB=E9=99=A4=E5=A4=9A=E4=BD=99?=
 =?UTF-8?q?=E7=9A=84=E9=9D=9E=E6=B5=81=E5=BC=8F=E6=B6=88=E6=81=AF=E6=8E=A5?=
 =?UTF-8?q?=E5=8F=A3=20refactor:=20=E8=B0=83=E6=95=B4=E5=8F=82=E8=80=83?=
 =?UTF-8?q?=E6=96=87=E7=8C=AE=E7=9A=84=E7=94=9F=E6=88=90=E6=96=B9=E6=B3=95?=
 =?UTF-8?q?=20=20=20=20=20=E7=8E=B0=E5=9C=A8=E6=98=AF=E7=94=9F=E6=88=90?=
 =?UTF-8?q?=E5=9B=BA=E5=AE=9A=E7=9A=84=E5=8F=82=E8=80=83=E6=96=87=E7=8C=AE?=
 =?UTF-8?q?=E8=A1=A8=EF=BC=8C=E8=80=8C=E4=B8=8D=E6=98=AFAI=E8=87=AA?=
 =?UTF-8?q?=E5=8A=A8=E7=94=9F=E6=88=90=20chore:=20=E8=B0=83=E6=95=B4?=
 =?UTF-8?q?=E6=8F=90=E7=A4=BA=E8=AF=8D=E5=92=8CLLM=E9=85=8D=E7=BD=AE=20cho?=
 =?UTF-8?q?re:=20=E8=B0=83=E6=95=B4=E5=89=8D=E7=AB=AF=E6=A0=B7=E5=BC=8F?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 deepsearcher/agent/deep_search.py       | 72 +++++++++++--------------
 deepsearcher/config.yaml                |  2 +-
 deepsearcher/llm/openai_llm.py          |  6 +--
 deepsearcher/templates/html/index.html  | 20 +++----
 deepsearcher/templates/static/js/app.js |  2 +-
 main.py                                 | 41 --------------
 test.py                                 |  2 +-
 7 files changed, 46 insertions(+), 99 deletions(-)

diff --git a/deepsearcher/agent/deep_search.py b/deepsearcher/agent/deep_search.py
index 0e35e77..860c225 100644
--- a/deepsearcher/agent/deep_search.py
+++ b/deepsearcher/agent/deep_search.py
@@ -63,7 +63,7 @@ RERANK_PROMPT = """
 
 例如，假如给出4个chunks（实际检索到的文档片段不一定是这么多），返回4个"True"或者"False"（注意这只是一个示例，不代表实际判断）: ["True", "False", "True", "True"]
 使用的语言与问题相同
-你需要返回的是 a python list of str without any addtional content:
+你需要返回的是 a python list of str(bool) without any addtional content:
 """
 
 
@@ -87,35 +87,19 @@ REFLECT_PROMPT = """
 
 
 SUMMARY_PROMPT = """
-你是一个内容分析专家，请你根据提供的问题和检索到的信息，生成详细、层次分明、尽可能长的回答。
+你是一个内容分析专家
+请你综合已经提出的问题和检索到的信息，以原问题为中心，生成详细准确、层次分明、尽可能长的回答。
 如果检索到的信息不足以回答问题，你应该使用你的知识来进行扩展补充。
-注意，不要一个子问题一个子问题的回答，而是应该仔细分析子问题之间的关系、子问题和原问题之间的关系。
-同时，你应该根据提供的信息生成文内引用和文末参考资料列表，使用markdown脚注。
-如果你自己提供的信息需要使用"your knowledge here[^0]"引用。
-注意，这里的"[^0]"的序号0是固定的，表示你的知识，文末引用使用"[^0]: AI 生成",
-来自<chunk><reference>的引用序号从[^1]开始，来源需要与前文<reference>中的"href"一致，不需要对每个<chunk>分配一个引用，而是相同<reference>的<chunk>共用一个引用
+注意，不要逐个回答问题，而是应该综合所有问题和信息，生成一个完整的回答。
+同时，你应该根据提供的信息生成文内引用"[^index]"(markdown文内引用)。
+如果你自己提供的信息需要使用"[^0]"引用，即你提供的信息使用固定index=0。
+来自<chunk><reference>的引用序号从[^index]从index=1开始，来源需要与前文<reference>中的"href"一致
+不需要对每个<chunk>分配一个引用，而是相同<reference>的<chunk>共用一个引用。
 另外，如果回答的内容文内引用需要引用多个<reference>，请添加多个[^index]到句尾。
-如果多个片段是相同的来源或者一个片段可以回答多个问题，文内引用可以引用多次，但文末只引用一次来源，即文末的引用列表中不能有重复。
 
-例子:
 <EXAMPLE>
 
-文内引用示例:
-"XGBoost是非常强大的集成学习模型[^2]"
-
-
-文末引用示例:
-正确例子：
-[^0]: AI 生成
-[^1]: files/docs/machine_learning.md
-[^2]: files/docs/chap_001_003_models.md
-
-错误例子：
-[^0]: AI 生成
-[^1]: files/docs/chap_001_003_models.md
-[^2]: files/docs/machine_learning.md
-[^3]: files/docs/chap_001_003_models.md（错误，这是重复引用）
-[^5]: files/docs/machine_learning.md（错误，也这是重复引用）
+"XGBoost是非常强大的集成学习模型。[^1]但是XGBoost的缺点是计算复杂度高，需要大量的计算资源。[^0]"
 
 </EXAMPLE>
 
@@ -257,7 +241,7 @@ class DeepSearch(BaseAgent):
                 continue
 
             # Format all chunks for batch processing
-            chunks = self._format_chunks(retrieved_results)
+            chunks, _ = self._format_chunks(retrieved_results)
 
             # Batch process all chunks with a single LLM call
             content = self.llm.chat(
@@ -312,7 +296,7 @@ class DeepSearch(BaseAgent):
     def _generate_more_sub_queries(
         self, original_query: str, all_sub_queries: list[str], all_retrieved_results: list[RetrievalResult]
     ) -> list[str]:
-        chunks = self._format_chunks(all_retrieved_results)
+        chunks, _ = self._format_chunks(all_retrieved_results)
         reflect_prompt = REFLECT_PROMPT.format(
             original_query=original_query,
             all_sub_queries=all_sub_queries,
@@ -410,7 +394,7 @@ class DeepSearch(BaseAgent):
         if not all_retrieved_results or len(all_retrieved_results) == 0:
             send_info(f"'{original_query}'没能找到更多信息！")
             return "", []
-        chunks = self._format_chunks(all_retrieved_results)
+        chunks, refs = self._format_chunks(all_retrieved_results)
         send_info(f"正在总结 {len(all_retrieved_results)} 个查找到的文档片段")
         summary_prompt = SUMMARY_PROMPT.format(
             original_query=original_query,
@@ -418,29 +402,33 @@ class DeepSearch(BaseAgent):
             chunks=chunks
         )
         response = self.llm.chat([{"role": "user", "content": summary_prompt}])
-        final_answer = self.llm.remove_think(response)
-        send_answer(final_answer)
-        return self.llm.remove_think(response), all_retrieved_results
+        response = self.llm.remove_think(response) + refs
+        send_answer(response)
+        return response, all_retrieved_results
 
-    def _format_chunks(self, retrieved_results: list[RetrievalResult]):
+    def _format_chunks(self, retrieved_results: list[RetrievalResult]) -> tuple[str, str]:
         # 以referecen为key，把chunk放到字典中
-        references = defaultdict(list)
+        ref_dict = defaultdict(list)
         for result in retrieved_results:
-            references[result.reference].append(result.text)
-        chunks = []
+            ref_dict[result.reference].append(result.text)
+        formated_chunks = []
+        formated_refs = ["\n\n[^0]: AI 生成\n"]
         chunk_count = 0
-        for i, reference in enumerate(references):
-            formated = "".join(
+        for i, reference in enumerate(ref_dict):
+            formated_chunk = "".join(
                 [
                     (
                         f"<reference id='{i + 1}' href='{reference}'>" +
                         f"<chunk id='{j + 1 + chunk_count}'>\n{chunk}\n</chunk id='{j + 1 + chunk_count}'>" +
                         f"</reference id='{i + 1}'>\n"
                     )
-                        for j, chunk in enumerate(references[reference])
+                        for j, chunk in enumerate(ref_dict[reference])
                 ]
             )
-            print(formated)
-            chunks.append(formated)
-            chunk_count += len(references[reference])
-        return "".join(chunks)
+            print(formated_chunk)
+            formated_chunks.append(formated_chunk)
+            chunk_count += len(ref_dict[reference])
+            formated_refs.append(f"[^{i + 1}]: " + str(reference) + "\n")
+        formated_chunks = "".join(formated_chunks)
+        formated_refs = "".join(formated_refs)
+        return formated_chunks, formated_refs
diff --git a/deepsearcher/config.yaml b/deepsearcher/config.yaml
index e560153..5b59538 100644
--- a/deepsearcher/config.yaml
+++ b/deepsearcher/config.yaml
@@ -83,5 +83,5 @@ query_settings:
   max_iter: 3
 
 load_settings:
-  chunk_size: 4096
+  chunk_size: 2048
   chunk_overlap: 1024
diff --git a/deepsearcher/llm/openai_llm.py b/deepsearcher/llm/openai_llm.py
index e5edf6d..eacf374 100644
--- a/deepsearcher/llm/openai_llm.py
+++ b/deepsearcher/llm/openai_llm.py
@@ -48,9 +48,9 @@ class OpenAILLM(BaseLLM):
             model=self.model,
             messages=messages,
             stream=True,
-            temperature=0.7,
-            top_p=0.8,
-            presence_penalty=1.3
+            temperature=0.8,
+            top_p=0.9,
+            presence_penalty=1.4
         ) as stream:
             # stream到控制台测试
             content = ""
diff --git a/deepsearcher/templates/html/index.html b/deepsearcher/templates/html/index.html
index c716062..fa53db4 100644
--- a/deepsearcher/templates/html/index.html
+++ b/deepsearcher/templates/html/index.html
@@ -9,7 +9,7 @@
 <body>
     <div class="container">
         <header>
-            <h1>DeepSearcher 智能搜索系统</h1>
+            <h1>DeepSearcher 智能深度搜索系统</h1>
             <p class="app-description">基于大型语言模型和向量数据库的知识管理系统，支持私有数据搜索和在线内容整合，提供准确答案和综合报告。</p>
         </header>
 
@@ -21,12 +21,12 @@
                     <input type="text" id="filePaths" placeholder="例如: /path/to/file1.pdf,/path/to/file2.txt">
                 </div>
                 <div class="form-group">
-                    <label for="collectionName">集合名称（可选）</label>
-                    <input type="text" id="collectionName" placeholder="例如: my_collection">
+                    <label for="collectionName">集合名称</label>
+                    <input type="text" id="collectionName" placeholder="例如: default">
                 </div>
                 <div class="form-group">
-                    <label for="collectionDesc">集合描述（可选）</label>
-                    <textarea id="collectionDesc" rows="2" placeholder="例如: 这是一个测试集合"></textarea>
+                    <label for="collectionDesc">集合描述</label>
+                    <textarea id="collectionDesc" rows="2" placeholder="例如: This is a general collection for all queries"></textarea>
                 </div>
                 <button id="loadFilesBtn">加载文件</button>
                 <div id="loadStatus" class="status"></div>
@@ -39,12 +39,12 @@
                     <input type="text" id="websiteUrls" placeholder="例如: https://example.com/page1,https://example.com/page2">
                 </div>
                 <div class="form-group">
-                    <label for="webCollectionName">集合名称（可选）</label>
-                    <input type="text" id="webCollectionName" placeholder="例如: web_collection">
+                    <label for="webCollectionName">集合名称</label>
+                    <input type="text" id="webCollectionName" placeholder="例如: default">
                 </div>
                 <div class="form-group">
-                    <label for="webCollectionDesc">集合描述（可选）</label>
-                    <textarea id="webCollectionDesc" rows="2" placeholder="例如: 来自网站的内容"></textarea>
+                    <label for="webCollectionDesc">集合描述</label>
+                    <textarea id="webCollectionDesc" rows="2" placeholder="例如: This is a general collection for all queries"></textarea>
                 </div>
                 <button id="loadWebsiteBtn">加载网站</button>
                 <div id="webLoadStatus" class="status"></div>
@@ -79,7 +79,7 @@
         </main>
 
         <footer>
-            <p>DeepSearcher © 2025 | 企业知识管理与智能问答系统</p>
+            <p>DeepSearcher © 2025 | 智能深度搜索系统</p>
         </footer>
     </div>
 
diff --git a/deepsearcher/templates/static/js/app.js b/deepsearcher/templates/static/js/app.js
index 8a750cb..2feb279 100644
--- a/deepsearcher/templates/static/js/app.js
+++ b/deepsearcher/templates/static/js/app.js
@@ -199,7 +199,7 @@ function handleStreamMessage(data) {
                 // 处理answer类型，显示查询结果
                 console.log('Processing answer message:', message.content.substring(0, 100) + '...');
                 // 将结果内容显示在结果区域
-                if (message.content && message.content !== "==== FINAL ANSWER====") {
+                if (message.content) {
                     document.getElementById('resultText').textContent = message.content;
                     showResult();
                 }
diff --git a/main.py b/main.py
index a1a76b0..4b34478 100644
--- a/main.py
+++ b/main.py
@@ -203,47 +203,6 @@ def load_website(
         raise HTTPException(status_code=500, detail=str(e))
 
 
-@app.get("/query/")
-def perform_query(
-    original_query: str = Query(
-        ...,
-        description="Your question here.",
-        examples=["Write a report about Milvus."],
-    ),
-    max_iter: int = Query(
-        3,
-        description="The maximum number of iterations for reflection.",
-        ge=1,
-        examples=[3],
-    ),
-):
-    """
-    Perform a query against the loaded data.
-
-    Args:
-        original_query (str): The user's question or query.
-        max_iter (int, optional): Maximum number of iterations for reflection. Defaults to 3.
-
-    Returns:
-        dict: A dictionary containing the query result and token consumption.
-
-    Raises:
-        HTTPException: If the query fails.
-    """
-    try:
-        # 清空之前的消息
-        message_stream = get_message_stream()
-        message_stream.clear_messages()
-        result_text, _ = query(original_query, max_iter=max_iter)
-
-        return {
-            "result": result_text,
-            "messages": message_stream.get_messages_as_dicts()
-        }
-    except Exception as e:
-        raise HTTPException(status_code=500, detail=str(e))
-
-
 @app.get("/query-stream/")
 async def perform_query_stream(
     original_query: str = Query(
diff --git a/test.py b/test.py
index 72f45d0..29cff4e 100644
--- a/test.py
+++ b/test.py
@@ -25,4 +25,4 @@ load_from_local_files(
 # load_from_website(urls=website_url)
 
 # Query
-result = query("Write a comprehensive report about Milvus.", max_iter=2) # Your question here
+result = query("Write a comprehensive report about Milvus.", max_iter=1) # Your question here