From e1850d5c4eec37c44b016eebe095922657d0448e Mon Sep 17 00:00:00 2001 From: Jiang <33757498+hijzy@users.noreply.github.com> Date: Fri, 13 Feb 2026 15:43:23 +0800 Subject: [PATCH 1/2] fix: add full text search for neo4j db (#1095) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * feat: add full_text_search for neo4j * test: 改回去 --------- Co-authored-by: CaralHsi --- src/memos/graph_dbs/neo4j.py | 20 ++++++++++++++ src/memos/graph_dbs/neo4j_community.py | 20 ++++++++++++++ .../tree_text_memory/retrieve/searcher.py | 26 ++++++++++++------- 3 files changed, 56 insertions(+), 10 deletions(-) diff --git a/src/memos/graph_dbs/neo4j.py b/src/memos/graph_dbs/neo4j.py index 23ce2408b..746051187 100644 --- a/src/memos/graph_dbs/neo4j.py +++ b/src/memos/graph_dbs/neo4j.py @@ -928,6 +928,26 @@ def search_by_embedding( return records + def search_by_fulltext( + self, + query_words: list[str], + top_k: int = 10, + scope: str | None = None, + status: str | None = None, + threshold: float | None = None, + search_filter: dict | None = None, + user_name: str | None = None, + filter: dict | None = None, + knowledgebase_ids: list[str] | None = None, + tsquery_config: str | None = None, + **kwargs, + ) -> list[dict]: + """ + TODO: 实现 Neo4j 的关键词检索, 以兼容 TreeTextMemory 的 keyword/fulltext 召回路径. + 目前先返回空列表, 避免切换到 Neo4j 后因缺失方法导致运行时报错. + """ + return [] + def get_by_metadata( self, filters: list[dict[str, Any]], diff --git a/src/memos/graph_dbs/neo4j_community.py b/src/memos/graph_dbs/neo4j_community.py index e34313fa2..cae7d6ca5 100644 --- a/src/memos/graph_dbs/neo4j_community.py +++ b/src/memos/graph_dbs/neo4j_community.py @@ -382,6 +382,26 @@ def search_by_embedding( return filtered_results + def search_by_fulltext( + self, + query_words: list[str], + top_k: int = 10, + scope: str | None = None, + status: str | None = None, + threshold: float | None = None, + search_filter: dict | None = None, + user_name: str | None = None, + filter: dict | None = None, + knowledgebase_ids: list[str] | None = None, + tsquery_config: str | None = None, + **kwargs, + ) -> list[dict]: + """ + TODO: 实现 Neo4j Community 的关键词检索, 以兼容 TreeTextMemory 的 keyword/fulltext 召回路径. + 目前先返回空列表, 避免切换到 Neo4j 后因缺失方法导致运行时报错. + """ + return [] + def _normalize_date_string(self, date_str: str) -> str: """ Normalize date string to ISO 8601 format for Neo4j datetime() function. diff --git a/src/memos/memories/textual/tree_text_memory/retrieve/searcher.py b/src/memos/memories/textual/tree_text_memory/retrieve/searcher.py index f00efccb6..c8e7acc25 100644 --- a/src/memos/memories/textual/tree_text_memory/retrieve/searcher.py +++ b/src/memos/memories/textual/tree_text_memory/retrieve/searcher.py @@ -511,16 +511,22 @@ def _retrieve_from_keyword( id_to_score: dict[str, float] = {} for scope in scopes: - hits = self.graph_store.search_by_fulltext( - query_words=tsquery_terms, - top_k=top_k * 2, - status="activated", - scope=scope, - search_filter=None, - filter=search_filter, - user_name=user_name, - tsquery_config="jiebaqry", - ) + try: + hits = self.graph_store.search_by_fulltext( + query_words=tsquery_terms, + top_k=top_k * 2, + status="activated", + scope=scope, + search_filter=None, + filter=search_filter, + user_name=user_name, + tsquery_config="jiebaqry", + ) + except Exception as e: + logger.warning( + f"[PATH-KEYWORD] search_by_fulltext failed, scope={scope}, user_name={user_name}" + ) + hits = [] for h in hits or []: hid = str(h.get("id") or "").strip().strip("'\"") if not hid: From 5b937614882b3e0f4ee6724738353496cc59a9f1 Mon Sep 17 00:00:00 2001 From: Jiang <33757498+hijzy@users.noreply.github.com> Date: Sat, 14 Feb 2026 10:16:57 +0800 Subject: [PATCH 2/2] fix: Add toggle for fulltext retrieval path (#1096) feat: Add toggle for fulltext retrieval path (FULLTEXT_CALL), default off --- src/memos/api/config.py | 2 ++ .../tree_text_memory/retrieve/searcher.py | 28 ++++++++++--------- 2 files changed, 17 insertions(+), 13 deletions(-) diff --git a/src/memos/api/config.py b/src/memos/api/config.py index d2dd19266..65049b0c2 100644 --- a/src/memos/api/config.py +++ b/src/memos/api/config.py @@ -1014,6 +1014,7 @@ def create_user_config(user_name: str, user_id: str) -> tuple["MOSConfig", "Gene "fast_graph": bool(os.getenv("FAST_GRAPH", "false") == "true"), "bm25": bool(os.getenv("BM25_CALL", "false") == "true"), "cot": bool(os.getenv("VEC_COT_CALL", "false") == "true"), + "fulltext": bool(os.getenv("FULLTEXT_CALL", "false") == "true"), }, "include_embedding": bool( os.getenv("INCLUDE_EMBEDDING", "false") == "true" @@ -1096,6 +1097,7 @@ def get_default_cube_config() -> "GeneralMemCubeConfig | None": "fast_graph": bool(os.getenv("FAST_GRAPH", "false") == "true"), "bm25": bool(os.getenv("BM25_CALL", "false") == "true"), "cot": bool(os.getenv("VEC_COT_CALL", "false") == "true"), + "fulltext": bool(os.getenv("FULLTEXT_CALL", "false") == "true"), }, "mode": os.getenv("ASYNC_MODE", "sync"), "include_embedding": bool( diff --git a/src/memos/memories/textual/tree_text_memory/retrieve/searcher.py b/src/memos/memories/textual/tree_text_memory/retrieve/searcher.py index f00efccb6..da6b1e32a 100644 --- a/src/memos/memories/textual/tree_text_memory/retrieve/searcher.py +++ b/src/memos/memories/textual/tree_text_memory/retrieve/searcher.py @@ -67,6 +67,7 @@ def __init__( self.internet_retriever = internet_retriever self.vec_cot = search_strategy.get("cot", False) if search_strategy else False self.use_fast_graph = search_strategy.get("fast_graph", False) if search_strategy else False + self.use_fulltext = search_strategy.get("fulltext", False) if search_strategy else False self.manual_close_internet = manual_close_internet self.tokenizer = tokenizer self._usage_executor = ContextThreadPoolExecutor(max_workers=4, thread_name_prefix="usage") @@ -380,20 +381,21 @@ def _retrieve_paths( user_name, ) ) - tasks.append( - executor.submit( - self._retrieve_from_keyword, - query, - parsed_goal, - query_embedding, - top_k, - memory_type, - search_filter, - search_priority, - user_name, - id_filter, + if self.use_fulltext: + tasks.append( + executor.submit( + self._retrieve_from_keyword, + query, + parsed_goal, + query_embedding, + top_k, + memory_type, + search_filter, + search_priority, + user_name, + id_filter, + ) ) - ) if search_tool_memory: tasks.append( executor.submit(