浏览代码

fix: improve document filtering in full text search(elasticsearch) (#22683)

tags/1.7.0
uply23333 3 个月前
父节点
当前提交
ab012fe1a2
没有帐户链接到提交者的电子邮件
共有 1 个文件被更改,包括 9 次插入2 次删除
  1. 9
    2
      api/core/rag/datasource/vdb/elasticsearch/elasticsearch_vector.py

+ 9
- 2
api/core/rag/datasource/vdb/elasticsearch/elasticsearch_vector.py 查看文件

@@ -147,10 +147,17 @@ class ElasticSearchVector(BaseVector):
return docs

def search_by_full_text(self, query: str, **kwargs: Any) -> list[Document]:
query_str = {"match": {Field.CONTENT_KEY.value: query}}
query_str: dict[str, Any] = {"match": {Field.CONTENT_KEY.value: query}}
document_ids_filter = kwargs.get("document_ids_filter")

if document_ids_filter:
query_str["filter"] = {"terms": {"metadata.document_id": document_ids_filter}} # type: ignore
query_str = {
"bool": {
"must": {"match": {Field.CONTENT_KEY.value: query}},
"filter": {"terms": {"metadata.document_id": document_ids_filter}},
}
}

results = self._client.search(index=self._collection_name, query=query_str, size=kwargs.get("top_k", 4))
docs = []
for hit in results["hits"]["hits"]:

正在加载...
取消
保存