浏览代码

Update comments (#4569)

### What problem does this PR solve?

Add license statement.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
tags/v0.16.0
Jin Hai 9 个月前
父节点
当前提交
3894de895b
没有帐户链接到提交者的电子邮件
共有 86 个文件被更改,包括 1034 次插入145 次删除
  1. 16
    0
      agent/__init__.py
  2. 16
    0
      agent/component/__init__.py
  3. 1
    1
      agent/settings.py
  4. 16
    0
      api/__init__.py
  5. 16
    0
      api/utils/t_crypt.py
  6. 16
    0
      api/utils/web_utils.py
  7. 16
    0
      deepdoc/__init__.py
  8. 3
    0
      deepdoc/parser/__init__.py
  9. 3
    0
      deepdoc/parser/docx_parser.py
  10. 3
    0
      deepdoc/parser/excel_parser.py
  11. 4
    0
      deepdoc/parser/html_parser.py
  12. 16
    0
      deepdoc/parser/json_parser.py
  13. 4
    0
      deepdoc/parser/markdown_parser.py
  14. 3
    0
      deepdoc/parser/pdf_parser.py
  15. 4
    0
      deepdoc/parser/ppt_parser.py
  16. 3
    0
      deepdoc/parser/resume/__init__.py
  17. 15
    0
      deepdoc/parser/resume/entities/__init__.py
  18. 3
    0
      deepdoc/parser/resume/entities/corporations.py
  19. 3
    0
      deepdoc/parser/resume/entities/degrees.py
  20. 3
    0
      deepdoc/parser/resume/entities/industries.py
  21. 4
    0
      deepdoc/parser/resume/entities/regions.py
  22. 3
    0
      deepdoc/parser/resume/entities/schools.py
  23. 3
    0
      deepdoc/parser/resume/step_one.py
  24. 4
    0
      deepdoc/parser/resume/step_two.py
  25. 4
    0
      deepdoc/parser/txt_parser.py
  26. 3
    0
      deepdoc/parser/utils.py
  27. 3
    0
      deepdoc/vision/__init__.py
  28. 4
    0
      deepdoc/vision/layout_recognizer.py
  29. 3
    0
      deepdoc/vision/ocr.py
  30. 3
    0
      deepdoc/vision/postprocess.py
  31. 3
    0
      deepdoc/vision/recognizer.py
  32. 3
    0
      deepdoc/vision/seeit.py
  33. 3
    0
      deepdoc/vision/t_ocr.py
  34. 4
    0
      deepdoc/vision/t_recognizer.py
  35. 3
    0
      deepdoc/vision/table_structure_recognizer.py
  36. 16
    0
      intergrations/chatgpt-on-wechat/plugins/__init__.py
  37. 16
    0
      intergrations/chatgpt-on-wechat/plugins/ragflow_chat.py
  38. 16
    0
      rag/__init__.py
  39. 15
    0
      rag/app/__init__.py
  40. 4
    0
      rag/app/audio.py
  41. 4
    0
      rag/app/book.py
  42. 3
    0
      rag/app/email.py
  43. 16
    0
      rag/app/knowledge_graph.py
  44. 4
    0
      rag/app/laws.py
  45. 1
    1
      rag/app/manual.py
  46. 4
    0
      rag/app/naive.py
  47. 4
    0
      rag/app/one.py
  48. 4
    0
      rag/app/paper.py
  49. 4
    0
      rag/app/picture.py
  50. 4
    0
      rag/app/presentation.py
  51. 4
    0
      rag/app/qa.py
  52. 4
    0
      rag/app/resume.py
  53. 4
    0
      rag/app/table.py
  54. 4
    0
      rag/app/tag.py
  55. 16
    0
      rag/svr/jina_server.py
  56. 16
    0
      rag/utils/azure_sas_conn.py
  57. 16
    0
      rag/utils/azure_spn_conn.py
  58. 16
    0
      rag/utils/doc_store_conn.py
  59. 16
    0
      rag/utils/es_conn.py
  60. 16
    0
      rag/utils/infinity_conn.py
  61. 16
    0
      rag/utils/minio_conn.py
  62. 16
    0
      rag/utils/redis_conn.py
  63. 16
    0
      rag/utils/s3_conn.py
  64. 16
    0
      rag/utils/storage_factory.py
  65. 17
    1
      sdk/python/hello_ragflow.py
  66. 16
    0
      sdk/python/ragflow_sdk/__init__.py
  67. 15
    0
      sdk/python/ragflow_sdk/modules/__init__.py
  68. 16
    0
      sdk/python/ragflow_sdk/modules/agent.py
  69. 16
    0
      sdk/python/ragflow_sdk/modules/base.py
  70. 21
    5
      sdk/python/ragflow_sdk/modules/chat.py
  71. 19
    6
      sdk/python/ragflow_sdk/modules/chunk.py
  72. 34
    15
      sdk/python/ragflow_sdk/modules/dataset.py
  73. 26
    12
      sdk/python/ragflow_sdk/modules/document.py
  74. 28
    11
      sdk/python/ragflow_sdk/modules/session.py
  75. 30
    8
      sdk/python/test/conftest.py
  76. 16
    0
      sdk/python/test/test_frontend_api/common.py
  77. 16
    0
      sdk/python/test/test_frontend_api/get_email.py
  78. 18
    2
      sdk/python/test/test_frontend_api/test_dataset.py
  79. 18
    1
      sdk/python/test/test_sdk_api/common.py
  80. 18
    2
      sdk/python/test/test_sdk_api/get_email.py
  81. 22
    5
      sdk/python/test/test_sdk_api/t_agent.py
  82. 20
    4
      sdk/python/test/test_sdk_api/t_chat.py
  83. 32
    12
      sdk/python/test/test_sdk_api/t_chunk.py
  84. 24
    3
      sdk/python/test/test_sdk_api/t_dataset.py
  85. 73
    41
      sdk/python/test/test_sdk_api/t_document.py
  86. 34
    15
      sdk/python/test/test_sdk_api/t_session.py

+ 16
- 0
agent/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from beartype.claw import beartype_this_package from beartype.claw import beartype_this_package
beartype_this_package() beartype_this_package()

+ 16
- 0
agent/component/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import importlib import importlib
from .begin import Begin, BeginParam from .begin import Begin, BeginParam
from .generate import Generate, GenerateParam from .generate import Generate, GenerateParam

+ 1
- 1
agent/settings.py 查看文件

# #
# Copyright 2019 The FATE Authors. All Rights Reserved.
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
# #
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.

+ 16
- 0
api/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from beartype.claw import beartype_this_package from beartype.claw import beartype_this_package
beartype_this_package() beartype_this_package()

+ 16
- 0
api/utils/t_crypt.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import base64 import base64
import os import os
import sys import sys

+ 16
- 0
api/utils/web_utils.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import re import re
import socket import socket
from urllib.parse import urlparse from urllib.parse import urlparse

+ 16
- 0
deepdoc/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from beartype.claw import beartype_this_package from beartype.claw import beartype_this_package
beartype_this_package() beartype_this_package()

+ 3
- 0
deepdoc/parser/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/parser/docx_parser.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/parser/excel_parser.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 4
- 0
deepdoc/parser/html_parser.py 查看文件

# -*- coding: utf-8 -*- # -*- coding: utf-8 -*-
#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

from rag.nlp import find_codec from rag.nlp import find_codec
import readability import readability
import html_text import html_text

+ 16
- 0
deepdoc/parser/json_parser.py 查看文件

# -*- coding: utf-8 -*- # -*- coding: utf-8 -*-
#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

# The following documents are mainly referenced, and only adaptation modifications have been made # The following documents are mainly referenced, and only adaptation modifications have been made
# from https://github.com/langchain-ai/langchain/blob/master/libs/text-splitters/langchain_text_splitters/json.py # from https://github.com/langchain-ai/langchain/blob/master/libs/text-splitters/langchain_text_splitters/json.py



+ 4
- 0
deepdoc/parser/markdown_parser.py 查看文件

# -*- coding: utf-8 -*- # -*- coding: utf-8 -*-
#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import re import re


class RAGFlowMarkdownParser: class RAGFlowMarkdownParser:

+ 3
- 0
deepdoc/parser/pdf_parser.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 4
- 0
deepdoc/parser/ppt_parser.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
from io import BytesIO from io import BytesIO
from pptx import Presentation from pptx import Presentation

+ 3
- 0
deepdoc/parser/resume/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 15
- 0
deepdoc/parser/resume/entities/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

+ 3
- 0
deepdoc/parser/resume/entities/corporations.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/parser/resume/entities/degrees.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/parser/resume/entities/industries.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 4
- 0
deepdoc/parser/resume/entities/regions.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import re import re


TBL = { TBL = {

+ 3
- 0
deepdoc/parser/resume/entities/schools.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/parser/resume/step_one.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 4
- 0
deepdoc/parser/resume/step_two.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
import re import re
import copy import copy

+ 4
- 0
deepdoc/parser/txt_parser.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import re import re


from deepdoc.parser.utils import get_text from deepdoc.parser.utils import get_text

+ 3
- 0
deepdoc/parser/utils.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/vision/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 4
- 0
deepdoc/vision/layout_recognizer.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import os import os
import re import re
from collections import Counter from collections import Counter

+ 3
- 0
deepdoc/vision/ocr.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/vision/postprocess.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/vision/recognizer.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/vision/seeit.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 3
- 0
deepdoc/vision/t_ocr.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 4
- 0
deepdoc/vision/t_recognizer.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
import os import os
import sys import sys

+ 3
- 0
deepdoc/vision/table_structure_recognizer.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 16
- 0
intergrations/chatgpt-on-wechat/plugins/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from beartype.claw import beartype_this_package from beartype.claw import beartype_this_package
beartype_this_package() beartype_this_package()



+ 16
- 0
intergrations/chatgpt-on-wechat/plugins/ragflow_chat.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import logging import logging
import requests import requests
from bridge.context import ContextType # Import Context, ContextType from bridge.context import ContextType # Import Context, ContextType

+ 16
- 0
rag/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from beartype.claw import beartype_this_package from beartype.claw import beartype_this_package
beartype_this_package() beartype_this_package()

+ 15
- 0
rag/app/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

+ 4
- 0
rag/app/audio.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import re import re


from api.db import LLMType from api.db import LLMType

+ 4
- 0
rag/app/book.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
from tika import parser from tika import parser
import re import re

+ 3
- 0
rag/app/email.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at

+ 16
- 0
rag/app/knowledge_graph.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import re import re


from graphrag.index import build_knowledge_graph_chunks from graphrag.index import build_knowledge_graph_chunks

+ 4
- 0
rag/app/laws.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
from tika import parser from tika import parser
import re import re

+ 1
- 1
rag/app/manual.py 查看文件

# #
# Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
# #
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.

+ 4
- 0
rag/app/naive.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
from tika import parser from tika import parser
from io import BytesIO from io import BytesIO

+ 4
- 0
rag/app/one.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
from tika import parser from tika import parser
from io import BytesIO from io import BytesIO

+ 4
- 0
rag/app/paper.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
import copy import copy
import re import re

+ 4
- 0
rag/app/picture.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import io import io


import numpy as np import numpy as np

+ 4
- 0
rag/app/presentation.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import copy import copy
import re import re
from io import BytesIO from io import BytesIO

+ 4
- 0
rag/app/qa.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
import re import re
import csv import csv

+ 4
- 0
rag/app/resume.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import logging import logging
import base64 import base64
import datetime import datetime

+ 4
- 0
rag/app/table.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import copy import copy
import re import re
from io import BytesIO from io import BytesIO

+ 4
- 0
rag/app/tag.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License"); # Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License. # you may not use this file except in compliance with the License.
# You may obtain a copy of the License at # You may obtain a copy of the License at
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
# #

import re import re
import csv import csv
from copy import deepcopy from copy import deepcopy

+ 16
- 0
rag/svr/jina_server.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from jina import Deployment from jina import Deployment
from docarray import BaseDoc from docarray import BaseDoc
from jina import Executor, requests from jina import Executor, requests

+ 16
- 0
rag/utils/azure_sas_conn.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import logging import logging
import os import os
import time import time

+ 16
- 0
rag/utils/azure_spn_conn.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import logging import logging
import os import os
import time import time

+ 16
- 0
rag/utils/doc_store_conn.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from abc import ABC, abstractmethod from abc import ABC, abstractmethod
from dataclasses import dataclass from dataclasses import dataclass
import numpy as np import numpy as np

+ 16
- 0
rag/utils/es_conn.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import logging import logging
import re import re
import json import json

+ 16
- 0
rag/utils/infinity_conn.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import logging import logging
import os import os
import re import re

+ 16
- 0
rag/utils/minio_conn.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import logging import logging
import time import time
from minio import Minio from minio import Minio

+ 16
- 0
rag/utils/redis_conn.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import logging import logging
import json import json



+ 16
- 0
rag/utils/s3_conn.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import logging import logging
import boto3 import boto3
from botocore.exceptions import ClientError from botocore.exceptions import ClientError

+ 16
- 0
rag/utils/storage_factory.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import os import os
from enum import Enum from enum import Enum



+ 17
- 1
sdk/python/hello_ragflow.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import ragflow_sdk import ragflow_sdk


print(ragflow_sdk.__version__)
print(ragflow_sdk.__version__)

+ 16
- 0
sdk/python/ragflow_sdk/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from beartype.claw import beartype_this_package from beartype.claw import beartype_this_package
beartype_this_package() beartype_this_package()



+ 15
- 0
sdk/python/ragflow_sdk/modules/__init__.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

+ 16
- 0
sdk/python/ragflow_sdk/modules/agent.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from .base import Base from .base import Base
from .session import Session from .session import Session
import requests import requests

+ 16
- 0
sdk/python/ragflow_sdk/modules/base.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

class Base(object): class Base(object):
def __init__(self, rag, res_dict): def __init__(self, rag, res_dict):
self.rag = rag self.rag = rag

+ 21
- 5
sdk/python/ragflow_sdk/modules/chat.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#



from .base import Base from .base import Base
from .session import Session from .session import Session


def update(self, update_message: dict): def update(self, update_message: dict):
res = self.put(f'/chats/{self.id}', res = self.put(f'/chats/{self.id}',
update_message)
update_message)
res = res.json() res = res.json()
if res.get("code") != 0: if res.get("code") != 0:
raise Exception(res["message"]) raise Exception(res["message"])



def create_session(self, name: str = "New session") -> Session: def create_session(self, name: str = "New session") -> Session:
res = self.post(f"/chats/{self.id}/sessions", {"name": name}) res = self.post(f"/chats/{self.id}/sessions", {"name": name})
res = res.json() res = res.json()
return Session(self.rag, res['data']) return Session(self.rag, res['data'])
raise Exception(res["message"]) raise Exception(res["message"])


def list_sessions(self,page: int = 1, page_size: int = 30, orderby: str = "create_time", desc: bool = True,
def list_sessions(self, page: int = 1, page_size: int = 30, orderby: str = "create_time", desc: bool = True,
id: str = None, name: str = None) -> list[Session]: id: str = None, name: str = None) -> list[Session]:
res = self.get(f'/chats/{self.id}/sessions',{"page": page, "page_size": page_size, "orderby": orderby, "desc": desc, "id": id, "name": name} )
res = self.get(f'/chats/{self.id}/sessions',
{"page": page, "page_size": page_size, "orderby": orderby, "desc": desc, "id": id, "name": name})
res = res.json() res = res.json()
if res.get("code") == 0: if res.get("code") == 0:
result_list = [] result_list = []
return result_list return result_list
raise Exception(res["message"]) raise Exception(res["message"])


def delete_sessions(self,ids: list[str] | None = None):
def delete_sessions(self, ids: list[str] | None = None):
res = self.rm(f"/chats/{self.id}/sessions", {"ids": ids}) res = self.rm(f"/chats/{self.id}/sessions", {"ids": ids})
res = res.json() res = res.json()
if res.get("code") != 0: if res.get("code") != 0:

+ 19
- 6
sdk/python/ragflow_sdk/modules/chunk.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from .base import Base from .base import Base




res_dict.pop(k) res_dict.pop(k)
super().__init__(rag, res_dict) super().__init__(rag, res_dict)



def update(self,update_message:dict):
res = self.put(f"/datasets/{self.dataset_id}/documents/{self.document_id}/chunks/{self.id}",update_message)
def update(self, update_message: dict):
res = self.put(f"/datasets/{self.dataset_id}/documents/{self.document_id}/chunks/{self.id}", update_message)
res = res.json() res = res.json()
if res.get("code") != 0 :
if res.get("code") != 0:
raise Exception(res["message"]) raise Exception(res["message"])



+ 34
- 15
sdk/python/ragflow_sdk/modules/dataset.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from .document import Document from .document import Document


from .base import Base from .base import Base


def update(self, update_message: dict): def update(self, update_message: dict):
res = self.put(f'/datasets/{self.id}', res = self.put(f'/datasets/{self.id}',
update_message)
update_message)
res = res.json() res = res.json()
if res.get("code") != 0: if res.get("code") != 0:
raise Exception(res["message"]) raise Exception(res["message"])


def upload_documents(self,document_list: list[dict]):
def upload_documents(self, document_list: list[dict]):
url = f"/datasets/{self.id}/documents" url = f"/datasets/{self.id}/documents"
files = [("file",(ele["display_name"],ele["blob"])) for ele in document_list]
res = self.post(path=url,json=None,files=files)
files = [("file", (ele["display_name"], ele["blob"])) for ele in document_list]
res = self.post(path=url, json=None, files=files)
res = res.json() res = res.json()
if res.get("code") == 0: if res.get("code") == 0:
doc_list=[]
doc_list = []
for doc in res["data"]: for doc in res["data"]:
document = Document(self.rag,doc)
document = Document(self.rag, doc)
doc_list.append(document) doc_list.append(document)
return doc_list return doc_list
raise Exception(res.get("message")) raise Exception(res.get("message"))


def list_documents(self, id: str | None = None, keywords: str | None = None, page: int = 1, page_size: int = 30, orderby: str = "create_time", desc: bool = True):
res = self.get(f"/datasets/{self.id}/documents",params={"id": id,"keywords": keywords,"page": page,"page_size": page_size,"orderby": orderby,"desc": desc})
def list_documents(self, id: str | None = None, keywords: str | None = None, page: int = 1, page_size: int = 30,
orderby: str = "create_time", desc: bool = True):
res = self.get(f"/datasets/{self.id}/documents",
params={"id": id, "keywords": keywords, "page": page, "page_size": page_size, "orderby": orderby,
"desc": desc})
res = res.json() res = res.json()
documents = [] documents = []
if res.get("code") == 0: if res.get("code") == 0:
for document in res["data"].get("docs"): for document in res["data"].get("docs"):
documents.append(Document(self.rag,document))
documents.append(Document(self.rag, document))
return documents return documents
raise Exception(res["message"]) raise Exception(res["message"])


def delete_documents(self,ids: list[str] | None = None):
res = self.rm(f"/datasets/{self.id}/documents",{"ids":ids})
def delete_documents(self, ids: list[str] | None = None):
res = self.rm(f"/datasets/{self.id}/documents", {"ids": ids})
res = res.json() res = res.json()
if res.get("code") != 0: if res.get("code") != 0:
raise Exception(res["message"]) raise Exception(res["message"])


def async_parse_documents(self,document_ids):
res = self.post(f"/datasets/{self.id}/chunks",{"document_ids":document_ids})
def async_parse_documents(self, document_ids):
res = self.post(f"/datasets/{self.id}/chunks", {"document_ids": document_ids})
res = res.json() res = res.json()
if res.get("code") != 0: if res.get("code") != 0:
raise Exception(res.get("message")) raise Exception(res.get("message"))


def async_cancel_parse_documents(self,document_ids):
res = self.rm(f"/datasets/{self.id}/chunks",{"document_ids":document_ids})
def async_cancel_parse_documents(self, document_ids):
res = self.rm(f"/datasets/{self.id}/chunks", {"document_ids": document_ids})
res = res.json() res = res.json()
if res.get("code") != 0: if res.get("code") != 0:
raise Exception(res.get("message")) raise Exception(res.get("message"))

+ 26
- 12
sdk/python/ragflow_sdk/modules/document.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import json import json
from .base import Base from .base import Base
from .chunk import Chunk from .chunk import Chunk
res_dict.pop(k) res_dict.pop(k)
super().__init__(rag, res_dict) super().__init__(rag, res_dict)



def update(self, update_message: dict): def update(self, update_message: dict):
res = self.put(f'/datasets/{self.dataset_id}/documents/{self.id}', res = self.put(f'/datasets/{self.dataset_id}/documents/{self.id}',
update_message) update_message)
except json.JSONDecodeError: except json.JSONDecodeError:
return res.content return res.content



def list_chunks(self,page=1, page_size=30, keywords=""):
data={"keywords": keywords,"page":page,"page_size":page_size}
def list_chunks(self, page=1, page_size=30, keywords=""):
data = {"keywords": keywords, "page": page, "page_size": page_size}
res = self.get(f'/datasets/{self.dataset_id}/documents/{self.id}/chunks', data) res = self.get(f'/datasets/{self.dataset_id}/documents/{self.id}/chunks', data)
res = res.json() res = res.json()
if res.get("code") == 0: if res.get("code") == 0:
chunks=[]
chunks = []
for data in res["data"].get("chunks"): for data in res["data"].get("chunks"):
chunk = Chunk(self.rag,data)
chunk = Chunk(self.rag, data)
chunks.append(chunk) chunks.append(chunk)
return chunks return chunks
raise Exception(res.get("message")) raise Exception(res.get("message"))


def add_chunk(self, content: str, important_keywords: list[str] = [], questions: list[str] = []): def add_chunk(self, content: str, important_keywords: list[str] = [], questions: list[str] = []):
res = self.post(f'/datasets/{self.dataset_id}/documents/{self.id}/chunks', res = self.post(f'/datasets/{self.dataset_id}/documents/{self.id}/chunks',
{"content":content,"important_keywords":important_keywords, "questions": questions})
{"content": content, "important_keywords": important_keywords, "questions": questions})
res = res.json() res = res.json()
if res.get("code") == 0: if res.get("code") == 0:
return Chunk(self.rag,res["data"].get("chunk"))
return Chunk(self.rag, res["data"].get("chunk"))
raise Exception(res.get("message")) raise Exception(res.get("message"))


def delete_chunks(self,ids:list[str] | None = None):
res = self.rm(f"/datasets/{self.dataset_id}/documents/{self.id}/chunks",{"chunk_ids":ids})
def delete_chunks(self, ids: list[str] | None = None):
res = self.rm(f"/datasets/{self.dataset_id}/documents/{self.id}/chunks", {"chunk_ids": ids})
res = res.json() res = res.json()
if res.get("code")!=0:
raise Exception(res.get("message"))
if res.get("code") != 0:
raise Exception(res.get("message"))

+ 28
- 11
sdk/python/ragflow_sdk/modules/session.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import json import json


from .base import Base from .base import Base
self.id = None self.id = None
self.name = "New session" self.name = "New session"
self.messages = [{"role": "assistant", "content": "Hi! I am your assistant,can I help you?"}] self.messages = [{"role": "assistant", "content": "Hi! I am your assistant,can I help you?"}]
for key,value in res_dict.items():
if key =="chat_id" and value is not None:
for key, value in res_dict.items():
if key == "chat_id" and value is not None:
self.chat_id = None self.chat_id = None
self.__session_type = "chat" self.__session_type = "chat"
if key == "agent_id" and value is not None: if key == "agent_id" and value is not None:
self.__session_type = "agent" self.__session_type = "agent"
super().__init__(rag, res_dict) super().__init__(rag, res_dict)


def ask(self, question="",stream=True,**kwargs):
def ask(self, question="", stream=True, **kwargs):
if self.__session_type == "agent": if self.__session_type == "agent":
res=self._ask_agent(question,stream)
res = self._ask_agent(question, stream)
elif self.__session_type == "chat": elif self.__session_type == "chat":
res=self._ask_chat(question,stream,**kwargs)
res = self._ask_chat(question, stream, **kwargs)
for line in res.iter_lines(): for line in res.iter_lines():
line = line.decode("utf-8") line = line.decode("utf-8")
if line.startswith("{"): if line.startswith("{"):
message = Message(self.rag, temp_dict) message = Message(self.rag, temp_dict)
yield message yield message


def _ask_chat(self, question: str, stream: bool,**kwargs):
json_data={"question": question, "stream": True,"session_id":self.id}
def _ask_chat(self, question: str, stream: bool, **kwargs):
json_data = {"question": question, "stream": True, "session_id": self.id}
json_data.update(kwargs) json_data.update(kwargs)
res = self.post(f"/chats/{self.chat_id}/completions", res = self.post(f"/chats/{self.chat_id}/completions",
json_data, stream=stream) json_data, stream=stream)
return res return res


def _ask_agent(self,question:str,stream:bool):
def _ask_agent(self, question: str, stream: bool):
res = self.post(f"/agents/{self.agent_id}/completions", res = self.post(f"/agents/{self.agent_id}/completions",
{"question": question, "stream": True,"session_id":self.id}, stream=stream)
{"question": question, "stream": True, "session_id": self.id}, stream=stream)
return res return res


def update(self,update_message):
def update(self, update_message):
res = self.put(f"/chats/{self.chat_id}/sessions/{self.id}", res = self.put(f"/chats/{self.chat_id}/sessions/{self.id}",
update_message)
update_message)
res = res.json() res = res.json()
if res.get("code") != 0: if res.get("code") != 0:
raise Exception(res.get("message")) raise Exception(res.get("message"))



class Message(Base): class Message(Base):
def __init__(self, rag, res_dict): def __init__(self, rag, res_dict):
self.content = "Hi! I am your assistant,can I help you?" self.content = "Hi! I am your assistant,can I help you?"

+ 30
- 8
sdk/python/test/conftest.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import os import os
import pytest import pytest
import requests import requests



HOST_ADDRESS = os.getenv('HOST_ADDRESS', 'http://127.0.0.1:9380') HOST_ADDRESS = os.getenv('HOST_ADDRESS', 'http://127.0.0.1:9380')



# def generate_random_email(): # def generate_random_email():
# return 'user_' + ''.join(random.choices(string.ascii_lowercase + string.digits, k=8))+'@1.com' # return 'user_' + ''.join(random.choices(string.ascii_lowercase + string.digits, k=8))+'@1.com'


def generate_email(): def generate_email():
return 'user_123@1.com' return 'user_123@1.com'



EMAIL = generate_email() EMAIL = generate_email()
# password is "123" # password is "123"
PASSWORD='''ctAseGvejiaSWWZ88T/m4FQVOpQyUvP+x7sXtdv3feqZACiQleuewkUi35E16wSd5C5QcnkkcV9cYc8TKPTRZlxappDuirxghxoOvFcJxFU4ixLsD
PASSWORD = '''ctAseGvejiaSWWZ88T/m4FQVOpQyUvP+x7sXtdv3feqZACiQleuewkUi35E16wSd5C5QcnkkcV9cYc8TKPTRZlxappDuirxghxoOvFcJxFU4ixLsD
fN33jCHRoDUW81IH9zjij/vaw8IbVyb6vuwg6MX6inOEBRRzVbRYxXOu1wkWY6SsI8X70oF9aeLFp/PzQpjoe/YbSqpTq8qqrmHzn9vO+yvyYyvmDsphXe fN33jCHRoDUW81IH9zjij/vaw8IbVyb6vuwg6MX6inOEBRRzVbRYxXOu1wkWY6SsI8X70oF9aeLFp/PzQpjoe/YbSqpTq8qqrmHzn9vO+yvyYyvmDsphXe
X8f7fp9c7vUsfOCkM+gHY3PadG+QHa7KI7mzTKgUTZImK6BZtfRBATDTthEUbbaTewY4H0MnWiCeeDhcbeQao6cFy1To8pE3RpmxnGnS8BsBn8w==''' X8f7fp9c7vUsfOCkM+gHY3PadG+QHa7KI7mzTKgUTZImK6BZtfRBATDTthEUbbaTewY4H0MnWiCeeDhcbeQao6cFy1To8pE3RpmxnGnS8BsBn8w=='''



def register(): def register():
url = HOST_ADDRESS + "/v1/user/register" url = HOST_ADDRESS + "/v1/user/register"
name = "user" name = "user"
register_data = {"email":EMAIL,"nickname":name,"password":PASSWORD}
res = requests.post(url=url,json=register_data)
register_data = {"email": EMAIL, "nickname": name, "password": PASSWORD}
res = requests.post(url=url, json=register_data)
res = res.json() res = res.json()
if res.get("code") != 0: if res.get("code") != 0:
raise Exception(res.get("message")) raise Exception(res.get("message"))



def login(): def login():
url = HOST_ADDRESS + "/v1/user/login" url = HOST_ADDRESS + "/v1/user/login"
login_data = {"email":EMAIL,"password":PASSWORD}
response=requests.post(url=url,json=login_data)
login_data = {"email": EMAIL, "password": PASSWORD}
response = requests.post(url=url, json=login_data)
res = response.json() res = response.json()
if res.get("code")!=0:
if res.get("code") != 0:
raise Exception(res.get("message")) raise Exception(res.get("message"))
auth = response.headers["Authorization"] auth = response.headers["Authorization"]
return auth return auth



@pytest.fixture(scope="session") @pytest.fixture(scope="session")
def get_api_key_fixture(): def get_api_key_fixture():
try: try:
auth = login() auth = login()
url = HOST_ADDRESS + "/v1/system/new_token" url = HOST_ADDRESS + "/v1/system/new_token"
auth = {"Authorization": auth} auth = {"Authorization": auth}
response = requests.post(url=url,headers=auth)
response = requests.post(url=url, headers=auth)
res = response.json() res = response.json()
if res.get("code") != 0: if res.get("code") != 0:
raise Exception(res.get("message")) raise Exception(res.get("message"))
return res["data"].get("token") return res["data"].get("token")



@pytest.fixture(scope="session") @pytest.fixture(scope="session")
def get_auth(): def get_auth():
try: try:
auth = login() auth = login()
return auth return auth



@pytest.fixture(scope="session") @pytest.fixture(scope="session")
def get_email(): def get_email():
return EMAIL return EMAIL

+ 16
- 0
sdk/python/test/test_frontend_api/common.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import os import os
import requests import requests



+ 16
- 0
sdk/python/test/test_frontend_api/get_email.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

def test_get_email(get_email): def test_get_email(get_email):
print("\nEmail account:",flush=True) print("\nEmail account:",flush=True)
print(f"{get_email}\n",flush=True) print(f"{get_email}\n",flush=True)

+ 18
- 2
sdk/python/test/test_frontend_api/test_dataset.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from common import create_dataset, list_dataset, rm_dataset, update_dataset, DATASET_NAME_LIMIT from common import create_dataset, list_dataset, rm_dataset, update_dataset, DATASET_NAME_LIMIT
import re import re
import random import random
print(f"found {len(dataset_list)} datasets") print(f"found {len(dataset_list)} datasets")
dataset_id = dataset_list[0] dataset_id = dataset_list[0]


json_req = {"kb_id": dataset_id, "name": "test_update_dataset", "description": "test", "permission": "me", "parser_id": "presentation",
json_req = {"kb_id": dataset_id, "name": "test_update_dataset", "description": "test", "permission": "me",
"parser_id": "presentation",
"language": "spanish"} "language": "spanish"}
res = update_dataset(get_auth, json_req) res = update_dataset(get_auth, json_req)
assert res.get("code") == 0, f"{res.get('message')}" assert res.get("code") == 0, f"{res.get('message')}"
res = rm_dataset(get_auth, dataset_id) res = rm_dataset(get_auth, dataset_id)
assert res.get("code") == 0, f"{res.get('message')}" assert res.get("code") == 0, f"{res.get('message')}"
print(f"{len(dataset_list)} datasets are deleted") print(f"{len(dataset_list)} datasets are deleted")


+ 18
- 1
sdk/python/test/test_sdk_api/common.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import os import os
HOST_ADDRESS=os.getenv('HOST_ADDRESS', 'http://127.0.0.1:9380')

HOST_ADDRESS = os.getenv('HOST_ADDRESS', 'http://127.0.0.1:9380')

+ 18
- 2
sdk/python/test/test_sdk_api/get_email.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

def test_get_email(get_email): def test_get_email(get_email):
print("\nEmail account:",flush=True)
print(f"{get_email}\n",flush=True)
print("\nEmail account:", flush=True)
print(f"{get_email}\n", flush=True)

+ 22
- 5
sdk/python/test/test_sdk_api/t_agent.py 查看文件

from ragflow_sdk import RAGFlow,Agent
#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from ragflow_sdk import RAGFlow, Agent
from common import HOST_ADDRESS from common import HOST_ADDRESS
import pytest import pytest



@pytest.mark.skip(reason="") @pytest.mark.skip(reason="")
def test_list_agents_with_success(get_api_key_fixture): def test_list_agents_with_success(get_api_key_fixture):
API_KEY=get_api_key_fixture
rag = RAGFlow(API_KEY,HOST_ADDRESS)
API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS)
rag.list_agents() rag.list_agents()




def test_converse_with_agent_with_success(get_api_key_fixture): def test_converse_with_agent_with_success(get_api_key_fixture):
API_KEY = "ragflow-BkOGNhYjIyN2JiODExZWY5MzVhMDI0Mm" API_KEY = "ragflow-BkOGNhYjIyN2JiODExZWY5MzVhMDI0Mm"
agent_id = "ebfada2eb2bc11ef968a0242ac120006" agent_id = "ebfada2eb2bc11ef968a0242ac120006"
rag = RAGFlow(API_KEY,HOST_ADDRESS)
rag = RAGFlow(API_KEY, HOST_ADDRESS)
lang = "Chinese" lang = "Chinese"
file = "How is the weather tomorrow?" file = "How is the weather tomorrow?"
Agent.ask(agent_id=agent_id,rag=rag,lang=lang,file=file)
Agent.ask(agent_id=agent_id, rag=rag, lang=lang, file=file)

+ 20
- 4
sdk/python/test/test_sdk_api/t_chat.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from ragflow_sdk import RAGFlow from ragflow_sdk import RAGFlow
from common import HOST_ADDRESS from common import HOST_ADDRESS



def test_create_chat_with_name(get_api_key_fixture): def test_create_chat_with_name(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
display_name = "ragflow.txt" display_name = "ragflow.txt"
with open("test_data/ragflow.txt", "rb") as file: with open("test_data/ragflow.txt", "rb") as file:
blob = file.read() blob = file.read()
document = {"display_name":display_name,"blob":blob}
document = {"display_name": display_name, "blob": blob}
documents = [] documents = []
documents.append(document) documents.append(document)
docs= kb.upload_documents(documents)
docs = kb.upload_documents(documents)
for doc in docs: for doc in docs:
doc.add_chunk("This is a test to add chunk") doc.add_chunk("This is a test to add chunk")
rag.create_chat("test_create_chat", dataset_ids=[kb.id]) rag.create_chat("test_create_chat", dataset_ids=[kb.id])
chat = rag.create_chat("test_delete_chat", dataset_ids=[kb.id]) chat = rag.create_chat("test_delete_chat", dataset_ids=[kb.id])
rag.delete_chats(ids=[chat.id]) rag.delete_chats(ids=[chat.id])



def test_list_chats_with_success(get_api_key_fixture): def test_list_chats_with_success(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
rag.create_chat("test_list_1", dataset_ids=[kb.id]) rag.create_chat("test_list_1", dataset_ids=[kb.id])
rag.create_chat("test_list_2", dataset_ids=[kb.id]) rag.create_chat("test_list_2", dataset_ids=[kb.id])
rag.list_chats() rag.list_chats()



+ 32
- 12
sdk/python/test/test_sdk_api/t_chunk.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from ragflow_sdk import RAGFlow from ragflow_sdk import RAGFlow
from common import HOST_ADDRESS from common import HOST_ADDRESS
from time import sleep from time import sleep



def test_parse_document_with_txt(get_api_key_fixture): def test_parse_document_with_txt(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_parse_document") ds = rag.create_dataset(name="test_parse_document")
name = 'ragflow_test.txt' name = 'ragflow_test.txt'
with open("test_data/ragflow_test.txt", "rb") as file :
with open("test_data/ragflow_test.txt", "rb") as file:
blob = file.read() blob = file.read()
docs = ds.upload_documents([{"display_name": name, "blob": blob}]) docs = ds.upload_documents([{"display_name": name, "blob": blob}])
doc = docs[0] doc = docs[0]
raise Exception("Run time ERROR: Document parsing did not complete in time.") raise Exception("Run time ERROR: Document parsing did not complete in time.")
''' '''



def test_parse_and_cancel_document(get_api_key_fixture): def test_parse_and_cancel_document(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_parse_and_cancel_document") ds = rag.create_dataset(name="test_parse_and_cancel_document")
name = 'ragflow_test.txt' name = 'ragflow_test.txt'
with open("test_data/ragflow_test.txt", "rb") as file :
with open("test_data/ragflow_test.txt", "rb") as file:
blob = file.read() blob = file.read()
docs=ds.upload_documents([{"display_name": name, "blob": blob}])
docs = ds.upload_documents([{"display_name": name, "blob": blob}])
doc = docs[0] doc = docs[0]
ds.async_parse_documents(document_ids=[doc.id]) ds.async_parse_documents(document_ids=[doc.id])
sleep(1) sleep(1)
raise Exception("Run time ERROR: Bulk document parsing did not complete in time.") raise Exception("Run time ERROR: Bulk document parsing did not complete in time.")
''' '''



def test_list_chunks_with_success(get_api_key_fixture): def test_list_chunks_with_success(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
{'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks) {'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks)
] ]
''' '''
documents =[{"display_name":"test_list_chunks_with_success.txt","blob":blob}]
documents = [{"display_name": "test_list_chunks_with_success.txt", "blob": blob}]
docs = ds.upload_documents(documents) docs = ds.upload_documents(documents)
ids = [doc.id for doc in docs] ids = [doc.id for doc in docs]
ds.async_parse_documents(ids) ds.async_parse_documents(ids)
{'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks) {'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks)
] ]
''' '''
documents =[{"display_name":"test_list_chunks_with_success.txt","blob":blob}]
documents = [{"display_name": "test_list_chunks_with_success.txt", "blob": blob}]
docs = ds.upload_documents(documents) docs = ds.upload_documents(documents)
doc = docs[0] doc = docs[0]
doc.add_chunk(content="This is a chunk addition test") doc.add_chunk(content="This is a chunk addition test")
{'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks) {'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks)
] ]
''' '''
documents =[{"display_name":"test_delete_chunk_with_success.txt","blob":blob}]
documents = [{"display_name": "test_delete_chunk_with_success.txt", "blob": blob}]
docs = ds.upload_documents(documents) docs = ds.upload_documents(documents)
doc = docs[0] doc = docs[0]
chunk = doc.add_chunk(content="This is a chunk addition test") chunk = doc.add_chunk(content="This is a chunk addition test")
{'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks) {'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks)
] ]
''' '''
documents =[{"display_name":"test_update_chunk_content_with_success.txt","blob":blob}]
documents = [{"display_name": "test_update_chunk_content_with_success.txt", "blob": blob}]
docs = ds.upload_documents(documents) docs = ds.upload_documents(documents)
doc = docs[0] doc = docs[0]
chunk = doc.add_chunk(content="This is a chunk addition test") chunk = doc.add_chunk(content="This is a chunk addition test")
# For Elasticsearch, the chunk is not searchable in shot time (~2s). # For Elasticsearch, the chunk is not searchable in shot time (~2s).
sleep(3) sleep(3)
chunk.update({"content":"This is a updated content"})
chunk.update({"content": "This is a updated content"})



def test_update_chunk_available(get_api_key_fixture): def test_update_chunk_available(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
{'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks) {'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks)
] ]
''' '''
documents =[{"display_name":"test_update_chunk_available_with_success.txt","blob":blob}]
documents = [{"display_name": "test_update_chunk_available_with_success.txt", "blob": blob}]
docs = ds.upload_documents(documents) docs = ds.upload_documents(documents)
doc = docs[0] doc = docs[0]
chunk = doc.add_chunk(content="This is a chunk addition test") chunk = doc.add_chunk(content="This is a chunk addition test")
# For Elasticsearch, the chunk is not searchable in shot time (~2s). # For Elasticsearch, the chunk is not searchable in shot time (~2s).
sleep(3) sleep(3)
chunk.update({"available":0})
chunk.update({"available": 0})




def test_retrieve_chunks(get_api_key_fixture): def test_retrieve_chunks(get_api_key_fixture):
{'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks) {'display_name': f'chunk_{i}.txt', 'blob': chunk} for i, chunk in enumerate(chunks)
] ]
''' '''
documents =[{"display_name":"test_retrieve_chunks.txt","blob":blob}]
documents = [{"display_name": "test_retrieve_chunks.txt", "blob": blob}]
docs = ds.upload_documents(documents) docs = ds.upload_documents(documents)
doc = docs[0] doc = docs[0]
doc.add_chunk(content="This is a chunk addition test") doc.add_chunk(content="This is a chunk addition test")
rag.retrieve(dataset_ids=[ds.id],document_ids=[doc.id])
rag.retrieve(dataset_ids=[ds.id], document_ids=[doc.id])
rag.delete_datasets(ids=[ds.id]) rag.delete_datasets(ids=[ds.id])


# test different parameters for the retrieval # test different parameters for the retrieval

+ 24
- 3
sdk/python/test/test_sdk_api/t_dataset.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from ragflow_sdk import RAGFlow from ragflow_sdk import RAGFlow
import random import random
import pytest import pytest
from common import HOST_ADDRESS from common import HOST_ADDRESS



def test_create_dataset_with_name(get_api_key_fixture): def test_create_dataset_with_name(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
rag.create_dataset("test_create_dataset_with_name") rag.create_dataset("test_create_dataset_with_name")



def test_create_dataset_with_duplicated_name(get_api_key_fixture): def test_create_dataset_with_duplicated_name(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
rag.create_dataset("test_create_dataset_with_duplicated_name") rag.create_dataset("test_create_dataset_with_duplicated_name")
assert str(exc_info.value) == "Duplicated dataset name in creating dataset." assert str(exc_info.value) == "Duplicated dataset name in creating dataset."



def test_create_dataset_with_random_chunk_method(get_api_key_fixture): def test_create_dataset_with_random_chunk_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
valid_chunk_methods = ["naive","manual","qa","table","paper","book","laws","presentation","picture","one","knowledge_graph","email"]
valid_chunk_methods = ["naive", "manual", "qa", "table", "paper", "book", "laws", "presentation", "picture", "one",
"knowledge_graph", "email"]
random_chunk_method = random.choice(valid_chunk_methods) random_chunk_method = random.choice(valid_chunk_methods)
rag.create_dataset("test_create_dataset_with_random_chunk_method",chunk_method=random_chunk_method)
rag.create_dataset("test_create_dataset_with_random_chunk_method", chunk_method=random_chunk_method)



def test_create_dataset_with_invalid_parameter(get_api_key_fixture): def test_create_dataset_with_invalid_parameter(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
"knowledge_graph", "email", "tag"] "knowledge_graph", "email", "tag"]
chunk_method = "invalid_chunk_method" chunk_method = "invalid_chunk_method"
with pytest.raises(Exception) as exc_info: with pytest.raises(Exception) as exc_info:
rag.create_dataset("test_create_dataset_with_invalid_chunk_method",chunk_method=chunk_method)
rag.create_dataset("test_create_dataset_with_invalid_chunk_method", chunk_method=chunk_method)
assert str(exc_info.value) == f"'{chunk_method}' is not in {valid_chunk_methods}" assert str(exc_info.value) == f"'{chunk_method}' is not in {valid_chunk_methods}"





+ 73
- 41
sdk/python/test/test_sdk_api/t_document.py 查看文件

#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from ragflow_sdk import RAGFlow from ragflow_sdk import RAGFlow
from common import HOST_ADDRESS from common import HOST_ADDRESS
import pytest import pytest



def test_upload_document_with_success(get_api_key_fixture): def test_upload_document_with_success(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_upload_document") ds = rag.create_dataset(name="test_upload_document")
blob = b"Sample document content for test." blob = b"Sample document content for test."
with open("test_data/ragflow.txt", "rb") as file: with open("test_data/ragflow.txt", "rb") as file:
blob_2=file.read()
blob_2 = file.read()
document_infos = [] document_infos = []
document_infos.append({"display_name": "test_1.txt","blob": blob})
document_infos.append({"display_name": "test_2.txt","blob": blob_2})
document_infos.append({"display_name": "test_1.txt", "blob": blob})
document_infos.append({"display_name": "test_2.txt", "blob": blob_2})
ds.upload_documents(document_infos) ds.upload_documents(document_infos)




rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_update_document") ds = rag.create_dataset(name="test_update_document")
blob = b"Sample document content for test." blob = b"Sample document content for test."
document_infos=[{"display_name":"test.txt","blob":blob}]
docs=ds.upload_documents(document_infos)
document_infos = [{"display_name": "test.txt", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
doc.update({"chunk_method": "manual", "name": "manual.txt"}) doc.update({"chunk_method": "manual", "name": "manual.txt"})


rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_download_document") ds = rag.create_dataset(name="test_download_document")
blob = b"Sample document content for test." blob = b"Sample document content for test."
document_infos=[{"display_name": "test_1.txt","blob": blob}]
docs=ds.upload_documents(document_infos)
document_infos = [{"display_name": "test_1.txt", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
with open("test_download.txt","wb+") as file:
with open("test_download.txt", "wb+") as file:
file.write(doc.download()) file.write(doc.download())




rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_list_documents") ds = rag.create_dataset(name="test_list_documents")
blob = b"Sample document content for test." blob = b"Sample document content for test."
document_infos = [{"display_name": "test.txt","blob":blob}]
document_infos = [{"display_name": "test.txt", "blob": blob}]
ds.upload_documents(document_infos) ds.upload_documents(document_infos)
ds.list_documents(keywords="test", page=1, page_size=12) ds.list_documents(keywords="test", page=1, page_size=12)


ds = rag.create_dataset(name="test_delete_documents") ds = rag.create_dataset(name="test_delete_documents")
name = "test_delete_documents.txt" name = "test_delete_documents.txt"
blob = b"Sample document content for test." blob = b"Sample document content for test."
document_infos=[{"display_name": name, "blob": blob}]
document_infos = [{"display_name": name, "blob": blob}]
docs = ds.upload_documents(document_infos) docs = ds.upload_documents(document_infos)
ds.delete_documents([docs[0].id]) ds.delete_documents([docs[0].id])



# upload and parse the document with different in different parse method. # upload and parse the document with different in different parse method.
def test_upload_and_parse_pdf_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_pdf_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_pdf_document") ds = rag.create_dataset(name="test_pdf_document")
with open("test_data/test.pdf", "rb") as file: with open("test_data/test.pdf", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.pdf","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.pdf", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])



def test_upload_and_parse_docx_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_docx_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_docx_document") ds = rag.create_dataset(name="test_docx_document")
with open("test_data/test.docx", "rb") as file: with open("test_data/test.docx", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.docx","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.docx", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])


def test_upload_and_parse_excel_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_excel_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_excel_document") ds = rag.create_dataset(name="test_excel_document")
with open("test_data/test.xlsx", "rb") as file: with open("test_data/test.xlsx", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.xlsx","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.xlsx", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])


def test_upload_and_parse_ppt_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_ppt_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_ppt_document") ds = rag.create_dataset(name="test_ppt_document")
with open("test_data/test.ppt", "rb") as file: with open("test_data/test.ppt", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.ppt","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.ppt", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])


def test_upload_and_parse_image_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_image_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_image_document") ds = rag.create_dataset(name="test_image_document")
with open("test_data/test.jpg", "rb") as file: with open("test_data/test.jpg", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.jpg","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.jpg", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])


def test_upload_and_parse_txt_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_txt_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_txt_document") ds = rag.create_dataset(name="test_txt_document")
with open("test_data/test.txt", "rb") as file: with open("test_data/test.txt", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.txt","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.txt", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])


def test_upload_and_parse_md_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_md_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_md_document") ds = rag.create_dataset(name="test_md_document")
with open("test_data/test.md", "rb") as file: with open("test_data/test.md", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.md","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.md", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])



def test_upload_and_parse_json_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_json_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_json_document") ds = rag.create_dataset(name="test_json_document")
with open("test_data/test.json", "rb") as file: with open("test_data/test.json", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.json","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.json", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])



@pytest.mark.skip(reason="") @pytest.mark.skip(reason="")
def test_upload_and_parse_eml_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_eml_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_eml_document") ds = rag.create_dataset(name="test_eml_document")
with open("test_data/test.eml", "rb") as file: with open("test_data/test.eml", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.eml","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.eml", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id]) ds.async_parse_documents([doc.id])



def test_upload_and_parse_html_documents_with_general_parse_method(get_api_key_fixture): def test_upload_and_parse_html_documents_with_general_parse_method(get_api_key_fixture):
API_KEY = get_api_key_fixture API_KEY = get_api_key_fixture
rag = RAGFlow(API_KEY, HOST_ADDRESS) rag = RAGFlow(API_KEY, HOST_ADDRESS)
ds = rag.create_dataset(name="test_html_document") ds = rag.create_dataset(name="test_html_document")
with open("test_data/test.html", "rb") as file: with open("test_data/test.html", "rb") as file:
blob=file.read()
document_infos = [{"display_name": "test.html","blob": blob}]
docs=ds.upload_documents(document_infos)
blob = file.read()
document_infos = [{"display_name": "test.html", "blob": blob}]
docs = ds.upload_documents(document_infos)
doc = docs[0] doc = docs[0]
ds.async_parse_documents([doc.id])
ds.async_parse_documents([doc.id])

+ 34
- 15
sdk/python/test/test_sdk_api/t_session.py 查看文件

from ragflow_sdk import RAGFlow,Agent
#
# Copyright 2025 The InfiniFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from ragflow_sdk import RAGFlow, Agent
from common import HOST_ADDRESS from common import HOST_ADDRESS
import pytest import pytest


display_name = "ragflow.txt" display_name = "ragflow.txt"
with open("test_data/ragflow.txt", "rb") as file: with open("test_data/ragflow.txt", "rb") as file:
blob = file.read() blob = file.read()
document = {"display_name":display_name,"blob":blob}
document = {"display_name": display_name, "blob": blob}
documents = [] documents = []
documents.append(document) documents.append(document)
docs= kb.upload_documents(documents)
docs = kb.upload_documents(documents)
for doc in docs: for doc in docs:
doc.add_chunk("This is a test to add chunk") doc.add_chunk("This is a test to add chunk")
assistant=rag.create_chat("test_create_session", dataset_ids=[kb.id])
assistant = rag.create_chat("test_create_session", dataset_ids=[kb.id])
assistant.create_session() assistant.create_session()




question = "What is AI" question = "What is AI"
for ans in session.ask(question): for ans in session.ask(question):
pass pass
# assert not ans.content.startswith("**ERROR**"), "Please check this error." # assert not ans.content.startswith("**ERROR**"), "Please check this error."




display_name = "ragflow.txt" display_name = "ragflow.txt"
with open("test_data/ragflow.txt", "rb") as file: with open("test_data/ragflow.txt", "rb") as file:
blob = file.read() blob = file.read()
document = {"display_name":display_name,"blob":blob}
document = {"display_name": display_name, "blob": blob}
documents = [] documents = []
documents.append(document) documents.append(document)
docs= kb.upload_documents(documents)
docs = kb.upload_documents(documents)
for doc in docs: for doc in docs:
doc.add_chunk("This is a test to add chunk") doc.add_chunk("This is a test to add chunk")
assistant=rag.create_chat("test_delete_session", dataset_ids=[kb.id])
assistant = rag.create_chat("test_delete_session", dataset_ids=[kb.id])
session = assistant.create_session() session = assistant.create_session()
assistant.delete_sessions(ids=[session.id]) assistant.delete_sessions(ids=[session.id])


display_name = "ragflow.txt" display_name = "ragflow.txt"
with open("test_data/ragflow.txt", "rb") as file: with open("test_data/ragflow.txt", "rb") as file:
blob = file.read() blob = file.read()
document = {"display_name":display_name,"blob":blob}
document = {"display_name": display_name, "blob": blob}
documents = [] documents = []
documents.append(document) documents.append(document)
docs= kb.upload_documents(documents)
docs = kb.upload_documents(documents)
for doc in docs: for doc in docs:
doc.add_chunk("This is a test to add chunk") doc.add_chunk("This is a test to add chunk")
assistant=rag.create_chat("test_list_session", dataset_ids=[kb.id])
assistant = rag.create_chat("test_list_session", dataset_ids=[kb.id])
assistant.create_session("test_1") assistant.create_session("test_1")
assistant.create_session("test_2") assistant.create_session("test_2")
assistant.list_sessions() assistant.list_sessions()



@pytest.mark.skip(reason="") @pytest.mark.skip(reason="")
def test_create_agent_session_with_success(get_api_key_fixture): def test_create_agent_session_with_success(get_api_key_fixture):
API_KEY = "ragflow-BkOGNhYjIyN2JiODExZWY5MzVhMDI0Mm" API_KEY = "ragflow-BkOGNhYjIyN2JiODExZWY5MzVhMDI0Mm"
rag = RAGFlow(API_KEY,HOST_ADDRESS)
rag = RAGFlow(API_KEY, HOST_ADDRESS)
Agent.create_session("2e45b5209c1011efa3e90242ac120006", rag) Agent.create_session("2e45b5209c1011efa3e90242ac120006", rag)



@pytest.mark.skip(reason="") @pytest.mark.skip(reason="")
def test_create_agent_conversation_with_success(get_api_key_fixture): def test_create_agent_conversation_with_success(get_api_key_fixture):
API_KEY = "ragflow-BkOGNhYjIyN2JiODExZWY5MzVhMDI0Mm" API_KEY = "ragflow-BkOGNhYjIyN2JiODExZWY5MzVhMDI0Mm"
rag = RAGFlow(API_KEY,HOST_ADDRESS)
rag = RAGFlow(API_KEY, HOST_ADDRESS)
session = Agent.create_session("2e45b5209c1011efa3e90242ac120006", rag) session = Agent.create_session("2e45b5209c1011efa3e90242ac120006", rag)
session.ask("What is this job") session.ask("What is this job")



@pytest.mark.skip(reason="") @pytest.mark.skip(reason="")
def test_list_agent_sessions_with_success(get_api_key_fixture): def test_list_agent_sessions_with_success(get_api_key_fixture):
API_KEY = "ragflow-BkOGNhYjIyN2JiODExZWY5MzVhMDI0Mm" API_KEY = "ragflow-BkOGNhYjIyN2JiODExZWY5MzVhMDI0Mm"
agent_id = "2710f2269b4611ef8fdf0242ac120006" agent_id = "2710f2269b4611ef8fdf0242ac120006"
rag = RAGFlow(API_KEY,HOST_ADDRESS)
Agent.list_sessions(agent_id,rag)
rag = RAGFlow(API_KEY, HOST_ADDRESS)
Agent.list_sessions(agent_id, rag)

正在加载...
取消
保存