Você não pode selecionar mais de 25 tópicos Os tópicos devem começar com uma letra ou um número, podem incluir traços ('-') e podem ter até 35 caracteres.

api_app.py 12KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307
  1. #
  2. # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. import os
  17. import re
  18. from datetime import datetime, timedelta
  19. from flask import request
  20. from flask_login import login_required, current_user
  21. from api.db import FileType, ParserType
  22. from api.db.db_models import APIToken, API4Conversation
  23. from api.db.services import duplicate_name
  24. from api.db.services.api_service import APITokenService, API4ConversationService
  25. from api.db.services.dialog_service import DialogService, chat
  26. from api.db.services.document_service import DocumentService
  27. from api.db.services.knowledgebase_service import KnowledgebaseService
  28. from api.db.services.user_service import UserTenantService
  29. from api.settings import RetCode
  30. from api.utils import get_uuid, current_timestamp, datetime_format
  31. from api.utils.api_utils import server_error_response, get_data_error_result, get_json_result, validate_request
  32. from itsdangerous import URLSafeTimedSerializer
  33. from api.db.services.task_service import TaskService, queue_tasks
  34. from api.utils.file_utils import filename_type, thumbnail
  35. from rag.utils.minio_conn import MINIO
  36. from api.db.db_models import Task
  37. from api.db.services.file2document_service import File2DocumentService
  38. def generate_confirmation_token(tenent_id):
  39. serializer = URLSafeTimedSerializer(tenent_id)
  40. return "ragflow-" + serializer.dumps(get_uuid(), salt=tenent_id)[2:34]
  41. @manager.route('/new_token', methods=['POST'])
  42. @validate_request("dialog_id")
  43. @login_required
  44. def new_token():
  45. req = request.json
  46. try:
  47. tenants = UserTenantService.query(user_id=current_user.id)
  48. if not tenants:
  49. return get_data_error_result(retmsg="Tenant not found!")
  50. tenant_id = tenants[0].tenant_id
  51. obj = {"tenant_id": tenant_id, "token": generate_confirmation_token(tenant_id),
  52. "dialog_id": req["dialog_id"],
  53. "create_time": current_timestamp(),
  54. "create_date": datetime_format(datetime.now()),
  55. "update_time": None,
  56. "update_date": None
  57. }
  58. if not APITokenService.save(**obj):
  59. return get_data_error_result(retmsg="Fail to new a dialog!")
  60. return get_json_result(data=obj)
  61. except Exception as e:
  62. return server_error_response(e)
  63. @manager.route('/token_list', methods=['GET'])
  64. @login_required
  65. def token_list():
  66. try:
  67. tenants = UserTenantService.query(user_id=current_user.id)
  68. if not tenants:
  69. return get_data_error_result(retmsg="Tenant not found!")
  70. objs = APITokenService.query(tenant_id=tenants[0].tenant_id, dialog_id=request.args["dialog_id"])
  71. return get_json_result(data=[o.to_dict() for o in objs])
  72. except Exception as e:
  73. return server_error_response(e)
  74. @manager.route('/rm', methods=['POST'])
  75. @validate_request("tokens", "tenant_id")
  76. @login_required
  77. def rm():
  78. req = request.json
  79. try:
  80. for token in req["tokens"]:
  81. APITokenService.filter_delete(
  82. [APIToken.tenant_id == req["tenant_id"], APIToken.token == token])
  83. return get_json_result(data=True)
  84. except Exception as e:
  85. return server_error_response(e)
  86. @manager.route('/stats', methods=['GET'])
  87. @login_required
  88. def stats():
  89. try:
  90. tenants = UserTenantService.query(user_id=current_user.id)
  91. if not tenants:
  92. return get_data_error_result(retmsg="Tenant not found!")
  93. objs = API4ConversationService.stats(
  94. tenants[0].tenant_id,
  95. request.args.get(
  96. "from_date",
  97. (datetime.now() -
  98. timedelta(
  99. days=7)).strftime("%Y-%m-%d 24:00:00")),
  100. request.args.get(
  101. "to_date",
  102. datetime.now().strftime("%Y-%m-%d %H:%M:%S")))
  103. res = {
  104. "pv": [(o["dt"], o["pv"]) for o in objs],
  105. "uv": [(o["dt"], o["uv"]) for o in objs],
  106. "speed": [(o["dt"], float(o["tokens"])/(float(o["duration"]+0.1))) for o in objs],
  107. "tokens": [(o["dt"], float(o["tokens"])/1000.) for o in objs],
  108. "round": [(o["dt"], o["round"]) for o in objs],
  109. "thumb_up": [(o["dt"], o["thumb_up"]) for o in objs]
  110. }
  111. return get_json_result(data=res)
  112. except Exception as e:
  113. return server_error_response(e)
  114. @manager.route('/new_conversation', methods=['GET'])
  115. def set_conversation():
  116. token = request.headers.get('Authorization').split()[1]
  117. objs = APIToken.query(token=token)
  118. if not objs:
  119. return get_json_result(
  120. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  121. req = request.json
  122. try:
  123. e, dia = DialogService.get_by_id(objs[0].dialog_id)
  124. if not e:
  125. return get_data_error_result(retmsg="Dialog not found")
  126. conv = {
  127. "id": get_uuid(),
  128. "dialog_id": dia.id,
  129. "user_id": request.args.get("user_id", ""),
  130. "message": [{"role": "assistant", "content": dia.prompt_config["prologue"]}]
  131. }
  132. API4ConversationService.save(**conv)
  133. e, conv = API4ConversationService.get_by_id(conv["id"])
  134. if not e:
  135. return get_data_error_result(retmsg="Fail to new a conversation!")
  136. conv = conv.to_dict()
  137. return get_json_result(data=conv)
  138. except Exception as e:
  139. return server_error_response(e)
  140. @manager.route('/completion', methods=['POST'])
  141. @validate_request("conversation_id", "messages")
  142. def completion():
  143. token = request.headers.get('Authorization').split()[1]
  144. if not APIToken.query(token=token):
  145. return get_json_result(
  146. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  147. req = request.json
  148. e, conv = API4ConversationService.get_by_id(req["conversation_id"])
  149. if not e:
  150. return get_data_error_result(retmsg="Conversation not found!")
  151. msg = []
  152. for m in req["messages"]:
  153. if m["role"] == "system":
  154. continue
  155. if m["role"] == "assistant" and not msg:
  156. continue
  157. msg.append({"role": m["role"], "content": m["content"]})
  158. try:
  159. conv.message.append(msg[-1])
  160. e, dia = DialogService.get_by_id(conv.dialog_id)
  161. if not e:
  162. return get_data_error_result(retmsg="Dialog not found!")
  163. del req["conversation_id"]
  164. del req["messages"]
  165. ans = chat(dia, msg, **req)
  166. if not conv.reference:
  167. conv.reference = []
  168. conv.reference.append(ans["reference"])
  169. conv.message.append({"role": "assistant", "content": ans["answer"]})
  170. API4ConversationService.append_message(conv.id, conv.to_dict())
  171. return get_json_result(data=ans)
  172. except Exception as e:
  173. return server_error_response(e)
  174. @manager.route('/conversation/<conversation_id>', methods=['GET'])
  175. # @login_required
  176. def get(conversation_id):
  177. try:
  178. e, conv = API4ConversationService.get_by_id(conversation_id)
  179. if not e:
  180. return get_data_error_result(retmsg="Conversation not found!")
  181. return get_json_result(data=conv.to_dict())
  182. except Exception as e:
  183. return server_error_response(e)
  184. @manager.route('/document/upload', methods=['POST'])
  185. @validate_request("kb_name")
  186. def upload():
  187. token = request.headers.get('Authorization').split()[1]
  188. objs = APIToken.query(token=token)
  189. if not objs:
  190. return get_json_result(
  191. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  192. kb_name = request.form.get("kb_name").strip()
  193. tenant_id = objs[0].tenant_id
  194. try:
  195. e, kb = KnowledgebaseService.get_by_name(kb_name, tenant_id)
  196. if not e:
  197. return get_data_error_result(
  198. retmsg="Can't find this knowledgebase!")
  199. kb_id = kb.id
  200. except Exception as e:
  201. return server_error_response(e)
  202. if 'file' not in request.files:
  203. return get_json_result(
  204. data=False, retmsg='No file part!', retcode=RetCode.ARGUMENT_ERROR)
  205. file = request.files['file']
  206. if file.filename == '':
  207. return get_json_result(
  208. data=False, retmsg='No file selected!', retcode=RetCode.ARGUMENT_ERROR)
  209. try:
  210. if DocumentService.get_doc_count(kb.tenant_id) >= int(os.environ.get('MAX_FILE_NUM_PER_USER', 8192)):
  211. return get_data_error_result(
  212. retmsg="Exceed the maximum file number of a free user!")
  213. filename = duplicate_name(
  214. DocumentService.query,
  215. name=file.filename,
  216. kb_id=kb_id)
  217. filetype = filename_type(filename)
  218. if not filetype:
  219. return get_data_error_result(
  220. retmsg="This type of file has not been supported yet!")
  221. location = filename
  222. while MINIO.obj_exist(kb_id, location):
  223. location += "_"
  224. blob = request.files['file'].read()
  225. MINIO.put(kb_id, location, blob)
  226. doc = {
  227. "id": get_uuid(),
  228. "kb_id": kb.id,
  229. "parser_id": kb.parser_id,
  230. "parser_config": kb.parser_config,
  231. "created_by": kb.tenant_id,
  232. "type": filetype,
  233. "name": filename,
  234. "location": location,
  235. "size": len(blob),
  236. "thumbnail": thumbnail(filename, blob)
  237. }
  238. form_data=request.form
  239. if "parser_id" in form_data.keys():
  240. if request.form.get("parser_id").strip() in list(vars(ParserType).values())[1:-3]:
  241. doc["parser_id"] = request.form.get("parser_id").strip()
  242. if doc["type"] == FileType.VISUAL:
  243. doc["parser_id"] = ParserType.PICTURE.value
  244. if re.search(r"\.(ppt|pptx|pages)$", filename):
  245. doc["parser_id"] = ParserType.PRESENTATION.value
  246. doc_result = DocumentService.insert(doc)
  247. except Exception as e:
  248. return server_error_response(e)
  249. if "run" in form_data.keys():
  250. if request.form.get("run").strip() == "1":
  251. try:
  252. info = {"run": 1, "progress": 0}
  253. info["progress_msg"] = ""
  254. info["chunk_num"] = 0
  255. info["token_num"] = 0
  256. DocumentService.update_by_id(doc["id"], info)
  257. # if str(req["run"]) == TaskStatus.CANCEL.value:
  258. tenant_id = DocumentService.get_tenant_id(doc["id"])
  259. if not tenant_id:
  260. return get_data_error_result(retmsg="Tenant not found!")
  261. #e, doc = DocumentService.get_by_id(doc["id"])
  262. TaskService.filter_delete([Task.doc_id == doc["id"]])
  263. e, doc = DocumentService.get_by_id(doc["id"])
  264. doc = doc.to_dict()
  265. doc["tenant_id"] = tenant_id
  266. bucket, name = File2DocumentService.get_minio_address(doc_id=doc["id"])
  267. queue_tasks(doc, bucket, name)
  268. except Exception as e:
  269. return server_error_response(e)
  270. return get_json_result(data=doc_result.to_json())