Você não pode selecionar mais de 25 tópicos Os tópicos devem começar com uma letra ou um número, podem incluir traços ('-') e podem ter até 35 caracteres.

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308
  1. #
  2. # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. import json
  17. import os
  18. import re
  19. from datetime import datetime, timedelta
  20. from flask import request, Response
  21. from flask_login import login_required, current_user
  22. from api.db import FileType, ParserType
  23. from api.db.db_models import APIToken, API4Conversation
  24. from api.db.services import duplicate_name
  25. from api.db.services.api_service import APITokenService, API4ConversationService
  26. from api.db.services.dialog_service import DialogService, chat
  27. from api.db.services.document_service import DocumentService
  28. from api.db.services.knowledgebase_service import KnowledgebaseService
  29. from api.db.services.user_service import UserTenantService
  30. from api.settings import RetCode
  31. from api.utils import get_uuid, current_timestamp, datetime_format
  32. from api.utils.api_utils import server_error_response, get_data_error_result, get_json_result, validate_request
  33. from itsdangerous import URLSafeTimedSerializer
  34. from api.utils.file_utils import filename_type, thumbnail
  35. from rag.utils.minio_conn import MINIO
  36. def generate_confirmation_token(tenent_id):
  37. serializer = URLSafeTimedSerializer(tenent_id)
  38. return "ragflow-" + serializer.dumps(get_uuid(), salt=tenent_id)[2:34]
  39. @manager.route('/new_token', methods=['POST'])
  40. @validate_request("dialog_id")
  41. @login_required
  42. def new_token():
  43. req = request.json
  44. try:
  45. tenants = UserTenantService.query(user_id=current_user.id)
  46. if not tenants:
  47. return get_data_error_result(retmsg="Tenant not found!")
  48. tenant_id = tenants[0].tenant_id
  49. obj = {"tenant_id": tenant_id, "token": generate_confirmation_token(tenant_id),
  50. "dialog_id": req["dialog_id"],
  51. "create_time": current_timestamp(),
  52. "create_date": datetime_format(datetime.now()),
  53. "update_time": None,
  54. "update_date": None
  55. }
  56. if not APITokenService.save(**obj):
  57. return get_data_error_result(retmsg="Fail to new a dialog!")
  58. return get_json_result(data=obj)
  59. except Exception as e:
  60. return server_error_response(e)
  61. @manager.route('/token_list', methods=['GET'])
  62. @login_required
  63. def token_list():
  64. try:
  65. tenants = UserTenantService.query(user_id=current_user.id)
  66. if not tenants:
  67. return get_data_error_result(retmsg="Tenant not found!")
  68. objs = APITokenService.query(tenant_id=tenants[0].tenant_id, dialog_id=request.args["dialog_id"])
  69. return get_json_result(data=[o.to_dict() for o in objs])
  70. except Exception as e:
  71. return server_error_response(e)
  72. @manager.route('/rm', methods=['POST'])
  73. @validate_request("tokens", "tenant_id")
  74. @login_required
  75. def rm():
  76. req = request.json
  77. try:
  78. for token in req["tokens"]:
  79. APITokenService.filter_delete(
  80. [APIToken.tenant_id == req["tenant_id"], APIToken.token == token])
  81. return get_json_result(data=True)
  82. except Exception as e:
  83. return server_error_response(e)
  84. @manager.route('/stats', methods=['GET'])
  85. @login_required
  86. def stats():
  87. try:
  88. tenants = UserTenantService.query(user_id=current_user.id)
  89. if not tenants:
  90. return get_data_error_result(retmsg="Tenant not found!")
  91. objs = API4ConversationService.stats(
  92. tenants[0].tenant_id,
  93. request.args.get(
  94. "from_date",
  95. (datetime.now() -
  96. timedelta(
  97. days=7)).strftime("%Y-%m-%d 24:00:00")),
  98. request.args.get(
  99. "to_date",
  100. datetime.now().strftime("%Y-%m-%d %H:%M:%S")))
  101. res = {
  102. "pv": [(o["dt"], o["pv"]) for o in objs],
  103. "uv": [(o["dt"], o["uv"]) for o in objs],
  104. "speed": [(o["dt"], float(o["tokens"])/(float(o["duration"]+0.1))) for o in objs],
  105. "tokens": [(o["dt"], float(o["tokens"])/1000.) for o in objs],
  106. "round": [(o["dt"], o["round"]) for o in objs],
  107. "thumb_up": [(o["dt"], o["thumb_up"]) for o in objs]
  108. }
  109. return get_json_result(data=res)
  110. except Exception as e:
  111. return server_error_response(e)
  112. @manager.route('/new_conversation', methods=['GET'])
  113. def set_conversation():
  114. token = request.headers.get('Authorization').split()[1]
  115. objs = APIToken.query(token=token)
  116. if not objs:
  117. return get_json_result(
  118. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  119. req = request.json
  120. try:
  121. e, dia = DialogService.get_by_id(objs[0].dialog_id)
  122. if not e:
  123. return get_data_error_result(retmsg="Dialog not found")
  124. conv = {
  125. "id": get_uuid(),
  126. "dialog_id": dia.id,
  127. "user_id": request.args.get("user_id", ""),
  128. "message": [{"role": "assistant", "content": dia.prompt_config["prologue"]}]
  129. }
  130. API4ConversationService.save(**conv)
  131. e, conv = API4ConversationService.get_by_id(conv["id"])
  132. if not e:
  133. return get_data_error_result(retmsg="Fail to new a conversation!")
  134. conv = conv.to_dict()
  135. return get_json_result(data=conv)
  136. except Exception as e:
  137. return server_error_response(e)
  138. @manager.route('/completion', methods=['POST'])
  139. @validate_request("conversation_id", "messages")
  140. def completion():
  141. token = request.headers.get('Authorization').split()[1]
  142. if not APIToken.query(token=token):
  143. return get_json_result(
  144. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  145. req = request.json
  146. e, conv = API4ConversationService.get_by_id(req["conversation_id"])
  147. if not e:
  148. return get_data_error_result(retmsg="Conversation not found!")
  149. if "quote" not in req: req["quote"] = False
  150. msg = []
  151. for m in req["messages"]:
  152. if m["role"] == "system":
  153. continue
  154. if m["role"] == "assistant" and not msg:
  155. continue
  156. msg.append({"role": m["role"], "content": m["content"]})
  157. try:
  158. conv.message.append(msg[-1])
  159. e, dia = DialogService.get_by_id(conv.dialog_id)
  160. if not e:
  161. return get_data_error_result(retmsg="Dialog not found!")
  162. del req["conversation_id"]
  163. del req["messages"]
  164. if not conv.reference:
  165. conv.reference = []
  166. conv.message.append({"role": "assistant", "content": ""})
  167. conv.reference.append({"chunks": [], "doc_aggs": []})
  168. def fillin_conv(ans):
  169. nonlocal conv
  170. if not conv.reference:
  171. conv.reference.append(ans["reference"])
  172. else: conv.reference[-1] = ans["reference"]
  173. conv.message[-1] = {"role": "assistant", "content": ans["answer"]}
  174. def stream():
  175. nonlocal dia, msg, req, conv
  176. try:
  177. for ans in chat(dia, msg, True, **req):
  178. fillin_conv(ans)
  179. yield "data:"+json.dumps({"retcode": 0, "retmsg": "", "data": ans}, ensure_ascii=False) + "\n\n"
  180. API4ConversationService.append_message(conv.id, conv.to_dict())
  181. except Exception as e:
  182. yield "data:" + json.dumps({"retcode": 500, "retmsg": str(e),
  183. "data": {"answer": "**ERROR**: "+str(e), "reference": []}},
  184. ensure_ascii=False) + "\n\n"
  185. yield "data:"+json.dumps({"retcode": 0, "retmsg": "", "data": True}, ensure_ascii=False) + "\n\n"
  186. if req.get("stream", True):
  187. resp = Response(stream(), mimetype="text/event-stream")
  188. resp.headers.add_header("Cache-control", "no-cache")
  189. resp.headers.add_header("Connection", "keep-alive")
  190. resp.headers.add_header("X-Accel-Buffering", "no")
  191. resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
  192. return resp
  193. else:
  194. ans = chat(dia, msg, False, **req)
  195. fillin_conv(ans)
  196. API4ConversationService.append_message(conv.id, conv.to_dict())
  197. return get_json_result(data=ans)
  198. except Exception as e:
  199. return server_error_response(e)
  200. @manager.route('/conversation/<conversation_id>', methods=['GET'])
  201. # @login_required
  202. def get(conversation_id):
  203. try:
  204. e, conv = API4ConversationService.get_by_id(conversation_id)
  205. if not e:
  206. return get_data_error_result(retmsg="Conversation not found!")
  207. return get_json_result(data=conv.to_dict())
  208. except Exception as e:
  209. return server_error_response(e)
  210. @manager.route('/document/upload', methods=['POST'])
  211. @validate_request("kb_name")
  212. def upload():
  213. token = request.headers.get('Authorization').split()[1]
  214. objs = APIToken.query(token=token)
  215. if not objs:
  216. return get_json_result(
  217. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  218. kb_name = request.form.get("kb_name").strip()
  219. tenant_id = objs[0].tenant_id
  220. try:
  221. e, kb = KnowledgebaseService.get_by_name(kb_name, tenant_id)
  222. if not e:
  223. return get_data_error_result(
  224. retmsg="Can't find this knowledgebase!")
  225. kb_id = kb.id
  226. except Exception as e:
  227. return server_error_response(e)
  228. if 'file' not in request.files:
  229. return get_json_result(
  230. data=False, retmsg='No file part!', retcode=RetCode.ARGUMENT_ERROR)
  231. file = request.files['file']
  232. if file.filename == '':
  233. return get_json_result(
  234. data=False, retmsg='No file selected!', retcode=RetCode.ARGUMENT_ERROR)
  235. try:
  236. if DocumentService.get_doc_count(kb.tenant_id) >= int(os.environ.get('MAX_FILE_NUM_PER_USER', 8192)):
  237. return get_data_error_result(
  238. retmsg="Exceed the maximum file number of a free user!")
  239. filename = duplicate_name(
  240. DocumentService.query,
  241. name=file.filename,
  242. kb_id=kb_id)
  243. filetype = filename_type(filename)
  244. if not filetype:
  245. return get_data_error_result(
  246. retmsg="This type of file has not been supported yet!")
  247. location = filename
  248. while MINIO.obj_exist(kb_id, location):
  249. location += "_"
  250. blob = request.files['file'].read()
  251. MINIO.put(kb_id, location, blob)
  252. doc = {
  253. "id": get_uuid(),
  254. "kb_id": kb.id,
  255. "parser_id": kb.parser_id,
  256. "parser_config": kb.parser_config,
  257. "created_by": kb.tenant_id,
  258. "type": filetype,
  259. "name": filename,
  260. "location": location,
  261. "size": len(blob),
  262. "thumbnail": thumbnail(filename, blob)
  263. }
  264. if doc["type"] == FileType.VISUAL:
  265. doc["parser_id"] = ParserType.PICTURE.value
  266. if re.search(r"\.(ppt|pptx|pages)$", filename):
  267. doc["parser_id"] = ParserType.PRESENTATION.value
  268. doc = DocumentService.insert(doc)
  269. return get_json_result(data=doc.to_json())
  270. except Exception as e:
  271. return server_error_response(e)