選択できるのは25トピックまでです。 トピックは、先頭が英数字で、英数字とダッシュ('-')を使用した35文字以内のものにしてください。

conversation_app.py 9.3KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258
  1. #
  2. # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. from copy import deepcopy
  17. from flask import request, Response
  18. from flask_login import login_required,current_user
  19. from api.db.services.dialog_service import DialogService, ConversationService, chat
  20. from api.db.services.llm_service import LLMBundle, TenantService
  21. from api.db import LLMType
  22. from api.utils.api_utils import server_error_response, get_data_error_result, validate_request
  23. from api.utils import get_uuid
  24. from api.utils.api_utils import get_json_result
  25. import json
  26. @manager.route('/set', methods=['POST'])
  27. @login_required
  28. def set_conversation():
  29. req = request.json
  30. conv_id = req.get("conversation_id")
  31. if conv_id:
  32. del req["conversation_id"]
  33. try:
  34. if not ConversationService.update_by_id(conv_id, req):
  35. return get_data_error_result(retmsg="Conversation not found!")
  36. e, conv = ConversationService.get_by_id(conv_id)
  37. if not e:
  38. return get_data_error_result(
  39. retmsg="Fail to update a conversation!")
  40. conv = conv.to_dict()
  41. return get_json_result(data=conv)
  42. except Exception as e:
  43. return server_error_response(e)
  44. try:
  45. e, dia = DialogService.get_by_id(req["dialog_id"])
  46. if not e:
  47. return get_data_error_result(retmsg="Dialog not found")
  48. conv = {
  49. "id": get_uuid(),
  50. "dialog_id": req["dialog_id"],
  51. "name": req.get("name", "New conversation"),
  52. "message": [{"role": "assistant", "content": dia.prompt_config["prologue"]}]
  53. }
  54. ConversationService.save(**conv)
  55. e, conv = ConversationService.get_by_id(conv["id"])
  56. if not e:
  57. return get_data_error_result(retmsg="Fail to new a conversation!")
  58. conv = conv.to_dict()
  59. return get_json_result(data=conv)
  60. except Exception as e:
  61. return server_error_response(e)
  62. @manager.route('/get', methods=['GET'])
  63. @login_required
  64. def get():
  65. conv_id = request.args["conversation_id"]
  66. try:
  67. e, conv = ConversationService.get_by_id(conv_id)
  68. if not e:
  69. return get_data_error_result(retmsg="Conversation not found!")
  70. conv = conv.to_dict()
  71. return get_json_result(data=conv)
  72. except Exception as e:
  73. return server_error_response(e)
  74. @manager.route('/rm', methods=['POST'])
  75. @login_required
  76. def rm():
  77. conv_ids = request.json["conversation_ids"]
  78. try:
  79. for cid in conv_ids:
  80. ConversationService.delete_by_id(cid)
  81. return get_json_result(data=True)
  82. except Exception as e:
  83. return server_error_response(e)
  84. @manager.route('/list', methods=['GET'])
  85. @login_required
  86. def list_convsersation():
  87. dialog_id = request.args["dialog_id"]
  88. try:
  89. convs = ConversationService.query(
  90. dialog_id=dialog_id,
  91. order_by=ConversationService.model.create_time,
  92. reverse=True)
  93. convs = [d.to_dict() for d in convs]
  94. return get_json_result(data=convs)
  95. except Exception as e:
  96. return server_error_response(e)
  97. @manager.route('/completion', methods=['POST'])
  98. @login_required
  99. #@validate_request("conversation_id", "messages")
  100. def completion():
  101. req = request.json
  102. #req = {"conversation_id": "9aaaca4c11d311efa461fa163e197198", "messages": [
  103. # {"role": "user", "content": "上海有吗?"}
  104. #]}
  105. msg = []
  106. for m in req["messages"]:
  107. if m["role"] == "system":
  108. continue
  109. if m["role"] == "assistant" and not msg:
  110. continue
  111. msg.append(m)
  112. message_id = msg[-1].get("id")
  113. try:
  114. e, conv = ConversationService.get_by_id(req["conversation_id"])
  115. if not e:
  116. return get_data_error_result(retmsg="Conversation not found!")
  117. conv.message.append(deepcopy(msg[-1]))
  118. e, dia = DialogService.get_by_id(conv.dialog_id)
  119. if not e:
  120. return get_data_error_result(retmsg="Dialog not found!")
  121. del req["conversation_id"]
  122. del req["messages"]
  123. if not conv.reference:
  124. conv.reference = []
  125. conv.message.append({"role": "assistant", "content": "", "id": message_id})
  126. conv.reference.append({"chunks": [], "doc_aggs": []})
  127. def fillin_conv(ans):
  128. nonlocal conv, message_id
  129. if not conv.reference:
  130. conv.reference.append(ans["reference"])
  131. else: conv.reference[-1] = ans["reference"]
  132. conv.message[-1] = {"role": "assistant", "content": ans["answer"],
  133. "id": message_id, "prompt": ans.get("prompt", "")}
  134. def stream():
  135. nonlocal dia, msg, req, conv
  136. try:
  137. for ans in chat(dia, msg, True, **req):
  138. fillin_conv(ans)
  139. yield "data:"+json.dumps({"retcode": 0, "retmsg": "", "data": ans}, ensure_ascii=False) + "\n\n"
  140. ConversationService.update_by_id(conv.id, conv.to_dict())
  141. except Exception as e:
  142. yield "data:" + json.dumps({"retcode": 500, "retmsg": str(e),
  143. "data": {"answer": "**ERROR**: "+str(e), "reference": []}},
  144. ensure_ascii=False) + "\n\n"
  145. yield "data:"+json.dumps({"retcode": 0, "retmsg": "", "data": True}, ensure_ascii=False) + "\n\n"
  146. if req.get("stream", True):
  147. resp = Response(stream(), mimetype="text/event-stream")
  148. resp.headers.add_header("Cache-control", "no-cache")
  149. resp.headers.add_header("Connection", "keep-alive")
  150. resp.headers.add_header("X-Accel-Buffering", "no")
  151. resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
  152. return resp
  153. else:
  154. answer = None
  155. for ans in chat(dia, msg, **req):
  156. answer = ans
  157. fillin_conv(ans)
  158. ConversationService.update_by_id(conv.id, conv.to_dict())
  159. break
  160. return get_json_result(data=answer)
  161. except Exception as e:
  162. return server_error_response(e)
  163. @manager.route('/tts', methods=['POST'])
  164. @login_required
  165. def tts():
  166. req = request.json
  167. text = req["text"]
  168. tenants = TenantService.get_by_user_id(current_user.id)
  169. if not tenants:
  170. return get_data_error_result(retmsg="Tenant not found!")
  171. tts_id = tenants[0]["tts_id"]
  172. if not tts_id:
  173. return get_data_error_result(retmsg="No default TTS model is set")
  174. tts_mdl = LLMBundle(tenants[0]["tenant_id"], LLMType.TTS, tts_id)
  175. def stream_audio():
  176. try:
  177. for chunk in tts_mdl(text):
  178. yield chunk
  179. except Exception as e:
  180. yield "data:" + json.dumps({"retcode": 500, "retmsg": str(e),
  181. "data": {"answer": "**ERROR**: "+str(e)}},
  182. ensure_ascii=False).encode('utf-8')
  183. resp = Response(stream_audio(), mimetype="audio/mpeg")
  184. resp.headers.add_header("Cache-Control", "no-cache")
  185. resp.headers.add_header("Connection", "keep-alive")
  186. resp.headers.add_header("X-Accel-Buffering", "no")
  187. return resp
  188. @manager.route('/delete_msg', methods=['POST'])
  189. @login_required
  190. @validate_request("conversation_id", "message_id")
  191. def delete_msg():
  192. req = request.json
  193. e, conv = ConversationService.get_by_id(req["conversation_id"])
  194. if not e:
  195. return get_data_error_result(retmsg="Conversation not found!")
  196. conv = conv.to_dict()
  197. for i, msg in enumerate(conv["message"]):
  198. if req["message_id"] != msg.get("id", ""):
  199. continue
  200. assert conv["message"][i+1]["id"] == req["message_id"]
  201. conv["message"].pop(i)
  202. conv["message"].pop(i)
  203. conv["reference"].pop(i)
  204. break
  205. ConversationService.update_by_id(conv["id"], conv)
  206. return get_json_result(data=conv)
  207. @manager.route('/thumbup', methods=['POST'])
  208. @login_required
  209. @validate_request("conversation_id", "message_id")
  210. def thumbup():
  211. req = request.json
  212. e, conv = ConversationService.get_by_id(req["conversation_id"])
  213. if not e:
  214. return get_data_error_result(retmsg="Conversation not found!")
  215. up_down = req.get("set")
  216. feedback = req.get("feedback", "")
  217. conv = conv.to_dict()
  218. for i, msg in enumerate(conv["message"]):
  219. if req["message_id"] == msg.get("id", "") and msg.get("role", "") == "assistant":
  220. if up_down:
  221. msg["thumbup"] = True
  222. if "feedback" in msg: del msg["feedback"]
  223. else:
  224. msg["thumbup"] = False
  225. if feedback: msg["feedback"] = feedback
  226. break
  227. ConversationService.update_by_id(conv["id"], conv)
  228. return get_json_result(data=conv)