You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

conversation_app.py 15KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417
  1. #
  2. # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. import json
  17. import re
  18. import traceback
  19. from copy import deepcopy
  20. from flask import Response, request
  21. from flask_login import current_user, login_required
  22. from api import settings
  23. from api.db import LLMType
  24. from api.db.db_models import APIToken
  25. from api.db.services.conversation_service import ConversationService, structure_answer
  26. from api.db.services.dialog_service import DialogService, ask, chat, gen_mindmap
  27. from api.db.services.llm_service import LLMBundle
  28. from api.db.services.search_service import SearchService
  29. from api.db.services.tenant_llm_service import TenantLLMService
  30. from api.db.services.user_service import TenantService, UserTenantService
  31. from api.utils.api_utils import get_data_error_result, get_json_result, server_error_response, validate_request
  32. from rag.prompts.prompt_template import load_prompt
  33. from rag.prompts.prompts import chunks_format
  34. @manager.route("/set", methods=["POST"]) # noqa: F821
  35. @login_required
  36. def set_conversation():
  37. req = request.json
  38. conv_id = req.get("conversation_id")
  39. is_new = req.get("is_new")
  40. name = req.get("name", "New conversation")
  41. req["user_id"] = current_user.id
  42. if len(name) > 255:
  43. name = name[0:255]
  44. del req["is_new"]
  45. if not is_new:
  46. del req["conversation_id"]
  47. try:
  48. if not ConversationService.update_by_id(conv_id, req):
  49. return get_data_error_result(message="Conversation not found!")
  50. e, conv = ConversationService.get_by_id(conv_id)
  51. if not e:
  52. return get_data_error_result(message="Fail to update a conversation!")
  53. conv = conv.to_dict()
  54. return get_json_result(data=conv)
  55. except Exception as e:
  56. return server_error_response(e)
  57. try:
  58. e, dia = DialogService.get_by_id(req["dialog_id"])
  59. if not e:
  60. return get_data_error_result(message="Dialog not found")
  61. conv = {
  62. "id": conv_id,
  63. "dialog_id": req["dialog_id"],
  64. "name": name,
  65. "message": [{"role": "assistant", "content": dia.prompt_config["prologue"]}],
  66. "user_id": current_user.id,
  67. "reference": [],
  68. }
  69. ConversationService.save(**conv)
  70. return get_json_result(data=conv)
  71. except Exception as e:
  72. return server_error_response(e)
  73. @manager.route("/get", methods=["GET"]) # noqa: F821
  74. @login_required
  75. def get():
  76. conv_id = request.args["conversation_id"]
  77. try:
  78. e, conv = ConversationService.get_by_id(conv_id)
  79. if not e:
  80. return get_data_error_result(message="Conversation not found!")
  81. tenants = UserTenantService.query(user_id=current_user.id)
  82. avatar = None
  83. for tenant in tenants:
  84. dialog = DialogService.query(tenant_id=tenant.tenant_id, id=conv.dialog_id)
  85. if dialog and len(dialog) > 0:
  86. avatar = dialog[0].icon
  87. break
  88. else:
  89. return get_json_result(data=False, message="Only owner of conversation authorized for this operation.", code=settings.RetCode.OPERATING_ERROR)
  90. for ref in conv.reference:
  91. if isinstance(ref, list):
  92. continue
  93. ref["chunks"] = chunks_format(ref)
  94. conv = conv.to_dict()
  95. conv["avatar"] = avatar
  96. return get_json_result(data=conv)
  97. except Exception as e:
  98. return server_error_response(e)
  99. @manager.route("/getsse/<dialog_id>", methods=["GET"]) # type: ignore # noqa: F821
  100. def getsse(dialog_id):
  101. token = request.headers.get("Authorization").split()
  102. if len(token) != 2:
  103. return get_data_error_result(message='Authorization is not valid!"')
  104. token = token[1]
  105. objs = APIToken.query(beta=token)
  106. if not objs:
  107. return get_data_error_result(message='Authentication error: API key is invalid!"')
  108. try:
  109. e, conv = DialogService.get_by_id(dialog_id)
  110. if not e:
  111. return get_data_error_result(message="Dialog not found!")
  112. conv = conv.to_dict()
  113. conv["avatar"] = conv["icon"]
  114. del conv["icon"]
  115. return get_json_result(data=conv)
  116. except Exception as e:
  117. return server_error_response(e)
  118. @manager.route("/rm", methods=["POST"]) # noqa: F821
  119. @login_required
  120. def rm():
  121. conv_ids = request.json["conversation_ids"]
  122. try:
  123. for cid in conv_ids:
  124. exist, conv = ConversationService.get_by_id(cid)
  125. if not exist:
  126. return get_data_error_result(message="Conversation not found!")
  127. tenants = UserTenantService.query(user_id=current_user.id)
  128. for tenant in tenants:
  129. if DialogService.query(tenant_id=tenant.tenant_id, id=conv.dialog_id):
  130. break
  131. else:
  132. return get_json_result(data=False, message="Only owner of conversation authorized for this operation.", code=settings.RetCode.OPERATING_ERROR)
  133. ConversationService.delete_by_id(cid)
  134. return get_json_result(data=True)
  135. except Exception as e:
  136. return server_error_response(e)
  137. @manager.route("/list", methods=["GET"]) # noqa: F821
  138. @login_required
  139. def list_conversation():
  140. dialog_id = request.args["dialog_id"]
  141. try:
  142. if not DialogService.query(tenant_id=current_user.id, id=dialog_id):
  143. return get_json_result(data=False, message="Only owner of dialog authorized for this operation.", code=settings.RetCode.OPERATING_ERROR)
  144. convs = ConversationService.query(dialog_id=dialog_id, order_by=ConversationService.model.create_time, reverse=True)
  145. convs = [d.to_dict() for d in convs]
  146. return get_json_result(data=convs)
  147. except Exception as e:
  148. return server_error_response(e)
  149. @manager.route("/completion", methods=["POST"]) # noqa: F821
  150. @login_required
  151. @validate_request("conversation_id", "messages")
  152. def completion():
  153. req = request.json
  154. msg = []
  155. for m in req["messages"]:
  156. if m["role"] == "system":
  157. continue
  158. if m["role"] == "assistant" and not msg:
  159. continue
  160. msg.append(m)
  161. message_id = msg[-1].get("id")
  162. chat_model_id = req.get("llm_id", "")
  163. req.pop("llm_id", None)
  164. chat_model_config = {}
  165. for model_config in [
  166. "temperature",
  167. "top_p",
  168. "frequency_penalty",
  169. "presence_penalty",
  170. "max_tokens",
  171. ]:
  172. config = req.get(model_config)
  173. if config:
  174. chat_model_config[model_config] = config
  175. try:
  176. e, conv = ConversationService.get_by_id(req["conversation_id"])
  177. if not e:
  178. return get_data_error_result(message="Conversation not found!")
  179. conv.message = deepcopy(req["messages"])
  180. e, dia = DialogService.get_by_id(conv.dialog_id)
  181. if not e:
  182. return get_data_error_result(message="Dialog not found!")
  183. del req["conversation_id"]
  184. del req["messages"]
  185. if not conv.reference:
  186. conv.reference = []
  187. conv.reference = [r for r in conv.reference if r]
  188. conv.reference.append({"chunks": [], "doc_aggs": []})
  189. if chat_model_id:
  190. if not TenantLLMService.get_api_key(tenant_id=dia.tenant_id, model_name=chat_model_id):
  191. req.pop("chat_model_id", None)
  192. req.pop("chat_model_config", None)
  193. return get_data_error_result(message=f"Cannot use specified model {chat_model_id}.")
  194. dia.llm_id = chat_model_id
  195. dia.llm_setting = chat_model_config
  196. is_embedded = bool(chat_model_id)
  197. def stream():
  198. nonlocal dia, msg, req, conv
  199. try:
  200. for ans in chat(dia, msg, True, **req):
  201. ans = structure_answer(conv, ans, message_id, conv.id)
  202. yield "data:" + json.dumps({"code": 0, "message": "", "data": ans}, ensure_ascii=False) + "\n\n"
  203. if not is_embedded:
  204. ConversationService.update_by_id(conv.id, conv.to_dict())
  205. except Exception as e:
  206. traceback.print_exc()
  207. yield "data:" + json.dumps({"code": 500, "message": str(e), "data": {"answer": "**ERROR**: " + str(e), "reference": []}}, ensure_ascii=False) + "\n\n"
  208. yield "data:" + json.dumps({"code": 0, "message": "", "data": True}, ensure_ascii=False) + "\n\n"
  209. if req.get("stream", True):
  210. resp = Response(stream(), mimetype="text/event-stream")
  211. resp.headers.add_header("Cache-control", "no-cache")
  212. resp.headers.add_header("Connection", "keep-alive")
  213. resp.headers.add_header("X-Accel-Buffering", "no")
  214. resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
  215. return resp
  216. else:
  217. answer = None
  218. for ans in chat(dia, msg, **req):
  219. answer = structure_answer(conv, ans, message_id, conv.id)
  220. if not is_embedded:
  221. ConversationService.update_by_id(conv.id, conv.to_dict())
  222. break
  223. return get_json_result(data=answer)
  224. except Exception as e:
  225. return server_error_response(e)
  226. @manager.route("/tts", methods=["POST"]) # noqa: F821
  227. @login_required
  228. def tts():
  229. req = request.json
  230. text = req["text"]
  231. tenants = TenantService.get_info_by(current_user.id)
  232. if not tenants:
  233. return get_data_error_result(message="Tenant not found!")
  234. tts_id = tenants[0]["tts_id"]
  235. if not tts_id:
  236. return get_data_error_result(message="No default TTS model is set")
  237. tts_mdl = LLMBundle(tenants[0]["tenant_id"], LLMType.TTS, tts_id)
  238. def stream_audio():
  239. try:
  240. for txt in re.split(r"[,。/《》?;:!\n\r:;]+", text):
  241. for chunk in tts_mdl.tts(txt):
  242. yield chunk
  243. except Exception as e:
  244. yield ("data:" + json.dumps({"code": 500, "message": str(e), "data": {"answer": "**ERROR**: " + str(e)}}, ensure_ascii=False)).encode("utf-8")
  245. resp = Response(stream_audio(), mimetype="audio/mpeg")
  246. resp.headers.add_header("Cache-Control", "no-cache")
  247. resp.headers.add_header("Connection", "keep-alive")
  248. resp.headers.add_header("X-Accel-Buffering", "no")
  249. return resp
  250. @manager.route("/delete_msg", methods=["POST"]) # noqa: F821
  251. @login_required
  252. @validate_request("conversation_id", "message_id")
  253. def delete_msg():
  254. req = request.json
  255. e, conv = ConversationService.get_by_id(req["conversation_id"])
  256. if not e:
  257. return get_data_error_result(message="Conversation not found!")
  258. conv = conv.to_dict()
  259. for i, msg in enumerate(conv["message"]):
  260. if req["message_id"] != msg.get("id", ""):
  261. continue
  262. assert conv["message"][i + 1]["id"] == req["message_id"]
  263. conv["message"].pop(i)
  264. conv["message"].pop(i)
  265. conv["reference"].pop(max(0, i // 2 - 1))
  266. break
  267. ConversationService.update_by_id(conv["id"], conv)
  268. return get_json_result(data=conv)
  269. @manager.route("/thumbup", methods=["POST"]) # noqa: F821
  270. @login_required
  271. @validate_request("conversation_id", "message_id")
  272. def thumbup():
  273. req = request.json
  274. e, conv = ConversationService.get_by_id(req["conversation_id"])
  275. if not e:
  276. return get_data_error_result(message="Conversation not found!")
  277. up_down = req.get("thumbup")
  278. feedback = req.get("feedback", "")
  279. conv = conv.to_dict()
  280. for i, msg in enumerate(conv["message"]):
  281. if req["message_id"] == msg.get("id", "") and msg.get("role", "") == "assistant":
  282. if up_down:
  283. msg["thumbup"] = True
  284. if "feedback" in msg:
  285. del msg["feedback"]
  286. else:
  287. msg["thumbup"] = False
  288. if feedback:
  289. msg["feedback"] = feedback
  290. break
  291. ConversationService.update_by_id(conv["id"], conv)
  292. return get_json_result(data=conv)
  293. @manager.route("/ask", methods=["POST"]) # noqa: F821
  294. @login_required
  295. @validate_request("question", "kb_ids")
  296. def ask_about():
  297. req = request.json
  298. uid = current_user.id
  299. search_id = req.get("search_id", "")
  300. search_app = None
  301. search_config = {}
  302. if search_id:
  303. search_app = SearchService.get_detail(search_id)
  304. if search_app:
  305. search_config = search_app.get("search_config", {})
  306. def stream():
  307. nonlocal req, uid
  308. try:
  309. for ans in ask(req["question"], req["kb_ids"], uid, search_config=search_config):
  310. yield "data:" + json.dumps({"code": 0, "message": "", "data": ans}, ensure_ascii=False) + "\n\n"
  311. except Exception as e:
  312. yield "data:" + json.dumps({"code": 500, "message": str(e), "data": {"answer": "**ERROR**: " + str(e), "reference": []}}, ensure_ascii=False) + "\n\n"
  313. yield "data:" + json.dumps({"code": 0, "message": "", "data": True}, ensure_ascii=False) + "\n\n"
  314. resp = Response(stream(), mimetype="text/event-stream")
  315. resp.headers.add_header("Cache-control", "no-cache")
  316. resp.headers.add_header("Connection", "keep-alive")
  317. resp.headers.add_header("X-Accel-Buffering", "no")
  318. resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
  319. return resp
  320. @manager.route("/mindmap", methods=["POST"]) # noqa: F821
  321. @login_required
  322. @validate_request("question", "kb_ids")
  323. def mindmap():
  324. req = request.json
  325. search_id = req.get("search_id", "")
  326. search_app = SearchService.get_detail(search_id) if search_id else {}
  327. search_config = search_app.get("search_config", {}) if search_app else {}
  328. kb_ids = search_config.get("kb_ids", [])
  329. kb_ids.extend(req["kb_ids"])
  330. kb_ids = list(set(kb_ids))
  331. mind_map = gen_mindmap(req["question"], kb_ids, search_app.get("tenant_id", current_user.id), search_config)
  332. if "error" in mind_map:
  333. return server_error_response(Exception(mind_map["error"]))
  334. return get_json_result(data=mind_map)
  335. @manager.route("/related_questions", methods=["POST"]) # noqa: F821
  336. @login_required
  337. @validate_request("question")
  338. def related_questions():
  339. req = request.json
  340. search_id = req.get("search_id", "")
  341. search_config = {}
  342. if search_id:
  343. if search_app := SearchService.get_detail(search_id):
  344. search_config = search_app.get("search_config", {})
  345. question = req["question"]
  346. chat_id = search_config.get("chat_id", "")
  347. chat_mdl = LLMBundle(current_user.id, LLMType.CHAT, chat_id)
  348. gen_conf = search_config.get("llm_setting", {"temperature": 0.9})
  349. prompt = load_prompt("related_question")
  350. ans = chat_mdl.chat(
  351. prompt,
  352. [
  353. {
  354. "role": "user",
  355. "content": f"""
  356. Keywords: {question}
  357. Related search terms:
  358. """,
  359. }
  360. ],
  361. gen_conf,
  362. )
  363. return get_json_result(data=[re.sub(r"^[0-9]\. ", "", a) for a in ans.split("\n") if re.match(r"^[0-9]\. ", a)])