Вы не можете выбрать более 25 тем Темы должны начинаться с буквы или цифры, могут содержать дефисы(-) и должны содержать не более 35 символов.

dialog_app.py 7.5KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192
  1. #
  2. # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. from flask import request
  17. from flask_login import login_required, current_user
  18. from api.db.services.dialog_service import DialogService
  19. from api.db import StatusEnum
  20. from api.db.services.llm_service import TenantLLMService
  21. from api.db.services.knowledgebase_service import KnowledgebaseService
  22. from api.db.services.user_service import TenantService, UserTenantService
  23. from api import settings
  24. from api.utils.api_utils import server_error_response, get_data_error_result, validate_request
  25. from api.utils import get_uuid
  26. from api.utils.api_utils import get_json_result
  27. @manager.route('/set', methods=['POST']) # noqa: F821
  28. @login_required
  29. def set_dialog():
  30. req = request.json
  31. dialog_id = req.get("dialog_id")
  32. name = req.get("name", "New Dialog")
  33. description = req.get("description", "A helpful dialog")
  34. icon = req.get("icon", "")
  35. top_n = req.get("top_n", 6)
  36. top_k = req.get("top_k", 1024)
  37. rerank_id = req.get("rerank_id", "")
  38. if not rerank_id:
  39. req["rerank_id"] = ""
  40. similarity_threshold = req.get("similarity_threshold", 0.1)
  41. vector_similarity_weight = req.get("vector_similarity_weight", 0.3)
  42. llm_setting = req.get("llm_setting", {})
  43. default_prompt_with_dataset = {
  44. "system": """你是一个智能助手,请总结知识库的内容来回答问题,请列举知识库中的数据详细回答。当所有知识库内容都与问题无关时,你的回答必须包括“知识库中未找到您要的答案!”这句话。回答需要考虑聊天历史。
  45. 以下是知识库:
  46. {knowledge}
  47. 以上是知识库。""",
  48. "prologue": "您好,我是您的助手小樱,长得可爱又善良,can I help you?",
  49. "parameters": [
  50. {"key": "knowledge", "optional": False}
  51. ],
  52. "empty_response": "Sorry! 知识库中未找到相关内容!"
  53. }
  54. default_prompt_no_dataset = {
  55. "system": """You are a helpful assistant.""",
  56. "prologue": "您好,我是您的助手小樱,长得可爱又善良,can I help you?",
  57. "parameters": [
  58. ],
  59. "empty_response": ""
  60. }
  61. prompt_config = req.get("prompt_config", default_prompt_with_dataset)
  62. if not prompt_config["system"]:
  63. prompt_config["system"] = default_prompt_with_dataset["system"]
  64. if not req.get("kb_ids", []):
  65. if prompt_config['system'] == default_prompt_with_dataset['system'] or "{knowledge}" in prompt_config['system']:
  66. prompt_config = default_prompt_no_dataset
  67. for p in prompt_config["parameters"]:
  68. if p["optional"]:
  69. continue
  70. if prompt_config["system"].find("{%s}" % p["key"]) < 0:
  71. return get_data_error_result(
  72. message="Parameter '{}' is not used".format(p["key"]))
  73. try:
  74. e, tenant = TenantService.get_by_id(current_user.id)
  75. if not e:
  76. return get_data_error_result(message="Tenant not found!")
  77. kbs = KnowledgebaseService.get_by_ids(req.get("kb_ids", []))
  78. embd_ids = [TenantLLMService.split_model_name_and_factory(kb.embd_id)[0] for kb in kbs] # remove vendor suffix for comparison
  79. embd_count = len(set(embd_ids))
  80. if embd_count > 1:
  81. return get_data_error_result(message=f'Datasets use different embedding models: {[kb.embd_id for kb in kbs]}"')
  82. llm_id = req.get("llm_id", tenant.llm_id)
  83. if not dialog_id:
  84. dia = {
  85. "id": get_uuid(),
  86. "tenant_id": current_user.id,
  87. "name": name,
  88. "kb_ids": req.get("kb_ids", []),
  89. "description": description,
  90. "llm_id": llm_id,
  91. "llm_setting": llm_setting,
  92. "prompt_config": prompt_config,
  93. "top_n": top_n,
  94. "top_k": top_k,
  95. "rerank_id": rerank_id,
  96. "similarity_threshold": similarity_threshold,
  97. "vector_similarity_weight": vector_similarity_weight,
  98. "icon": icon
  99. }
  100. if not DialogService.save(**dia):
  101. return get_data_error_result(message="Fail to new a dialog!")
  102. return get_json_result(data=dia)
  103. else:
  104. del req["dialog_id"]
  105. if "kb_names" in req:
  106. del req["kb_names"]
  107. if not DialogService.update_by_id(dialog_id, req):
  108. return get_data_error_result(message="Dialog not found!")
  109. e, dia = DialogService.get_by_id(dialog_id)
  110. if not e:
  111. return get_data_error_result(message="Fail to update a dialog!")
  112. dia = dia.to_dict()
  113. dia.update(req)
  114. dia["kb_ids"], dia["kb_names"] = get_kb_names(dia["kb_ids"])
  115. return get_json_result(data=dia)
  116. except Exception as e:
  117. return server_error_response(e)
  118. @manager.route('/get', methods=['GET']) # noqa: F821
  119. @login_required
  120. def get():
  121. dialog_id = request.args["dialog_id"]
  122. try:
  123. e, dia = DialogService.get_by_id(dialog_id)
  124. if not e:
  125. return get_data_error_result(message="Dialog not found!")
  126. dia = dia.to_dict()
  127. dia["kb_ids"], dia["kb_names"] = get_kb_names(dia["kb_ids"])
  128. return get_json_result(data=dia)
  129. except Exception as e:
  130. return server_error_response(e)
  131. def get_kb_names(kb_ids):
  132. ids, nms = [], []
  133. for kid in kb_ids:
  134. e, kb = KnowledgebaseService.get_by_id(kid)
  135. if not e or kb.status != StatusEnum.VALID.value:
  136. continue
  137. ids.append(kid)
  138. nms.append(kb.name)
  139. return ids, nms
  140. @manager.route('/list', methods=['GET']) # noqa: F821
  141. @login_required
  142. def list_dialogs():
  143. try:
  144. diags = DialogService.query(
  145. tenant_id=current_user.id,
  146. status=StatusEnum.VALID.value,
  147. reverse=True,
  148. order_by=DialogService.model.create_time)
  149. diags = [d.to_dict() for d in diags]
  150. for d in diags:
  151. d["kb_ids"], d["kb_names"] = get_kb_names(d["kb_ids"])
  152. return get_json_result(data=diags)
  153. except Exception as e:
  154. return server_error_response(e)
  155. @manager.route('/rm', methods=['POST']) # noqa: F821
  156. @login_required
  157. @validate_request("dialog_ids")
  158. def rm():
  159. req = request.json
  160. dialog_list=[]
  161. tenants = UserTenantService.query(user_id=current_user.id)
  162. try:
  163. for id in req["dialog_ids"]:
  164. for tenant in tenants:
  165. if DialogService.query(tenant_id=tenant.tenant_id, id=id):
  166. break
  167. else:
  168. return get_json_result(
  169. data=False, message='Only owner of dialog authorized for this operation.',
  170. code=settings.RetCode.OPERATING_ERROR)
  171. dialog_list.append({"id": id,"status":StatusEnum.INVALID.value})
  172. DialogService.update_many_by_id(dialog_list)
  173. return get_json_result(data=True)
  174. except Exception as e:
  175. return server_error_response(e)