| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523 | 
							- #
 - #  Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
 - #
 - #  Licensed under the Apache License, Version 2.0 (the "License");
 - #  you may not use this file except in compliance with the License.
 - #  You may obtain a copy of the License at
 - #
 - #      http://www.apache.org/licenses/LICENSE-2.0
 - #
 - #  Unless required by applicable law or agreed to in writing, software
 - #  distributed under the License is distributed on an "AS IS" BASIS,
 - #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 - #  See the License for the specific language governing permissions and
 - #  limitations under the License.
 - #
 - import re
 - import json
 - from functools import partial
 - from uuid import uuid4
 - from api.db import LLMType
 - from flask import request, Response
 - from api.db.services.dialog_service import ask
 - from agent.canvas import Canvas
 - from api.db import StatusEnum
 - from api.db.db_models import API4Conversation
 - from api.db.services.api_service import API4ConversationService
 - from api.db.services.canvas_service import UserCanvasService
 - from api.db.services.dialog_service import DialogService, ConversationService, chat
 - from api.db.services.knowledgebase_service import KnowledgebaseService
 - from api.utils import get_uuid
 - from api.utils.api_utils import get_error_data_result
 - from api.utils.api_utils import get_result, token_required
 - from api.db.services.llm_service import LLMBundle
 - 
 - 
 - @manager.route('/chats/<chat_id>/sessions', methods=['POST'])
 - @token_required
 - def create(tenant_id,chat_id):
 -     req = request.json
 -     req["dialog_id"] = chat_id
 -     dia = DialogService.query(tenant_id=tenant_id, id=req["dialog_id"], status=StatusEnum.VALID.value)
 -     if not dia:
 -         return get_error_data_result(message="You do not own the assistant.")
 -     conv = {
 -         "id": get_uuid(),
 -         "dialog_id": req["dialog_id"],
 -         "name": req.get("name", "New session"),
 -         "message": [{"role": "assistant", "content": "Hi! I am your assistant,can I help you?"}]
 -     }
 -     if not conv.get("name"):
 -         return get_error_data_result(message="`name` can not be empty.")
 -     ConversationService.save(**conv)
 -     e, conv = ConversationService.get_by_id(conv["id"])
 -     if not e:
 -         return get_error_data_result(message="Fail to create a session!")
 -     conv = conv.to_dict()
 -     conv['messages'] = conv.pop("message")
 -     conv["chat_id"] = conv.pop("dialog_id")
 -     del conv["reference"]
 -     return get_result(data=conv)
 - 
 - 
 - @manager.route('/agents/<agent_id>/sessions', methods=['POST'])
 - @token_required
 - def create_agent_session(tenant_id, agent_id):
 -     req = request.json
 -     e, cvs = UserCanvasService.get_by_id(agent_id)
 -     if not e:
 -         return get_error_data_result("Agent not found.")
 -     if cvs.user_id != tenant_id:
 -         return get_error_data_result(message="You do not own the agent.")
 - 
 -     if not isinstance(cvs.dsl, str):
 -         cvs.dsl = json.dumps(cvs.dsl, ensure_ascii=False)
 - 
 -     canvas = Canvas(cvs.dsl, tenant_id)
 -     conv = {
 -         "id": get_uuid(),
 -         "dialog_id": cvs.id,
 -         "user_id": req.get("usr_id",""),
 -         "message": [{"role": "assistant", "content": canvas.get_prologue()}],
 -         "source": "agent"
 -     }
 -     API4ConversationService.save(**conv)
 -     conv["agent_id"] = conv.pop("dialog_id")
 -     return get_result(data=conv)
 - 
 - 
 - @manager.route('/chats/<chat_id>/sessions/<session_id>', methods=['PUT'])
 - @token_required
 - def update(tenant_id,chat_id,session_id):
 -     req = request.json
 -     req["dialog_id"] = chat_id
 -     conv_id = session_id
 -     conv = ConversationService.query(id=conv_id,dialog_id=chat_id)
 -     if not conv:
 -         return get_error_data_result(message="Session does not exist")
 -     if not DialogService.query(id=chat_id, tenant_id=tenant_id, status=StatusEnum.VALID.value):
 -         return get_error_data_result(message="You do not own the session")
 -     if "message" in req or "messages" in req:
 -         return get_error_data_result(message="`message` can not be change")
 -     if "reference" in req:
 -         return get_error_data_result(message="`reference` can not be change")
 -     if "name" in req and not req.get("name"):
 -         return get_error_data_result(message="`name` can not be empty.")
 -     if not ConversationService.update_by_id(conv_id, req):
 -         return get_error_data_result(message="Session updates error")
 -     return get_result()
 - 
 - 
 - @manager.route('/chats/<chat_id>/completions', methods=['POST'])
 - @token_required
 - def completion(tenant_id, chat_id):
 -     req = request.json
 -     if not req.get("session_id"):
 -         conv = {
 -             "id": get_uuid(),
 -             "dialog_id": chat_id,
 -             "name": req.get("name", "New session"),
 -             "message": [{"role": "assistant", "content": "Hi! I am your assistant,can I help you?"}]
 -         }
 -         if not conv.get("name"):
 -             return get_error_data_result(message="`name` can not be empty.")
 -         ConversationService.save(**conv)
 -         e, conv = ConversationService.get_by_id(conv["id"])
 -         session_id=conv.id
 -     else:
 -         session_id = req.get("session_id")
 -     if not req.get("question"):
 -         return get_error_data_result(message="Please input your question.")
 -     conv = ConversationService.query(id=session_id,dialog_id=chat_id)
 -     if not conv:
 -         return get_error_data_result(message="Session does not exist")
 -     conv = conv[0]
 -     if not DialogService.query(id=chat_id, tenant_id=tenant_id, status=StatusEnum.VALID.value):
 -         return get_error_data_result(message="You do not own the chat")
 -     msg = []
 -     question = {
 -         "content": req.get("question"),
 -         "role": "user",
 -         "id": str(uuid4())
 -     }
 -     conv.message.append(question)
 -     for m in conv.message:
 -         if m["role"] == "system": continue
 -         if m["role"] == "assistant" and not msg: continue
 -         msg.append(m)
 -     message_id = msg[-1].get("id")
 -     e, dia = DialogService.get_by_id(conv.dialog_id)
 - 
 -     if not conv.reference:
 -         conv.reference = []
 -     conv.message.append({"role": "assistant", "content": "", "id": message_id})
 -     conv.reference.append({"chunks": [], "doc_aggs": []})
 - 
 -     def fillin_conv(ans):
 -         reference = ans["reference"]
 -         if "chunks" in reference:
 -             chunks = reference.get("chunks")
 -             chunk_list = []
 -             for chunk in chunks:
 -                 new_chunk = {
 -                     "id": chunk["chunk_id"],
 -                     "content": chunk["content_with_weight"],
 -                     "document_id": chunk["doc_id"],
 -                     "document_name": chunk["docnm_kwd"],
 -                     "dataset_id": chunk["kb_id"],
 -                     "image_id": chunk.get("img_id", ""),
 -                     "similarity": chunk["similarity"],
 -                     "vector_similarity": chunk["vector_similarity"],
 -                     "term_similarity": chunk["term_similarity"],
 -                     "positions": chunk.get("positions", []),
 -                 }
 -                 chunk_list.append(new_chunk)
 -             reference["chunks"] = chunk_list
 -         nonlocal conv, message_id
 -         if not conv.reference:
 -             conv.reference.append(ans["reference"])
 -         else:
 -             conv.reference[-1] = ans["reference"]
 -         conv.message[-1] = {"role": "assistant", "content": ans["answer"],
 -                             "id": message_id, "prompt": ans.get("prompt", "")}
 -         ans["id"] = message_id
 -         ans["session_id"]=session_id
 - 
 -     def stream():
 -         nonlocal dia, msg, req, conv
 -         try:
 -             for ans in chat(dia, msg, **req):
 -                 fillin_conv(ans)
 -                 yield "data:" + json.dumps({"code": 0,  "data": ans}, ensure_ascii=False) + "\n\n"
 -             ConversationService.update_by_id(conv.id, conv.to_dict())
 -         except Exception as e:
 -             yield "data:" + json.dumps({"code": 500, "message": str(e),
 -                                         "data": {"answer": "**ERROR**: " + str(e),"reference": []}},
 -                                        ensure_ascii=False) + "\n\n"
 -         yield "data:" + json.dumps({"code": 0, "data": True}, ensure_ascii=False) + "\n\n"
 - 
 -     if req.get("stream", True):
 -         resp = Response(stream(), mimetype="text/event-stream")
 -         resp.headers.add_header("Cache-control", "no-cache")
 -         resp.headers.add_header("Connection", "keep-alive")
 -         resp.headers.add_header("X-Accel-Buffering", "no")
 -         resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
 - 
 -         return resp
 - 
 -     else:
 -         answer = None
 -         for ans in chat(dia, msg, **req):
 -             answer = ans
 -             fillin_conv(ans)
 -             ConversationService.update_by_id(conv.id, conv.to_dict())
 -             break
 -         return get_result(data=answer)
 - 
 - 
 - @manager.route('/agents/<agent_id>/completions', methods=['POST'])
 - @token_required
 - def agent_completion(tenant_id, agent_id):
 -     req = request.json
 - 
 -     e, cvs = UserCanvasService.get_by_id(agent_id)
 -     if not e:
 -         return get_error_data_result("Agent not found.")
 -     if cvs.user_id != tenant_id:
 -         return get_error_data_result(message="You do not own the agent.")
 -     if not isinstance(cvs.dsl, str):
 -         cvs.dsl = json.dumps(cvs.dsl, ensure_ascii=False)
 -     canvas = Canvas(cvs.dsl, tenant_id)
 - 
 -     if not req.get("session_id"):
 -         session_id = get_uuid()
 -         conv = {
 -             "id": session_id,
 -             "dialog_id": cvs.id,
 -             "user_id": req.get("user_id",""),
 -             "message": [{"role": "assistant", "content": canvas.get_prologue()}],
 -             "source": "agent"
 -         }
 -         API4ConversationService.save(**conv)
 -         conv = API4Conversation(**conv)
 -     else:
 -         session_id = req.get("session_id")
 -         e, conv = API4ConversationService.get_by_id(req["session_id"])
 -         if not e:
 -             return get_error_data_result(message="Session not found!")
 - 
 -     messages = conv.message
 -     question = req.get("question")
 -     if not question:
 -         return get_error_data_result("`question` is required.")
 -     question={
 -         "role":"user",
 -         "content":question,
 -         "id": str(uuid4())
 -     }
 -     messages.append(question)
 -     msg = []
 -     for m in messages:
 -         if m["role"] == "system":
 -             continue
 -         if m["role"] == "assistant" and not msg:
 -             continue
 -         msg.append(m)
 -     if not msg[-1].get("id"): msg[-1]["id"] = get_uuid()
 -     message_id = msg[-1]["id"]
 - 
 -     if "quote" not in req: req["quote"] = False
 -     stream = req.get("stream", True)
 - 
 -     def fillin_conv(ans):
 -         reference = ans["reference"]
 -         if "chunks" in reference:
 -             chunks = reference.get("chunks")
 -             chunk_list = []
 -             for chunk in chunks:
 -                 new_chunk = {
 -                     "id": chunk["chunk_id"],
 -                     "content": chunk["content_with_weight"],
 -                     "document_id": chunk["doc_id"],
 -                     "document_name": chunk["docnm_kwd"],
 -                     "dataset_id": chunk["kb_id"],
 -                     "image_id": chunk["img_id"],
 -                     "similarity": chunk["similarity"],
 -                     "vector_similarity": chunk["vector_similarity"],
 -                     "term_similarity": chunk["term_similarity"],
 -                     "positions": chunk["positions"],
 -                 }
 -                 chunk_list.append(new_chunk)
 -             reference["chunks"] = chunk_list
 -         nonlocal conv, message_id
 -         if not conv.reference:
 -             conv.reference.append(ans["reference"])
 -         else:
 -             conv.reference[-1] = ans["reference"]
 -         conv.message[-1] = {"role": "assistant", "content": ans["answer"], "id": message_id}
 -         ans["id"] = message_id
 -         ans["session_id"] = session_id
 - 
 -     def rename_field(ans):
 -         reference = ans['reference']
 -         if not isinstance(reference, dict):
 -             return
 -         for chunk_i in reference.get('chunks', []):
 -             if 'docnm_kwd' in chunk_i:
 -                 chunk_i['doc_name'] = chunk_i['docnm_kwd']
 -                 chunk_i.pop('docnm_kwd')
 -     conv.message.append(msg[-1])
 - 
 -     if not conv.reference:
 -         conv.reference = []
 -     conv.message.append({"role": "assistant", "content": "", "id": message_id})
 -     conv.reference.append({"chunks": [], "doc_aggs": []})
 - 
 -     final_ans = {"reference": [], "content": ""}
 - 
 -     canvas.messages.append(msg[-1])
 -     canvas.add_user_input(msg[-1]["content"])
 -     answer = canvas.run(stream=stream)
 - 
 -     assert answer is not None, "Nothing. Is it over?"
 - 
 -     if stream:
 -         assert isinstance(answer, partial), "Nothing. Is it over?"
 - 
 -         def sse():
 -             nonlocal answer, cvs, conv
 -             try:
 -                 for ans in answer():
 -                     for k in ans.keys():
 -                         final_ans[k] = ans[k]
 -                     ans = {"answer": ans["content"], "reference": ans.get("reference", [])}
 -                     fillin_conv(ans)
 -                     rename_field(ans)
 -                     yield "data:" + json.dumps({"code": 0, "message": "", "data": ans},
 -                                                ensure_ascii=False) + "\n\n"
 - 
 -                 canvas.messages.append({"role": "assistant", "content": final_ans["content"], "id": message_id})
 -                 if final_ans.get("reference"):
 -                     canvas.reference.append(final_ans["reference"])
 -                 cvs.dsl = json.loads(str(canvas))
 -                 API4ConversationService.append_message(conv.id, conv.to_dict())
 -             except Exception as e:
 -                 yield "data:" + json.dumps({"code": 500, "message": str(e),
 -                                             "data": {"answer": "**ERROR**: " + str(e), "reference": []}},
 -                                            ensure_ascii=False) + "\n\n"
 -             yield "data:" + json.dumps({"code": 0, "data": True}, ensure_ascii=False) + "\n\n"
 - 
 -         resp = Response(sse(), mimetype="text/event-stream")
 -         resp.headers.add_header("Cache-control", "no-cache")
 -         resp.headers.add_header("Connection", "keep-alive")
 -         resp.headers.add_header("X-Accel-Buffering", "no")
 -         resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
 -         return resp
 - 
 -     final_ans["content"] = "\n".join(answer["content"]) if "content" in answer else ""
 -     canvas.messages.append({"role": "assistant", "content": final_ans["content"], "id": message_id})
 -     if final_ans.get("reference"):
 -         canvas.reference.append(final_ans["reference"])
 -     cvs.dsl = json.loads(str(canvas))
 - 
 -     result = {"answer": final_ans["content"], "reference": final_ans.get("reference", [])}
 -     fillin_conv(result)
 -     API4ConversationService.append_message(conv.id, conv.to_dict())
 -     rename_field(result)
 -     return get_result(data=result)
 - 
 - 
 - @manager.route('/chats/<chat_id>/sessions', methods=['GET'])
 - @token_required
 - def list_session(chat_id,tenant_id):
 -     if not DialogService.query(tenant_id=tenant_id, id=chat_id, status=StatusEnum.VALID.value):
 -         return get_error_data_result(message=f"You don't own the assistant {chat_id}.")
 -     id = request.args.get("id")
 -     name = request.args.get("name")
 -     page_number = int(request.args.get("page", 1))
 -     items_per_page = int(request.args.get("page_size", 30))
 -     orderby = request.args.get("orderby", "create_time")
 -     if request.args.get("desc") == "False" or request.args.get("desc") == "false":
 -         desc = False
 -     else:
 -         desc = True
 -     convs = ConversationService.get_list(chat_id,page_number,items_per_page,orderby,desc,id,name)
 -     if not convs:
 -         return get_result(data=[])
 -     for conv in convs:
 -         conv['messages'] = conv.pop("message")
 -         infos = conv["messages"]
 -         for info in infos:
 -             if "prompt" in info:
 -                 info.pop("prompt")
 -         conv["chat_id"] = conv.pop("dialog_id")
 -         if conv["reference"]:
 -             messages = conv["messages"]
 -             message_num = 0
 -             chunk_num = 0
 -             while message_num < len(messages):
 -                 if message_num != 0 and messages[message_num]["role"] != "user":
 -                     chunk_list = []
 -                     if "chunks" in conv["reference"][chunk_num]:
 -                         chunks = conv["reference"][chunk_num]["chunks"]
 -                         for chunk in chunks:
 -                             new_chunk = {
 -                                 "id": chunk["chunk_id"],
 -                                 "content": chunk["content_with_weight"],
 -                                 "document_id": chunk["doc_id"],
 -                                 "document_name": chunk["docnm_kwd"],
 -                                 "dataset_id": chunk["kb_id"],
 -                                 "image_id": chunk["img_id"],
 -                                 "similarity": chunk["similarity"],
 -                                 "vector_similarity": chunk["vector_similarity"],
 -                                 "term_similarity": chunk["term_similarity"],
 -                                 "positions": chunk["positions"],
 -                             }
 -                             chunk_list.append(new_chunk)
 -                     chunk_num += 1
 -                     messages[message_num]["reference"] = chunk_list
 -                 message_num += 1
 -         del conv["reference"]
 -     return get_result(data=convs)
 - 
 - 
 - @manager.route('/chats/<chat_id>/sessions', methods=["DELETE"])
 - @token_required
 - def delete(tenant_id,chat_id):
 -     if not DialogService.query(id=chat_id, tenant_id=tenant_id, status=StatusEnum.VALID.value):
 -         return get_error_data_result(message="You don't own the chat")
 -     req = request.json
 -     convs = ConversationService.query(dialog_id=chat_id)
 -     if not req:
 -         ids = None
 -     else:
 -         ids=req.get("ids")
 - 
 -     if not ids:
 -         conv_list = []
 -         for conv in convs:
 -             conv_list.append(conv.id)
 -     else:
 -         conv_list=ids
 -     for id in conv_list:
 -         conv = ConversationService.query(id=id,dialog_id=chat_id)
 -         if not conv:
 -             return get_error_data_result(message="The chat doesn't own the session")
 -         ConversationService.delete_by_id(id)
 -     return get_result()
 - 
 - @manager.route('/sessions/ask', methods=['POST'])
 - @token_required
 - def ask_about(tenant_id):
 -     req = request.json
 -     if not req.get("question"):
 -         return get_error_data_result("`question` is required.")
 -     if not req.get("dataset_ids"):
 -         return get_error_data_result("`dataset_ids` is required.")
 -     if not isinstance(req.get("dataset_ids"),list):
 -         return get_error_data_result("`dataset_ids` should be a list.")
 -     req["kb_ids"]=req.pop("dataset_ids")
 -     for kb_id in req["kb_ids"]:
 -         if not KnowledgebaseService.accessible(kb_id,tenant_id):
 -             return get_error_data_result(f"You don't own the dataset {kb_id}.")
 -         kbs = KnowledgebaseService.query(id=kb_id)
 -         kb = kbs[0]
 -         if kb.chunk_num == 0:
 -             return get_error_data_result(f"The dataset {kb_id} doesn't own parsed file")
 -     uid = tenant_id
 -     def stream():
 -         nonlocal req, uid
 -         try:
 -             for ans in ask(req["question"], req["kb_ids"], uid):
 -                 yield "data:" + json.dumps({"code": 0, "message": "", "data": ans}, ensure_ascii=False) + "\n\n"
 -         except Exception as e:
 -             yield "data:" + json.dumps({"code": 500, "message": str(e),
 -                                         "data": {"answer": "**ERROR**: " + str(e), "reference": []}},
 -                                        ensure_ascii=False) + "\n\n"
 -         yield "data:" + json.dumps({"code": 0, "message": "", "data": True}, ensure_ascii=False) + "\n\n"
 - 
 -     resp = Response(stream(), mimetype="text/event-stream")
 -     resp.headers.add_header("Cache-control", "no-cache")
 -     resp.headers.add_header("Connection", "keep-alive")
 -     resp.headers.add_header("X-Accel-Buffering", "no")
 -     resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
 -     return resp
 - 
 - 
 - @manager.route('/sessions/related_questions', methods=['POST'])
 - @token_required
 - def related_questions(tenant_id):
 -     req = request.json
 -     if not req.get("question"):
 -         return get_error_data_result("`question` is required.")
 -     question = req["question"]
 -     chat_mdl = LLMBundle(tenant_id, LLMType.CHAT)
 -     prompt = """
 - Objective: To generate search terms related to the user's search keywords, helping users find more valuable information.
 - Instructions:
 -  - Based on the keywords provided by the user, generate 5-10 related search terms.
 -  - Each search term should be directly or indirectly related to the keyword, guiding the user to find more valuable information.
 -  - Use common, general terms as much as possible, avoiding obscure words or technical jargon.
 -  - Keep the term length between 2-4 words, concise and clear.
 -  - DO NOT translate, use the language of the original keywords.
 - 
 - ### Example:
 - Keywords: Chinese football
 - Related search terms:
 - 1. Current status of Chinese football
 - 2. Reform of Chinese football
 - 3. Youth training of Chinese football
 - 4. Chinese football in the Asian Cup
 - 5. Chinese football in the World Cup
 - 
 - Reason:
 -  - When searching, users often only use one or two keywords, making it difficult to fully express their information needs.
 -  - Generating related search terms can help users dig deeper into relevant information and improve search efficiency. 
 -  - At the same time, related terms can also help search engines better understand user needs and return more accurate search results.
 - 
 - """
 -     ans = chat_mdl.chat(prompt, [{"role": "user", "content": f"""
 - Keywords: {question}
 - Related search terms:
 -     """}], {"temperature": 0.9})
 -     return get_result(data=[re.sub(r"^[0-9]\. ", "", a) for a in ans.split("\n") if re.match(r"^[0-9]\. ", a)])
 
 
  |