| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453 |
- #
- # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- import re
- import json
- from api.db import LLMType
- from flask import request, Response
-
- from api.db.services.conversation_service import ConversationService, iframe_completion
- from api.db.services.conversation_service import completion as rag_completion
- from api.db.services.canvas_service import completion as agent_completion
- from api.db.services.dialog_service import ask
- from agent.canvas import Canvas
- from api.db import StatusEnum
- from api.db.db_models import APIToken
- from api.db.services.api_service import API4ConversationService
- from api.db.services.canvas_service import UserCanvasService
- from api.db.services.dialog_service import DialogService
- from api.db.services.knowledgebase_service import KnowledgebaseService
- from api.utils import get_uuid
- from api.utils.api_utils import get_error_data_result
- from api.utils.api_utils import get_result, token_required
- from api.db.services.llm_service import LLMBundle
-
-
- @manager.route('/chats/<chat_id>/sessions', methods=['POST']) # noqa: F821
- @token_required
- def create(tenant_id, chat_id):
- req = request.json
- req["dialog_id"] = chat_id
- dia = DialogService.query(tenant_id=tenant_id, id=req["dialog_id"], status=StatusEnum.VALID.value)
- if not dia:
- return get_error_data_result(message="You do not own the assistant.")
- conv = {
- "id": get_uuid(),
- "dialog_id": req["dialog_id"],
- "name": req.get("name", "New session"),
- "message": [{"role": "assistant", "content": dia[0].prompt_config.get("prologue")}],
- "user_id": req.get("user_id", "")
- }
- if not conv.get("name"):
- return get_error_data_result(message="`name` can not be empty.")
- ConversationService.save(**conv)
- e, conv = ConversationService.get_by_id(conv["id"])
- if not e:
- return get_error_data_result(message="Fail to create a session!")
- conv = conv.to_dict()
- conv['messages'] = conv.pop("message")
- conv["chat_id"] = conv.pop("dialog_id")
- del conv["reference"]
- return get_result(data=conv)
-
-
- @manager.route('/agents/<agent_id>/sessions', methods=['POST']) # noqa: F821
- @token_required
- def create_agent_session(tenant_id, agent_id):
- req = request.json
- e, cvs = UserCanvasService.get_by_id(agent_id)
- if not e:
- return get_error_data_result("Agent not found.")
-
- if not UserCanvasService.query(user_id=tenant_id,id=agent_id):
- return get_error_data_result("You cannot access the agent.")
-
- if not isinstance(cvs.dsl, str):
- cvs.dsl = json.dumps(cvs.dsl, ensure_ascii=False)
-
- canvas = Canvas(cvs.dsl, tenant_id)
- canvas.reset()
- query = canvas.get_preset_param()
- if query:
- for ele in query:
- if not ele["optional"]:
- if not req.get(ele["key"]):
- return get_error_data_result(f"`{ele['key']}` is required")
- ele["value"] = req[ele["key"]]
- if ele["optional"]:
- if req.get(ele["key"]):
- ele["value"] = req[ele['key']]
- else:
- if "value" in ele:
- ele.pop("value")
- cvs.dsl = json.loads(str(canvas))
- conv = {
- "id": get_uuid(),
- "dialog_id": cvs.id,
- "user_id": req.get("usr_id","") if isinstance(req, dict) else "",
- "message": [{"role": "assistant", "content": canvas.get_prologue()}],
- "source": "agent",
- "dsl": cvs.dsl
- }
- API4ConversationService.save(**conv)
- conv["agent_id"] = conv.pop("dialog_id")
- return get_result(data=conv)
-
-
- @manager.route('/chats/<chat_id>/sessions/<session_id>', methods=['PUT']) # noqa: F821
- @token_required
- def update(tenant_id, chat_id, session_id):
- req = request.json
- req["dialog_id"] = chat_id
- conv_id = session_id
- conv = ConversationService.query(id=conv_id, dialog_id=chat_id)
- if not conv:
- return get_error_data_result(message="Session does not exist")
- if not DialogService.query(id=chat_id, tenant_id=tenant_id, status=StatusEnum.VALID.value):
- return get_error_data_result(message="You do not own the session")
- if "message" in req or "messages" in req:
- return get_error_data_result(message="`message` can not be change")
- if "reference" in req:
- return get_error_data_result(message="`reference` can not be change")
- if "name" in req and not req.get("name"):
- return get_error_data_result(message="`name` can not be empty.")
- if not ConversationService.update_by_id(conv_id, req):
- return get_error_data_result(message="Session updates error")
- return get_result()
-
-
- @manager.route('/chats/<chat_id>/completions', methods=['POST']) # noqa: F821
- @token_required
- def chat_completion(tenant_id, chat_id):
- req = request.json
- if not req or not req.get("session_id"):
- req = {"question":""}
- if not DialogService.query(tenant_id=tenant_id,id=chat_id,status=StatusEnum.VALID.value):
- return get_error_data_result(f"You don't own the chat {chat_id}")
- if req.get("session_id"):
- if not ConversationService.query(id=req["session_id"],dialog_id=chat_id):
- return get_error_data_result(f"You don't own the session {req['session_id']}")
- if req.get("stream", True):
- resp = Response(rag_completion(tenant_id, chat_id, **req), mimetype="text/event-stream")
- resp.headers.add_header("Cache-control", "no-cache")
- resp.headers.add_header("Connection", "keep-alive")
- resp.headers.add_header("X-Accel-Buffering", "no")
- resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
-
- return resp
- else:
- answer = None
- for ans in rag_completion(tenant_id, chat_id, **req):
- answer = ans
- break
- return get_result(data=answer)
-
-
- @manager.route('/agents/<agent_id>/completions', methods=['POST']) # noqa: F821
- @token_required
- def agent_completions(tenant_id, agent_id):
- req = request.json
- cvs = UserCanvasService.query(user_id=tenant_id, id=agent_id)
- if not cvs:
- return get_error_data_result(f"You don't own the agent {agent_id}")
- if req.get("session_id"):
- dsl = cvs[0].dsl
- if not isinstance(dsl,str):
- dsl = json.dumps(dsl)
- canvas=Canvas(dsl,tenant_id)
- if canvas.get_preset_param():
- req["question"]=""
- conv = API4ConversationService.query(id=req["session_id"], dialog_id=agent_id)
- if not conv:
- return get_error_data_result(f"You don't own the session {req['session_id']}")
- else:
- req["question"]=""
- if req.get("stream", True):
- resp = Response(agent_completion(tenant_id, agent_id, **req), mimetype="text/event-stream")
- resp.headers.add_header("Cache-control", "no-cache")
- resp.headers.add_header("Connection", "keep-alive")
- resp.headers.add_header("X-Accel-Buffering", "no")
- resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
- return resp
- try:
- for answer in agent_completion(tenant_id, agent_id, **req):
- return get_result(data=answer)
- except Exception as e:
- return get_error_data_result(str(e))
-
-
- @manager.route('/chats/<chat_id>/sessions', methods=['GET']) # noqa: F821
- @token_required
- def list_session(tenant_id, chat_id):
- if not DialogService.query(tenant_id=tenant_id, id=chat_id, status=StatusEnum.VALID.value):
- return get_error_data_result(message=f"You don't own the assistant {chat_id}.")
- id = request.args.get("id")
- name = request.args.get("name")
- page_number = int(request.args.get("page", 1))
- items_per_page = int(request.args.get("page_size", 30))
- orderby = request.args.get("orderby", "create_time")
- user_id = request.args.get("user_id")
- if request.args.get("desc") == "False" or request.args.get("desc") == "false":
- desc = False
- else:
- desc = True
- convs = ConversationService.get_list(chat_id, page_number, items_per_page, orderby, desc, id, name, user_id)
- if not convs:
- return get_result(data=[])
- for conv in convs:
- conv['messages'] = conv.pop("message")
- infos = conv["messages"]
- for info in infos:
- if "prompt" in info:
- info.pop("prompt")
- conv["chat_id"] = conv.pop("dialog_id")
- if conv["reference"]:
- messages = conv["messages"]
- message_num = 0
- chunk_num = 0
- while message_num < len(messages):
- if message_num != 0 and messages[message_num]["role"] != "user":
- chunk_list = []
- if "chunks" in conv["reference"][chunk_num]:
- chunks = conv["reference"][chunk_num]["chunks"]
- for chunk in chunks:
- new_chunk = {
- "id": chunk.get("chunk_id", chunk.get("id")),
- "content": chunk.get("content_with_weight", chunk.get("content")),
- "document_id": chunk.get("doc_id", chunk.get("document_id")),
- "document_name": chunk.get("docnm_kwd", chunk.get("document_name")),
- "dataset_id": chunk.get("kb_id", chunk.get("dataset_id")),
- "image_id": chunk.get("image_id", chunk.get("img_id")),
- "positions": chunk.get("positions", chunk.get("position_int")),
- }
-
- chunk_list.append(new_chunk)
- chunk_num += 1
- messages[message_num]["reference"] = chunk_list
- message_num += 1
- del conv["reference"]
- return get_result(data=convs)
-
-
- @manager.route('/agents/<agent_id>/sessions', methods=['GET']) # noqa: F821
- @token_required
- def list_agent_session(tenant_id, agent_id):
- if not UserCanvasService.query(user_id=tenant_id, id=agent_id):
- return get_error_data_result(message=f"You don't own the agent {agent_id}.")
- id = request.args.get("id")
- if not API4ConversationService.query(id=id, user_id=tenant_id):
- return get_error_data_result(f"You don't own the session {id}")
- page_number = int(request.args.get("page", 1))
- items_per_page = int(request.args.get("page_size", 30))
- orderby = request.args.get("orderby", "update_time")
- if request.args.get("desc") == "False" or request.args.get("desc") == "false":
- desc = False
- else:
- desc = True
- convs = API4ConversationService.get_list(agent_id, tenant_id, page_number, items_per_page, orderby, desc, id)
- if not convs:
- return get_result(data=[])
- for conv in convs:
- conv['messages'] = conv.pop("message")
- infos = conv["messages"]
- for info in infos:
- if "prompt" in info:
- info.pop("prompt")
- conv["agent_id"] = conv.pop("dialog_id")
- if conv["reference"]:
- messages = conv["messages"]
- message_num = 0
- chunk_num = 0
- while message_num < len(messages):
- if message_num != 0 and messages[message_num]["role"] != "user":
- chunk_list = []
- if "chunks" in conv["reference"][chunk_num]:
- chunks = conv["reference"][chunk_num]["chunks"]
- for chunk in chunks:
- new_chunk = {
- "id": chunk.get("chunk_id", chunk.get("id")),
- "content": chunk.get("content_with_weight", chunk.get("content")),
- "document_id": chunk.get("doc_id", chunk.get("document_id")),
- "document_name": chunk.get("docnm_kwd", chunk.get("document_name")),
- "dataset_id": chunk.get("kb_id", chunk.get("dataset_id")),
- "image_id": chunk.get("image_id", chunk.get("img_id")),
- "positions": chunk.get("positions", chunk.get("position_int")),
- }
- chunk_list.append(new_chunk)
- chunk_num += 1
- messages[message_num]["reference"] = chunk_list
- message_num += 1
- del conv["reference"]
- return get_result(data=convs)
-
-
- @manager.route('/chats/<chat_id>/sessions', methods=["DELETE"]) # noqa: F821
- @token_required
- def delete(tenant_id, chat_id):
- if not DialogService.query(id=chat_id, tenant_id=tenant_id, status=StatusEnum.VALID.value):
- return get_error_data_result(message="You don't own the chat")
- req = request.json
- convs = ConversationService.query(dialog_id=chat_id)
- if not req:
- ids = None
- else:
- ids = req.get("ids")
-
- if not ids:
- conv_list = []
- for conv in convs:
- conv_list.append(conv.id)
- else:
- conv_list = ids
- for id in conv_list:
- conv = ConversationService.query(id=id, dialog_id=chat_id)
- if not conv:
- return get_error_data_result(message="The chat doesn't own the session")
- ConversationService.delete_by_id(id)
- return get_result()
-
-
- @manager.route('/sessions/ask', methods=['POST']) # noqa: F821
- @token_required
- def ask_about(tenant_id):
- req = request.json
- if not req.get("question"):
- return get_error_data_result("`question` is required.")
- if not req.get("dataset_ids"):
- return get_error_data_result("`dataset_ids` is required.")
- if not isinstance(req.get("dataset_ids"), list):
- return get_error_data_result("`dataset_ids` should be a list.")
- req["kb_ids"] = req.pop("dataset_ids")
- for kb_id in req["kb_ids"]:
- if not KnowledgebaseService.accessible(kb_id, tenant_id):
- return get_error_data_result(f"You don't own the dataset {kb_id}.")
- kbs = KnowledgebaseService.query(id=kb_id)
- kb = kbs[0]
- if kb.chunk_num == 0:
- return get_error_data_result(f"The dataset {kb_id} doesn't own parsed file")
- uid = tenant_id
-
- def stream():
- nonlocal req, uid
- try:
- for ans in ask(req["question"], req["kb_ids"], uid):
- yield "data:" + json.dumps({"code": 0, "message": "", "data": ans}, ensure_ascii=False) + "\n\n"
- except Exception as e:
- yield "data:" + json.dumps({"code": 500, "message": str(e),
- "data": {"answer": "**ERROR**: " + str(e), "reference": []}},
- ensure_ascii=False) + "\n\n"
- yield "data:" + json.dumps({"code": 0, "message": "", "data": True}, ensure_ascii=False) + "\n\n"
-
- resp = Response(stream(), mimetype="text/event-stream")
- resp.headers.add_header("Cache-control", "no-cache")
- resp.headers.add_header("Connection", "keep-alive")
- resp.headers.add_header("X-Accel-Buffering", "no")
- resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
- return resp
-
-
- @manager.route('/sessions/related_questions', methods=['POST']) # noqa: F821
- @token_required
- def related_questions(tenant_id):
- req = request.json
- if not req.get("question"):
- return get_error_data_result("`question` is required.")
- question = req["question"]
- chat_mdl = LLMBundle(tenant_id, LLMType.CHAT)
- prompt = """
- Objective: To generate search terms related to the user's search keywords, helping users find more valuable information.
- Instructions:
- - Based on the keywords provided by the user, generate 5-10 related search terms.
- - Each search term should be directly or indirectly related to the keyword, guiding the user to find more valuable information.
- - Use common, general terms as much as possible, avoiding obscure words or technical jargon.
- - Keep the term length between 2-4 words, concise and clear.
- - DO NOT translate, use the language of the original keywords.
-
- ### Example:
- Keywords: Chinese football
- Related search terms:
- 1. Current status of Chinese football
- 2. Reform of Chinese football
- 3. Youth training of Chinese football
- 4. Chinese football in the Asian Cup
- 5. Chinese football in the World Cup
-
- Reason:
- - When searching, users often only use one or two keywords, making it difficult to fully express their information needs.
- - Generating related search terms can help users dig deeper into relevant information and improve search efficiency.
- - At the same time, related terms can also help search engines better understand user needs and return more accurate search results.
-
- """
- ans = chat_mdl.chat(prompt, [{"role": "user", "content": f"""
- Keywords: {question}
- Related search terms:
- """}], {"temperature": 0.9})
- return get_result(data=[re.sub(r"^[0-9]\. ", "", a) for a in ans.split("\n") if re.match(r"^[0-9]\. ", a)])
-
-
- @manager.route('/chatbots/<dialog_id>/completions', methods=['POST']) # noqa: F821
- def chatbot_completions(dialog_id):
- req = request.json
-
- token = request.headers.get('Authorization').split()
- if len(token) != 2:
- return get_error_data_result(message='Authorization is not valid!"')
- token = token[1]
- objs = APIToken.query(beta=token)
- if not objs:
- return get_error_data_result(message='Token is not valid!"')
-
- if "quote" not in req:
- req["quote"] = False
-
- if req.get("stream", True):
- resp = Response(iframe_completion(dialog_id, **req), mimetype="text/event-stream")
- resp.headers.add_header("Cache-control", "no-cache")
- resp.headers.add_header("Connection", "keep-alive")
- resp.headers.add_header("X-Accel-Buffering", "no")
- resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
- return resp
-
- for answer in iframe_completion(dialog_id, **req):
- return get_result(data=answer)
-
-
- @manager.route('/agentbots/<agent_id>/completions', methods=['POST']) # noqa: F821
- def agent_bot_completions(agent_id):
- req = request.json
-
- token = request.headers.get('Authorization').split()
- if len(token) != 2:
- return get_error_data_result(message='Authorization is not valid!"')
- token = token[1]
- objs = APIToken.query(beta=token)
- if not objs:
- return get_error_data_result(message='Token is not valid!"')
-
- if "quote" not in req:
- req["quote"] = False
-
- if req.get("stream", True):
- resp = Response(agent_completion(objs[0].tenant_id, agent_id, **req), mimetype="text/event-stream")
- resp.headers.add_header("Cache-control", "no-cache")
- resp.headers.add_header("Connection", "keep-alive")
- resp.headers.add_header("X-Accel-Buffering", "no")
- resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
- return resp
-
- for answer in agent_completion(objs[0].tenant_id, agent_id, **req):
- return get_result(data=answer)
-
|