### What problem does this PR solve? Enhance the prompt of `related_question` API. ### Type of change - [x] Enhancement - [x] Documentation Update

7 月之前 · ee6a0bd9db
--- a/api/apps/conversation_app.py
+++ b/api/apps/conversation_app.py
@@ -17,26 +17,25 @@ import json
 import re
 import traceback
 from copy import deepcopy
 import trio
 from api.db.db_models import APIToken

 from api.db.services.conversation_service import ConversationService, structure_answer
 from api.db.services.user_service import UserTenantService
 from flask import request, Response
 from flask_login import login_required, current_user
 import trio
 from flask import Response, request
 from flask_login import current_user, login_required

 from api import settings
 from api.db import LLMType
 from api.db.services.dialog_service import DialogService, chat, ask
 from api.db.db_models import APIToken
 from api.db.services.conversation_service import ConversationService, structure_answer
 from api.db.services.dialog_service import DialogService, ask, chat
 from api.db.services.knowledgebase_service import KnowledgebaseService
 from api.db.services.llm_service import LLMBundle, TenantService
 from api import settings
 from api.utils.api_utils import get_json_result
 from api.utils.api_utils import server_error_response, get_data_error_result, validate_request
 from api.db.services.user_service import UserTenantService
 from api.utils.api_utils import get_data_error_result, get_json_result, server_error_response, validate_request
 from graphrag.general.mind_map_extractor import MindMapExtractor
 from rag.app.tag import label_question


@manager.route('/set', methods=['POST'])  # noqa: F821
@manager.route("/set", methods=["POST"])  # noqa: F821
@login_required
 def set_conversation():
    req = request.json
@@ -50,8 +49,7 @@ def set_conversation():
                return get_data_error_result(message="Conversation not found!")
            e, conv = ConversationService.get_by_id(conv_id)
            if not e:
                return get_data_error_result(
                    message="Fail to update a conversation!")
                return get_data_error_result(message="Fail to update a conversation!")
            conv = conv.to_dict()
            return get_json_result(data=conv)
        except Exception as e:
@@ -61,38 +59,30 @@ def set_conversation():
        e, dia = DialogService.get_by_id(req["dialog_id"])
        if not e:
            return get_data_error_result(message="Dialog not found")
        conv = {
            "id": conv_id,
            "dialog_id": req["dialog_id"],
            "name": req.get("name", "New conversation"),
            "message": [{"role": "assistant", "content": dia.prompt_config["prologue"]}]
        }
        conv = {"id": conv_id, "dialog_id": req["dialog_id"], "name": req.get("name", "New conversation"), "message": [{"role": "assistant", "content": dia.prompt_config["prologue"]}]}
        ConversationService.save(**conv)
        return get_json_result(data=conv)
    except Exception as e:
        return server_error_response(e)


@manager.route('/get', methods=['GET'])  # noqa: F821
@manager.route("/get", methods=["GET"])  # noqa: F821
@login_required
 def get():
    conv_id = request.args["conversation_id"]
    try:

        e, conv = ConversationService.get_by_id(conv_id)
        if not e:
            return get_data_error_result(message="Conversation not found!")
        tenants = UserTenantService.query(user_id=current_user.id)
        avatar =None
        avatar = None
        for tenant in tenants:
            dialog = DialogService.query(tenant_id=tenant.tenant_id, id=conv.dialog_id)
            if dialog and len(dialog)>0:
            if dialog and len(dialog) > 0:
                avatar = dialog[0].icon
                break
        else:
            return get_json_result(
                data=False, message='Only owner of conversation authorized for this operation.',
                code=settings.RetCode.OPERATING_ERROR)
            return get_json_result(data=False, message="Only owner of conversation authorized for this operation.", code=settings.RetCode.OPERATING_ERROR)

        def get_value(d, k1, k2):
            return d.get(k1, d.get(k2))
@@ -100,26 +90,29 @@ def get():
        for ref in conv.reference:
            if isinstance(ref, list):
                continue
            ref["chunks"] = [{
                "id": get_value(ck, "chunk_id", "id"),
                "content": get_value(ck, "content", "content_with_weight"),
                "document_id": get_value(ck, "doc_id", "document_id"),
                "document_name": get_value(ck, "docnm_kwd", "document_name"),
                "dataset_id": get_value(ck, "kb_id", "dataset_id"),
                "image_id": get_value(ck, "image_id", "img_id"),
                "positions": get_value(ck, "positions", "position_int"),
            } for ck in ref.get("chunks", [])]
            ref["chunks"] = [
                {
                    "id": get_value(ck, "chunk_id", "id"),
                    "content": get_value(ck, "content", "content_with_weight"),
                    "document_id": get_value(ck, "doc_id", "document_id"),
                    "document_name": get_value(ck, "docnm_kwd", "document_name"),
                    "dataset_id": get_value(ck, "kb_id", "dataset_id"),
                    "image_id": get_value(ck, "image_id", "img_id"),
                    "positions": get_value(ck, "positions", "position_int"),
                }
                for ck in ref.get("chunks", [])
            ]

        conv = conv.to_dict()
        conv["avatar"]=avatar
        conv["avatar"] = avatar
        return get_json_result(data=conv)
    except Exception as e:
        return server_error_response(e)

@manager.route('/getsse/<dialog_id>', methods=['GET'])  # type: ignore # noqa: F821
 def getsse(dialog_id):

    token = request.headers.get('Authorization').split()
@manager.route("/getsse/<dialog_id>", methods=["GET"])  # type: ignore # noqa: F821
 def getsse(dialog_id):
    token = request.headers.get("Authorization").split()
    if len(token) != 2:
        return get_data_error_result(message='Authorization is not valid!"')
    token = token[1]
@@ -131,13 +124,14 @@ def getsse(dialog_id):
        if not e:
            return get_data_error_result(message="Dialog not found!")
        conv = conv.to_dict()
        conv["avatar"]= conv["icon"]
        conv["avatar"] = conv["icon"]
        del conv["icon"]
        return get_json_result(data=conv)
    except Exception as e:
        return server_error_response(e)

@manager.route('/rm', methods=['POST'])  # noqa: F821

@manager.route("/rm", methods=["POST"])  # noqa: F821
@login_required
 def rm():
    conv_ids = request.json["conversation_ids"]
@@ -151,28 +145,21 @@ def rm():
                if DialogService.query(tenant_id=tenant.tenant_id, id=conv.dialog_id):
                    break
            else:
                return get_json_result(
                    data=False, message='Only owner of conversation authorized for this operation.',
                    code=settings.RetCode.OPERATING_ERROR)
                return get_json_result(data=False, message="Only owner of conversation authorized for this operation.", code=settings.RetCode.OPERATING_ERROR)
            ConversationService.delete_by_id(cid)
        return get_json_result(data=True)
    except Exception as e:
        return server_error_response(e)


@manager.route('/list', methods=['GET'])  # noqa: F821
@manager.route("/list", methods=["GET"])  # noqa: F821
@login_required
 def list_convsersation():
    dialog_id = request.args["dialog_id"]
    try:
        if not DialogService.query(tenant_id=current_user.id, id=dialog_id):
            return get_json_result(
                data=False, message='Only owner of dialog authorized for this operation.',
                code=settings.RetCode.OPERATING_ERROR)
        convs = ConversationService.query(
            dialog_id=dialog_id,
            order_by=ConversationService.model.create_time,
            reverse=True)
            return get_json_result(data=False, message="Only owner of dialog authorized for this operation.", code=settings.RetCode.OPERATING_ERROR)
        convs = ConversationService.query(dialog_id=dialog_id, order_by=ConversationService.model.create_time, reverse=True)

        convs = [d.to_dict() for d in convs]
        return get_json_result(data=convs)
@@ -180,7 +167,7 @@ def list_convsersation():
        return server_error_response(e)


@manager.route('/completion', methods=['POST'])  # noqa: F821
@manager.route("/completion", methods=["POST"])  # noqa: F821
@login_required
@validate_request("conversation_id", "messages")
 def completion():
@@ -207,25 +194,30 @@ def completion():
        if not conv.reference:
            conv.reference = []
        else:

            def get_value(d, k1, k2):
                return d.get(k1, d.get(k2))

            for ref in conv.reference:
                if isinstance(ref, list):
                    continue
                ref["chunks"] = [{
                    "id": get_value(ck, "chunk_id", "id"),
                    "content": get_value(ck, "content", "content_with_weight"),
                    "document_id": get_value(ck, "doc_id", "document_id"),
                    "document_name": get_value(ck, "docnm_kwd", "document_name"),
                    "dataset_id": get_value(ck, "kb_id", "dataset_id"),
                    "image_id": get_value(ck, "image_id", "img_id"),
                    "positions": get_value(ck, "positions", "position_int"),
                } for ck in ref.get("chunks", [])]
                ref["chunks"] = [
                    {
                        "id": get_value(ck, "chunk_id", "id"),
                        "content": get_value(ck, "content", "content_with_weight"),
                        "document_id": get_value(ck, "doc_id", "document_id"),
                        "document_name": get_value(ck, "docnm_kwd", "document_name"),
                        "dataset_id": get_value(ck, "kb_id", "dataset_id"),
                        "image_id": get_value(ck, "image_id", "img_id"),
                        "positions": get_value(ck, "positions", "position_int"),
                    }
                    for ck in ref.get("chunks", [])
                ]

        if not conv.reference:
            conv.reference = []
        conv.reference.append({"chunks": [], "doc_aggs": []})

        def stream():
            nonlocal dia, msg, req, conv
            try:
@@ -235,9 +227,7 @@ def completion():
                ConversationService.update_by_id(conv.id, conv.to_dict())
            except Exception as e:
                traceback.print_exc()
                yield "data:" + json.dumps({"code": 500, "message": str(e),
                                            "data": {"answer": "**ERROR**: " + str(e), "reference": []}},
                                           ensure_ascii=False) + "\n\n"
                yield "data:" + json.dumps({"code": 500, "message": str(e), "data": {"answer": "**ERROR**: " + str(e), "reference": []}}, ensure_ascii=False) + "\n\n"
            yield "data:" + json.dumps({"code": 0, "message": "", "data": True}, ensure_ascii=False) + "\n\n"

        if req.get("stream", True):
@@ -259,7 +249,7 @@ def completion():
        return server_error_response(e)


@manager.route('/tts', methods=['POST'])  # noqa: F821
@manager.route("/tts", methods=["POST"])  # noqa: F821
@login_required
 def tts():
    req = request.json
@@ -281,9 +271,7 @@ def tts():
                for chunk in tts_mdl.tts(txt):
                    yield chunk
        except Exception as e:
            yield ("data:" + json.dumps({"code": 500, "message": str(e),
                                         "data": {"answer": "**ERROR**: " + str(e)}},
                                        ensure_ascii=False)).encode('utf-8')
            yield ("data:" + json.dumps({"code": 500, "message": str(e), "data": {"answer": "**ERROR**: " + str(e)}}, ensure_ascii=False)).encode("utf-8")

    resp = Response(stream_audio(), mimetype="audio/mpeg")
    resp.headers.add_header("Cache-Control", "no-cache")
@@ -293,7 +281,7 @@ def tts():
    return resp


@manager.route('/delete_msg', methods=['POST'])  # noqa: F821
@manager.route("/delete_msg", methods=["POST"])  # noqa: F821
@login_required
@validate_request("conversation_id", "message_id")
 def delete_msg():
@@ -316,7 +304,7 @@ def delete_msg():
    return get_json_result(data=conv)


@manager.route('/thumbup', methods=['POST'])  # noqa: F821
@manager.route("/thumbup", methods=["POST"])  # noqa: F821
@login_required
@validate_request("conversation_id", "message_id")
 def thumbup():
@@ -343,7 +331,7 @@ def thumbup():
    return get_json_result(data=conv)


@manager.route('/ask', methods=['POST'])  # noqa: F821
@manager.route("/ask", methods=["POST"])  # noqa: F821
@login_required
@validate_request("question", "kb_ids")
 def ask_about():
@@ -356,9 +344,7 @@ def ask_about():
            for ans in ask(req["question"], req["kb_ids"], uid):
                yield "data:" + json.dumps({"code": 0, "message": "", "data": ans}, ensure_ascii=False) + "\n\n"
        except Exception as e:
            yield "data:" + json.dumps({"code": 500, "message": str(e),
                                        "data": {"answer": "**ERROR**: " + str(e), "reference": []}},
                                       ensure_ascii=False) + "\n\n"
            yield "data:" + json.dumps({"code": 500, "message": str(e), "data": {"answer": "**ERROR**: " + str(e), "reference": []}}, ensure_ascii=False) + "\n\n"
        yield "data:" + json.dumps({"code": 0, "message": "", "data": True}, ensure_ascii=False) + "\n\n"

    resp = Response(stream(), mimetype="text/event-stream")
@@ -369,7 +355,7 @@ def ask_about():
    return resp


@manager.route('/mindmap', methods=['POST'])  # noqa: F821
@manager.route("/mindmap", methods=["POST"])  # noqa: F821
@login_required
@validate_request("question", "kb_ids")
 def mindmap():
@@ -382,10 +368,7 @@ def mindmap():
    embd_mdl = LLMBundle(kb.tenant_id, LLMType.EMBEDDING, llm_name=kb.embd_id)
    chat_mdl = LLMBundle(current_user.id, LLMType.CHAT)
    question = req["question"]
    ranks = settings.retrievaler.retrieval(question, embd_mdl, kb.tenant_id, kb_ids, 1, 12,
                                           0.3, 0.3, aggs=False,
                                           rank_feature=label_question(question, [kb])
                                           )
    ranks = settings.retrievaler.retrieval(question, embd_mdl, kb.tenant_id, kb_ids, 1, 12, 0.3, 0.3, aggs=False, rank_feature=label_question(question, [kb]))
    mindmap = MindMapExtractor(chat_mdl)
    mind_map = trio.run(mindmap, [c["content_with_weight"] for c in ranks["chunks"]])
    mind_map = mind_map.output
@@ -394,7 +377,7 @@ def mindmap():
    return get_json_result(data=mind_map)


@manager.route('/related_questions', methods=['POST'])  # noqa: F821
@manager.route("/related_questions", methods=["POST"])  # noqa: F821
@login_required
@validate_request("question")
 def related_questions():
@@ -402,31 +385,49 @@ def related_questions():
    question = req["question"]
    chat_mdl = LLMBundle(current_user.id, LLMType.CHAT)
    prompt = """
 Objective: To generate search terms related to the user's search keywords, helping users find more valuable information.
 Role: You are an AI language model assistant tasked with generating 5-10 related questions based on a user’s original query. These questions should help expand the search query scope and improve search relevance.

 Instructions:
 - Based on the keywords provided by the user, generate 5-10 related search terms.
 - Each search term should be directly or indirectly related to the keyword, guiding the user to find more valuable information.
 - Use common, general terms as much as possible, avoiding obscure words or technical jargon.
 - Keep the term length between 2-4 words, concise and clear.
 - DO NOT translate, use the language of the original keywords.

 ### Example:
 Keywords: Chinese football
 Related search terms:
 1. Current status of Chinese football
 2. Reform of Chinese football
 3. Youth training of Chinese football
 4. Chinese football in the Asian Cup
 5. Chinese football in the World Cup
 	Input: You are provided with a user’s question.
 	Output: Generate 5-10 alternative questions that are related to the original user question. These alternatives should help retrieve a broader range of relevant documents from a vector database.
 	Context: Focus on rephrasing the original question in different ways, making sure the alternative questions are diverse but still connected to the topic of the original query. Do not create overly obscure, irrelevant, or unrelated questions.
 	Fallback: If you cannot generate any relevant alternatives, do not return any questions.
 	Guidance:
 	1. Each alternative should be unique but still relevant to the original query.
 	2. Keep the phrasing clear, concise, and easy to understand.
 	3. Avoid overly technical jargon or specialized terms unless directly relevant.
 	4. Ensure that each question contributes towards improving search results by broadening the search angle, not narrowing it.

 Example:
 Original Question: What are the benefits of electric vehicles?

 Alternative Questions:
 	1. How do electric vehicles impact the environment?
 	2. What are the advantages of owning an electric car?
 	3. What is the cost-effectiveness of electric vehicles?
 	4. How do electric vehicles compare to traditional cars in terms of fuel efficiency?
 	5. What are the environmental benefits of switching to electric cars?
 	6. How do electric vehicles help reduce carbon emissions?
 	7. Why are electric vehicles becoming more popular?
 	8. What are the long-term savings of using electric vehicles?
 	9. How do electric vehicles contribute to sustainability?
 	10. What are the key benefits of electric vehicles for consumers?

 Reason:
 - When searching, users often only use one or two keywords, making it difficult to fully express their information needs.
 - Generating related search terms can help users dig deeper into relevant information and improve search efficiency. 
 - At the same time, related terms can also help search engines better understand user needs and return more accurate search results.
 
 	Rephrasing the original query into multiple alternative questions helps the user explore different aspects of their search topic, improving the quality of search results.
 	These questions guide the search engine to provide a more comprehensive set of relevant documents.
 """
    ans = chat_mdl.chat(prompt, [{"role": "user", "content": f"""
    ans = chat_mdl.chat(
        prompt,
        [
            {
                "role": "user",
                "content": f"""
 Keywords: {question}
 Related search terms:
    """}], {"temperature": 0.9})
    """,
            }
        ],
        {"temperature": 0.9},
    )
    return get_json_result(data=[re.sub(r"^[0-9]\. ", "", a) for a in ans.split("\n") if re.match(r"^[0-9]\. ", a)])
--- a/docs/references/http_api_reference.md
+++ b/docs/references/http_api_reference.md
@@ -535,17 +535,15 @@ Failure:

 ---

 | Code | Message | Description |
 |------|---------|-------------|
 | 400  | Bad Request | Invalid request parameters |
 | 401  | Unauthorized | Unauthorized access |
 | 403  | Forbidden | Access denied |
 | 404  | Not Found | Resource not found |
 | 500  | Internal Server Error | Server internal error |
 | 1001 | Invalid Chunk ID | Invalid Chunk ID |
 | 1002 | Chunk Update Failed | Chunk update failed |


 | Code | Message               | Description                |
 | ---- | --------------------- | -------------------------- |
 | 400  | Bad Request           | Invalid request parameters |
 | 401  | Unauthorized          | Unauthorized access        |
 | 403  | Forbidden             | Access denied              |
 | 404  | Not Found             | Resource not found         |
 | 500  | Internal Server Error | Server internal error      |
 | 1001 | Invalid Chunk ID      | Invalid Chunk ID           |
 | 1002 | Chunk Update Failed   | Chunk update failed        |

 ---

@@ -1091,6 +1089,7 @@ curl --request POST \
  The key terms or phrases to tag with the chunk.
 - `"questions"`(*Body parameter*), `list[string]`
  If there is a given question, the embedded chunks will be based on them

 #### Response

 Success:
@@ -1549,7 +1548,7 @@ curl --request POST \
    - All the variables in 'System' should be curly bracketed.
    - The default value is `[{"key": "knowledge", "optional": true}]`.
  - `"rerank_model"`: `string` If it is not specified, vector cosine similarity will be used; otherwise, reranking score will be used.
  -  `top_k`: `int` Refers to the process of reordering or selecting the top-k items from a list or set based on a specific ranking criterion. Default to 1024.
  - `top_k`: `int` Refers to the process of reordering or selecting the top-k items from a list or set based on a specific ranking criterion. Default to 1024.
  - `"empty_response"`: `string` If nothing is retrieved in the dataset for the user's question, this will be used as the response. To allow the LLM to improvise when nothing is found, leave this blank.
  - `"opener"`: `string` The opening greeting for the user. Defaults to `"Hi! I am your assistant, can I help you?"`.
  - `"show_quote`: `boolean` Indicates whether the source of text should be displayed. Defaults to `true`.
@@ -2148,8 +2147,10 @@ Failure:
 Asks a specified chat assistant a question to start an AI-powered conversation.

 :::tip NOTE

 - In streaming mode, not all responses include a reference, as this depends on the system's judgement.
 - In streaming mode, the last message is an empty message:

  ```json
  data:
  {
@@ -2157,6 +2158,7 @@ Asks a specified chat assistant a question to start an AI-powered conversation.
    "data": true
  }
  ```

 :::

 #### Request
@@ -2183,6 +2185,7 @@ curl --request POST \
     {
     }'
 ```

 ```bash
 curl --request POST \
     --url http://{address}/api/v1/chats/{chat_id}/completions \
@@ -2214,6 +2217,7 @@ curl --request POST \
 #### Response

 Success without `session_id`:

 ```json
 data:{
    "code": 0,
@@ -2504,8 +2508,10 @@ Failure:
 Asks a specified agent a question to start an AI-powered conversation.

 :::tip NOTE

 - In streaming mode, not all responses include a reference, as this depends on the system's judgement.
 - In streaming mode, the last message is an empty message:

  ```json
  data:
  {
@@ -2513,6 +2519,7 @@ Asks a specified agent a question to start an AI-powered conversation.
    "data": true
  }
  ```

 :::

 #### Request
@@ -2529,9 +2536,12 @@ Asks a specified agent a question to start an AI-powered conversation.
  - `"user_id"`: `string`(optional)
  - `"sync_dsl"`: `boolean` (optional)
  - other parameters: `string`

 ##### Request example

 If the **Begin** component does not take parameters, the following code will create a session.
 ```bash 

 ```bash
 curl --request POST \
     --url http://{address}/api/v1/agents/{agent_id}/completions \
     --header 'Content-Type: application/json' \
@@ -2540,7 +2550,9 @@ curl --request POST \
     {
     }'
 ```

 If the **Begin** component takes parameters, the following code will create a session.

 ```bash
 curl --request POST \
     --url http://{address}/api/v1/agents/{agent_id}/completions \
@@ -2552,7 +2564,9 @@ curl --request POST \
          "file":"How is the weather tomorrow?"
     }'
 ```

 The following code will execute the completion process

 ```bash
 curl --request POST \
     --url http://{address}/api/v1/agents/{agent_id}/completions \
@@ -2586,7 +2600,9 @@ curl --request POST \
  Parameters specified in the **Begin** component.

 #### Response

 success without `session_id` provided and with no parameters specified in the **Begin** component:

 ```json
 data:{
    "code": 0,
@@ -2641,7 +2657,9 @@ data:{
 }
 data:
 ```

 Success with parameters specified in the **Begin** component:

 ```json
 data:{
    "code": 0,
@@ -2979,6 +2997,79 @@ Failure:
    "message": "The agent doesn't own the session cbd31e52f73911ef93b232903b842af6"
 }
 ```

 ---

 ### Related Questions

 **POST** `/api/v1/conversation/related_questions`

 Generates five to ten alternative question strings from the user's original query to retrieve more relevant search results.

 :::tip NOTE
 The chat model dynamically determines the number of questions to generate based on the instruction, typically between five and ten.
 :::

 #### Request

 - Method: POST
 - URL: `/api/v1/conversation/related_questions`
 - Headers:
  - `'content-Type: application/json'`
  - `'Authorization: Bearer <YOUR_API_KEY>'`
 - Body:
  - `"question"`: `string`

 ##### Request example

 ```bash
 curl --request DELETE \
     --url http://{address}/api/v1/conversation/related_questions \
     --header 'Content-Type: application/json' \
     --header 'Authorization: Bearer <YOUR_API_KEY>' \
     --data '
     {
          "question": "What are the key advantages of Neovim over Vim?"
     }'
 ```

 ##### Request Parameters

 - `"question"`: (*Body Parameter*), `string`
  The original user question.

 #### Response

 Success:

 ```json
 {
    "code": 0,
    "data": [
        "What makes Neovim superior to Vim in terms of features?",
        "How do the benefits of Neovim compare to those of Vim?",
        "What advantages does Neovim offer that are not present in Vim?",
        "In what ways does Neovim outperform Vim in functionality?",
        "What are the most significant improvements in Neovim compared to Vim?",
        "What unique advantages does Neovim bring to the table over Vim?",
        "How does the user experience in Neovim differ from Vim in terms of benefits?",
        "What are the top reasons to switch from Vim to Neovim?",
        "What features of Neovim are considered more advanced than those in Vim?"
    ],
    "message": "success"
 }
 ```

 Failure:

 ```json
 {
    "code": 401,
    "data": null,
    "message": "<Unauthorized '401: Unauthorized'>"
 }
 ```

 ---

 ## AGENT MANAGEMENT
@@ -3094,4 +3185,4 @@ Failure:
 }
 ```

 ---
 ---