您最多选择25个主题 主题必须以字母或数字开头,可以包含连字符 (-),并且长度不得超过35个字符

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643
  1. #
  2. # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. import json
  17. import os
  18. import re
  19. from datetime import datetime, timedelta
  20. from flask import request, Response
  21. from flask_login import login_required, current_user
  22. from api.db import FileType, ParserType, FileSource, LLMType
  23. from api.db.db_models import APIToken, API4Conversation, Task, File
  24. from api.db.services import duplicate_name
  25. from api.db.services.api_service import APITokenService, API4ConversationService
  26. from api.db.services.dialog_service import DialogService, chat
  27. from api.db.services.document_service import DocumentService
  28. from api.db.services.file2document_service import File2DocumentService
  29. from api.db.services.file_service import FileService
  30. from api.db.services.knowledgebase_service import KnowledgebaseService
  31. from api.db.services.llm_service import TenantLLMService
  32. from api.db.services.task_service import queue_tasks, TaskService
  33. from api.db.services.user_service import UserTenantService
  34. from api.settings import RetCode, retrievaler
  35. from api.utils import get_uuid, current_timestamp, datetime_format
  36. from api.utils.api_utils import server_error_response, get_data_error_result, get_json_result, validate_request
  37. from itsdangerous import URLSafeTimedSerializer
  38. from api.utils.file_utils import filename_type, thumbnail
  39. from rag.nlp import keyword_extraction
  40. from rag.utils.minio_conn import MINIO
  41. def generate_confirmation_token(tenent_id):
  42. serializer = URLSafeTimedSerializer(tenent_id)
  43. return "ragflow-" + serializer.dumps(get_uuid(), salt=tenent_id)[2:34]
  44. @manager.route('/new_token', methods=['POST'])
  45. @validate_request("dialog_id")
  46. @login_required
  47. def new_token():
  48. req = request.json
  49. try:
  50. tenants = UserTenantService.query(user_id=current_user.id)
  51. if not tenants:
  52. return get_data_error_result(retmsg="Tenant not found!")
  53. tenant_id = tenants[0].tenant_id
  54. obj = {"tenant_id": tenant_id, "token": generate_confirmation_token(tenant_id),
  55. "dialog_id": req["dialog_id"],
  56. "create_time": current_timestamp(),
  57. "create_date": datetime_format(datetime.now()),
  58. "update_time": None,
  59. "update_date": None
  60. }
  61. if not APITokenService.save(**obj):
  62. return get_data_error_result(retmsg="Fail to new a dialog!")
  63. return get_json_result(data=obj)
  64. except Exception as e:
  65. return server_error_response(e)
  66. @manager.route('/token_list', methods=['GET'])
  67. @login_required
  68. def token_list():
  69. try:
  70. tenants = UserTenantService.query(user_id=current_user.id)
  71. if not tenants:
  72. return get_data_error_result(retmsg="Tenant not found!")
  73. objs = APITokenService.query(tenant_id=tenants[0].tenant_id, dialog_id=request.args["dialog_id"])
  74. return get_json_result(data=[o.to_dict() for o in objs])
  75. except Exception as e:
  76. return server_error_response(e)
  77. @manager.route('/rm', methods=['POST'])
  78. @validate_request("tokens", "tenant_id")
  79. @login_required
  80. def rm():
  81. req = request.json
  82. try:
  83. for token in req["tokens"]:
  84. APITokenService.filter_delete(
  85. [APIToken.tenant_id == req["tenant_id"], APIToken.token == token])
  86. return get_json_result(data=True)
  87. except Exception as e:
  88. return server_error_response(e)
  89. @manager.route('/stats', methods=['GET'])
  90. @login_required
  91. def stats():
  92. try:
  93. tenants = UserTenantService.query(user_id=current_user.id)
  94. if not tenants:
  95. return get_data_error_result(retmsg="Tenant not found!")
  96. objs = API4ConversationService.stats(
  97. tenants[0].tenant_id,
  98. request.args.get(
  99. "from_date",
  100. (datetime.now() -
  101. timedelta(
  102. days=7)).strftime("%Y-%m-%d 24:00:00")),
  103. request.args.get(
  104. "to_date",
  105. datetime.now().strftime("%Y-%m-%d %H:%M:%S")))
  106. res = {
  107. "pv": [(o["dt"], o["pv"]) for o in objs],
  108. "uv": [(o["dt"], o["uv"]) for o in objs],
  109. "speed": [(o["dt"], float(o["tokens"])/(float(o["duration"]+0.1))) for o in objs],
  110. "tokens": [(o["dt"], float(o["tokens"])/1000.) for o in objs],
  111. "round": [(o["dt"], o["round"]) for o in objs],
  112. "thumb_up": [(o["dt"], o["thumb_up"]) for o in objs]
  113. }
  114. return get_json_result(data=res)
  115. except Exception as e:
  116. return server_error_response(e)
  117. @manager.route('/new_conversation', methods=['GET'])
  118. def set_conversation():
  119. token = request.headers.get('Authorization').split()[1]
  120. objs = APIToken.query(token=token)
  121. if not objs:
  122. return get_json_result(
  123. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  124. req = request.json
  125. try:
  126. e, dia = DialogService.get_by_id(objs[0].dialog_id)
  127. if not e:
  128. return get_data_error_result(retmsg="Dialog not found")
  129. conv = {
  130. "id": get_uuid(),
  131. "dialog_id": dia.id,
  132. "user_id": request.args.get("user_id", ""),
  133. "message": [{"role": "assistant", "content": dia.prompt_config["prologue"]}]
  134. }
  135. API4ConversationService.save(**conv)
  136. e, conv = API4ConversationService.get_by_id(conv["id"])
  137. if not e:
  138. return get_data_error_result(retmsg="Fail to new a conversation!")
  139. conv = conv.to_dict()
  140. return get_json_result(data=conv)
  141. except Exception as e:
  142. return server_error_response(e)
  143. @manager.route('/completion', methods=['POST'])
  144. @validate_request("conversation_id", "messages")
  145. def completion():
  146. token = request.headers.get('Authorization').split()[1]
  147. if not APIToken.query(token=token):
  148. return get_json_result(
  149. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  150. req = request.json
  151. e, conv = API4ConversationService.get_by_id(req["conversation_id"])
  152. if not e:
  153. return get_data_error_result(retmsg="Conversation not found!")
  154. if "quote" not in req: req["quote"] = False
  155. msg = []
  156. for m in req["messages"]:
  157. if m["role"] == "system":
  158. continue
  159. if m["role"] == "assistant" and not msg:
  160. continue
  161. msg.append({"role": m["role"], "content": m["content"]})
  162. try:
  163. conv.message.append(msg[-1])
  164. e, dia = DialogService.get_by_id(conv.dialog_id)
  165. if not e:
  166. return get_data_error_result(retmsg="Dialog not found!")
  167. del req["conversation_id"]
  168. del req["messages"]
  169. if not conv.reference:
  170. conv.reference = []
  171. conv.message.append({"role": "assistant", "content": ""})
  172. conv.reference.append({"chunks": [], "doc_aggs": []})
  173. def fillin_conv(ans):
  174. nonlocal conv
  175. if not conv.reference:
  176. conv.reference.append(ans["reference"])
  177. else: conv.reference[-1] = ans["reference"]
  178. conv.message[-1] = {"role": "assistant", "content": ans["answer"]}
  179. def rename_field(ans):
  180. reference = ans['reference']
  181. if not isinstance(reference, dict):
  182. return
  183. for chunk_i in reference.get('chunks', []):
  184. if 'docnm_kwd' in chunk_i:
  185. chunk_i['doc_name'] = chunk_i['docnm_kwd']
  186. chunk_i.pop('docnm_kwd')
  187. def stream():
  188. nonlocal dia, msg, req, conv
  189. try:
  190. for ans in chat(dia, msg, True, **req):
  191. fillin_conv(ans)
  192. rename_field(ans)
  193. yield "data:" + json.dumps({"retcode": 0, "retmsg": "", "data": ans}, ensure_ascii=False) + "\n\n"
  194. API4ConversationService.append_message(conv.id, conv.to_dict())
  195. except Exception as e:
  196. yield "data:" + json.dumps({"retcode": 500, "retmsg": str(e),
  197. "data": {"answer": "**ERROR**: "+str(e), "reference": []}},
  198. ensure_ascii=False) + "\n\n"
  199. yield "data:"+json.dumps({"retcode": 0, "retmsg": "", "data": True}, ensure_ascii=False) + "\n\n"
  200. if req.get("stream", True):
  201. resp = Response(stream(), mimetype="text/event-stream")
  202. resp.headers.add_header("Cache-control", "no-cache")
  203. resp.headers.add_header("Connection", "keep-alive")
  204. resp.headers.add_header("X-Accel-Buffering", "no")
  205. resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8")
  206. return resp
  207. else:
  208. answer = None
  209. for ans in chat(dia, msg, **req):
  210. answer = ans
  211. fillin_conv(ans)
  212. API4ConversationService.append_message(conv.id, conv.to_dict())
  213. break
  214. rename_field(answer)
  215. return get_json_result(data=answer)
  216. except Exception as e:
  217. return server_error_response(e)
  218. @manager.route('/conversation/<conversation_id>', methods=['GET'])
  219. # @login_required
  220. def get(conversation_id):
  221. try:
  222. e, conv = API4ConversationService.get_by_id(conversation_id)
  223. if not e:
  224. return get_data_error_result(retmsg="Conversation not found!")
  225. conv = conv.to_dict()
  226. for referenct_i in conv['reference']:
  227. if referenct_i is None or len(referenct_i) == 0:
  228. continue
  229. for chunk_i in referenct_i['chunks']:
  230. if 'docnm_kwd' in chunk_i.keys():
  231. chunk_i['doc_name'] = chunk_i['docnm_kwd']
  232. chunk_i.pop('docnm_kwd')
  233. return get_json_result(data=conv)
  234. except Exception as e:
  235. return server_error_response(e)
  236. @manager.route('/document/upload', methods=['POST'])
  237. @validate_request("kb_name")
  238. def upload():
  239. token = request.headers.get('Authorization').split()[1]
  240. objs = APIToken.query(token=token)
  241. if not objs:
  242. return get_json_result(
  243. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  244. kb_name = request.form.get("kb_name").strip()
  245. tenant_id = objs[0].tenant_id
  246. try:
  247. e, kb = KnowledgebaseService.get_by_name(kb_name, tenant_id)
  248. if not e:
  249. return get_data_error_result(
  250. retmsg="Can't find this knowledgebase!")
  251. kb_id = kb.id
  252. except Exception as e:
  253. return server_error_response(e)
  254. if 'file' not in request.files:
  255. return get_json_result(
  256. data=False, retmsg='No file part!', retcode=RetCode.ARGUMENT_ERROR)
  257. file = request.files['file']
  258. if file.filename == '':
  259. return get_json_result(
  260. data=False, retmsg='No file selected!', retcode=RetCode.ARGUMENT_ERROR)
  261. root_folder = FileService.get_root_folder(tenant_id)
  262. pf_id = root_folder["id"]
  263. FileService.init_knowledgebase_docs(pf_id, tenant_id)
  264. kb_root_folder = FileService.get_kb_folder(tenant_id)
  265. kb_folder = FileService.new_a_file_from_kb(kb.tenant_id, kb.name, kb_root_folder["id"])
  266. try:
  267. if DocumentService.get_doc_count(kb.tenant_id) >= int(os.environ.get('MAX_FILE_NUM_PER_USER', 8192)):
  268. return get_data_error_result(
  269. retmsg="Exceed the maximum file number of a free user!")
  270. filename = duplicate_name(
  271. DocumentService.query,
  272. name=file.filename,
  273. kb_id=kb_id)
  274. filetype = filename_type(filename)
  275. if not filetype:
  276. return get_data_error_result(
  277. retmsg="This type of file has not been supported yet!")
  278. location = filename
  279. while MINIO.obj_exist(kb_id, location):
  280. location += "_"
  281. blob = request.files['file'].read()
  282. MINIO.put(kb_id, location, blob)
  283. doc = {
  284. "id": get_uuid(),
  285. "kb_id": kb.id,
  286. "parser_id": kb.parser_id,
  287. "parser_config": kb.parser_config,
  288. "created_by": kb.tenant_id,
  289. "type": filetype,
  290. "name": filename,
  291. "location": location,
  292. "size": len(blob),
  293. "thumbnail": thumbnail(filename, blob)
  294. }
  295. form_data=request.form
  296. if "parser_id" in form_data.keys():
  297. if request.form.get("parser_id").strip() in list(vars(ParserType).values())[1:-3]:
  298. doc["parser_id"] = request.form.get("parser_id").strip()
  299. if doc["type"] == FileType.VISUAL:
  300. doc["parser_id"] = ParserType.PICTURE.value
  301. if doc["type"] == FileType.AURAL:
  302. doc["parser_id"] = ParserType.AUDIO.value
  303. if re.search(r"\.(ppt|pptx|pages)$", filename):
  304. doc["parser_id"] = ParserType.PRESENTATION.value
  305. doc_result = DocumentService.insert(doc)
  306. FileService.add_file_from_kb(doc, kb_folder["id"], kb.tenant_id)
  307. except Exception as e:
  308. return server_error_response(e)
  309. if "run" in form_data.keys():
  310. if request.form.get("run").strip() == "1":
  311. try:
  312. info = {"run": 1, "progress": 0}
  313. info["progress_msg"] = ""
  314. info["chunk_num"] = 0
  315. info["token_num"] = 0
  316. DocumentService.update_by_id(doc["id"], info)
  317. # if str(req["run"]) == TaskStatus.CANCEL.value:
  318. tenant_id = DocumentService.get_tenant_id(doc["id"])
  319. if not tenant_id:
  320. return get_data_error_result(retmsg="Tenant not found!")
  321. #e, doc = DocumentService.get_by_id(doc["id"])
  322. TaskService.filter_delete([Task.doc_id == doc["id"]])
  323. e, doc = DocumentService.get_by_id(doc["id"])
  324. doc = doc.to_dict()
  325. doc["tenant_id"] = tenant_id
  326. bucket, name = File2DocumentService.get_minio_address(doc_id=doc["id"])
  327. queue_tasks(doc, bucket, name)
  328. except Exception as e:
  329. return server_error_response(e)
  330. return get_json_result(data=doc_result.to_json())
  331. @manager.route('/list_chunks', methods=['POST'])
  332. # @login_required
  333. def list_chunks():
  334. token = request.headers.get('Authorization').split()[1]
  335. objs = APIToken.query(token=token)
  336. if not objs:
  337. return get_json_result(
  338. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  339. req = request.json
  340. try:
  341. if "doc_name" in req.keys():
  342. tenant_id = DocumentService.get_tenant_id_by_name(req['doc_name'])
  343. doc_id = DocumentService.get_doc_id_by_doc_name(req['doc_name'])
  344. elif "doc_id" in req.keys():
  345. tenant_id = DocumentService.get_tenant_id(req['doc_id'])
  346. doc_id = req['doc_id']
  347. else:
  348. return get_json_result(
  349. data=False, retmsg="Can't find doc_name or doc_id"
  350. )
  351. res = retrievaler.chunk_list(doc_id=doc_id, tenant_id=tenant_id)
  352. res = [
  353. {
  354. "content": res_item["content_with_weight"],
  355. "doc_name": res_item["docnm_kwd"],
  356. "img_id": res_item["img_id"]
  357. } for res_item in res
  358. ]
  359. except Exception as e:
  360. return server_error_response(e)
  361. return get_json_result(data=res)
  362. @manager.route('/list_kb_docs', methods=['POST'])
  363. # @login_required
  364. def list_kb_docs():
  365. token = request.headers.get('Authorization').split()[1]
  366. objs = APIToken.query(token=token)
  367. if not objs:
  368. return get_json_result(
  369. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  370. req = request.json
  371. tenant_id = objs[0].tenant_id
  372. kb_name = req.get("kb_name", "").strip()
  373. try:
  374. e, kb = KnowledgebaseService.get_by_name(kb_name, tenant_id)
  375. if not e:
  376. return get_data_error_result(
  377. retmsg="Can't find this knowledgebase!")
  378. kb_id = kb.id
  379. except Exception as e:
  380. return server_error_response(e)
  381. page_number = int(req.get("page", 1))
  382. items_per_page = int(req.get("page_size", 15))
  383. orderby = req.get("orderby", "create_time")
  384. desc = req.get("desc", True)
  385. keywords = req.get("keywords", "")
  386. try:
  387. docs, tol = DocumentService.get_by_kb_id(
  388. kb_id, page_number, items_per_page, orderby, desc, keywords)
  389. docs = [{"doc_id": doc['id'], "doc_name": doc['name']} for doc in docs]
  390. return get_json_result(data={"total": tol, "docs": docs})
  391. except Exception as e:
  392. return server_error_response(e)
  393. @manager.route('/document', methods=['DELETE'])
  394. # @login_required
  395. def document_rm():
  396. token = request.headers.get('Authorization').split()[1]
  397. objs = APIToken.query(token=token)
  398. if not objs:
  399. return get_json_result(
  400. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  401. tenant_id = objs[0].tenant_id
  402. req = request.json
  403. doc_ids = []
  404. try:
  405. doc_ids = [DocumentService.get_doc_id_by_doc_name(doc_name) for doc_name in req.get("doc_names", [])]
  406. for doc_id in req.get("doc_ids", []):
  407. if doc_id not in doc_ids:
  408. doc_ids.append(doc_id)
  409. if not doc_ids:
  410. return get_json_result(
  411. data=False, retmsg="Can't find doc_names or doc_ids"
  412. )
  413. except Exception as e:
  414. return server_error_response(e)
  415. root_folder = FileService.get_root_folder(tenant_id)
  416. pf_id = root_folder["id"]
  417. FileService.init_knowledgebase_docs(pf_id, tenant_id)
  418. errors = ""
  419. for doc_id in doc_ids:
  420. try:
  421. e, doc = DocumentService.get_by_id(doc_id)
  422. if not e:
  423. return get_data_error_result(retmsg="Document not found!")
  424. tenant_id = DocumentService.get_tenant_id(doc_id)
  425. if not tenant_id:
  426. return get_data_error_result(retmsg="Tenant not found!")
  427. b, n = File2DocumentService.get_minio_address(doc_id=doc_id)
  428. if not DocumentService.remove_document(doc, tenant_id):
  429. return get_data_error_result(
  430. retmsg="Database error (Document removal)!")
  431. f2d = File2DocumentService.get_by_document_id(doc_id)
  432. FileService.filter_delete([File.source_type == FileSource.KNOWLEDGEBASE, File.id == f2d[0].file_id])
  433. File2DocumentService.delete_by_document_id(doc_id)
  434. MINIO.rm(b, n)
  435. except Exception as e:
  436. errors += str(e)
  437. if errors:
  438. return get_json_result(data=False, retmsg=errors, retcode=RetCode.SERVER_ERROR)
  439. return get_json_result(data=True)
  440. @manager.route('/completion_aibotk', methods=['POST'])
  441. @validate_request("Authorization", "conversation_id", "word")
  442. def completion_faq():
  443. import base64
  444. req = request.json
  445. token = req["Authorization"]
  446. objs = APIToken.query(token=token)
  447. if not objs:
  448. return get_json_result(
  449. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  450. e, conv = API4ConversationService.get_by_id(req["conversation_id"])
  451. if not e:
  452. return get_data_error_result(retmsg="Conversation not found!")
  453. if "quote" not in req: req["quote"] = True
  454. msg = []
  455. msg.append({"role": "user", "content": req["word"]})
  456. try:
  457. conv.message.append(msg[-1])
  458. e, dia = DialogService.get_by_id(conv.dialog_id)
  459. if not e:
  460. return get_data_error_result(retmsg="Dialog not found!")
  461. del req["conversation_id"]
  462. if not conv.reference:
  463. conv.reference = []
  464. conv.message.append({"role": "assistant", "content": ""})
  465. conv.reference.append({"chunks": [], "doc_aggs": []})
  466. def fillin_conv(ans):
  467. nonlocal conv
  468. if not conv.reference:
  469. conv.reference.append(ans["reference"])
  470. else: conv.reference[-1] = ans["reference"]
  471. conv.message[-1] = {"role": "assistant", "content": ans["answer"]}
  472. data_type_picture = {
  473. "type": 3,
  474. "url": "base64 content"
  475. }
  476. data = [
  477. {
  478. "type": 1,
  479. "content": ""
  480. }
  481. ]
  482. ans = ""
  483. for a in chat(dia, msg, stream=False, **req):
  484. ans = a
  485. break
  486. data[0]["content"] += re.sub(r'##\d\$\$', '', ans["answer"])
  487. fillin_conv(ans)
  488. API4ConversationService.append_message(conv.id, conv.to_dict())
  489. chunk_idxs = [int(match[2]) for match in re.findall(r'##\d\$\$', ans["answer"])]
  490. for chunk_idx in chunk_idxs[:1]:
  491. if ans["reference"]["chunks"][chunk_idx]["img_id"]:
  492. try:
  493. bkt, nm = ans["reference"]["chunks"][chunk_idx]["img_id"].split("-")
  494. response = MINIO.get(bkt, nm)
  495. data_type_picture["url"] = base64.b64encode(response).decode('utf-8')
  496. data.append(data_type_picture)
  497. break
  498. except Exception as e:
  499. return server_error_response(e)
  500. response = {"code": 200, "msg": "success", "data": data}
  501. return response
  502. except Exception as e:
  503. return server_error_response(e)
  504. @manager.route('/retrieval', methods=['POST'])
  505. @validate_request("kb_id", "question")
  506. def retrieval():
  507. token = request.headers.get('Authorization').split()[1]
  508. objs = APIToken.query(token=token)
  509. if not objs:
  510. return get_json_result(
  511. data=False, retmsg='Token is not valid!"', retcode=RetCode.AUTHENTICATION_ERROR)
  512. req = request.json
  513. kb_id = req.get("kb_id")
  514. doc_ids = req.get("doc_ids", [])
  515. question = req.get("question")
  516. page = int(req.get("page", 1))
  517. size = int(req.get("size", 30))
  518. similarity_threshold = float(req.get("similarity_threshold", 0.2))
  519. vector_similarity_weight = float(req.get("vector_similarity_weight", 0.3))
  520. top = int(req.get("top_k", 1024))
  521. try:
  522. e, kb = KnowledgebaseService.get_by_id(kb_id)
  523. if not e:
  524. return get_data_error_result(retmsg="Knowledgebase not found!")
  525. embd_mdl = TenantLLMService.model_instance(
  526. kb.tenant_id, LLMType.EMBEDDING.value, llm_name=kb.embd_id)
  527. rerank_mdl = None
  528. if req.get("rerank_id"):
  529. rerank_mdl = TenantLLMService.model_instance(
  530. kb.tenant_id, LLMType.RERANK.value, llm_name=req["rerank_id"])
  531. if req.get("keyword", False):
  532. chat_mdl = TenantLLMService.model_instance(kb.tenant_id, LLMType.CHAT)
  533. question += keyword_extraction(chat_mdl, question)
  534. ranks = retrievaler.retrieval(question, embd_mdl, kb.tenant_id, [kb_id], page, size,
  535. similarity_threshold, vector_similarity_weight, top,
  536. doc_ids, rerank_mdl=rerank_mdl)
  537. for c in ranks["chunks"]:
  538. if "vector" in c:
  539. del c["vector"]
  540. return get_json_result(data=ranks)
  541. except Exception as e:
  542. if str(e).find("not_found") > 0:
  543. return get_json_result(data=False, retmsg=f'No chunk found! Check the chunk status please!',
  544. retcode=RetCode.DATA_ERROR)
  545. return server_error_response(e)