您最多选择25个主题 主题必须以字母或数字开头,可以包含连字符 (-),并且长度不得超过35个字符

ops_trace_manager.py 32KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847
  1. import json
  2. import logging
  3. import os
  4. import queue
  5. import threading
  6. import time
  7. from datetime import timedelta
  8. from typing import Any, Optional, Union
  9. from uuid import UUID, uuid4
  10. from cachetools import LRUCache
  11. from flask import current_app
  12. from sqlalchemy import select
  13. from sqlalchemy.orm import Session
  14. from core.helper.encrypter import decrypt_token, encrypt_token, obfuscated_token
  15. from core.ops.entities.config_entity import (
  16. OPS_FILE_PATH,
  17. TracingProviderEnum,
  18. )
  19. from core.ops.entities.trace_entity import (
  20. DatasetRetrievalTraceInfo,
  21. GenerateNameTraceInfo,
  22. MessageTraceInfo,
  23. ModerationTraceInfo,
  24. SuggestedQuestionTraceInfo,
  25. TaskData,
  26. ToolTraceInfo,
  27. TraceTaskName,
  28. WorkflowTraceInfo,
  29. )
  30. from core.ops.utils import get_message_data
  31. from extensions.ext_database import db
  32. from extensions.ext_storage import storage
  33. from models.model import App, AppModelConfig, Conversation, Message, MessageFile, TraceAppConfig
  34. from models.workflow import WorkflowAppLog, WorkflowRun
  35. from tasks.ops_trace_task import process_trace_tasks
  36. class OpsTraceProviderConfigMap(dict[str, dict[str, Any]]):
  37. def __getitem__(self, provider: str) -> dict[str, Any]:
  38. match provider:
  39. case TracingProviderEnum.LANGFUSE:
  40. from core.ops.entities.config_entity import LangfuseConfig
  41. from core.ops.langfuse_trace.langfuse_trace import LangFuseDataTrace
  42. return {
  43. "config_class": LangfuseConfig,
  44. "secret_keys": ["public_key", "secret_key"],
  45. "other_keys": ["host", "project_key"],
  46. "trace_instance": LangFuseDataTrace,
  47. }
  48. case TracingProviderEnum.LANGSMITH:
  49. from core.ops.entities.config_entity import LangSmithConfig
  50. from core.ops.langsmith_trace.langsmith_trace import LangSmithDataTrace
  51. return {
  52. "config_class": LangSmithConfig,
  53. "secret_keys": ["api_key"],
  54. "other_keys": ["project", "endpoint"],
  55. "trace_instance": LangSmithDataTrace,
  56. }
  57. case TracingProviderEnum.OPIK:
  58. from core.ops.entities.config_entity import OpikConfig
  59. from core.ops.opik_trace.opik_trace import OpikDataTrace
  60. return {
  61. "config_class": OpikConfig,
  62. "secret_keys": ["api_key"],
  63. "other_keys": ["project", "url", "workspace"],
  64. "trace_instance": OpikDataTrace,
  65. }
  66. case TracingProviderEnum.WEAVE:
  67. from core.ops.entities.config_entity import WeaveConfig
  68. from core.ops.weave_trace.weave_trace import WeaveDataTrace
  69. return {
  70. "config_class": WeaveConfig,
  71. "secret_keys": ["api_key"],
  72. "other_keys": ["project", "entity", "endpoint"],
  73. "trace_instance": WeaveDataTrace,
  74. }
  75. case _:
  76. raise KeyError(f"Unsupported tracing provider: {provider}")
  77. provider_config_map: dict[str, dict[str, Any]] = OpsTraceProviderConfigMap()
  78. class OpsTraceManager:
  79. ops_trace_instances_cache: LRUCache = LRUCache(maxsize=128)
  80. @classmethod
  81. def encrypt_tracing_config(
  82. cls, tenant_id: str, tracing_provider: str, tracing_config: dict, current_trace_config=None
  83. ):
  84. """
  85. Encrypt tracing config.
  86. :param tenant_id: tenant id
  87. :param tracing_provider: tracing provider
  88. :param tracing_config: tracing config dictionary to be encrypted
  89. :param current_trace_config: current tracing configuration for keeping existing values
  90. :return: encrypted tracing configuration
  91. """
  92. # Get the configuration class and the keys that require encryption
  93. config_class, secret_keys, other_keys = (
  94. provider_config_map[tracing_provider]["config_class"],
  95. provider_config_map[tracing_provider]["secret_keys"],
  96. provider_config_map[tracing_provider]["other_keys"],
  97. )
  98. new_config = {}
  99. # Encrypt necessary keys
  100. for key in secret_keys:
  101. if key in tracing_config:
  102. if "*" in tracing_config[key]:
  103. # If the key contains '*', retain the original value from the current config
  104. new_config[key] = current_trace_config.get(key, tracing_config[key])
  105. else:
  106. # Otherwise, encrypt the key
  107. new_config[key] = encrypt_token(tenant_id, tracing_config[key])
  108. for key in other_keys:
  109. new_config[key] = tracing_config.get(key, "")
  110. # Create a new instance of the config class with the new configuration
  111. encrypted_config = config_class(**new_config)
  112. return encrypted_config.model_dump()
  113. @classmethod
  114. def decrypt_tracing_config(cls, tenant_id: str, tracing_provider: str, tracing_config: dict):
  115. """
  116. Decrypt tracing config
  117. :param tenant_id: tenant id
  118. :param tracing_provider: tracing provider
  119. :param tracing_config: tracing config
  120. :return:
  121. """
  122. config_class, secret_keys, other_keys = (
  123. provider_config_map[tracing_provider]["config_class"],
  124. provider_config_map[tracing_provider]["secret_keys"],
  125. provider_config_map[tracing_provider]["other_keys"],
  126. )
  127. new_config = {}
  128. for key in secret_keys:
  129. if key in tracing_config:
  130. new_config[key] = decrypt_token(tenant_id, tracing_config[key])
  131. for key in other_keys:
  132. new_config[key] = tracing_config.get(key, "")
  133. return config_class(**new_config).model_dump()
  134. @classmethod
  135. def obfuscated_decrypt_token(cls, tracing_provider: str, decrypt_tracing_config: dict):
  136. """
  137. Decrypt tracing config
  138. :param tracing_provider: tracing provider
  139. :param decrypt_tracing_config: tracing config
  140. :return:
  141. """
  142. config_class, secret_keys, other_keys = (
  143. provider_config_map[tracing_provider]["config_class"],
  144. provider_config_map[tracing_provider]["secret_keys"],
  145. provider_config_map[tracing_provider]["other_keys"],
  146. )
  147. new_config = {}
  148. for key in secret_keys:
  149. if key in decrypt_tracing_config:
  150. new_config[key] = obfuscated_token(decrypt_tracing_config[key])
  151. for key in other_keys:
  152. new_config[key] = decrypt_tracing_config.get(key, "")
  153. return config_class(**new_config).model_dump()
  154. @classmethod
  155. def get_decrypted_tracing_config(cls, app_id: str, tracing_provider: str):
  156. """
  157. Get decrypted tracing config
  158. :param app_id: app id
  159. :param tracing_provider: tracing provider
  160. :return:
  161. """
  162. trace_config_data: Optional[TraceAppConfig] = (
  163. db.session.query(TraceAppConfig)
  164. .filter(TraceAppConfig.app_id == app_id, TraceAppConfig.tracing_provider == tracing_provider)
  165. .first()
  166. )
  167. if not trace_config_data:
  168. return None
  169. # decrypt_token
  170. app = db.session.query(App).filter(App.id == app_id).first()
  171. if not app:
  172. raise ValueError("App not found")
  173. tenant_id = app.tenant_id
  174. decrypt_tracing_config = cls.decrypt_tracing_config(
  175. tenant_id, tracing_provider, trace_config_data.tracing_config
  176. )
  177. return decrypt_tracing_config
  178. @classmethod
  179. def get_ops_trace_instance(
  180. cls,
  181. app_id: Optional[Union[UUID, str]] = None,
  182. ):
  183. """
  184. Get ops trace through model config
  185. :param app_id: app_id
  186. :return:
  187. """
  188. if isinstance(app_id, UUID):
  189. app_id = str(app_id)
  190. if app_id is None:
  191. return None
  192. app: Optional[App] = db.session.query(App).filter(App.id == app_id).first()
  193. if app is None:
  194. return None
  195. app_ops_trace_config = json.loads(app.tracing) if app.tracing else None
  196. if app_ops_trace_config is None:
  197. return None
  198. if not app_ops_trace_config.get("enabled"):
  199. return None
  200. tracing_provider = app_ops_trace_config.get("tracing_provider")
  201. if tracing_provider is None or tracing_provider not in provider_config_map:
  202. return None
  203. # decrypt_token
  204. decrypt_trace_config = cls.get_decrypted_tracing_config(app_id, tracing_provider)
  205. if not decrypt_trace_config:
  206. return None
  207. trace_instance, config_class = (
  208. provider_config_map[tracing_provider]["trace_instance"],
  209. provider_config_map[tracing_provider]["config_class"],
  210. )
  211. decrypt_trace_config_key = str(decrypt_trace_config)
  212. tracing_instance = cls.ops_trace_instances_cache.get(decrypt_trace_config_key)
  213. if tracing_instance is None:
  214. # create new tracing_instance and update the cache if it absent
  215. tracing_instance = trace_instance(config_class(**decrypt_trace_config))
  216. cls.ops_trace_instances_cache[decrypt_trace_config_key] = tracing_instance
  217. logging.info(f"new tracing_instance for app_id: {app_id}")
  218. return tracing_instance
  219. @classmethod
  220. def get_app_config_through_message_id(cls, message_id: str):
  221. app_model_config = None
  222. message_data = db.session.query(Message).filter(Message.id == message_id).first()
  223. if not message_data:
  224. return None
  225. conversation_id = message_data.conversation_id
  226. conversation_data = db.session.query(Conversation).filter(Conversation.id == conversation_id).first()
  227. if not conversation_data:
  228. return None
  229. if conversation_data.app_model_config_id:
  230. app_model_config = (
  231. db.session.query(AppModelConfig)
  232. .filter(AppModelConfig.id == conversation_data.app_model_config_id)
  233. .first()
  234. )
  235. elif conversation_data.app_model_config_id is None and conversation_data.override_model_configs:
  236. app_model_config = conversation_data.override_model_configs
  237. return app_model_config
  238. @classmethod
  239. def update_app_tracing_config(cls, app_id: str, enabled: bool, tracing_provider: str):
  240. """
  241. Update app tracing config
  242. :param app_id: app id
  243. :param enabled: enabled
  244. :param tracing_provider: tracing provider
  245. :return:
  246. """
  247. # auth check
  248. if tracing_provider not in provider_config_map and tracing_provider is not None:
  249. raise ValueError(f"Invalid tracing provider: {tracing_provider}")
  250. app_config: Optional[App] = db.session.query(App).filter(App.id == app_id).first()
  251. if not app_config:
  252. raise ValueError("App not found")
  253. app_config.tracing = json.dumps(
  254. {
  255. "enabled": enabled,
  256. "tracing_provider": tracing_provider,
  257. }
  258. )
  259. db.session.commit()
  260. @classmethod
  261. def get_app_tracing_config(cls, app_id: str):
  262. """
  263. Get app tracing config
  264. :param app_id: app id
  265. :return:
  266. """
  267. app: Optional[App] = db.session.query(App).filter(App.id == app_id).first()
  268. if not app:
  269. raise ValueError("App not found")
  270. if not app.tracing:
  271. return {"enabled": False, "tracing_provider": None}
  272. app_trace_config = json.loads(app.tracing)
  273. return app_trace_config
  274. @staticmethod
  275. def check_trace_config_is_effective(tracing_config: dict, tracing_provider: str):
  276. """
  277. Check trace config is effective
  278. :param tracing_config: tracing config
  279. :param tracing_provider: tracing provider
  280. :return:
  281. """
  282. config_type, trace_instance = (
  283. provider_config_map[tracing_provider]["config_class"],
  284. provider_config_map[tracing_provider]["trace_instance"],
  285. )
  286. tracing_config = config_type(**tracing_config)
  287. return trace_instance(tracing_config).api_check()
  288. @staticmethod
  289. def get_trace_config_project_key(tracing_config: dict, tracing_provider: str):
  290. """
  291. get trace config is project key
  292. :param tracing_config: tracing config
  293. :param tracing_provider: tracing provider
  294. :return:
  295. """
  296. config_type, trace_instance = (
  297. provider_config_map[tracing_provider]["config_class"],
  298. provider_config_map[tracing_provider]["trace_instance"],
  299. )
  300. tracing_config = config_type(**tracing_config)
  301. return trace_instance(tracing_config).get_project_key()
  302. @staticmethod
  303. def get_trace_config_project_url(tracing_config: dict, tracing_provider: str):
  304. """
  305. get trace config is project key
  306. :param tracing_config: tracing config
  307. :param tracing_provider: tracing provider
  308. :return:
  309. """
  310. config_type, trace_instance = (
  311. provider_config_map[tracing_provider]["config_class"],
  312. provider_config_map[tracing_provider]["trace_instance"],
  313. )
  314. tracing_config = config_type(**tracing_config)
  315. return trace_instance(tracing_config).get_project_url()
  316. class TraceTask:
  317. def __init__(
  318. self,
  319. trace_type: Any,
  320. message_id: Optional[str] = None,
  321. workflow_run: Optional[WorkflowRun] = None,
  322. conversation_id: Optional[str] = None,
  323. user_id: Optional[str] = None,
  324. timer: Optional[Any] = None,
  325. **kwargs,
  326. ):
  327. self.trace_type = trace_type
  328. self.message_id = message_id
  329. self.workflow_run_id = workflow_run.id if workflow_run else None
  330. self.conversation_id = conversation_id
  331. self.user_id = user_id
  332. self.timer = timer
  333. self.file_base_url = os.getenv("FILES_URL", "http://127.0.0.1:5001")
  334. self.app_id = None
  335. self.kwargs = kwargs
  336. def execute(self):
  337. return self.preprocess()
  338. def preprocess(self):
  339. preprocess_map = {
  340. TraceTaskName.CONVERSATION_TRACE: lambda: self.conversation_trace(**self.kwargs),
  341. TraceTaskName.WORKFLOW_TRACE: lambda: self.workflow_trace(
  342. workflow_run_id=self.workflow_run_id, conversation_id=self.conversation_id, user_id=self.user_id
  343. ),
  344. TraceTaskName.MESSAGE_TRACE: lambda: self.message_trace(message_id=self.message_id),
  345. TraceTaskName.MODERATION_TRACE: lambda: self.moderation_trace(
  346. message_id=self.message_id, timer=self.timer, **self.kwargs
  347. ),
  348. TraceTaskName.SUGGESTED_QUESTION_TRACE: lambda: self.suggested_question_trace(
  349. message_id=self.message_id, timer=self.timer, **self.kwargs
  350. ),
  351. TraceTaskName.DATASET_RETRIEVAL_TRACE: lambda: self.dataset_retrieval_trace(
  352. message_id=self.message_id, timer=self.timer, **self.kwargs
  353. ),
  354. TraceTaskName.TOOL_TRACE: lambda: self.tool_trace(
  355. message_id=self.message_id, timer=self.timer, **self.kwargs
  356. ),
  357. TraceTaskName.GENERATE_NAME_TRACE: lambda: self.generate_name_trace(
  358. conversation_id=self.conversation_id, timer=self.timer, **self.kwargs
  359. ),
  360. }
  361. return preprocess_map.get(self.trace_type, lambda: None)()
  362. # process methods for different trace types
  363. def conversation_trace(self, **kwargs):
  364. return kwargs
  365. def workflow_trace(
  366. self,
  367. *,
  368. workflow_run_id: str | None,
  369. conversation_id: str | None,
  370. user_id: str | None,
  371. ):
  372. if not workflow_run_id:
  373. return {}
  374. with Session(db.engine) as session:
  375. workflow_run_stmt = select(WorkflowRun).where(WorkflowRun.id == workflow_run_id)
  376. workflow_run = session.scalars(workflow_run_stmt).first()
  377. if not workflow_run:
  378. raise ValueError("Workflow run not found")
  379. workflow_id = workflow_run.workflow_id
  380. tenant_id = workflow_run.tenant_id
  381. workflow_run_id = workflow_run.id
  382. workflow_run_elapsed_time = workflow_run.elapsed_time
  383. workflow_run_status = workflow_run.status
  384. workflow_run_inputs = workflow_run.inputs_dict
  385. workflow_run_outputs = workflow_run.outputs_dict
  386. workflow_run_version = workflow_run.version
  387. error = workflow_run.error or ""
  388. total_tokens = workflow_run.total_tokens
  389. file_list = workflow_run_inputs.get("sys.file") or []
  390. query = workflow_run_inputs.get("query") or workflow_run_inputs.get("sys.query") or ""
  391. # get workflow_app_log_id
  392. workflow_app_log_data_stmt = select(WorkflowAppLog.id).where(
  393. WorkflowAppLog.tenant_id == tenant_id,
  394. WorkflowAppLog.app_id == workflow_run.app_id,
  395. WorkflowAppLog.workflow_run_id == workflow_run.id,
  396. )
  397. workflow_app_log_id = session.scalar(workflow_app_log_data_stmt)
  398. # get message_id
  399. message_id = None
  400. if conversation_id:
  401. message_data_stmt = select(Message.id).where(
  402. Message.conversation_id == conversation_id,
  403. Message.workflow_run_id == workflow_run_id,
  404. )
  405. message_id = session.scalar(message_data_stmt)
  406. metadata = {
  407. "workflow_id": workflow_id,
  408. "conversation_id": conversation_id,
  409. "workflow_run_id": workflow_run_id,
  410. "tenant_id": tenant_id,
  411. "elapsed_time": workflow_run_elapsed_time,
  412. "status": workflow_run_status,
  413. "version": workflow_run_version,
  414. "total_tokens": total_tokens,
  415. "file_list": file_list,
  416. "triggered_from": workflow_run.triggered_from,
  417. "user_id": user_id,
  418. }
  419. workflow_trace_info = WorkflowTraceInfo(
  420. workflow_data=workflow_run.to_dict(),
  421. conversation_id=conversation_id,
  422. workflow_id=workflow_id,
  423. tenant_id=tenant_id,
  424. workflow_run_id=workflow_run_id,
  425. workflow_run_elapsed_time=workflow_run_elapsed_time,
  426. workflow_run_status=workflow_run_status,
  427. workflow_run_inputs=workflow_run_inputs,
  428. workflow_run_outputs=workflow_run_outputs,
  429. workflow_run_version=workflow_run_version,
  430. error=error,
  431. total_tokens=total_tokens,
  432. file_list=file_list,
  433. query=query,
  434. metadata=metadata,
  435. workflow_app_log_id=workflow_app_log_id,
  436. message_id=message_id,
  437. start_time=workflow_run.created_at,
  438. end_time=workflow_run.finished_at,
  439. )
  440. return workflow_trace_info
  441. def message_trace(self, message_id: str | None):
  442. if not message_id:
  443. return {}
  444. message_data = get_message_data(message_id)
  445. if not message_data:
  446. return {}
  447. conversation_mode_stmt = select(Conversation.mode).where(Conversation.id == message_data.conversation_id)
  448. conversation_mode = db.session.scalars(conversation_mode_stmt).all()
  449. if not conversation_mode or len(conversation_mode) == 0:
  450. return {}
  451. conversation_mode = conversation_mode[0]
  452. created_at = message_data.created_at
  453. inputs = message_data.message
  454. # get message file data
  455. message_file_data = db.session.query(MessageFile).filter_by(message_id=message_id).first()
  456. file_list = []
  457. if message_file_data and message_file_data.url is not None:
  458. file_url = f"{self.file_base_url}/{message_file_data.url}" if message_file_data else ""
  459. file_list.append(file_url)
  460. metadata = {
  461. "conversation_id": message_data.conversation_id,
  462. "ls_provider": message_data.model_provider,
  463. "ls_model_name": message_data.model_id,
  464. "status": message_data.status,
  465. "from_end_user_id": message_data.from_end_user_id,
  466. "from_account_id": message_data.from_account_id,
  467. "agent_based": message_data.agent_based,
  468. "workflow_run_id": message_data.workflow_run_id,
  469. "from_source": message_data.from_source,
  470. "message_id": message_id,
  471. }
  472. message_tokens = message_data.message_tokens
  473. message_trace_info = MessageTraceInfo(
  474. message_id=message_id,
  475. message_data=message_data.to_dict(),
  476. conversation_model=conversation_mode,
  477. message_tokens=message_tokens,
  478. answer_tokens=message_data.answer_tokens,
  479. total_tokens=message_tokens + message_data.answer_tokens,
  480. error=message_data.error or "",
  481. inputs=inputs,
  482. outputs=message_data.answer,
  483. file_list=file_list,
  484. start_time=created_at,
  485. end_time=created_at + timedelta(seconds=message_data.provider_response_latency),
  486. metadata=metadata,
  487. message_file_data=message_file_data,
  488. conversation_mode=conversation_mode,
  489. )
  490. return message_trace_info
  491. def moderation_trace(self, message_id, timer, **kwargs):
  492. moderation_result = kwargs.get("moderation_result")
  493. if not moderation_result:
  494. return {}
  495. inputs = kwargs.get("inputs")
  496. message_data = get_message_data(message_id)
  497. if not message_data:
  498. return {}
  499. metadata = {
  500. "message_id": message_id,
  501. "action": moderation_result.action,
  502. "preset_response": moderation_result.preset_response,
  503. "query": moderation_result.query,
  504. }
  505. # get workflow_app_log_id
  506. workflow_app_log_id = None
  507. if message_data.workflow_run_id:
  508. workflow_app_log_data = (
  509. db.session.query(WorkflowAppLog).filter_by(workflow_run_id=message_data.workflow_run_id).first()
  510. )
  511. workflow_app_log_id = str(workflow_app_log_data.id) if workflow_app_log_data else None
  512. moderation_trace_info = ModerationTraceInfo(
  513. message_id=workflow_app_log_id or message_id,
  514. inputs=inputs,
  515. message_data=message_data.to_dict(),
  516. flagged=moderation_result.flagged,
  517. action=moderation_result.action,
  518. preset_response=moderation_result.preset_response,
  519. query=moderation_result.query,
  520. start_time=timer.get("start"),
  521. end_time=timer.get("end"),
  522. metadata=metadata,
  523. )
  524. return moderation_trace_info
  525. def suggested_question_trace(self, message_id, timer, **kwargs):
  526. suggested_question = kwargs.get("suggested_question", [])
  527. message_data = get_message_data(message_id)
  528. if not message_data:
  529. return {}
  530. metadata = {
  531. "message_id": message_id,
  532. "ls_provider": message_data.model_provider,
  533. "ls_model_name": message_data.model_id,
  534. "status": message_data.status,
  535. "from_end_user_id": message_data.from_end_user_id,
  536. "from_account_id": message_data.from_account_id,
  537. "agent_based": message_data.agent_based,
  538. "workflow_run_id": message_data.workflow_run_id,
  539. "from_source": message_data.from_source,
  540. }
  541. # get workflow_app_log_id
  542. workflow_app_log_id = None
  543. if message_data.workflow_run_id:
  544. workflow_app_log_data = (
  545. db.session.query(WorkflowAppLog).filter_by(workflow_run_id=message_data.workflow_run_id).first()
  546. )
  547. workflow_app_log_id = str(workflow_app_log_data.id) if workflow_app_log_data else None
  548. suggested_question_trace_info = SuggestedQuestionTraceInfo(
  549. message_id=workflow_app_log_id or message_id,
  550. message_data=message_data.to_dict(),
  551. inputs=message_data.message,
  552. outputs=message_data.answer,
  553. start_time=timer.get("start"),
  554. end_time=timer.get("end"),
  555. metadata=metadata,
  556. total_tokens=message_data.message_tokens + message_data.answer_tokens,
  557. status=message_data.status,
  558. error=message_data.error,
  559. from_account_id=message_data.from_account_id,
  560. agent_based=message_data.agent_based,
  561. from_source=message_data.from_source,
  562. model_provider=message_data.model_provider,
  563. model_id=message_data.model_id,
  564. suggested_question=suggested_question,
  565. level=message_data.status,
  566. status_message=message_data.error,
  567. )
  568. return suggested_question_trace_info
  569. def dataset_retrieval_trace(self, message_id, timer, **kwargs):
  570. documents = kwargs.get("documents")
  571. message_data = get_message_data(message_id)
  572. if not message_data:
  573. return {}
  574. metadata = {
  575. "message_id": message_id,
  576. "ls_provider": message_data.model_provider,
  577. "ls_model_name": message_data.model_id,
  578. "status": message_data.status,
  579. "from_end_user_id": message_data.from_end_user_id,
  580. "from_account_id": message_data.from_account_id,
  581. "agent_based": message_data.agent_based,
  582. "workflow_run_id": message_data.workflow_run_id,
  583. "from_source": message_data.from_source,
  584. }
  585. dataset_retrieval_trace_info = DatasetRetrievalTraceInfo(
  586. message_id=message_id,
  587. inputs=message_data.query or message_data.inputs,
  588. documents=[doc.model_dump() for doc in documents] if documents else [],
  589. start_time=timer.get("start"),
  590. end_time=timer.get("end"),
  591. metadata=metadata,
  592. message_data=message_data.to_dict(),
  593. )
  594. return dataset_retrieval_trace_info
  595. def tool_trace(self, message_id, timer, **kwargs):
  596. tool_name = kwargs.get("tool_name", "")
  597. tool_inputs = kwargs.get("tool_inputs", {})
  598. tool_outputs = kwargs.get("tool_outputs", {})
  599. message_data = get_message_data(message_id)
  600. if not message_data:
  601. return {}
  602. tool_config = {}
  603. time_cost = 0
  604. error = None
  605. tool_parameters = {}
  606. created_time = message_data.created_at
  607. end_time = message_data.updated_at
  608. agent_thoughts = message_data.agent_thoughts
  609. for agent_thought in agent_thoughts:
  610. if tool_name in agent_thought.tools:
  611. created_time = agent_thought.created_at
  612. tool_meta_data = agent_thought.tool_meta.get(tool_name, {})
  613. tool_config = tool_meta_data.get("tool_config", {})
  614. time_cost = tool_meta_data.get("time_cost", 0)
  615. end_time = created_time + timedelta(seconds=time_cost)
  616. error = tool_meta_data.get("error", "")
  617. tool_parameters = tool_meta_data.get("tool_parameters", {})
  618. metadata = {
  619. "message_id": message_id,
  620. "tool_name": tool_name,
  621. "tool_inputs": tool_inputs,
  622. "tool_outputs": tool_outputs,
  623. "tool_config": tool_config,
  624. "time_cost": time_cost,
  625. "error": error,
  626. "tool_parameters": tool_parameters,
  627. }
  628. file_url = ""
  629. message_file_data = db.session.query(MessageFile).filter_by(message_id=message_id).first()
  630. if message_file_data:
  631. message_file_id = message_file_data.id if message_file_data else None
  632. type = message_file_data.type
  633. created_by_role = message_file_data.created_by_role
  634. created_user_id = message_file_data.created_by
  635. file_url = f"{self.file_base_url}/{message_file_data.url}"
  636. metadata.update(
  637. {
  638. "message_file_id": message_file_id,
  639. "created_by_role": created_by_role,
  640. "created_user_id": created_user_id,
  641. "type": type,
  642. }
  643. )
  644. tool_trace_info = ToolTraceInfo(
  645. message_id=message_id,
  646. message_data=message_data.to_dict(),
  647. tool_name=tool_name,
  648. start_time=timer.get("start") if timer else created_time,
  649. end_time=timer.get("end") if timer else end_time,
  650. tool_inputs=tool_inputs,
  651. tool_outputs=tool_outputs,
  652. metadata=metadata,
  653. message_file_data=message_file_data,
  654. error=error,
  655. inputs=message_data.message,
  656. outputs=message_data.answer,
  657. tool_config=tool_config,
  658. time_cost=time_cost,
  659. tool_parameters=tool_parameters,
  660. file_url=file_url,
  661. )
  662. return tool_trace_info
  663. def generate_name_trace(self, conversation_id, timer, **kwargs):
  664. generate_conversation_name = kwargs.get("generate_conversation_name")
  665. inputs = kwargs.get("inputs")
  666. tenant_id = kwargs.get("tenant_id")
  667. if not tenant_id:
  668. return {}
  669. start_time = timer.get("start")
  670. end_time = timer.get("end")
  671. metadata = {
  672. "conversation_id": conversation_id,
  673. "tenant_id": tenant_id,
  674. }
  675. generate_name_trace_info = GenerateNameTraceInfo(
  676. conversation_id=conversation_id,
  677. inputs=inputs,
  678. outputs=generate_conversation_name,
  679. start_time=start_time,
  680. end_time=end_time,
  681. metadata=metadata,
  682. tenant_id=tenant_id,
  683. )
  684. return generate_name_trace_info
  685. trace_manager_timer: Optional[threading.Timer] = None
  686. trace_manager_queue: queue.Queue = queue.Queue()
  687. trace_manager_interval = int(os.getenv("TRACE_QUEUE_MANAGER_INTERVAL", 5))
  688. trace_manager_batch_size = int(os.getenv("TRACE_QUEUE_MANAGER_BATCH_SIZE", 100))
  689. class TraceQueueManager:
  690. def __init__(self, app_id=None, user_id=None):
  691. global trace_manager_timer
  692. self.app_id = app_id
  693. self.user_id = user_id
  694. self.trace_instance = OpsTraceManager.get_ops_trace_instance(app_id)
  695. self.flask_app = current_app._get_current_object() # type: ignore
  696. if trace_manager_timer is None:
  697. self.start_timer()
  698. def add_trace_task(self, trace_task: TraceTask):
  699. global trace_manager_timer, trace_manager_queue
  700. try:
  701. if self.trace_instance:
  702. trace_task.app_id = self.app_id
  703. trace_manager_queue.put(trace_task)
  704. except Exception as e:
  705. logging.exception(f"Error adding trace task, trace_type {trace_task.trace_type}")
  706. finally:
  707. self.start_timer()
  708. def collect_tasks(self):
  709. global trace_manager_queue
  710. tasks: list[TraceTask] = []
  711. while len(tasks) < trace_manager_batch_size and not trace_manager_queue.empty():
  712. task = trace_manager_queue.get_nowait()
  713. tasks.append(task)
  714. trace_manager_queue.task_done()
  715. return tasks
  716. def run(self):
  717. try:
  718. tasks = self.collect_tasks()
  719. if tasks:
  720. self.send_to_celery(tasks)
  721. except Exception as e:
  722. logging.exception("Error processing trace tasks")
  723. def start_timer(self):
  724. global trace_manager_timer
  725. if trace_manager_timer is None or not trace_manager_timer.is_alive():
  726. trace_manager_timer = threading.Timer(trace_manager_interval, self.run)
  727. trace_manager_timer.name = f"trace_manager_timer_{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime())}"
  728. trace_manager_timer.daemon = False
  729. trace_manager_timer.start()
  730. def send_to_celery(self, tasks: list[TraceTask]):
  731. with self.flask_app.app_context():
  732. for task in tasks:
  733. if task.app_id is None:
  734. continue
  735. file_id = uuid4().hex
  736. trace_info = task.execute()
  737. task_data = TaskData(
  738. app_id=task.app_id,
  739. trace_info_type=type(trace_info).__name__,
  740. trace_info=trace_info.model_dump() if trace_info else None,
  741. )
  742. file_path = f"{OPS_FILE_PATH}{task.app_id}/{file_id}.json"
  743. storage.save(file_path, task_data.model_dump_json().encode("utf-8"))
  744. file_info = {
  745. "file_id": file_id,
  746. "app_id": task.app_id,
  747. }
  748. process_trace_tasks.delay(file_info)