You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

remove_app_and_related_data_task.py 12KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328
  1. import logging
  2. import time
  3. from collections.abc import Callable
  4. import click
  5. from celery import shared_task # type: ignore
  6. from sqlalchemy import delete
  7. from sqlalchemy.exc import SQLAlchemyError
  8. from core.repositories import SQLAlchemyWorkflowNodeExecutionRepository
  9. from extensions.ext_database import db
  10. from models.dataset import AppDatasetJoin
  11. from models.model import (
  12. ApiToken,
  13. AppAnnotationHitHistory,
  14. AppAnnotationSetting,
  15. AppModelConfig,
  16. Conversation,
  17. EndUser,
  18. InstalledApp,
  19. Message,
  20. MessageAgentThought,
  21. MessageAnnotation,
  22. MessageChain,
  23. MessageFeedback,
  24. MessageFile,
  25. RecommendedApp,
  26. Site,
  27. TagBinding,
  28. TraceAppConfig,
  29. )
  30. from models.tools import WorkflowToolProvider
  31. from models.web import PinnedConversation, SavedMessage
  32. from models.workflow import ConversationVariable, Workflow, WorkflowAppLog, WorkflowRun
  33. @shared_task(queue="app_deletion", bind=True, max_retries=3)
  34. def remove_app_and_related_data_task(self, tenant_id: str, app_id: str):
  35. logging.info(click.style(f"Start deleting app and related data: {tenant_id}:{app_id}", fg="green"))
  36. start_at = time.perf_counter()
  37. try:
  38. # Delete related data
  39. _delete_app_model_configs(tenant_id, app_id)
  40. _delete_app_site(tenant_id, app_id)
  41. _delete_app_api_tokens(tenant_id, app_id)
  42. _delete_installed_apps(tenant_id, app_id)
  43. _delete_recommended_apps(tenant_id, app_id)
  44. _delete_app_annotation_data(tenant_id, app_id)
  45. _delete_app_dataset_joins(tenant_id, app_id)
  46. _delete_app_workflows(tenant_id, app_id)
  47. _delete_app_workflow_runs(tenant_id, app_id)
  48. _delete_app_workflow_node_executions(tenant_id, app_id)
  49. _delete_app_workflow_app_logs(tenant_id, app_id)
  50. _delete_app_conversations(tenant_id, app_id)
  51. _delete_app_messages(tenant_id, app_id)
  52. _delete_workflow_tool_providers(tenant_id, app_id)
  53. _delete_app_tag_bindings(tenant_id, app_id)
  54. _delete_end_users(tenant_id, app_id)
  55. _delete_trace_app_configs(tenant_id, app_id)
  56. _delete_conversation_variables(app_id=app_id)
  57. end_at = time.perf_counter()
  58. logging.info(click.style(f"App and related data deleted: {app_id} latency: {end_at - start_at}", fg="green"))
  59. except SQLAlchemyError as e:
  60. logging.exception(
  61. click.style(f"Database error occurred while deleting app {app_id} and related data", fg="red")
  62. )
  63. raise self.retry(exc=e, countdown=60) # Retry after 60 seconds
  64. except Exception as e:
  65. logging.exception(click.style(f"Error occurred while deleting app {app_id} and related data", fg="red"))
  66. raise self.retry(exc=e, countdown=60) # Retry after 60 seconds
  67. def _delete_app_model_configs(tenant_id: str, app_id: str):
  68. def del_model_config(model_config_id: str):
  69. db.session.query(AppModelConfig).filter(AppModelConfig.id == model_config_id).delete(synchronize_session=False)
  70. _delete_records(
  71. """select id from app_model_configs where app_id=:app_id limit 1000""",
  72. {"app_id": app_id},
  73. del_model_config,
  74. "app model config",
  75. )
  76. def _delete_app_site(tenant_id: str, app_id: str):
  77. def del_site(site_id: str):
  78. db.session.query(Site).filter(Site.id == site_id).delete(synchronize_session=False)
  79. _delete_records("""select id from sites where app_id=:app_id limit 1000""", {"app_id": app_id}, del_site, "site")
  80. def _delete_app_api_tokens(tenant_id: str, app_id: str):
  81. def del_api_token(api_token_id: str):
  82. db.session.query(ApiToken).filter(ApiToken.id == api_token_id).delete(synchronize_session=False)
  83. _delete_records(
  84. """select id from api_tokens where app_id=:app_id limit 1000""", {"app_id": app_id}, del_api_token, "api token"
  85. )
  86. def _delete_installed_apps(tenant_id: str, app_id: str):
  87. def del_installed_app(installed_app_id: str):
  88. db.session.query(InstalledApp).filter(InstalledApp.id == installed_app_id).delete(synchronize_session=False)
  89. _delete_records(
  90. """select id from installed_apps where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  91. {"tenant_id": tenant_id, "app_id": app_id},
  92. del_installed_app,
  93. "installed app",
  94. )
  95. def _delete_recommended_apps(tenant_id: str, app_id: str):
  96. def del_recommended_app(recommended_app_id: str):
  97. db.session.query(RecommendedApp).filter(RecommendedApp.id == recommended_app_id).delete(
  98. synchronize_session=False
  99. )
  100. _delete_records(
  101. """select id from recommended_apps where app_id=:app_id limit 1000""",
  102. {"app_id": app_id},
  103. del_recommended_app,
  104. "recommended app",
  105. )
  106. def _delete_app_annotation_data(tenant_id: str, app_id: str):
  107. def del_annotation_hit_history(annotation_hit_history_id: str):
  108. db.session.query(AppAnnotationHitHistory).filter(
  109. AppAnnotationHitHistory.id == annotation_hit_history_id
  110. ).delete(synchronize_session=False)
  111. _delete_records(
  112. """select id from app_annotation_hit_histories where app_id=:app_id limit 1000""",
  113. {"app_id": app_id},
  114. del_annotation_hit_history,
  115. "annotation hit history",
  116. )
  117. def del_annotation_setting(annotation_setting_id: str):
  118. db.session.query(AppAnnotationSetting).filter(AppAnnotationSetting.id == annotation_setting_id).delete(
  119. synchronize_session=False
  120. )
  121. _delete_records(
  122. """select id from app_annotation_settings where app_id=:app_id limit 1000""",
  123. {"app_id": app_id},
  124. del_annotation_setting,
  125. "annotation setting",
  126. )
  127. def _delete_app_dataset_joins(tenant_id: str, app_id: str):
  128. def del_dataset_join(dataset_join_id: str):
  129. db.session.query(AppDatasetJoin).filter(AppDatasetJoin.id == dataset_join_id).delete(synchronize_session=False)
  130. _delete_records(
  131. """select id from app_dataset_joins where app_id=:app_id limit 1000""",
  132. {"app_id": app_id},
  133. del_dataset_join,
  134. "dataset join",
  135. )
  136. def _delete_app_workflows(tenant_id: str, app_id: str):
  137. def del_workflow(workflow_id: str):
  138. db.session.query(Workflow).filter(Workflow.id == workflow_id).delete(synchronize_session=False)
  139. _delete_records(
  140. """select id from workflows where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  141. {"tenant_id": tenant_id, "app_id": app_id},
  142. del_workflow,
  143. "workflow",
  144. )
  145. def _delete_app_workflow_runs(tenant_id: str, app_id: str):
  146. def del_workflow_run(workflow_run_id: str):
  147. db.session.query(WorkflowRun).filter(WorkflowRun.id == workflow_run_id).delete(synchronize_session=False)
  148. _delete_records(
  149. """select id from workflow_runs where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  150. {"tenant_id": tenant_id, "app_id": app_id},
  151. del_workflow_run,
  152. "workflow run",
  153. )
  154. def _delete_app_workflow_node_executions(tenant_id: str, app_id: str):
  155. # Create a repository instance for WorkflowNodeExecution
  156. repository = SQLAlchemyWorkflowNodeExecutionRepository(
  157. session_factory=db.engine, tenant_id=tenant_id, app_id=app_id
  158. )
  159. # Use the clear method to delete all records for this tenant_id and app_id
  160. repository.clear()
  161. logging.info(click.style(f"Deleted workflow node executions for tenant {tenant_id} and app {app_id}", fg="green"))
  162. def _delete_app_workflow_app_logs(tenant_id: str, app_id: str):
  163. def del_workflow_app_log(workflow_app_log_id: str):
  164. db.session.query(WorkflowAppLog).filter(WorkflowAppLog.id == workflow_app_log_id).delete(
  165. synchronize_session=False
  166. )
  167. _delete_records(
  168. """select id from workflow_app_logs where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  169. {"tenant_id": tenant_id, "app_id": app_id},
  170. del_workflow_app_log,
  171. "workflow app log",
  172. )
  173. def _delete_app_conversations(tenant_id: str, app_id: str):
  174. def del_conversation(conversation_id: str):
  175. db.session.query(PinnedConversation).filter(PinnedConversation.conversation_id == conversation_id).delete(
  176. synchronize_session=False
  177. )
  178. db.session.query(Conversation).filter(Conversation.id == conversation_id).delete(synchronize_session=False)
  179. _delete_records(
  180. """select id from conversations where app_id=:app_id limit 1000""",
  181. {"app_id": app_id},
  182. del_conversation,
  183. "conversation",
  184. )
  185. def _delete_conversation_variables(*, app_id: str):
  186. stmt = delete(ConversationVariable).where(ConversationVariable.app_id == app_id)
  187. with db.engine.connect() as conn:
  188. conn.execute(stmt)
  189. conn.commit()
  190. logging.info(click.style(f"Deleted conversation variables for app {app_id}", fg="green"))
  191. def _delete_app_messages(tenant_id: str, app_id: str):
  192. def del_message(message_id: str):
  193. db.session.query(MessageFeedback).filter(MessageFeedback.message_id == message_id).delete(
  194. synchronize_session=False
  195. )
  196. db.session.query(MessageAnnotation).filter(MessageAnnotation.message_id == message_id).delete(
  197. synchronize_session=False
  198. )
  199. db.session.query(MessageChain).filter(MessageChain.message_id == message_id).delete(synchronize_session=False)
  200. db.session.query(MessageAgentThought).filter(MessageAgentThought.message_id == message_id).delete(
  201. synchronize_session=False
  202. )
  203. db.session.query(MessageFile).filter(MessageFile.message_id == message_id).delete(synchronize_session=False)
  204. db.session.query(SavedMessage).filter(SavedMessage.message_id == message_id).delete(synchronize_session=False)
  205. db.session.query(Message).filter(Message.id == message_id).delete()
  206. _delete_records(
  207. """select id from messages where app_id=:app_id limit 1000""", {"app_id": app_id}, del_message, "message"
  208. )
  209. def _delete_workflow_tool_providers(tenant_id: str, app_id: str):
  210. def del_tool_provider(tool_provider_id: str):
  211. db.session.query(WorkflowToolProvider).filter(WorkflowToolProvider.id == tool_provider_id).delete(
  212. synchronize_session=False
  213. )
  214. _delete_records(
  215. """select id from tool_workflow_providers where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  216. {"tenant_id": tenant_id, "app_id": app_id},
  217. del_tool_provider,
  218. "tool workflow provider",
  219. )
  220. def _delete_app_tag_bindings(tenant_id: str, app_id: str):
  221. def del_tag_binding(tag_binding_id: str):
  222. db.session.query(TagBinding).filter(TagBinding.id == tag_binding_id).delete(synchronize_session=False)
  223. _delete_records(
  224. """select id from tag_bindings where tenant_id=:tenant_id and target_id=:app_id limit 1000""",
  225. {"tenant_id": tenant_id, "app_id": app_id},
  226. del_tag_binding,
  227. "tag binding",
  228. )
  229. def _delete_end_users(tenant_id: str, app_id: str):
  230. def del_end_user(end_user_id: str):
  231. db.session.query(EndUser).filter(EndUser.id == end_user_id).delete(synchronize_session=False)
  232. _delete_records(
  233. """select id from end_users where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  234. {"tenant_id": tenant_id, "app_id": app_id},
  235. del_end_user,
  236. "end user",
  237. )
  238. def _delete_trace_app_configs(tenant_id: str, app_id: str):
  239. def del_trace_app_config(trace_app_config_id: str):
  240. db.session.query(TraceAppConfig).filter(TraceAppConfig.id == trace_app_config_id).delete(
  241. synchronize_session=False
  242. )
  243. _delete_records(
  244. """select id from trace_app_config where app_id=:app_id limit 1000""",
  245. {"app_id": app_id},
  246. del_trace_app_config,
  247. "trace app config",
  248. )
  249. def _delete_records(query_sql: str, params: dict, delete_func: Callable, name: str) -> None:
  250. while True:
  251. with db.engine.begin() as conn:
  252. rs = conn.execute(db.text(query_sql), params)
  253. if rs.rowcount == 0:
  254. break
  255. for i in rs:
  256. record_id = str(i.id)
  257. try:
  258. delete_func(record_id)
  259. db.session.commit()
  260. logging.info(click.style(f"Deleted {name} {record_id}", fg="green"))
  261. except Exception:
  262. logging.exception(f"Error occurred while deleting {name} {record_id}")
  263. continue
  264. rs.close()