You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

remove_app_and_related_data_task.py 13KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348
  1. import logging
  2. import time
  3. from collections.abc import Callable
  4. import click
  5. import sqlalchemy as sa
  6. from celery import shared_task # type: ignore
  7. from sqlalchemy import delete
  8. from sqlalchemy.exc import SQLAlchemyError
  9. from sqlalchemy.orm import sessionmaker
  10. from extensions.ext_database import db
  11. from models import (
  12. ApiToken,
  13. AppAnnotationHitHistory,
  14. AppAnnotationSetting,
  15. AppDatasetJoin,
  16. AppMCPServer,
  17. AppModelConfig,
  18. Conversation,
  19. EndUser,
  20. InstalledApp,
  21. Message,
  22. MessageAgentThought,
  23. MessageAnnotation,
  24. MessageChain,
  25. MessageFeedback,
  26. MessageFile,
  27. RecommendedApp,
  28. Site,
  29. TagBinding,
  30. TraceAppConfig,
  31. )
  32. from models.tools import WorkflowToolProvider
  33. from models.web import PinnedConversation, SavedMessage
  34. from models.workflow import ConversationVariable, Workflow, WorkflowAppLog
  35. from repositories.factory import DifyAPIRepositoryFactory
  36. @shared_task(queue="app_deletion", bind=True, max_retries=3)
  37. def remove_app_and_related_data_task(self, tenant_id: str, app_id: str):
  38. logging.info(click.style(f"Start deleting app and related data: {tenant_id}:{app_id}", fg="green"))
  39. start_at = time.perf_counter()
  40. try:
  41. # Delete related data
  42. _delete_app_model_configs(tenant_id, app_id)
  43. _delete_app_site(tenant_id, app_id)
  44. _delete_app_mcp_servers(tenant_id, app_id)
  45. _delete_app_api_tokens(tenant_id, app_id)
  46. _delete_installed_apps(tenant_id, app_id)
  47. _delete_recommended_apps(tenant_id, app_id)
  48. _delete_app_annotation_data(tenant_id, app_id)
  49. _delete_app_dataset_joins(tenant_id, app_id)
  50. _delete_app_workflows(tenant_id, app_id)
  51. _delete_app_workflow_runs(tenant_id, app_id)
  52. _delete_app_workflow_node_executions(tenant_id, app_id)
  53. _delete_app_workflow_app_logs(tenant_id, app_id)
  54. _delete_app_conversations(tenant_id, app_id)
  55. _delete_app_messages(tenant_id, app_id)
  56. _delete_workflow_tool_providers(tenant_id, app_id)
  57. _delete_app_tag_bindings(tenant_id, app_id)
  58. _delete_end_users(tenant_id, app_id)
  59. _delete_trace_app_configs(tenant_id, app_id)
  60. _delete_conversation_variables(app_id=app_id)
  61. end_at = time.perf_counter()
  62. logging.info(click.style(f"App and related data deleted: {app_id} latency: {end_at - start_at}", fg="green"))
  63. except SQLAlchemyError as e:
  64. logging.exception(
  65. click.style(f"Database error occurred while deleting app {app_id} and related data", fg="red")
  66. )
  67. raise self.retry(exc=e, countdown=60) # Retry after 60 seconds
  68. except Exception as e:
  69. logging.exception(click.style(f"Error occurred while deleting app {app_id} and related data", fg="red"))
  70. raise self.retry(exc=e, countdown=60) # Retry after 60 seconds
  71. def _delete_app_model_configs(tenant_id: str, app_id: str):
  72. def del_model_config(model_config_id: str):
  73. db.session.query(AppModelConfig).where(AppModelConfig.id == model_config_id).delete(synchronize_session=False)
  74. _delete_records(
  75. """select id from app_model_configs where app_id=:app_id limit 1000""",
  76. {"app_id": app_id},
  77. del_model_config,
  78. "app model config",
  79. )
  80. def _delete_app_site(tenant_id: str, app_id: str):
  81. def del_site(site_id: str):
  82. db.session.query(Site).where(Site.id == site_id).delete(synchronize_session=False)
  83. _delete_records("""select id from sites where app_id=:app_id limit 1000""", {"app_id": app_id}, del_site, "site")
  84. def _delete_app_mcp_servers(tenant_id: str, app_id: str):
  85. def del_mcp_server(mcp_server_id: str):
  86. db.session.query(AppMCPServer).where(AppMCPServer.id == mcp_server_id).delete(synchronize_session=False)
  87. _delete_records(
  88. """select id from app_mcp_servers where app_id=:app_id limit 1000""",
  89. {"app_id": app_id},
  90. del_mcp_server,
  91. "app mcp server",
  92. )
  93. def _delete_app_api_tokens(tenant_id: str, app_id: str):
  94. def del_api_token(api_token_id: str):
  95. db.session.query(ApiToken).where(ApiToken.id == api_token_id).delete(synchronize_session=False)
  96. _delete_records(
  97. """select id from api_tokens where app_id=:app_id limit 1000""", {"app_id": app_id}, del_api_token, "api token"
  98. )
  99. def _delete_installed_apps(tenant_id: str, app_id: str):
  100. def del_installed_app(installed_app_id: str):
  101. db.session.query(InstalledApp).where(InstalledApp.id == installed_app_id).delete(synchronize_session=False)
  102. _delete_records(
  103. """select id from installed_apps where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  104. {"tenant_id": tenant_id, "app_id": app_id},
  105. del_installed_app,
  106. "installed app",
  107. )
  108. def _delete_recommended_apps(tenant_id: str, app_id: str):
  109. def del_recommended_app(recommended_app_id: str):
  110. db.session.query(RecommendedApp).where(RecommendedApp.id == recommended_app_id).delete(
  111. synchronize_session=False
  112. )
  113. _delete_records(
  114. """select id from recommended_apps where app_id=:app_id limit 1000""",
  115. {"app_id": app_id},
  116. del_recommended_app,
  117. "recommended app",
  118. )
  119. def _delete_app_annotation_data(tenant_id: str, app_id: str):
  120. def del_annotation_hit_history(annotation_hit_history_id: str):
  121. db.session.query(AppAnnotationHitHistory).where(AppAnnotationHitHistory.id == annotation_hit_history_id).delete(
  122. synchronize_session=False
  123. )
  124. _delete_records(
  125. """select id from app_annotation_hit_histories where app_id=:app_id limit 1000""",
  126. {"app_id": app_id},
  127. del_annotation_hit_history,
  128. "annotation hit history",
  129. )
  130. def del_annotation_setting(annotation_setting_id: str):
  131. db.session.query(AppAnnotationSetting).where(AppAnnotationSetting.id == annotation_setting_id).delete(
  132. synchronize_session=False
  133. )
  134. _delete_records(
  135. """select id from app_annotation_settings where app_id=:app_id limit 1000""",
  136. {"app_id": app_id},
  137. del_annotation_setting,
  138. "annotation setting",
  139. )
  140. def _delete_app_dataset_joins(tenant_id: str, app_id: str):
  141. def del_dataset_join(dataset_join_id: str):
  142. db.session.query(AppDatasetJoin).where(AppDatasetJoin.id == dataset_join_id).delete(synchronize_session=False)
  143. _delete_records(
  144. """select id from app_dataset_joins where app_id=:app_id limit 1000""",
  145. {"app_id": app_id},
  146. del_dataset_join,
  147. "dataset join",
  148. )
  149. def _delete_app_workflows(tenant_id: str, app_id: str):
  150. def del_workflow(workflow_id: str):
  151. db.session.query(Workflow).where(Workflow.id == workflow_id).delete(synchronize_session=False)
  152. _delete_records(
  153. """select id from workflows where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  154. {"tenant_id": tenant_id, "app_id": app_id},
  155. del_workflow,
  156. "workflow",
  157. )
  158. def _delete_app_workflow_runs(tenant_id: str, app_id: str):
  159. """Delete all workflow runs for an app using the service repository."""
  160. session_maker = sessionmaker(bind=db.engine)
  161. workflow_run_repo = DifyAPIRepositoryFactory.create_api_workflow_run_repository(session_maker)
  162. deleted_count = workflow_run_repo.delete_runs_by_app(
  163. tenant_id=tenant_id,
  164. app_id=app_id,
  165. batch_size=1000,
  166. )
  167. logging.info("Deleted %s workflow runs for app %s", deleted_count, app_id)
  168. def _delete_app_workflow_node_executions(tenant_id: str, app_id: str):
  169. """Delete all workflow node executions for an app using the service repository."""
  170. session_maker = sessionmaker(bind=db.engine)
  171. node_execution_repo = DifyAPIRepositoryFactory.create_api_workflow_node_execution_repository(session_maker)
  172. deleted_count = node_execution_repo.delete_executions_by_app(
  173. tenant_id=tenant_id,
  174. app_id=app_id,
  175. batch_size=1000,
  176. )
  177. logging.info("Deleted %s workflow node executions for app %s", deleted_count, app_id)
  178. def _delete_app_workflow_app_logs(tenant_id: str, app_id: str):
  179. def del_workflow_app_log(workflow_app_log_id: str):
  180. db.session.query(WorkflowAppLog).where(WorkflowAppLog.id == workflow_app_log_id).delete(
  181. synchronize_session=False
  182. )
  183. _delete_records(
  184. """select id from workflow_app_logs where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  185. {"tenant_id": tenant_id, "app_id": app_id},
  186. del_workflow_app_log,
  187. "workflow app log",
  188. )
  189. def _delete_app_conversations(tenant_id: str, app_id: str):
  190. def del_conversation(conversation_id: str):
  191. db.session.query(PinnedConversation).where(PinnedConversation.conversation_id == conversation_id).delete(
  192. synchronize_session=False
  193. )
  194. db.session.query(Conversation).where(Conversation.id == conversation_id).delete(synchronize_session=False)
  195. _delete_records(
  196. """select id from conversations where app_id=:app_id limit 1000""",
  197. {"app_id": app_id},
  198. del_conversation,
  199. "conversation",
  200. )
  201. def _delete_conversation_variables(*, app_id: str):
  202. stmt = delete(ConversationVariable).where(ConversationVariable.app_id == app_id)
  203. with db.engine.connect() as conn:
  204. conn.execute(stmt)
  205. conn.commit()
  206. logging.info(click.style(f"Deleted conversation variables for app {app_id}", fg="green"))
  207. def _delete_app_messages(tenant_id: str, app_id: str):
  208. def del_message(message_id: str):
  209. db.session.query(MessageFeedback).where(MessageFeedback.message_id == message_id).delete(
  210. synchronize_session=False
  211. )
  212. db.session.query(MessageAnnotation).where(MessageAnnotation.message_id == message_id).delete(
  213. synchronize_session=False
  214. )
  215. db.session.query(MessageChain).where(MessageChain.message_id == message_id).delete(synchronize_session=False)
  216. db.session.query(MessageAgentThought).where(MessageAgentThought.message_id == message_id).delete(
  217. synchronize_session=False
  218. )
  219. db.session.query(MessageFile).where(MessageFile.message_id == message_id).delete(synchronize_session=False)
  220. db.session.query(SavedMessage).where(SavedMessage.message_id == message_id).delete(synchronize_session=False)
  221. db.session.query(Message).where(Message.id == message_id).delete()
  222. _delete_records(
  223. """select id from messages where app_id=:app_id limit 1000""", {"app_id": app_id}, del_message, "message"
  224. )
  225. def _delete_workflow_tool_providers(tenant_id: str, app_id: str):
  226. def del_tool_provider(tool_provider_id: str):
  227. db.session.query(WorkflowToolProvider).where(WorkflowToolProvider.id == tool_provider_id).delete(
  228. synchronize_session=False
  229. )
  230. _delete_records(
  231. """select id from tool_workflow_providers where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  232. {"tenant_id": tenant_id, "app_id": app_id},
  233. del_tool_provider,
  234. "tool workflow provider",
  235. )
  236. def _delete_app_tag_bindings(tenant_id: str, app_id: str):
  237. def del_tag_binding(tag_binding_id: str):
  238. db.session.query(TagBinding).where(TagBinding.id == tag_binding_id).delete(synchronize_session=False)
  239. _delete_records(
  240. """select id from tag_bindings where tenant_id=:tenant_id and target_id=:app_id limit 1000""",
  241. {"tenant_id": tenant_id, "app_id": app_id},
  242. del_tag_binding,
  243. "tag binding",
  244. )
  245. def _delete_end_users(tenant_id: str, app_id: str):
  246. def del_end_user(end_user_id: str):
  247. db.session.query(EndUser).where(EndUser.id == end_user_id).delete(synchronize_session=False)
  248. _delete_records(
  249. """select id from end_users where tenant_id=:tenant_id and app_id=:app_id limit 1000""",
  250. {"tenant_id": tenant_id, "app_id": app_id},
  251. del_end_user,
  252. "end user",
  253. )
  254. def _delete_trace_app_configs(tenant_id: str, app_id: str):
  255. def del_trace_app_config(trace_app_config_id: str):
  256. db.session.query(TraceAppConfig).where(TraceAppConfig.id == trace_app_config_id).delete(
  257. synchronize_session=False
  258. )
  259. _delete_records(
  260. """select id from trace_app_config where app_id=:app_id limit 1000""",
  261. {"app_id": app_id},
  262. del_trace_app_config,
  263. "trace app config",
  264. )
  265. def _delete_records(query_sql: str, params: dict, delete_func: Callable, name: str) -> None:
  266. while True:
  267. with db.engine.begin() as conn:
  268. rs = conn.execute(sa.text(query_sql), params)
  269. if rs.rowcount == 0:
  270. break
  271. for i in rs:
  272. record_id = str(i.id)
  273. try:
  274. delete_func(record_id)
  275. db.session.commit()
  276. logging.info(click.style(f"Deleted {name} {record_id}", fg="green"))
  277. except Exception:
  278. logging.exception("Error occurred while deleting %s %s", name, record_id)
  279. continue
  280. rs.close()