mail_clean_document_notify_task.py 4.1 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091
  1. import logging
  2. import time
  3. from collections import defaultdict
  4. import click
  5. from flask import render_template # type: ignore
  6. import app
  7. from configs import dify_config
  8. from extensions.ext_database import db
  9. from extensions.ext_mail import mail
  10. from models.account import Account, Tenant, TenantAccountJoin
  11. from models.dataset import Dataset, DatasetAutoDisableLog
  12. from services.feature_service import FeatureService
  13. @app.celery.task(queue="dataset")
  14. def send_document_clean_notify_task():
  15. """
  16. Async Send document clean notify mail
  17. Usage: send_document_clean_notify_task.delay()
  18. """
  19. if not mail.is_inited():
  20. return
  21. logging.info(click.style("Start send document clean notify mail", fg="green"))
  22. start_at = time.perf_counter()
  23. # send document clean notify mail
  24. try:
  25. dataset_auto_disable_logs = DatasetAutoDisableLog.query.filter(DatasetAutoDisableLog.notified == False).all()
  26. # group by tenant_id
  27. dataset_auto_disable_logs_map: dict[str, list[DatasetAutoDisableLog]] = defaultdict(list)
  28. for dataset_auto_disable_log in dataset_auto_disable_logs:
  29. if dataset_auto_disable_log.tenant_id not in dataset_auto_disable_logs_map:
  30. dataset_auto_disable_logs_map[dataset_auto_disable_log.tenant_id] = []
  31. dataset_auto_disable_logs_map[dataset_auto_disable_log.tenant_id].append(dataset_auto_disable_log)
  32. url = f"{dify_config.CONSOLE_WEB_URL}/datasets"
  33. for tenant_id, tenant_dataset_auto_disable_logs in dataset_auto_disable_logs_map.items():
  34. features = FeatureService.get_features(tenant_id)
  35. plan = features.billing.subscription.plan
  36. if plan != "sandbox":
  37. knowledge_details = []
  38. # check tenant
  39. tenant = Tenant.query.filter(Tenant.id == tenant_id).first()
  40. if not tenant:
  41. continue
  42. # check current owner
  43. current_owner_join = TenantAccountJoin.query.filter_by(tenant_id=tenant.id, role="owner").first()
  44. if not current_owner_join:
  45. continue
  46. account = Account.query.filter(Account.id == current_owner_join.account_id).first()
  47. if not account:
  48. continue
  49. dataset_auto_dataset_map = {} # type: ignore
  50. for dataset_auto_disable_log in tenant_dataset_auto_disable_logs:
  51. if dataset_auto_disable_log.dataset_id not in dataset_auto_dataset_map:
  52. dataset_auto_dataset_map[dataset_auto_disable_log.dataset_id] = []
  53. dataset_auto_dataset_map[dataset_auto_disable_log.dataset_id].append(
  54. dataset_auto_disable_log.document_id
  55. )
  56. for dataset_id, document_ids in dataset_auto_dataset_map.items():
  57. dataset = Dataset.query.filter(Dataset.id == dataset_id).first()
  58. if dataset:
  59. document_count = len(document_ids)
  60. knowledge_details.append(rf"Knowledge base {dataset.name}: {document_count} documents")
  61. if knowledge_details:
  62. html_content = render_template(
  63. "clean_document_job_mail_template-US.html",
  64. userName=account.email,
  65. knowledge_details=knowledge_details,
  66. url=url,
  67. )
  68. mail.send(
  69. to=account.email, subject="Dify Knowledge base auto disable notification", html=html_content
  70. )
  71. # update notified to True
  72. for dataset_auto_disable_log in tenant_dataset_auto_disable_logs:
  73. dataset_auto_disable_log.notified = True
  74. db.session.commit()
  75. end_at = time.perf_counter()
  76. logging.info(
  77. click.style("Send document clean notify mail succeeded: latency: {}".format(end_at - start_at), fg="green")
  78. )
  79. except Exception:
  80. logging.exception("Send document clean notify mail failed")