keywords.py 2.6 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970
  1. from collections.abc import Sequence
  2. from typing import Any
  3. from core.moderation.base import Moderation, ModerationAction, ModerationInputsResult, ModerationOutputsResult
  4. class KeywordsModeration(Moderation):
  5. name: str = "keywords"
  6. @classmethod
  7. def validate_config(cls, tenant_id: str, config: dict) -> None:
  8. """
  9. Validate the incoming form config data.
  10. :param tenant_id: the id of workspace
  11. :param config: the form config data
  12. :return:
  13. """
  14. cls._validate_inputs_and_outputs_config(config, True)
  15. if not config.get("keywords"):
  16. raise ValueError("keywords is required")
  17. if len(config.get("keywords")) > 10000:
  18. raise ValueError("keywords length must be less than 10000")
  19. keywords_row_len = config["keywords"].split("\n")
  20. if len(keywords_row_len) > 100:
  21. raise ValueError("the number of rows for the keywords must be less than 100")
  22. def moderation_for_inputs(self, inputs: dict, query: str = "") -> ModerationInputsResult:
  23. flagged = False
  24. preset_response = ""
  25. if self.config["inputs_config"]["enabled"]:
  26. preset_response = self.config["inputs_config"]["preset_response"]
  27. if query:
  28. inputs["query__"] = query
  29. # Filter out empty values
  30. keywords_list = [keyword for keyword in self.config["keywords"].split("\n") if keyword]
  31. flagged = self._is_violated(inputs, keywords_list)
  32. return ModerationInputsResult(
  33. flagged=flagged, action=ModerationAction.DIRECT_OUTPUT, preset_response=preset_response
  34. )
  35. def moderation_for_outputs(self, text: str) -> ModerationOutputsResult:
  36. flagged = False
  37. preset_response = ""
  38. if self.config["outputs_config"]["enabled"]:
  39. # Filter out empty values
  40. keywords_list = [keyword for keyword in self.config["keywords"].split("\n") if keyword]
  41. flagged = self._is_violated({"text": text}, keywords_list)
  42. preset_response = self.config["outputs_config"]["preset_response"]
  43. return ModerationOutputsResult(
  44. flagged=flagged, action=ModerationAction.DIRECT_OUTPUT, preset_response=preset_response
  45. )
  46. def _is_violated(self, inputs: dict, keywords_list: list) -> bool:
  47. return any(self._check_keywords_in_value(keywords_list, value) for value in inputs.values())
  48. def _check_keywords_in_value(self, keywords_list: Sequence[str], value: Any) -> bool:
  49. return any(keyword.lower() in str(value).lower() for keyword in keywords_list)