external.py 9.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263
  1. from flask import request
  2. from flask_login import current_user # type: ignore
  3. from flask_restful import Resource, marshal, reqparse # type: ignore
  4. from werkzeug.exceptions import Forbidden, InternalServerError, NotFound
  5. import services
  6. from controllers.console import api
  7. from controllers.console.datasets.error import DatasetNameDuplicateError
  8. from controllers.console.wraps import account_initialization_required, setup_required
  9. from fields.dataset_fields import dataset_detail_fields
  10. from libs.login import login_required
  11. from services.dataset_service import DatasetService
  12. from services.external_knowledge_service import ExternalDatasetService
  13. from services.hit_testing_service import HitTestingService
  14. from services.knowledge_service import ExternalDatasetTestService
  15. def _validate_name(name):
  16. if not name or len(name) < 1 or len(name) > 100:
  17. raise ValueError("Name must be between 1 to 100 characters.")
  18. return name
  19. def _validate_description_length(description):
  20. if description and len(description) > 400:
  21. raise ValueError("Description cannot exceed 400 characters.")
  22. return description
  23. class ExternalApiTemplateListApi(Resource):
  24. @setup_required
  25. @login_required
  26. @account_initialization_required
  27. def get(self):
  28. page = request.args.get("page", default=1, type=int)
  29. limit = request.args.get("limit", default=20, type=int)
  30. search = request.args.get("keyword", default=None, type=str)
  31. external_knowledge_apis, total = ExternalDatasetService.get_external_knowledge_apis(
  32. page, limit, current_user.current_tenant_id, search
  33. )
  34. response = {
  35. "data": [item.to_dict() for item in external_knowledge_apis],
  36. "has_more": len(external_knowledge_apis) == limit,
  37. "limit": limit,
  38. "total": total,
  39. "page": page,
  40. }
  41. return response, 200
  42. @setup_required
  43. @login_required
  44. @account_initialization_required
  45. def post(self):
  46. parser = reqparse.RequestParser()
  47. parser.add_argument(
  48. "name",
  49. nullable=False,
  50. required=True,
  51. help="Name is required. Name must be between 1 to 100 characters.",
  52. type=_validate_name,
  53. )
  54. parser.add_argument(
  55. "settings",
  56. type=dict,
  57. location="json",
  58. nullable=False,
  59. required=True,
  60. )
  61. args = parser.parse_args()
  62. ExternalDatasetService.validate_api_list(args["settings"])
  63. # The role of the current user in the ta table must be admin, owner, or editor, or dataset_operator
  64. if not current_user.is_dataset_editor:
  65. raise Forbidden()
  66. try:
  67. external_knowledge_api = ExternalDatasetService.create_external_knowledge_api(
  68. tenant_id=current_user.current_tenant_id, user_id=current_user.id, args=args
  69. )
  70. except services.errors.dataset.DatasetNameDuplicateError:
  71. raise DatasetNameDuplicateError()
  72. return external_knowledge_api.to_dict(), 201
  73. class ExternalApiTemplateApi(Resource):
  74. @setup_required
  75. @login_required
  76. @account_initialization_required
  77. def get(self, external_knowledge_api_id):
  78. external_knowledge_api_id = str(external_knowledge_api_id)
  79. external_knowledge_api = ExternalDatasetService.get_external_knowledge_api(external_knowledge_api_id)
  80. if external_knowledge_api is None:
  81. raise NotFound("API template not found.")
  82. return external_knowledge_api.to_dict(), 200
  83. @setup_required
  84. @login_required
  85. @account_initialization_required
  86. def patch(self, external_knowledge_api_id):
  87. external_knowledge_api_id = str(external_knowledge_api_id)
  88. parser = reqparse.RequestParser()
  89. parser.add_argument(
  90. "name",
  91. nullable=False,
  92. required=True,
  93. help="type is required. Name must be between 1 to 100 characters.",
  94. type=_validate_name,
  95. )
  96. parser.add_argument(
  97. "settings",
  98. type=dict,
  99. location="json",
  100. nullable=False,
  101. required=True,
  102. )
  103. args = parser.parse_args()
  104. ExternalDatasetService.validate_api_list(args["settings"])
  105. external_knowledge_api = ExternalDatasetService.update_external_knowledge_api(
  106. tenant_id=current_user.current_tenant_id,
  107. user_id=current_user.id,
  108. external_knowledge_api_id=external_knowledge_api_id,
  109. args=args,
  110. )
  111. return external_knowledge_api.to_dict(), 200
  112. @setup_required
  113. @login_required
  114. @account_initialization_required
  115. def delete(self, external_knowledge_api_id):
  116. external_knowledge_api_id = str(external_knowledge_api_id)
  117. # The role of the current user in the ta table must be admin, owner, or editor
  118. if not current_user.is_editor or current_user.is_dataset_operator:
  119. raise Forbidden()
  120. ExternalDatasetService.delete_external_knowledge_api(current_user.current_tenant_id, external_knowledge_api_id)
  121. return {"result": "success"}, 200
  122. class ExternalApiUseCheckApi(Resource):
  123. @setup_required
  124. @login_required
  125. @account_initialization_required
  126. def get(self, external_knowledge_api_id):
  127. external_knowledge_api_id = str(external_knowledge_api_id)
  128. external_knowledge_api_is_using, count = ExternalDatasetService.external_knowledge_api_use_check(
  129. external_knowledge_api_id
  130. )
  131. return {"is_using": external_knowledge_api_is_using, "count": count}, 200
  132. class ExternalDatasetCreateApi(Resource):
  133. @setup_required
  134. @login_required
  135. @account_initialization_required
  136. def post(self):
  137. # The role of the current user in the ta table must be admin, owner, or editor
  138. if not current_user.is_editor:
  139. raise Forbidden()
  140. parser = reqparse.RequestParser()
  141. parser.add_argument("external_knowledge_api_id", type=str, required=True, nullable=False, location="json")
  142. parser.add_argument("external_knowledge_id", type=str, required=True, nullable=False, location="json")
  143. parser.add_argument(
  144. "name",
  145. nullable=False,
  146. required=True,
  147. help="name is required. Name must be between 1 to 100 characters.",
  148. type=_validate_name,
  149. )
  150. parser.add_argument("description", type=str, required=False, nullable=True, location="json")
  151. parser.add_argument("external_retrieval_model", type=dict, required=False, location="json")
  152. args = parser.parse_args()
  153. # The role of the current user in the ta table must be admin, owner, or editor, or dataset_operator
  154. if not current_user.is_dataset_editor:
  155. raise Forbidden()
  156. try:
  157. dataset = ExternalDatasetService.create_external_dataset(
  158. tenant_id=current_user.current_tenant_id,
  159. user_id=current_user.id,
  160. args=args,
  161. )
  162. except services.errors.dataset.DatasetNameDuplicateError:
  163. raise DatasetNameDuplicateError()
  164. return marshal(dataset, dataset_detail_fields), 201
  165. class ExternalKnowledgeHitTestingApi(Resource):
  166. @setup_required
  167. @login_required
  168. @account_initialization_required
  169. def post(self, dataset_id):
  170. dataset_id_str = str(dataset_id)
  171. dataset = DatasetService.get_dataset(dataset_id_str)
  172. if dataset is None:
  173. raise NotFound("Dataset not found.")
  174. try:
  175. DatasetService.check_dataset_permission(dataset, current_user)
  176. except services.errors.account.NoPermissionError as e:
  177. raise Forbidden(str(e))
  178. parser = reqparse.RequestParser()
  179. parser.add_argument("query", type=str, location="json")
  180. parser.add_argument("external_retrieval_model", type=dict, required=False, location="json")
  181. args = parser.parse_args()
  182. HitTestingService.hit_testing_args_check(args)
  183. try:
  184. response = HitTestingService.external_retrieve(
  185. dataset=dataset,
  186. query=args["query"],
  187. account=current_user,
  188. external_retrieval_model=args["external_retrieval_model"],
  189. )
  190. return response
  191. except Exception as e:
  192. raise InternalServerError(str(e))
  193. class BedrockRetrievalApi(Resource):
  194. # this api is only for internal testing
  195. def post(self):
  196. parser = reqparse.RequestParser()
  197. parser.add_argument("retrieval_setting", nullable=False, required=True, type=dict, location="json")
  198. parser.add_argument(
  199. "query",
  200. nullable=False,
  201. required=True,
  202. type=str,
  203. )
  204. parser.add_argument("knowledge_id", nullable=False, required=True, type=str)
  205. args = parser.parse_args()
  206. # Call the knowledge retrieval service
  207. result = ExternalDatasetTestService.knowledge_retrieval(
  208. args["retrieval_setting"], args["query"], args["knowledge_id"]
  209. )
  210. return result, 200
  211. api.add_resource(ExternalKnowledgeHitTestingApi, "/datasets/<uuid:dataset_id>/external-hit-testing")
  212. api.add_resource(ExternalDatasetCreateApi, "/datasets/external")
  213. api.add_resource(ExternalApiTemplateListApi, "/datasets/external-knowledge-api")
  214. api.add_resource(ExternalApiTemplateApi, "/datasets/external-knowledge-api/<uuid:external_knowledge_api_id>")
  215. api.add_resource(ExternalApiUseCheckApi, "/datasets/external-knowledge-api/<uuid:external_knowledge_api_id>/use-check")
  216. # this api is only for internal test
  217. api.add_resource(BedrockRetrievalApi, "/test/retrieval")