tool_engine.py 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353
  1. import json
  2. from collections.abc import Generator, Iterable
  3. from copy import deepcopy
  4. from datetime import datetime, timezone
  5. from mimetypes import guess_type
  6. from typing import Any, Optional, Union, cast
  7. from yarl import URL
  8. from core.app.entities.app_invoke_entities import InvokeFrom
  9. from core.callback_handler.agent_tool_callback_handler import DifyAgentCallbackHandler
  10. from core.callback_handler.workflow_tool_callback_handler import DifyWorkflowCallbackHandler
  11. from core.file import FileType
  12. from core.file.models import FileTransferMethod
  13. from core.ops.ops_trace_manager import TraceQueueManager
  14. from core.tools.__base.tool import Tool
  15. from core.tools.entities.tool_entities import ToolInvokeMessage, ToolInvokeMessageBinary, ToolInvokeMeta, ToolParameter
  16. from core.tools.errors import (
  17. ToolEngineInvokeError,
  18. ToolInvokeError,
  19. ToolNotFoundError,
  20. ToolNotSupportedError,
  21. ToolParameterValidationError,
  22. ToolProviderCredentialValidationError,
  23. ToolProviderNotFoundError,
  24. )
  25. from core.tools.utils.message_transformer import ToolFileMessageTransformer
  26. from core.tools.workflow_as_tool.tool import WorkflowTool
  27. from extensions.ext_database import db
  28. from models.enums import CreatedByRole
  29. from models.model import Message, MessageFile
  30. class ToolEngine:
  31. """
  32. Tool runtime engine take care of the tool executions.
  33. """
  34. @staticmethod
  35. def agent_invoke(
  36. tool: Tool,
  37. tool_parameters: Union[str, dict],
  38. user_id: str,
  39. tenant_id: str,
  40. message: Message,
  41. invoke_from: InvokeFrom,
  42. agent_tool_callback: DifyAgentCallbackHandler,
  43. trace_manager: Optional[TraceQueueManager] = None,
  44. conversation_id: Optional[str] = None,
  45. app_id: Optional[str] = None,
  46. message_id: Optional[str] = None,
  47. ) -> tuple[str, list[tuple[MessageFile, str]], ToolInvokeMeta]:
  48. """
  49. Agent invokes the tool with the given arguments.
  50. """
  51. # check if arguments is a string
  52. if isinstance(tool_parameters, str):
  53. # check if this tool has only one parameter
  54. parameters = [
  55. parameter
  56. for parameter in tool.get_runtime_parameters() or []
  57. if parameter.form == ToolParameter.ToolParameterForm.LLM
  58. ]
  59. if parameters and len(parameters) == 1:
  60. tool_parameters = {parameters[0].name: tool_parameters}
  61. else:
  62. raise ValueError(f"tool_parameters should be a dict, but got a string: {tool_parameters}")
  63. # invoke the tool
  64. try:
  65. # hit the callback handler
  66. agent_tool_callback.on_tool_start(tool_name=tool.entity.identity.name, tool_inputs=tool_parameters)
  67. messages = ToolEngine._invoke(tool, tool_parameters, user_id, conversation_id, app_id, message_id)
  68. invocation_meta_dict: dict[str, ToolInvokeMeta] = {}
  69. def message_callback(
  70. invocation_meta_dict: dict, messages: Generator[ToolInvokeMessage | ToolInvokeMeta, None, None]
  71. ):
  72. for message in messages:
  73. if isinstance(message, ToolInvokeMeta):
  74. invocation_meta_dict["meta"] = message
  75. else:
  76. yield message
  77. messages = ToolFileMessageTransformer.transform_tool_invoke_messages(
  78. messages=message_callback(invocation_meta_dict, messages),
  79. user_id=user_id,
  80. tenant_id=tenant_id,
  81. conversation_id=message.conversation_id,
  82. )
  83. message_list = list(messages)
  84. # extract binary data from tool invoke message
  85. binary_files = ToolEngine._extract_tool_response_binary_and_text(message_list)
  86. # create message file
  87. message_files = ToolEngine._create_message_files(
  88. tool_messages=binary_files, agent_message=message, invoke_from=invoke_from, user_id=user_id
  89. )
  90. plain_text = ToolEngine._convert_tool_response_to_str(message_list)
  91. meta = invocation_meta_dict["meta"]
  92. # hit the callback handler
  93. agent_tool_callback.on_tool_end(
  94. tool_name=tool.entity.identity.name,
  95. tool_inputs=tool_parameters,
  96. tool_outputs=plain_text,
  97. message_id=message.id,
  98. trace_manager=trace_manager,
  99. )
  100. # transform tool invoke message to get LLM friendly message
  101. return plain_text, message_files, meta
  102. except ToolProviderCredentialValidationError as e:
  103. error_response = "Please check your tool provider credentials"
  104. agent_tool_callback.on_tool_error(e)
  105. except (ToolNotFoundError, ToolNotSupportedError, ToolProviderNotFoundError) as e:
  106. error_response = f"there is not a tool named {tool.entity.identity.name}"
  107. agent_tool_callback.on_tool_error(e)
  108. except ToolParameterValidationError as e:
  109. error_response = f"tool parameters validation error: {e}, please check your tool parameters"
  110. agent_tool_callback.on_tool_error(e)
  111. except ToolInvokeError as e:
  112. error_response = f"tool invoke error: {e}"
  113. agent_tool_callback.on_tool_error(e)
  114. except ToolEngineInvokeError as e:
  115. meta = e.args[0]
  116. error_response = f"tool invoke error: {meta.error}"
  117. agent_tool_callback.on_tool_error(e)
  118. return error_response, [], meta
  119. except Exception as e:
  120. error_response = f"unknown error: {e}"
  121. agent_tool_callback.on_tool_error(e)
  122. return error_response, [], ToolInvokeMeta.error_instance(error_response)
  123. @staticmethod
  124. def generic_invoke(
  125. tool: Tool,
  126. tool_parameters: dict[str, Any],
  127. user_id: str,
  128. workflow_tool_callback: DifyWorkflowCallbackHandler,
  129. workflow_call_depth: int,
  130. thread_pool_id: Optional[str] = None,
  131. conversation_id: Optional[str] = None,
  132. app_id: Optional[str] = None,
  133. message_id: Optional[str] = None,
  134. ) -> Generator[ToolInvokeMessage, None, None]:
  135. """
  136. Workflow invokes the tool with the given arguments.
  137. """
  138. try:
  139. # hit the callback handler
  140. workflow_tool_callback.on_tool_start(tool_name=tool.entity.identity.name, tool_inputs=tool_parameters)
  141. if isinstance(tool, WorkflowTool):
  142. tool.workflow_call_depth = workflow_call_depth + 1
  143. tool.thread_pool_id = thread_pool_id
  144. if tool.runtime and tool.runtime.runtime_parameters:
  145. tool_parameters = {**tool.runtime.runtime_parameters, **tool_parameters}
  146. response = tool.invoke(
  147. user_id=user_id,
  148. tool_parameters=tool_parameters,
  149. conversation_id=conversation_id,
  150. app_id=app_id,
  151. message_id=message_id,
  152. )
  153. # hit the callback handler
  154. response = workflow_tool_callback.on_tool_execution(
  155. tool_name=tool.entity.identity.name,
  156. tool_inputs=tool_parameters,
  157. tool_outputs=response,
  158. )
  159. return response
  160. except Exception as e:
  161. workflow_tool_callback.on_tool_error(e)
  162. raise e
  163. @staticmethod
  164. def _invoke(
  165. tool: Tool,
  166. tool_parameters: dict,
  167. user_id: str,
  168. conversation_id: Optional[str] = None,
  169. app_id: Optional[str] = None,
  170. message_id: Optional[str] = None,
  171. ) -> Generator[ToolInvokeMessage | ToolInvokeMeta, None, None]:
  172. """
  173. Invoke the tool with the given arguments.
  174. """
  175. if not tool.runtime:
  176. raise ValueError("missing runtime in tool")
  177. started_at = datetime.now(timezone.utc)
  178. meta = ToolInvokeMeta(
  179. time_cost=0.0,
  180. error=None,
  181. tool_config={
  182. "tool_name": tool.entity.identity.name,
  183. "tool_provider": tool.entity.identity.provider,
  184. "tool_provider_type": tool.tool_provider_type().value,
  185. "tool_parameters": deepcopy(tool.runtime.runtime_parameters),
  186. "tool_icon": tool.entity.identity.icon,
  187. },
  188. )
  189. try:
  190. yield from tool.invoke(user_id, tool_parameters, conversation_id, app_id, message_id)
  191. except Exception as e:
  192. meta.error = str(e)
  193. raise ToolEngineInvokeError(meta)
  194. finally:
  195. ended_at = datetime.now(timezone.utc)
  196. meta.time_cost = (ended_at - started_at).total_seconds()
  197. yield meta
  198. @staticmethod
  199. def _convert_tool_response_to_str(tool_response: list[ToolInvokeMessage]) -> str:
  200. """
  201. Handle tool response
  202. """
  203. result = ""
  204. for response in tool_response:
  205. if response.type == ToolInvokeMessage.MessageType.TEXT:
  206. result += cast(ToolInvokeMessage.TextMessage, response.message).text
  207. elif response.type == ToolInvokeMessage.MessageType.LINK:
  208. result += (
  209. f"result link: {cast(ToolInvokeMessage.TextMessage, response.message).text}."
  210. + " please tell user to check it."
  211. )
  212. elif response.type in {ToolInvokeMessage.MessageType.IMAGE_LINK, ToolInvokeMessage.MessageType.IMAGE}:
  213. result += (
  214. "image has been created and sent to user already, "
  215. + "you do not need to create it, just tell the user to check it now."
  216. )
  217. elif response.type == ToolInvokeMessage.MessageType.JSON:
  218. text = json.dumps(cast(ToolInvokeMessage.JsonMessage, response.message).json_object, ensure_ascii=False)
  219. result += f"tool response: {text}."
  220. else:
  221. result += f"tool response: {response.message}."
  222. return result
  223. @staticmethod
  224. def _extract_tool_response_binary_and_text(
  225. tool_response: list[ToolInvokeMessage],
  226. ) -> Generator[ToolInvokeMessageBinary, None, None]:
  227. """
  228. Extract tool response binary
  229. """
  230. for response in tool_response:
  231. if response.type in {ToolInvokeMessage.MessageType.IMAGE_LINK, ToolInvokeMessage.MessageType.IMAGE}:
  232. mimetype = None
  233. if not response.meta:
  234. raise ValueError("missing meta data")
  235. if response.meta.get("mime_type"):
  236. mimetype = response.meta.get("mime_type")
  237. else:
  238. try:
  239. url = URL(cast(ToolInvokeMessage.TextMessage, response.message).text)
  240. extension = url.suffix
  241. guess_type_result, _ = guess_type(f"a{extension}")
  242. if guess_type_result:
  243. mimetype = guess_type_result
  244. except Exception:
  245. pass
  246. if not mimetype:
  247. mimetype = "image/jpeg"
  248. yield ToolInvokeMessageBinary(
  249. mimetype=response.meta.get("mime_type", "image/jpeg"),
  250. url=cast(ToolInvokeMessage.TextMessage, response.message).text,
  251. save_as=response.save_as,
  252. )
  253. elif response.type == ToolInvokeMessage.MessageType.BLOB:
  254. if not response.meta:
  255. raise ValueError("missing meta data")
  256. yield ToolInvokeMessageBinary(
  257. mimetype=response.meta.get("mime_type", "octet/stream"),
  258. url=cast(ToolInvokeMessage.TextMessage, response.message).text,
  259. save_as=response.save_as,
  260. )
  261. elif response.type == ToolInvokeMessage.MessageType.LINK:
  262. # check if there is a mime type in meta
  263. if response.meta and "mime_type" in response.meta:
  264. yield ToolInvokeMessageBinary(
  265. mimetype=response.meta.get("mime_type", "octet/stream") if response.meta else "octet/stream",
  266. url=cast(ToolInvokeMessage.TextMessage, response.message).text,
  267. save_as=response.save_as,
  268. )
  269. @staticmethod
  270. def _create_message_files(
  271. tool_messages: Iterable[ToolInvokeMessageBinary],
  272. agent_message: Message,
  273. invoke_from: InvokeFrom,
  274. user_id: str,
  275. ) -> list[tuple[MessageFile, str]]:
  276. """
  277. Create message file
  278. :param messages: messages
  279. :return: message files, should save as variable
  280. """
  281. result = []
  282. for message in tool_messages:
  283. if "image" in message.mimetype:
  284. file_type = FileType.IMAGE
  285. elif "video" in message.mimetype:
  286. file_type = FileType.VIDEO
  287. elif "audio" in message.mimetype:
  288. file_type = FileType.AUDIO
  289. elif "text" in message.mimetype or "pdf" in message.mimetype:
  290. file_type = FileType.DOCUMENT
  291. else:
  292. file_type = FileType.CUSTOM
  293. # extract tool file id from url
  294. tool_file_id = message.url.split("/")[-1].split(".")[0]
  295. message_file = MessageFile(
  296. message_id=agent_message.id,
  297. type=file_type,
  298. transfer_method=FileTransferMethod.TOOL_FILE,
  299. belongs_to="assistant",
  300. url=message.url,
  301. upload_file_id=tool_file_id,
  302. created_by_role=(
  303. CreatedByRole.ACCOUNT
  304. if invoke_from in {InvokeFrom.EXPLORE, InvokeFrom.DEBUGGER}
  305. else CreatedByRole.END_USER
  306. ),
  307. created_by=user_id,
  308. )
  309. db.session.add(message_file)
  310. db.session.commit()
  311. db.session.refresh(message_file)
  312. result.append((message_file.id, message.save_as))
  313. db.session.close()
  314. return result