tool_engine.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327
  1. import json
  2. from collections.abc import Generator, Iterable
  3. from copy import deepcopy
  4. from datetime import datetime, timezone
  5. from mimetypes import guess_type
  6. from typing import Any, Optional, Union, cast
  7. from yarl import URL
  8. from core.app.entities.app_invoke_entities import InvokeFrom
  9. from core.callback_handler.agent_tool_callback_handler import DifyAgentCallbackHandler
  10. from core.callback_handler.workflow_tool_callback_handler import DifyWorkflowCallbackHandler
  11. from core.file.file_obj import FileTransferMethod
  12. from core.ops.ops_trace_manager import TraceQueueManager
  13. from core.tools.__base.tool import Tool
  14. from core.tools.entities.tool_entities import ToolInvokeMessage, ToolInvokeMessageBinary, ToolInvokeMeta, ToolParameter
  15. from core.tools.errors import (
  16. ToolEngineInvokeError,
  17. ToolInvokeError,
  18. ToolNotFoundError,
  19. ToolNotSupportedError,
  20. ToolParameterValidationError,
  21. ToolProviderCredentialValidationError,
  22. ToolProviderNotFoundError,
  23. )
  24. from core.tools.utils.message_transformer import ToolFileMessageTransformer
  25. from core.tools.workflow_as_tool.tool import WorkflowTool
  26. from extensions.ext_database import db
  27. from models.model import Message, MessageFile
  28. class ToolEngine:
  29. """
  30. Tool runtime engine take care of the tool executions.
  31. """
  32. @staticmethod
  33. def agent_invoke(
  34. tool: Tool,
  35. tool_parameters: Union[str, dict],
  36. user_id: str,
  37. tenant_id: str,
  38. message: Message,
  39. invoke_from: InvokeFrom,
  40. agent_tool_callback: DifyAgentCallbackHandler,
  41. trace_manager: Optional[TraceQueueManager] = None,
  42. ) -> tuple[str, list[tuple[MessageFile, str]], ToolInvokeMeta]:
  43. """
  44. Agent invokes the tool with the given arguments.
  45. """
  46. # check if arguments is a string
  47. if isinstance(tool_parameters, str):
  48. # check if this tool has only one parameter
  49. parameters = [
  50. parameter
  51. for parameter in tool.get_runtime_parameters() or []
  52. if parameter.form == ToolParameter.ToolParameterForm.LLM
  53. ]
  54. if parameters and len(parameters) == 1:
  55. tool_parameters = {parameters[0].name: tool_parameters}
  56. else:
  57. raise ValueError(f"tool_parameters should be a dict, but got a string: {tool_parameters}")
  58. # invoke the tool
  59. try:
  60. # hit the callback handler
  61. agent_tool_callback.on_tool_start(tool_name=tool.entity.identity.name, tool_inputs=tool_parameters)
  62. messages = ToolEngine._invoke(tool, tool_parameters, user_id)
  63. invocation_meta_dict: dict[str, ToolInvokeMeta] = {}
  64. def message_callback(
  65. invocation_meta_dict: dict, messages: Generator[ToolInvokeMessage | ToolInvokeMeta, None, None]
  66. ):
  67. for message in messages:
  68. if isinstance(message, ToolInvokeMeta):
  69. invocation_meta_dict["meta"] = message
  70. else:
  71. yield message
  72. messages = ToolFileMessageTransformer.transform_tool_invoke_messages(
  73. messages=message_callback(invocation_meta_dict, messages),
  74. user_id=user_id,
  75. tenant_id=tenant_id,
  76. conversation_id=message.conversation_id,
  77. )
  78. # extract binary data from tool invoke message
  79. binary_files = ToolEngine._extract_tool_response_binary(messages)
  80. # create message file
  81. message_files = ToolEngine._create_message_files(
  82. tool_messages=binary_files, agent_message=message, invoke_from=invoke_from, user_id=user_id
  83. )
  84. plain_text = ToolEngine._convert_tool_response_to_str(messages)
  85. meta = invocation_meta_dict["meta"]
  86. # hit the callback handler
  87. agent_tool_callback.on_tool_end(
  88. tool_name=tool.entity.identity.name,
  89. tool_inputs=tool_parameters,
  90. tool_outputs=plain_text,
  91. message_id=message.id,
  92. trace_manager=trace_manager,
  93. )
  94. # transform tool invoke message to get LLM friendly message
  95. return plain_text, message_files, meta
  96. except ToolProviderCredentialValidationError as e:
  97. error_response = "Please check your tool provider credentials"
  98. agent_tool_callback.on_tool_error(e)
  99. except (ToolNotFoundError, ToolNotSupportedError, ToolProviderNotFoundError) as e:
  100. error_response = f"there is not a tool named {tool.entity.identity.name}"
  101. agent_tool_callback.on_tool_error(e)
  102. except ToolParameterValidationError as e:
  103. error_response = f"tool parameters validation error: {e}, please check your tool parameters"
  104. agent_tool_callback.on_tool_error(e)
  105. except ToolInvokeError as e:
  106. error_response = f"tool invoke error: {e}"
  107. agent_tool_callback.on_tool_error(e)
  108. except ToolEngineInvokeError as e:
  109. meta = e.args[0]
  110. error_response = f"tool invoke error: {meta.error}"
  111. agent_tool_callback.on_tool_error(e)
  112. return error_response, [], meta
  113. except Exception as e:
  114. error_response = f"unknown error: {e}"
  115. agent_tool_callback.on_tool_error(e)
  116. return error_response, [], ToolInvokeMeta.error_instance(error_response)
  117. @staticmethod
  118. def workflow_invoke(
  119. tool: Tool,
  120. tool_parameters: dict[str, Any],
  121. user_id: str,
  122. workflow_tool_callback: DifyWorkflowCallbackHandler,
  123. workflow_call_depth: int,
  124. thread_pool_id: Optional[str] = None,
  125. ) -> Generator[ToolInvokeMessage, None, None]:
  126. """
  127. Workflow invokes the tool with the given arguments.
  128. """
  129. try:
  130. # hit the callback handler
  131. workflow_tool_callback.on_tool_start(tool_name=tool.entity.identity.name, tool_inputs=tool_parameters)
  132. if isinstance(tool, WorkflowTool):
  133. tool.workflow_call_depth = workflow_call_depth + 1
  134. tool.thread_pool_id = thread_pool_id
  135. if tool.runtime and tool.runtime.runtime_parameters:
  136. tool_parameters = {**tool.runtime.runtime_parameters, **tool_parameters}
  137. response = tool.invoke(user_id=user_id, tool_parameters=tool_parameters)
  138. # hit the callback handler
  139. response = workflow_tool_callback.on_tool_execution(
  140. tool_name=tool.entity.identity.name,
  141. tool_inputs=tool_parameters,
  142. tool_outputs=response,
  143. )
  144. return response
  145. except Exception as e:
  146. workflow_tool_callback.on_tool_error(e)
  147. raise e
  148. @staticmethod
  149. def _invoke(
  150. tool: Tool, tool_parameters: dict, user_id: str
  151. ) -> Generator[ToolInvokeMessage | ToolInvokeMeta, None, None]:
  152. """
  153. Invoke the tool with the given arguments.
  154. """
  155. if not tool.runtime:
  156. raise ValueError("missing runtime in tool")
  157. started_at = datetime.now(timezone.utc)
  158. meta = ToolInvokeMeta(
  159. time_cost=0.0,
  160. error=None,
  161. tool_config={
  162. "tool_name": tool.entity.identity.name,
  163. "tool_provider": tool.entity.identity.provider,
  164. "tool_provider_type": tool.tool_provider_type().value,
  165. "tool_parameters": deepcopy(tool.runtime.runtime_parameters),
  166. "tool_icon": tool.entity.identity.icon,
  167. },
  168. )
  169. try:
  170. yield from tool.invoke(user_id, tool_parameters)
  171. except Exception as e:
  172. meta.error = str(e)
  173. raise ToolEngineInvokeError(meta)
  174. finally:
  175. ended_at = datetime.now(timezone.utc)
  176. meta.time_cost = (ended_at - started_at).total_seconds()
  177. yield meta
  178. @staticmethod
  179. def _convert_tool_response_to_str(tool_response: Generator[ToolInvokeMessage, None, None]) -> str:
  180. """
  181. Handle tool response
  182. """
  183. result = ""
  184. for response in tool_response:
  185. if response.type == ToolInvokeMessage.MessageType.TEXT:
  186. result += cast(ToolInvokeMessage.TextMessage, response.message).text
  187. elif response.type == ToolInvokeMessage.MessageType.LINK:
  188. result += (
  189. f"result link: {cast(ToolInvokeMessage.TextMessage, response.message).text}."
  190. + " please tell user to check it."
  191. )
  192. elif response.type in {ToolInvokeMessage.MessageType.IMAGE_LINK, ToolInvokeMessage.MessageType.IMAGE}:
  193. result += (
  194. "image has been created and sent to user already, "
  195. + "you do not need to create it, just tell the user to check it now."
  196. )
  197. elif response.type == ToolInvokeMessage.MessageType.JSON:
  198. text = json.dumps(cast(ToolInvokeMessage.JsonMessage, response.message).json_object, ensure_ascii=False)
  199. result += f"tool response: {text}."
  200. else:
  201. result += f"tool response: {response.message}."
  202. return result
  203. @staticmethod
  204. def _extract_tool_response_binary(
  205. tool_response: Generator[ToolInvokeMessage, None, None],
  206. ) -> Generator[ToolInvokeMessageBinary, None, None]:
  207. """
  208. Extract tool response binary
  209. """
  210. for response in tool_response:
  211. if response.type in {ToolInvokeMessage.MessageType.IMAGE_LINK, ToolInvokeMessage.MessageType.IMAGE}:
  212. mimetype = None
  213. if not response.meta:
  214. raise ValueError("missing meta data")
  215. if response.meta.get("mime_type"):
  216. mimetype = response.meta.get("mime_type")
  217. else:
  218. try:
  219. url = URL(cast(ToolInvokeMessage.TextMessage, response.message).text)
  220. extension = url.suffix
  221. guess_type_result, _ = guess_type(f"a{extension}")
  222. if guess_type_result:
  223. mimetype = guess_type_result
  224. except Exception:
  225. pass
  226. if not mimetype:
  227. mimetype = "image/jpeg"
  228. yield ToolInvokeMessageBinary(
  229. mimetype=response.meta.get("mime_type", "image/jpeg"),
  230. url=cast(ToolInvokeMessage.TextMessage, response.message).text,
  231. save_as=response.save_as,
  232. )
  233. elif response.type == ToolInvokeMessage.MessageType.BLOB:
  234. if not response.meta:
  235. raise ValueError("missing meta data")
  236. yield ToolInvokeMessageBinary(
  237. mimetype=response.meta.get("mime_type", "octet/stream"),
  238. url=cast(ToolInvokeMessage.TextMessage, response.message).text,
  239. save_as=response.save_as,
  240. )
  241. elif response.type == ToolInvokeMessage.MessageType.LINK:
  242. # check if there is a mime type in meta
  243. if response.meta and "mime_type" in response.meta:
  244. yield ToolInvokeMessageBinary(
  245. mimetype=response.meta.get("mime_type", "octet/stream") if response.meta else "octet/stream",
  246. url=cast(ToolInvokeMessage.TextMessage, response.message).text,
  247. save_as=response.save_as,
  248. )
  249. @staticmethod
  250. def _create_message_files(
  251. tool_messages: Iterable[ToolInvokeMessageBinary], agent_message: Message, invoke_from: InvokeFrom, user_id: str
  252. ) -> list[tuple[MessageFile, str]]:
  253. """
  254. Create message file
  255. :param messages: messages
  256. :return: message files, should save as variable
  257. """
  258. result = []
  259. for message in tool_messages:
  260. file_type = "bin"
  261. if "image" in message.mimetype:
  262. file_type = "image"
  263. elif "video" in message.mimetype:
  264. file_type = "video"
  265. elif "audio" in message.mimetype:
  266. file_type = "audio"
  267. elif "text" in message.mimetype:
  268. file_type = "text"
  269. elif "pdf" in message.mimetype:
  270. file_type = "pdf"
  271. elif "zip" in message.mimetype:
  272. file_type = "archive"
  273. # ...
  274. message_file = MessageFile(
  275. message_id=agent_message.id,
  276. type=file_type,
  277. transfer_method=FileTransferMethod.TOOL_FILE.value,
  278. belongs_to="assistant",
  279. url=message.url,
  280. upload_file_id=None,
  281. created_by_role=("account" if invoke_from in {InvokeFrom.EXPLORE, InvokeFrom.DEBUGGER} else "end_user"),
  282. created_by=user_id,
  283. )
  284. db.session.add(message_file)
  285. db.session.commit()
  286. db.session.refresh(message_file)
  287. result.append((message_file.id, message.save_as))
  288. db.session.close()
  289. return result