tool_engine.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319
  1. import json
  2. from collections.abc import Mapping
  3. from copy import deepcopy
  4. from datetime import UTC, datetime
  5. from mimetypes import guess_type
  6. from typing import Any, Optional, Union
  7. from yarl import URL
  8. from core.app.entities.app_invoke_entities import InvokeFrom
  9. from core.callback_handler.agent_tool_callback_handler import DifyAgentCallbackHandler
  10. from core.callback_handler.workflow_tool_callback_handler import DifyWorkflowCallbackHandler
  11. from core.file import FileType
  12. from core.file.models import FileTransferMethod
  13. from core.ops.ops_trace_manager import TraceQueueManager
  14. from core.tools.entities.tool_entities import ToolInvokeMessage, ToolInvokeMessageBinary, ToolInvokeMeta, ToolParameter
  15. from core.tools.errors import (
  16. ToolEngineInvokeError,
  17. ToolInvokeError,
  18. ToolNotFoundError,
  19. ToolNotSupportedError,
  20. ToolParameterValidationError,
  21. ToolProviderCredentialValidationError,
  22. ToolProviderNotFoundError,
  23. )
  24. from core.tools.tool.tool import Tool
  25. from core.tools.tool.workflow_tool import WorkflowTool
  26. from core.tools.utils.message_transformer import ToolFileMessageTransformer
  27. from extensions.ext_database import db
  28. from models.enums import CreatedByRole
  29. from models.model import Message, MessageFile
  30. class ToolEngine:
  31. """
  32. Tool runtime engine take care of the tool executions.
  33. """
  34. @staticmethod
  35. def agent_invoke(
  36. tool: Tool,
  37. tool_parameters: Union[str, dict],
  38. user_id: str,
  39. tenant_id: str,
  40. message: Message,
  41. invoke_from: InvokeFrom,
  42. agent_tool_callback: DifyAgentCallbackHandler,
  43. trace_manager: Optional[TraceQueueManager] = None,
  44. ) -> tuple[str, list[tuple[MessageFile, bool]], ToolInvokeMeta]:
  45. """
  46. Agent invokes the tool with the given arguments.
  47. """
  48. # check if arguments is a string
  49. if isinstance(tool_parameters, str):
  50. # check if this tool has only one parameter
  51. parameters = [
  52. parameter
  53. for parameter in tool.get_runtime_parameters()
  54. if parameter.form == ToolParameter.ToolParameterForm.LLM
  55. ]
  56. if parameters and len(parameters) == 1:
  57. tool_parameters = {parameters[0].name: tool_parameters}
  58. else:
  59. try:
  60. tool_parameters = json.loads(tool_parameters)
  61. except Exception as e:
  62. pass
  63. if not isinstance(tool_parameters, dict):
  64. raise ValueError(f"tool_parameters should be a dict, but got a string: {tool_parameters}")
  65. # invoke the tool
  66. try:
  67. # hit the callback handler
  68. agent_tool_callback.on_tool_start(tool_name=tool.identity.name, tool_inputs=tool_parameters)
  69. meta, response = ToolEngine._invoke(tool, tool_parameters, user_id)
  70. response = ToolFileMessageTransformer.transform_tool_invoke_messages(
  71. messages=response, user_id=user_id, tenant_id=tenant_id, conversation_id=message.conversation_id
  72. )
  73. # extract binary data from tool invoke message
  74. binary_files = ToolEngine._extract_tool_response_binary(response)
  75. # create message file
  76. message_files = ToolEngine._create_message_files(
  77. tool_messages=binary_files, agent_message=message, invoke_from=invoke_from, user_id=user_id
  78. )
  79. plain_text = ToolEngine._convert_tool_response_to_str(response)
  80. # hit the callback handler
  81. agent_tool_callback.on_tool_end(
  82. tool_name=tool.identity.name,
  83. tool_inputs=tool_parameters,
  84. tool_outputs=plain_text,
  85. message_id=message.id,
  86. trace_manager=trace_manager,
  87. )
  88. # transform tool invoke message to get LLM friendly message
  89. return plain_text, message_files, meta
  90. except ToolProviderCredentialValidationError as e:
  91. error_response = "Please check your tool provider credentials"
  92. agent_tool_callback.on_tool_error(e)
  93. except (ToolNotFoundError, ToolNotSupportedError, ToolProviderNotFoundError) as e:
  94. error_response = f"there is not a tool named {tool.identity.name}"
  95. agent_tool_callback.on_tool_error(e)
  96. except ToolParameterValidationError as e:
  97. error_response = f"tool parameters validation error: {e}, please check your tool parameters"
  98. agent_tool_callback.on_tool_error(e)
  99. except ToolInvokeError as e:
  100. error_response = f"tool invoke error: {e}"
  101. agent_tool_callback.on_tool_error(e)
  102. except ToolEngineInvokeError as e:
  103. meta = e.args[0]
  104. error_response = f"tool invoke error: {meta.error}"
  105. agent_tool_callback.on_tool_error(e)
  106. return error_response, [], meta
  107. except Exception as e:
  108. error_response = f"unknown error: {e}"
  109. agent_tool_callback.on_tool_error(e)
  110. return error_response, [], ToolInvokeMeta.error_instance(error_response)
  111. @staticmethod
  112. def workflow_invoke(
  113. tool: Tool,
  114. tool_parameters: Mapping[str, Any],
  115. user_id: str,
  116. workflow_tool_callback: DifyWorkflowCallbackHandler,
  117. workflow_call_depth: int,
  118. thread_pool_id: Optional[str] = None,
  119. ) -> list[ToolInvokeMessage]:
  120. """
  121. Workflow invokes the tool with the given arguments.
  122. """
  123. try:
  124. # hit the callback handler
  125. assert tool.identity is not None
  126. workflow_tool_callback.on_tool_start(tool_name=tool.identity.name, tool_inputs=tool_parameters)
  127. if isinstance(tool, WorkflowTool):
  128. tool.workflow_call_depth = workflow_call_depth + 1
  129. tool.thread_pool_id = thread_pool_id
  130. if tool.runtime and tool.runtime.runtime_parameters:
  131. tool_parameters = {**tool.runtime.runtime_parameters, **tool_parameters}
  132. response = tool.invoke(user_id=user_id, tool_parameters=tool_parameters)
  133. # hit the callback handler
  134. workflow_tool_callback.on_tool_end(
  135. tool_name=tool.identity.name,
  136. tool_inputs=tool_parameters,
  137. tool_outputs=response,
  138. )
  139. return response
  140. except Exception as e:
  141. workflow_tool_callback.on_tool_error(e)
  142. raise e
  143. @staticmethod
  144. def _invoke(tool: Tool, tool_parameters: dict, user_id: str) -> tuple[ToolInvokeMeta, list[ToolInvokeMessage]]:
  145. """
  146. Invoke the tool with the given arguments.
  147. """
  148. started_at = datetime.now(UTC)
  149. meta = ToolInvokeMeta(
  150. time_cost=0.0,
  151. error=None,
  152. tool_config={
  153. "tool_name": tool.identity.name,
  154. "tool_provider": tool.identity.provider,
  155. "tool_provider_type": tool.tool_provider_type().value,
  156. "tool_parameters": deepcopy(tool.runtime.runtime_parameters),
  157. "tool_icon": tool.identity.icon,
  158. },
  159. )
  160. try:
  161. response = tool.invoke(user_id, tool_parameters)
  162. except Exception as e:
  163. meta.error = str(e)
  164. raise ToolEngineInvokeError(meta)
  165. finally:
  166. ended_at = datetime.now(UTC)
  167. meta.time_cost = (ended_at - started_at).total_seconds()
  168. return meta, response
  169. @staticmethod
  170. def _convert_tool_response_to_str(tool_response: list[ToolInvokeMessage]) -> str:
  171. """
  172. Handle tool response
  173. """
  174. result = ""
  175. for response in tool_response:
  176. if response.type == ToolInvokeMessage.MessageType.TEXT:
  177. result += response.message
  178. elif response.type == ToolInvokeMessage.MessageType.LINK:
  179. result += f"result link: {response.message}. please tell user to check it."
  180. elif response.type in {ToolInvokeMessage.MessageType.IMAGE_LINK, ToolInvokeMessage.MessageType.IMAGE}:
  181. result += (
  182. "image has been created and sent to user already, you do not need to create it,"
  183. " just tell the user to check it now."
  184. )
  185. elif response.type == ToolInvokeMessage.MessageType.JSON:
  186. result += f"tool response: {json.dumps(response.message, ensure_ascii=False)}."
  187. else:
  188. result += f"tool response: {response.message}."
  189. return result
  190. @staticmethod
  191. def _extract_tool_response_binary(tool_response: list[ToolInvokeMessage]) -> list[ToolInvokeMessageBinary]:
  192. """
  193. Extract tool response binary
  194. """
  195. result = []
  196. for response in tool_response:
  197. if response.type in {ToolInvokeMessage.MessageType.IMAGE_LINK, ToolInvokeMessage.MessageType.IMAGE}:
  198. mimetype = None
  199. if response.meta.get("mime_type"):
  200. mimetype = response.meta.get("mime_type")
  201. else:
  202. try:
  203. url = URL(response.message)
  204. extension = url.suffix
  205. guess_type_result, _ = guess_type(f"a{extension}")
  206. if guess_type_result:
  207. mimetype = guess_type_result
  208. except Exception:
  209. pass
  210. if not mimetype:
  211. mimetype = "image/jpeg"
  212. result.append(
  213. ToolInvokeMessageBinary(
  214. mimetype=response.meta.get("mime_type", "image/jpeg"),
  215. url=response.message,
  216. save_as=response.save_as,
  217. )
  218. )
  219. elif response.type == ToolInvokeMessage.MessageType.BLOB:
  220. result.append(
  221. ToolInvokeMessageBinary(
  222. mimetype=response.meta.get("mime_type", "octet/stream"),
  223. url=response.message,
  224. save_as=response.save_as,
  225. )
  226. )
  227. elif response.type == ToolInvokeMessage.MessageType.LINK:
  228. # check if there is a mime type in meta
  229. if response.meta and "mime_type" in response.meta:
  230. result.append(
  231. ToolInvokeMessageBinary(
  232. mimetype=response.meta.get("mime_type", "octet/stream")
  233. if response.meta
  234. else "octet/stream",
  235. url=response.message,
  236. save_as=response.save_as,
  237. )
  238. )
  239. return result
  240. @staticmethod
  241. def _create_message_files(
  242. tool_messages: list[ToolInvokeMessageBinary],
  243. agent_message: Message,
  244. invoke_from: InvokeFrom,
  245. user_id: str,
  246. ) -> list[tuple[Any, str]]:
  247. """
  248. Create message file
  249. :param messages: messages
  250. :return: message files, should save as variable
  251. """
  252. result = []
  253. for message in tool_messages:
  254. if "image" in message.mimetype:
  255. file_type = FileType.IMAGE
  256. elif "video" in message.mimetype:
  257. file_type = FileType.VIDEO
  258. elif "audio" in message.mimetype:
  259. file_type = FileType.AUDIO
  260. elif "text" in message.mimetype or "pdf" in message.mimetype:
  261. file_type = FileType.DOCUMENT
  262. else:
  263. file_type = FileType.CUSTOM
  264. # extract tool file id from url
  265. tool_file_id = message.url.split("/")[-1].split(".")[0]
  266. message_file = MessageFile(
  267. message_id=agent_message.id,
  268. type=file_type,
  269. transfer_method=FileTransferMethod.TOOL_FILE,
  270. belongs_to="assistant",
  271. url=message.url,
  272. upload_file_id=tool_file_id,
  273. created_by_role=(
  274. CreatedByRole.ACCOUNT
  275. if invoke_from in {InvokeFrom.EXPLORE, InvokeFrom.DEBUGGER}
  276. else CreatedByRole.END_USER
  277. ),
  278. created_by=user_id,
  279. )
  280. db.session.add(message_file)
  281. db.session.commit()
  282. db.session.refresh(message_file)
  283. result.append((message_file.id, message.save_as))
  284. db.session.close()
  285. return result