ops_trace_manager.py 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814
  1. import json
  2. import logging
  3. import os
  4. import queue
  5. import threading
  6. import time
  7. from datetime import timedelta
  8. from typing import Any, Optional, Union
  9. from uuid import UUID, uuid4
  10. from flask import current_app
  11. from sqlalchemy import select
  12. from sqlalchemy.orm import Session
  13. from core.helper.encrypter import decrypt_token, encrypt_token, obfuscated_token
  14. from core.ops.entities.config_entity import (
  15. OPS_FILE_PATH,
  16. LangfuseConfig,
  17. LangSmithConfig,
  18. OpikConfig,
  19. TracingProviderEnum,
  20. )
  21. from core.ops.entities.trace_entity import (
  22. DatasetRetrievalTraceInfo,
  23. GenerateNameTraceInfo,
  24. MessageTraceInfo,
  25. ModerationTraceInfo,
  26. SuggestedQuestionTraceInfo,
  27. TaskData,
  28. ToolTraceInfo,
  29. TraceTaskName,
  30. WorkflowTraceInfo,
  31. )
  32. from core.ops.langfuse_trace.langfuse_trace import LangFuseDataTrace
  33. from core.ops.langsmith_trace.langsmith_trace import LangSmithDataTrace
  34. from core.ops.opik_trace.opik_trace import OpikDataTrace
  35. from core.ops.utils import get_message_data
  36. from extensions.ext_database import db
  37. from extensions.ext_storage import storage
  38. from models.model import App, AppModelConfig, Conversation, Message, MessageFile, TraceAppConfig
  39. from models.workflow import WorkflowAppLog, WorkflowRun
  40. from tasks.ops_trace_task import process_trace_tasks
  41. provider_config_map: dict[str, dict[str, Any]] = {
  42. TracingProviderEnum.LANGFUSE.value: {
  43. "config_class": LangfuseConfig,
  44. "secret_keys": ["public_key", "secret_key"],
  45. "other_keys": ["host", "project_key"],
  46. "trace_instance": LangFuseDataTrace,
  47. },
  48. TracingProviderEnum.LANGSMITH.value: {
  49. "config_class": LangSmithConfig,
  50. "secret_keys": ["api_key"],
  51. "other_keys": ["project", "endpoint"],
  52. "trace_instance": LangSmithDataTrace,
  53. },
  54. TracingProviderEnum.OPIK.value: {
  55. "config_class": OpikConfig,
  56. "secret_keys": ["api_key"],
  57. "other_keys": ["project", "url", "workspace"],
  58. "trace_instance": OpikDataTrace,
  59. },
  60. }
  61. class OpsTraceManager:
  62. @classmethod
  63. def encrypt_tracing_config(
  64. cls, tenant_id: str, tracing_provider: str, tracing_config: dict, current_trace_config=None
  65. ):
  66. """
  67. Encrypt tracing config.
  68. :param tenant_id: tenant id
  69. :param tracing_provider: tracing provider
  70. :param tracing_config: tracing config dictionary to be encrypted
  71. :param current_trace_config: current tracing configuration for keeping existing values
  72. :return: encrypted tracing configuration
  73. """
  74. # Get the configuration class and the keys that require encryption
  75. config_class, secret_keys, other_keys = (
  76. provider_config_map[tracing_provider]["config_class"],
  77. provider_config_map[tracing_provider]["secret_keys"],
  78. provider_config_map[tracing_provider]["other_keys"],
  79. )
  80. new_config = {}
  81. # Encrypt necessary keys
  82. for key in secret_keys:
  83. if key in tracing_config:
  84. if "*" in tracing_config[key]:
  85. # If the key contains '*', retain the original value from the current config
  86. new_config[key] = current_trace_config.get(key, tracing_config[key])
  87. else:
  88. # Otherwise, encrypt the key
  89. new_config[key] = encrypt_token(tenant_id, tracing_config[key])
  90. for key in other_keys:
  91. new_config[key] = tracing_config.get(key, "")
  92. # Create a new instance of the config class with the new configuration
  93. encrypted_config = config_class(**new_config)
  94. return encrypted_config.model_dump()
  95. @classmethod
  96. def decrypt_tracing_config(cls, tenant_id: str, tracing_provider: str, tracing_config: dict):
  97. """
  98. Decrypt tracing config
  99. :param tenant_id: tenant id
  100. :param tracing_provider: tracing provider
  101. :param tracing_config: tracing config
  102. :return:
  103. """
  104. config_class, secret_keys, other_keys = (
  105. provider_config_map[tracing_provider]["config_class"],
  106. provider_config_map[tracing_provider]["secret_keys"],
  107. provider_config_map[tracing_provider]["other_keys"],
  108. )
  109. new_config = {}
  110. for key in secret_keys:
  111. if key in tracing_config:
  112. new_config[key] = decrypt_token(tenant_id, tracing_config[key])
  113. for key in other_keys:
  114. new_config[key] = tracing_config.get(key, "")
  115. return config_class(**new_config).model_dump()
  116. @classmethod
  117. def obfuscated_decrypt_token(cls, tracing_provider: str, decrypt_tracing_config: dict):
  118. """
  119. Decrypt tracing config
  120. :param tracing_provider: tracing provider
  121. :param decrypt_tracing_config: tracing config
  122. :return:
  123. """
  124. config_class, secret_keys, other_keys = (
  125. provider_config_map[tracing_provider]["config_class"],
  126. provider_config_map[tracing_provider]["secret_keys"],
  127. provider_config_map[tracing_provider]["other_keys"],
  128. )
  129. new_config = {}
  130. for key in secret_keys:
  131. if key in decrypt_tracing_config:
  132. new_config[key] = obfuscated_token(decrypt_tracing_config[key])
  133. for key in other_keys:
  134. new_config[key] = decrypt_tracing_config.get(key, "")
  135. return config_class(**new_config).model_dump()
  136. @classmethod
  137. def get_decrypted_tracing_config(cls, app_id: str, tracing_provider: str):
  138. """
  139. Get decrypted tracing config
  140. :param app_id: app id
  141. :param tracing_provider: tracing provider
  142. :return:
  143. """
  144. trace_config_data: Optional[TraceAppConfig] = (
  145. db.session.query(TraceAppConfig)
  146. .filter(TraceAppConfig.app_id == app_id, TraceAppConfig.tracing_provider == tracing_provider)
  147. .first()
  148. )
  149. if not trace_config_data:
  150. return None
  151. # decrypt_token
  152. app = db.session.query(App).filter(App.id == app_id).first()
  153. if not app:
  154. raise ValueError("App not found")
  155. tenant_id = app.tenant_id
  156. decrypt_tracing_config = cls.decrypt_tracing_config(
  157. tenant_id, tracing_provider, trace_config_data.tracing_config
  158. )
  159. return decrypt_tracing_config
  160. @classmethod
  161. def get_ops_trace_instance(
  162. cls,
  163. app_id: Optional[Union[UUID, str]] = None,
  164. ):
  165. """
  166. Get ops trace through model config
  167. :param app_id: app_id
  168. :return:
  169. """
  170. if isinstance(app_id, UUID):
  171. app_id = str(app_id)
  172. if app_id is None:
  173. return None
  174. app: Optional[App] = db.session.query(App).filter(App.id == app_id).first()
  175. if app is None:
  176. return None
  177. app_ops_trace_config = json.loads(app.tracing) if app.tracing else None
  178. if app_ops_trace_config is None:
  179. return None
  180. tracing_provider = app_ops_trace_config.get("tracing_provider")
  181. if tracing_provider is None or tracing_provider not in provider_config_map:
  182. return None
  183. # decrypt_token
  184. decrypt_trace_config = cls.get_decrypted_tracing_config(app_id, tracing_provider)
  185. if app_ops_trace_config.get("enabled"):
  186. trace_instance, config_class = (
  187. provider_config_map[tracing_provider]["trace_instance"],
  188. provider_config_map[tracing_provider]["config_class"],
  189. )
  190. if not decrypt_trace_config:
  191. return None
  192. tracing_instance = trace_instance(config_class(**decrypt_trace_config))
  193. return tracing_instance
  194. return None
  195. @classmethod
  196. def get_app_config_through_message_id(cls, message_id: str):
  197. app_model_config = None
  198. message_data = db.session.query(Message).filter(Message.id == message_id).first()
  199. if not message_data:
  200. return None
  201. conversation_id = message_data.conversation_id
  202. conversation_data = db.session.query(Conversation).filter(Conversation.id == conversation_id).first()
  203. if not conversation_data:
  204. return None
  205. if conversation_data.app_model_config_id:
  206. app_model_config = (
  207. db.session.query(AppModelConfig)
  208. .filter(AppModelConfig.id == conversation_data.app_model_config_id)
  209. .first()
  210. )
  211. elif conversation_data.app_model_config_id is None and conversation_data.override_model_configs:
  212. app_model_config = conversation_data.override_model_configs
  213. return app_model_config
  214. @classmethod
  215. def update_app_tracing_config(cls, app_id: str, enabled: bool, tracing_provider: str):
  216. """
  217. Update app tracing config
  218. :param app_id: app id
  219. :param enabled: enabled
  220. :param tracing_provider: tracing provider
  221. :return:
  222. """
  223. # auth check
  224. if tracing_provider not in provider_config_map and tracing_provider is not None:
  225. raise ValueError(f"Invalid tracing provider: {tracing_provider}")
  226. app_config: Optional[App] = db.session.query(App).filter(App.id == app_id).first()
  227. if not app_config:
  228. raise ValueError("App not found")
  229. app_config.tracing = json.dumps(
  230. {
  231. "enabled": enabled,
  232. "tracing_provider": tracing_provider,
  233. }
  234. )
  235. db.session.commit()
  236. @classmethod
  237. def get_app_tracing_config(cls, app_id: str):
  238. """
  239. Get app tracing config
  240. :param app_id: app id
  241. :return:
  242. """
  243. app: Optional[App] = db.session.query(App).filter(App.id == app_id).first()
  244. if not app:
  245. raise ValueError("App not found")
  246. if not app.tracing:
  247. return {"enabled": False, "tracing_provider": None}
  248. app_trace_config = json.loads(app.tracing)
  249. return app_trace_config
  250. @staticmethod
  251. def check_trace_config_is_effective(tracing_config: dict, tracing_provider: str):
  252. """
  253. Check trace config is effective
  254. :param tracing_config: tracing config
  255. :param tracing_provider: tracing provider
  256. :return:
  257. """
  258. config_type, trace_instance = (
  259. provider_config_map[tracing_provider]["config_class"],
  260. provider_config_map[tracing_provider]["trace_instance"],
  261. )
  262. tracing_config = config_type(**tracing_config)
  263. return trace_instance(tracing_config).api_check()
  264. @staticmethod
  265. def get_trace_config_project_key(tracing_config: dict, tracing_provider: str):
  266. """
  267. get trace config is project key
  268. :param tracing_config: tracing config
  269. :param tracing_provider: tracing provider
  270. :return:
  271. """
  272. config_type, trace_instance = (
  273. provider_config_map[tracing_provider]["config_class"],
  274. provider_config_map[tracing_provider]["trace_instance"],
  275. )
  276. tracing_config = config_type(**tracing_config)
  277. return trace_instance(tracing_config).get_project_key()
  278. @staticmethod
  279. def get_trace_config_project_url(tracing_config: dict, tracing_provider: str):
  280. """
  281. get trace config is project key
  282. :param tracing_config: tracing config
  283. :param tracing_provider: tracing provider
  284. :return:
  285. """
  286. config_type, trace_instance = (
  287. provider_config_map[tracing_provider]["config_class"],
  288. provider_config_map[tracing_provider]["trace_instance"],
  289. )
  290. tracing_config = config_type(**tracing_config)
  291. return trace_instance(tracing_config).get_project_url()
  292. class TraceTask:
  293. def __init__(
  294. self,
  295. trace_type: Any,
  296. message_id: Optional[str] = None,
  297. workflow_run: Optional[WorkflowRun] = None,
  298. conversation_id: Optional[str] = None,
  299. user_id: Optional[str] = None,
  300. timer: Optional[Any] = None,
  301. **kwargs,
  302. ):
  303. self.trace_type = trace_type
  304. self.message_id = message_id
  305. self.workflow_run_id = workflow_run.id if workflow_run else None
  306. self.conversation_id = conversation_id
  307. self.user_id = user_id
  308. self.timer = timer
  309. self.file_base_url = os.getenv("FILES_URL", "http://127.0.0.1:5001")
  310. self.app_id = None
  311. self.kwargs = kwargs
  312. def execute(self):
  313. return self.preprocess()
  314. def preprocess(self):
  315. preprocess_map = {
  316. TraceTaskName.CONVERSATION_TRACE: lambda: self.conversation_trace(**self.kwargs),
  317. TraceTaskName.WORKFLOW_TRACE: lambda: self.workflow_trace(
  318. workflow_run_id=self.workflow_run_id, conversation_id=self.conversation_id, user_id=self.user_id
  319. ),
  320. TraceTaskName.MESSAGE_TRACE: lambda: self.message_trace(message_id=self.message_id),
  321. TraceTaskName.MODERATION_TRACE: lambda: self.moderation_trace(
  322. message_id=self.message_id, timer=self.timer, **self.kwargs
  323. ),
  324. TraceTaskName.SUGGESTED_QUESTION_TRACE: lambda: self.suggested_question_trace(
  325. message_id=self.message_id, timer=self.timer, **self.kwargs
  326. ),
  327. TraceTaskName.DATASET_RETRIEVAL_TRACE: lambda: self.dataset_retrieval_trace(
  328. message_id=self.message_id, timer=self.timer, **self.kwargs
  329. ),
  330. TraceTaskName.TOOL_TRACE: lambda: self.tool_trace(
  331. message_id=self.message_id, timer=self.timer, **self.kwargs
  332. ),
  333. TraceTaskName.GENERATE_NAME_TRACE: lambda: self.generate_name_trace(
  334. conversation_id=self.conversation_id, timer=self.timer, **self.kwargs
  335. ),
  336. }
  337. return preprocess_map.get(self.trace_type, lambda: None)()
  338. # process methods for different trace types
  339. def conversation_trace(self, **kwargs):
  340. return kwargs
  341. def workflow_trace(
  342. self,
  343. *,
  344. workflow_run_id: str | None,
  345. conversation_id: str | None,
  346. user_id: str | None,
  347. ):
  348. if not workflow_run_id:
  349. return {}
  350. with Session(db.engine) as session:
  351. workflow_run_stmt = select(WorkflowRun).where(WorkflowRun.id == workflow_run_id)
  352. workflow_run = session.scalars(workflow_run_stmt).first()
  353. if not workflow_run:
  354. raise ValueError("Workflow run not found")
  355. workflow_id = workflow_run.workflow_id
  356. tenant_id = workflow_run.tenant_id
  357. workflow_run_id = workflow_run.id
  358. workflow_run_elapsed_time = workflow_run.elapsed_time
  359. workflow_run_status = workflow_run.status
  360. workflow_run_inputs = workflow_run.inputs_dict
  361. workflow_run_outputs = workflow_run.outputs_dict
  362. workflow_run_version = workflow_run.version
  363. error = workflow_run.error or ""
  364. total_tokens = workflow_run.total_tokens
  365. file_list = workflow_run_inputs.get("sys.file") or []
  366. query = workflow_run_inputs.get("query") or workflow_run_inputs.get("sys.query") or ""
  367. # get workflow_app_log_id
  368. workflow_app_log_data_stmt = select(WorkflowAppLog.id).where(
  369. WorkflowAppLog.tenant_id == tenant_id,
  370. WorkflowAppLog.app_id == workflow_run.app_id,
  371. WorkflowAppLog.workflow_run_id == workflow_run.id,
  372. )
  373. workflow_app_log_id = session.scalar(workflow_app_log_data_stmt)
  374. # get message_id
  375. message_id = None
  376. if conversation_id:
  377. message_data_stmt = select(Message.id).where(
  378. Message.conversation_id == conversation_id,
  379. Message.workflow_run_id == workflow_run_id,
  380. )
  381. message_id = session.scalar(message_data_stmt)
  382. metadata = {
  383. "workflow_id": workflow_id,
  384. "conversation_id": conversation_id,
  385. "workflow_run_id": workflow_run_id,
  386. "tenant_id": tenant_id,
  387. "elapsed_time": workflow_run_elapsed_time,
  388. "status": workflow_run_status,
  389. "version": workflow_run_version,
  390. "total_tokens": total_tokens,
  391. "file_list": file_list,
  392. "triggered_form": workflow_run.triggered_from,
  393. "user_id": user_id,
  394. }
  395. workflow_trace_info = WorkflowTraceInfo(
  396. workflow_data=workflow_run.to_dict(),
  397. conversation_id=conversation_id,
  398. workflow_id=workflow_id,
  399. tenant_id=tenant_id,
  400. workflow_run_id=workflow_run_id,
  401. workflow_run_elapsed_time=workflow_run_elapsed_time,
  402. workflow_run_status=workflow_run_status,
  403. workflow_run_inputs=workflow_run_inputs,
  404. workflow_run_outputs=workflow_run_outputs,
  405. workflow_run_version=workflow_run_version,
  406. error=error,
  407. total_tokens=total_tokens,
  408. file_list=file_list,
  409. query=query,
  410. metadata=metadata,
  411. workflow_app_log_id=workflow_app_log_id,
  412. message_id=message_id,
  413. start_time=workflow_run.created_at,
  414. end_time=workflow_run.finished_at,
  415. )
  416. return workflow_trace_info
  417. def message_trace(self, message_id: str | None):
  418. if not message_id:
  419. return {}
  420. message_data = get_message_data(message_id)
  421. if not message_data:
  422. return {}
  423. conversation_mode_stmt = select(Conversation.mode).where(Conversation.id == message_data.conversation_id)
  424. conversation_mode = db.session.scalars(conversation_mode_stmt).all()
  425. if not conversation_mode or len(conversation_mode) == 0:
  426. return {}
  427. conversation_mode = conversation_mode[0]
  428. created_at = message_data.created_at
  429. inputs = message_data.message
  430. # get message file data
  431. message_file_data = db.session.query(MessageFile).filter_by(message_id=message_id).first()
  432. file_list = []
  433. if message_file_data and message_file_data.url is not None:
  434. file_url = f"{self.file_base_url}/{message_file_data.url}" if message_file_data else ""
  435. file_list.append(file_url)
  436. metadata = {
  437. "conversation_id": message_data.conversation_id,
  438. "ls_provider": message_data.model_provider,
  439. "ls_model_name": message_data.model_id,
  440. "status": message_data.status,
  441. "from_end_user_id": message_data.from_end_user_id,
  442. "from_account_id": message_data.from_account_id,
  443. "agent_based": message_data.agent_based,
  444. "workflow_run_id": message_data.workflow_run_id,
  445. "from_source": message_data.from_source,
  446. "message_id": message_id,
  447. }
  448. message_tokens = message_data.message_tokens
  449. message_trace_info = MessageTraceInfo(
  450. message_id=message_id,
  451. message_data=message_data.to_dict(),
  452. conversation_model=conversation_mode,
  453. message_tokens=message_tokens,
  454. answer_tokens=message_data.answer_tokens,
  455. total_tokens=message_tokens + message_data.answer_tokens,
  456. error=message_data.error or "",
  457. inputs=inputs,
  458. outputs=message_data.answer,
  459. file_list=file_list,
  460. start_time=created_at,
  461. end_time=created_at + timedelta(seconds=message_data.provider_response_latency),
  462. metadata=metadata,
  463. message_file_data=message_file_data,
  464. conversation_mode=conversation_mode,
  465. )
  466. return message_trace_info
  467. def moderation_trace(self, message_id, timer, **kwargs):
  468. moderation_result = kwargs.get("moderation_result")
  469. if not moderation_result:
  470. return {}
  471. inputs = kwargs.get("inputs")
  472. message_data = get_message_data(message_id)
  473. if not message_data:
  474. return {}
  475. metadata = {
  476. "message_id": message_id,
  477. "action": moderation_result.action,
  478. "preset_response": moderation_result.preset_response,
  479. "query": moderation_result.query,
  480. }
  481. # get workflow_app_log_id
  482. workflow_app_log_id = None
  483. if message_data.workflow_run_id:
  484. workflow_app_log_data = (
  485. db.session.query(WorkflowAppLog).filter_by(workflow_run_id=message_data.workflow_run_id).first()
  486. )
  487. workflow_app_log_id = str(workflow_app_log_data.id) if workflow_app_log_data else None
  488. moderation_trace_info = ModerationTraceInfo(
  489. message_id=workflow_app_log_id or message_id,
  490. inputs=inputs,
  491. message_data=message_data.to_dict(),
  492. flagged=moderation_result.flagged,
  493. action=moderation_result.action,
  494. preset_response=moderation_result.preset_response,
  495. query=moderation_result.query,
  496. start_time=timer.get("start"),
  497. end_time=timer.get("end"),
  498. metadata=metadata,
  499. )
  500. return moderation_trace_info
  501. def suggested_question_trace(self, message_id, timer, **kwargs):
  502. suggested_question = kwargs.get("suggested_question", [])
  503. message_data = get_message_data(message_id)
  504. if not message_data:
  505. return {}
  506. metadata = {
  507. "message_id": message_id,
  508. "ls_provider": message_data.model_provider,
  509. "ls_model_name": message_data.model_id,
  510. "status": message_data.status,
  511. "from_end_user_id": message_data.from_end_user_id,
  512. "from_account_id": message_data.from_account_id,
  513. "agent_based": message_data.agent_based,
  514. "workflow_run_id": message_data.workflow_run_id,
  515. "from_source": message_data.from_source,
  516. }
  517. # get workflow_app_log_id
  518. workflow_app_log_id = None
  519. if message_data.workflow_run_id:
  520. workflow_app_log_data = (
  521. db.session.query(WorkflowAppLog).filter_by(workflow_run_id=message_data.workflow_run_id).first()
  522. )
  523. workflow_app_log_id = str(workflow_app_log_data.id) if workflow_app_log_data else None
  524. suggested_question_trace_info = SuggestedQuestionTraceInfo(
  525. message_id=workflow_app_log_id or message_id,
  526. message_data=message_data.to_dict(),
  527. inputs=message_data.message,
  528. outputs=message_data.answer,
  529. start_time=timer.get("start"),
  530. end_time=timer.get("end"),
  531. metadata=metadata,
  532. total_tokens=message_data.message_tokens + message_data.answer_tokens,
  533. status=message_data.status,
  534. error=message_data.error,
  535. from_account_id=message_data.from_account_id,
  536. agent_based=message_data.agent_based,
  537. from_source=message_data.from_source,
  538. model_provider=message_data.model_provider,
  539. model_id=message_data.model_id,
  540. suggested_question=suggested_question,
  541. level=message_data.status,
  542. status_message=message_data.error,
  543. )
  544. return suggested_question_trace_info
  545. def dataset_retrieval_trace(self, message_id, timer, **kwargs):
  546. documents = kwargs.get("documents")
  547. message_data = get_message_data(message_id)
  548. if not message_data:
  549. return {}
  550. metadata = {
  551. "message_id": message_id,
  552. "ls_provider": message_data.model_provider,
  553. "ls_model_name": message_data.model_id,
  554. "status": message_data.status,
  555. "from_end_user_id": message_data.from_end_user_id,
  556. "from_account_id": message_data.from_account_id,
  557. "agent_based": message_data.agent_based,
  558. "workflow_run_id": message_data.workflow_run_id,
  559. "from_source": message_data.from_source,
  560. }
  561. dataset_retrieval_trace_info = DatasetRetrievalTraceInfo(
  562. message_id=message_id,
  563. inputs=message_data.query or message_data.inputs,
  564. documents=[doc.model_dump() for doc in documents] if documents else [],
  565. start_time=timer.get("start"),
  566. end_time=timer.get("end"),
  567. metadata=metadata,
  568. message_data=message_data.to_dict(),
  569. )
  570. return dataset_retrieval_trace_info
  571. def tool_trace(self, message_id, timer, **kwargs):
  572. tool_name = kwargs.get("tool_name", "")
  573. tool_inputs = kwargs.get("tool_inputs", {})
  574. tool_outputs = kwargs.get("tool_outputs", {})
  575. message_data = get_message_data(message_id)
  576. if not message_data:
  577. return {}
  578. tool_config = {}
  579. time_cost = 0
  580. error = None
  581. tool_parameters = {}
  582. created_time = message_data.created_at
  583. end_time = message_data.updated_at
  584. agent_thoughts = message_data.agent_thoughts
  585. for agent_thought in agent_thoughts:
  586. if tool_name in agent_thought.tools:
  587. created_time = agent_thought.created_at
  588. tool_meta_data = agent_thought.tool_meta.get(tool_name, {})
  589. tool_config = tool_meta_data.get("tool_config", {})
  590. time_cost = tool_meta_data.get("time_cost", 0)
  591. end_time = created_time + timedelta(seconds=time_cost)
  592. error = tool_meta_data.get("error", "")
  593. tool_parameters = tool_meta_data.get("tool_parameters", {})
  594. metadata = {
  595. "message_id": message_id,
  596. "tool_name": tool_name,
  597. "tool_inputs": tool_inputs,
  598. "tool_outputs": tool_outputs,
  599. "tool_config": tool_config,
  600. "time_cost": time_cost,
  601. "error": error,
  602. "tool_parameters": tool_parameters,
  603. }
  604. file_url = ""
  605. message_file_data = db.session.query(MessageFile).filter_by(message_id=message_id).first()
  606. if message_file_data:
  607. message_file_id = message_file_data.id if message_file_data else None
  608. type = message_file_data.type
  609. created_by_role = message_file_data.created_by_role
  610. created_user_id = message_file_data.created_by
  611. file_url = f"{self.file_base_url}/{message_file_data.url}"
  612. metadata.update(
  613. {
  614. "message_file_id": message_file_id,
  615. "created_by_role": created_by_role,
  616. "created_user_id": created_user_id,
  617. "type": type,
  618. }
  619. )
  620. tool_trace_info = ToolTraceInfo(
  621. message_id=message_id,
  622. message_data=message_data.to_dict(),
  623. tool_name=tool_name,
  624. start_time=timer.get("start") if timer else created_time,
  625. end_time=timer.get("end") if timer else end_time,
  626. tool_inputs=tool_inputs,
  627. tool_outputs=tool_outputs,
  628. metadata=metadata,
  629. message_file_data=message_file_data,
  630. error=error,
  631. inputs=message_data.message,
  632. outputs=message_data.answer,
  633. tool_config=tool_config,
  634. time_cost=time_cost,
  635. tool_parameters=tool_parameters,
  636. file_url=file_url,
  637. )
  638. return tool_trace_info
  639. def generate_name_trace(self, conversation_id, timer, **kwargs):
  640. generate_conversation_name = kwargs.get("generate_conversation_name")
  641. inputs = kwargs.get("inputs")
  642. tenant_id = kwargs.get("tenant_id")
  643. if not tenant_id:
  644. return {}
  645. start_time = timer.get("start")
  646. end_time = timer.get("end")
  647. metadata = {
  648. "conversation_id": conversation_id,
  649. "tenant_id": tenant_id,
  650. }
  651. generate_name_trace_info = GenerateNameTraceInfo(
  652. conversation_id=conversation_id,
  653. inputs=inputs,
  654. outputs=generate_conversation_name,
  655. start_time=start_time,
  656. end_time=end_time,
  657. metadata=metadata,
  658. tenant_id=tenant_id,
  659. )
  660. return generate_name_trace_info
  661. trace_manager_timer: Optional[threading.Timer] = None
  662. trace_manager_queue: queue.Queue = queue.Queue()
  663. trace_manager_interval = int(os.getenv("TRACE_QUEUE_MANAGER_INTERVAL", 5))
  664. trace_manager_batch_size = int(os.getenv("TRACE_QUEUE_MANAGER_BATCH_SIZE", 100))
  665. class TraceQueueManager:
  666. def __init__(self, app_id=None, user_id=None):
  667. global trace_manager_timer
  668. self.app_id = app_id
  669. self.user_id = user_id
  670. self.trace_instance = OpsTraceManager.get_ops_trace_instance(app_id)
  671. self.flask_app = current_app._get_current_object() # type: ignore
  672. if trace_manager_timer is None:
  673. self.start_timer()
  674. def add_trace_task(self, trace_task: TraceTask):
  675. global trace_manager_timer, trace_manager_queue
  676. try:
  677. if self.trace_instance:
  678. trace_task.app_id = self.app_id
  679. trace_manager_queue.put(trace_task)
  680. except Exception as e:
  681. logging.exception(f"Error adding trace task, trace_type {trace_task.trace_type}")
  682. finally:
  683. self.start_timer()
  684. def collect_tasks(self):
  685. global trace_manager_queue
  686. tasks: list[TraceTask] = []
  687. while len(tasks) < trace_manager_batch_size and not trace_manager_queue.empty():
  688. task = trace_manager_queue.get_nowait()
  689. tasks.append(task)
  690. trace_manager_queue.task_done()
  691. return tasks
  692. def run(self):
  693. try:
  694. tasks = self.collect_tasks()
  695. if tasks:
  696. self.send_to_celery(tasks)
  697. except Exception as e:
  698. logging.exception("Error processing trace tasks")
  699. def start_timer(self):
  700. global trace_manager_timer
  701. if trace_manager_timer is None or not trace_manager_timer.is_alive():
  702. trace_manager_timer = threading.Timer(trace_manager_interval, self.run)
  703. trace_manager_timer.name = f"trace_manager_timer_{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime())}"
  704. trace_manager_timer.daemon = False
  705. trace_manager_timer.start()
  706. def send_to_celery(self, tasks: list[TraceTask]):
  707. with self.flask_app.app_context():
  708. for task in tasks:
  709. if task.app_id is None:
  710. continue
  711. file_id = uuid4().hex
  712. trace_info = task.execute()
  713. task_data = TaskData(
  714. app_id=task.app_id,
  715. trace_info_type=type(trace_info).__name__,
  716. trace_info=trace_info.model_dump() if trace_info else None,
  717. )
  718. file_path = f"{OPS_FILE_PATH}{task.app_id}/{file_id}.json"
  719. storage.save(file_path, task_data.model_dump_json().encode("utf-8"))
  720. file_info = {
  721. "file_id": file_id,
  722. "app_id": task.app_id,
  723. }
  724. process_trace_tasks.delay(file_info)