arq.py 7.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237
  1. import sys
  2. import sentry_sdk
  3. from sentry_sdk.consts import OP, SPANSTATUS
  4. from sentry_sdk.integrations import _check_minimum_version, DidNotEnable, Integration
  5. from sentry_sdk.integrations.logging import ignore_logger
  6. from sentry_sdk.scope import should_send_default_pii
  7. from sentry_sdk.tracing import Transaction, TransactionSource
  8. from sentry_sdk.utils import (
  9. capture_internal_exceptions,
  10. ensure_integration_enabled,
  11. event_from_exception,
  12. SENSITIVE_DATA_SUBSTITUTE,
  13. parse_version,
  14. reraise,
  15. )
  16. try:
  17. import arq.worker
  18. from arq.version import VERSION as ARQ_VERSION
  19. from arq.connections import ArqRedis
  20. from arq.worker import JobExecutionFailed, Retry, RetryJob, Worker
  21. except ImportError:
  22. raise DidNotEnable("Arq is not installed")
  23. from typing import TYPE_CHECKING
  24. if TYPE_CHECKING:
  25. from typing import Any, Dict, Optional, Union
  26. from sentry_sdk._types import EventProcessor, Event, ExcInfo, Hint
  27. from arq.cron import CronJob
  28. from arq.jobs import Job
  29. from arq.typing import WorkerCoroutine
  30. from arq.worker import Function
  31. ARQ_CONTROL_FLOW_EXCEPTIONS = (JobExecutionFailed, Retry, RetryJob)
  32. class ArqIntegration(Integration):
  33. identifier = "arq"
  34. origin = f"auto.queue.{identifier}"
  35. @staticmethod
  36. def setup_once() -> None:
  37. try:
  38. if isinstance(ARQ_VERSION, str):
  39. version = parse_version(ARQ_VERSION)
  40. else:
  41. version = ARQ_VERSION.version[:2]
  42. except (TypeError, ValueError):
  43. version = None
  44. _check_minimum_version(ArqIntegration, version)
  45. patch_enqueue_job()
  46. patch_run_job()
  47. patch_create_worker()
  48. ignore_logger("arq.worker")
  49. def patch_enqueue_job() -> None:
  50. old_enqueue_job = ArqRedis.enqueue_job
  51. original_kwdefaults = old_enqueue_job.__kwdefaults__
  52. async def _sentry_enqueue_job(
  53. self: "ArqRedis", function: str, *args: "Any", **kwargs: "Any"
  54. ) -> "Optional[Job]":
  55. integration = sentry_sdk.get_client().get_integration(ArqIntegration)
  56. if integration is None:
  57. return await old_enqueue_job(self, function, *args, **kwargs)
  58. with sentry_sdk.start_span(
  59. op=OP.QUEUE_SUBMIT_ARQ, name=function, origin=ArqIntegration.origin
  60. ):
  61. return await old_enqueue_job(self, function, *args, **kwargs)
  62. _sentry_enqueue_job.__kwdefaults__ = original_kwdefaults
  63. ArqRedis.enqueue_job = _sentry_enqueue_job
  64. def patch_run_job() -> None:
  65. old_run_job = Worker.run_job
  66. async def _sentry_run_job(self: "Worker", job_id: str, score: int) -> None:
  67. integration = sentry_sdk.get_client().get_integration(ArqIntegration)
  68. if integration is None:
  69. return await old_run_job(self, job_id, score)
  70. with sentry_sdk.isolation_scope() as scope:
  71. scope._name = "arq"
  72. scope.clear_breadcrumbs()
  73. transaction = Transaction(
  74. name="unknown arq task",
  75. status="ok",
  76. op=OP.QUEUE_TASK_ARQ,
  77. source=TransactionSource.TASK,
  78. origin=ArqIntegration.origin,
  79. )
  80. with sentry_sdk.start_transaction(transaction):
  81. return await old_run_job(self, job_id, score)
  82. Worker.run_job = _sentry_run_job
  83. def _capture_exception(exc_info: "ExcInfo") -> None:
  84. scope = sentry_sdk.get_current_scope()
  85. if scope.transaction is not None:
  86. if exc_info[0] in ARQ_CONTROL_FLOW_EXCEPTIONS:
  87. scope.transaction.set_status(SPANSTATUS.ABORTED)
  88. return
  89. scope.transaction.set_status(SPANSTATUS.INTERNAL_ERROR)
  90. event, hint = event_from_exception(
  91. exc_info,
  92. client_options=sentry_sdk.get_client().options,
  93. mechanism={"type": ArqIntegration.identifier, "handled": False},
  94. )
  95. sentry_sdk.capture_event(event, hint=hint)
  96. def _make_event_processor(
  97. ctx: "Dict[Any, Any]", *args: "Any", **kwargs: "Any"
  98. ) -> "EventProcessor":
  99. def event_processor(event: "Event", hint: "Hint") -> "Optional[Event]":
  100. with capture_internal_exceptions():
  101. scope = sentry_sdk.get_current_scope()
  102. if scope.transaction is not None:
  103. scope.transaction.name = ctx["job_name"]
  104. event["transaction"] = ctx["job_name"]
  105. tags = event.setdefault("tags", {})
  106. tags["arq_task_id"] = ctx["job_id"]
  107. tags["arq_task_retry"] = ctx["job_try"] > 1
  108. extra = event.setdefault("extra", {})
  109. extra["arq-job"] = {
  110. "task": ctx["job_name"],
  111. "args": (
  112. args if should_send_default_pii() else SENSITIVE_DATA_SUBSTITUTE
  113. ),
  114. "kwargs": (
  115. kwargs if should_send_default_pii() else SENSITIVE_DATA_SUBSTITUTE
  116. ),
  117. "retry": ctx["job_try"],
  118. }
  119. return event
  120. return event_processor
  121. def _wrap_coroutine(name: str, coroutine: "WorkerCoroutine") -> "WorkerCoroutine":
  122. async def _sentry_coroutine(
  123. ctx: "Dict[Any, Any]", *args: "Any", **kwargs: "Any"
  124. ) -> "Any":
  125. integration = sentry_sdk.get_client().get_integration(ArqIntegration)
  126. if integration is None:
  127. return await coroutine(ctx, *args, **kwargs)
  128. sentry_sdk.get_isolation_scope().add_event_processor(
  129. _make_event_processor({**ctx, "job_name": name}, *args, **kwargs)
  130. )
  131. try:
  132. result = await coroutine(ctx, *args, **kwargs)
  133. except Exception:
  134. exc_info = sys.exc_info()
  135. _capture_exception(exc_info)
  136. reraise(*exc_info)
  137. return result
  138. return _sentry_coroutine
  139. def patch_create_worker() -> None:
  140. old_create_worker = arq.worker.create_worker
  141. @ensure_integration_enabled(ArqIntegration, old_create_worker)
  142. def _sentry_create_worker(*args: "Any", **kwargs: "Any") -> "Worker":
  143. settings_cls = args[0] if args else kwargs.get("settings_cls")
  144. if isinstance(settings_cls, dict):
  145. if "functions" in settings_cls:
  146. settings_cls["functions"] = [
  147. _get_arq_function(func)
  148. for func in settings_cls.get("functions", [])
  149. ]
  150. if "cron_jobs" in settings_cls:
  151. settings_cls["cron_jobs"] = [
  152. _get_arq_cron_job(cron_job)
  153. for cron_job in settings_cls.get("cron_jobs", [])
  154. ]
  155. if hasattr(settings_cls, "functions"):
  156. settings_cls.functions = [ # type: ignore[union-attr]
  157. _get_arq_function(func)
  158. for func in settings_cls.functions # type: ignore[union-attr]
  159. ]
  160. if hasattr(settings_cls, "cron_jobs"):
  161. settings_cls.cron_jobs = [ # type: ignore[union-attr]
  162. _get_arq_cron_job(cron_job)
  163. for cron_job in (settings_cls.cron_jobs or []) # type: ignore[union-attr]
  164. ]
  165. if "functions" in kwargs:
  166. kwargs["functions"] = [
  167. _get_arq_function(func) for func in kwargs.get("functions", [])
  168. ]
  169. if "cron_jobs" in kwargs:
  170. kwargs["cron_jobs"] = [
  171. _get_arq_cron_job(cron_job) for cron_job in kwargs.get("cron_jobs", [])
  172. ]
  173. return old_create_worker(*args, **kwargs)
  174. arq.worker.create_worker = _sentry_create_worker
  175. def _get_arq_function(func: "Union[str, Function, WorkerCoroutine]") -> "Function":
  176. arq_func = arq.worker.func(func)
  177. arq_func.coroutine = _wrap_coroutine(arq_func.name, arq_func.coroutine)
  178. return arq_func
  179. def _get_arq_cron_job(cron_job: "CronJob") -> "CronJob":
  180. cron_job.coroutine = _wrap_coroutine(cron_job.name, cron_job.coroutine)
  181. return cron_job