jamtur01's picture
Upload folder using huggingface_hub
9c6594c verified
from __future__ import annotations
__all__ = ("Sentry",)
import atexit
import functools
import os
import pathlib
import sys
from types import TracebackType
from typing import TYPE_CHECKING, Any, Callable, Literal
from urllib.parse import quote
import sentry_sdk # type: ignore
import sentry_sdk.scope # type: ignore
import sentry_sdk.utils # type: ignore
import wandb
import wandb.env
import wandb.util
if TYPE_CHECKING:
import wandb.sdk.internal.settings_static
SENTRY_DEFAULT_DSN = (
"https://2592b1968ea94cca9b5ef5e348e094a7@o151352.ingest.sentry.io/4504800232407040"
)
SessionStatus = Literal["ok", "exited", "crashed", "abnormal"]
def _safe_noop(func: Callable) -> Callable:
"""Decorator to ensure that Sentry methods do nothing if disabled and don't raise."""
@functools.wraps(func)
def wrapper(self: type[Sentry], *args: Any, **kwargs: Any) -> Any:
if self._disabled:
return None
try:
return func(self, *args, **kwargs)
except Exception as e:
# do not call self.exception here to avoid infinite recursion
if func.__name__ != "exception":
self.exception(f"Error in {func.__name__}: {e}")
return None
return wrapper
class Sentry:
_disabled: bool
def __init__(self) -> None:
self._disabled = not wandb.env.error_reporting_enabled()
self._sent_messages: set = set()
self.dsn = os.environ.get(wandb.env.SENTRY_DSN, SENTRY_DEFAULT_DSN)
self.scope: sentry_sdk.scope.Scope | None = None
# ensure we always end the Sentry session
atexit.register(self.end_session)
@property
def environment(self) -> str:
"""Return the environment we're running in."""
# check if we're in a git repo
is_git = pathlib.Path(__file__).parent.parent.parent.joinpath(".git").exists()
# these match the environments for gorilla
return "development" if is_git else "production"
@_safe_noop
def setup(self) -> None:
"""Setup Sentry SDK.
We use lower-level APIs (i.e., not sentry_sdk.init) here
to avoid the possibility of interfering with the user's
own Sentry SDK setup.
"""
client = sentry_sdk.Client(
dsn=self.dsn,
default_integrations=False,
environment=self.environment,
release=wandb.__version__,
)
self.scope = sentry_sdk.get_global_scope().fork()
self.scope.clear()
self.scope.set_client(client)
@_safe_noop
def message(self, message: str, repeat: bool = True) -> str | None:
"""Send a message to Sentry."""
if not repeat and message in self._sent_messages:
return None
self._sent_messages.add(message)
with sentry_sdk.scope.use_isolation_scope(self.scope): # type: ignore
return sentry_sdk.capture_message(message) # type: ignore
@_safe_noop
def exception(
self,
exc: str
| BaseException
| tuple[
type[BaseException] | None,
BaseException | None,
TracebackType | None,
]
| None,
handled: bool = False,
status: SessionStatus | None = None,
) -> str | None:
"""Log an exception to Sentry."""
if isinstance(exc, str):
exc_info = sentry_sdk.utils.exc_info_from_error(Exception(exc))
elif isinstance(exc, BaseException):
exc_info = sentry_sdk.utils.exc_info_from_error(exc)
else:
exc_info = sys.exc_info()
event, _ = sentry_sdk.utils.event_from_exception(
exc_info,
client_options=self.scope.get_client().options, # type: ignore
mechanism={"type": "generic", "handled": handled},
)
event_id = None
try:
with sentry_sdk.scope.use_isolation_scope(self.scope): # type: ignore
event_id = sentry_sdk.capture_event(event) # type: ignore
except Exception:
pass
# if the status is not explicitly set, we'll set it to "crashed" if the exception
# was unhandled, or "errored" if it was handled
status = status or ("crashed" if not handled else "errored") # type: ignore
self.mark_session(status=status)
client = self.scope.get_client() # type: ignore
if client is not None:
client.flush()
return event_id
def reraise(self, exc: Any) -> None:
"""Re-raise an exception after logging it to Sentry.
Use this for top-level exceptions when you want the user to see the traceback.
Must be called from within an exception handler.
"""
self.exception(exc)
# this will messily add this "reraise" function to the stack trace,
# but hopefully it's not too bad
raise exc.with_traceback(sys.exc_info()[2])
@_safe_noop
def start_session(self) -> None:
"""Start a new session."""
assert self.scope is not None
# get the current client and scope
session = self.scope._session
# if there's no session, start one
if session is None:
self.scope.start_session()
@_safe_noop
def end_session(self) -> None:
"""End the current session."""
assert self.scope is not None
# get the current client and scope
client = self.scope.get_client()
session = self.scope._session
if session is not None and client is not None:
self.scope.end_session()
client.flush()
@_safe_noop
def mark_session(self, status: SessionStatus | None = None) -> None:
"""Mark the current session with a status."""
assert self.scope is not None
session = self.scope._session
if session is not None:
session.update(status=status)
@_safe_noop
def configure_scope(
self,
tags: dict[str, Any] | None = None,
process_context: str | None = None,
) -> None:
"""Configure the Sentry scope for the current thread.
This function should be called at the beginning of every thread that
will send events to Sentry. It sets the tags that will be applied to
all events sent from this thread. It also tries to start a session
if one doesn't already exist for this thread.
"""
assert self.scope is not None
settings_tags = (
"entity",
"project",
"run_id",
"run_url",
"sweep_url",
"sweep_id",
"deployment",
"x_require_legacy_service",
"launch",
"_platform",
)
# set context
if process_context:
self.scope.set_tag("process_context", process_context)
# apply settings tags
if tags is None:
return None
for tag in settings_tags:
val = tags.get(tag, None)
if val not in (None, ""):
self.scope.set_tag(tag, val)
if tags.get("_colab", None):
python_runtime = "colab"
elif tags.get("_jupyter", None):
python_runtime = "jupyter"
elif tags.get("_ipython", None):
python_runtime = "ipython"
else:
python_runtime = "python"
self.scope.set_tag("python_runtime", python_runtime)
# Construct run_url and sweep_url given run_id and sweep_id
for obj in ("run", "sweep"):
obj_id, obj_url = f"{obj}_id", f"{obj}_url"
if tags.get(obj_url, None):
continue
try:
app_url = wandb.util.app_url(tags["base_url"]) # type: ignore
entity, project = (quote(tags[k]) for k in ("entity", "project")) # type: ignore
self.scope.set_tag(
obj_url,
f"{app_url}/{entity}/{project}/{obj}s/{tags[obj_id]}",
)
except Exception:
pass
email = tags.get("email")
if email:
self.scope.user = {"email": email}
# todo: add back the option to pass general tags see: c645f625d1c1a3db4a6b0e2aa8e924fee101904c (wandb/util.py)
self.start_session()