jamtur01's picture
Upload folder using huggingface_hub
9c6594c verified
"""All of W&B's environment variables.
Getters and putters for all of them should go here. That way it'll be easier to
avoid typos with names and be consistent about environment variables' semantics.
Environment variables are not the authoritative source for these values in many
cases.
"""
from __future__ import annotations
import json
import os
import sys
from pathlib import Path
from typing import MutableMapping
import platformdirs
CONFIG_PATHS = "WANDB_CONFIG_PATHS"
SWEEP_PARAM_PATH = "WANDB_SWEEP_PARAM_PATH"
SHOW_RUN = "WANDB_SHOW_RUN"
DEBUG = "WANDB_DEBUG"
SILENT = "WANDB_SILENT"
QUIET = "WANDB_QUIET"
INITED = "WANDB_INITED"
DIR = "WANDB_DIR"
# Deprecate DESCRIPTION in a future release
DESCRIPTION = "WANDB_DESCRIPTION"
NAME = "WANDB_NAME"
NOTEBOOK_NAME = "WANDB_NOTEBOOK_NAME"
NOTES = "WANDB_NOTES"
USERNAME = "WANDB_USERNAME"
USER_EMAIL = "WANDB_USER_EMAIL"
PROJECT = "WANDB_PROJECT"
ENTITY = "WANDB_ENTITY"
ORGANIZATION = "WANDB_ORGANIZATION"
BASE_URL = "WANDB_BASE_URL"
APP_URL = "WANDB_APP_URL"
PROGRAM = "WANDB_PROGRAM"
ARGS = "WANDB_ARGS"
MODE = "WANDB_MODE"
START_METHOD = "WANDB_START_METHOD"
RESUME = "WANDB_RESUME"
RUN_ID = "WANDB_RUN_ID"
RUN_STORAGE_ID = "WANDB_RUN_STORAGE_ID"
RUN_GROUP = "WANDB_RUN_GROUP"
RUN_DIR = "WANDB_RUN_DIR"
SWEEP_ID = "WANDB_SWEEP_ID"
HTTP_TIMEOUT = "WANDB_HTTP_TIMEOUT"
FILE_PUSHER_TIMEOUT = "WANDB_FILE_PUSHER_TIMEOUT"
API_KEY = "WANDB_API_KEY"
IDENTITY_TOKEN_FILE = "WANDB_IDENTITY_TOKEN_FILE"
CREDENTIALS_FILE = "WANDB_CREDENTIALS_FILE"
JOB_TYPE = "WANDB_JOB_TYPE"
DISABLE_CODE = "WANDB_DISABLE_CODE"
DISABLE_GIT = "WANDB_DISABLE_GIT"
GIT_ROOT = "WANDB_GIT_ROOT"
SAVE_CODE = "WANDB_SAVE_CODE"
TAGS = "WANDB_TAGS"
IGNORE = "WANDB_IGNORE_GLOBS"
ERROR_REPORTING = "WANDB_ERROR_REPORTING"
CORE_DEBUG = "WANDB_CORE_DEBUG"
DOCKER = "WANDB_DOCKER"
AGENT_REPORT_INTERVAL = "WANDB_AGENT_REPORT_INTERVAL"
AGENT_KILL_DELAY = "WANDB_AGENT_KILL_DELAY"
AGENT_DISABLE_FLAPPING = "WANDB_AGENT_DISABLE_FLAPPING"
AGENT_MAX_INITIAL_FAILURES = "WANDB_AGENT_MAX_INITIAL_FAILURES"
CRASH_NOSYNC_TIME = "WANDB_CRASH_NOSYNC_TIME"
MAGIC = "WANDB_MAGIC"
HOST = "WANDB_HOST"
ANONYMOUS = "WANDB_ANONYMOUS"
JUPYTER = "WANDB_JUPYTER"
CONFIG_DIR = "WANDB_CONFIG_DIR"
DATA_DIR = "WANDB_DATA_DIR"
ARTIFACT_DIR = "WANDB_ARTIFACT_DIR"
ARTIFACT_FETCH_FILE_URL_BATCH_SIZE = "WANDB_ARTIFACT_FETCH_FILE_URL_BATCH_SIZE"
CACHE_DIR = "WANDB_CACHE_DIR"
DISABLE_SSL = "WANDB_INSECURE_DISABLE_SSL"
SERVICE = "WANDB_SERVICE"
SENTRY_DSN = "WANDB_SENTRY_DSN"
INIT_TIMEOUT = "WANDB_INIT_TIMEOUT"
GIT_COMMIT = "WANDB_GIT_COMMIT"
GIT_REMOTE_URL = "WANDB_GIT_REMOTE_URL"
_EXECUTABLE = "WANDB_X_EXECUTABLE"
LAUNCH_QUEUE_NAME = "WANDB_LAUNCH_QUEUE_NAME"
LAUNCH_QUEUE_ENTITY = "WANDB_LAUNCH_QUEUE_ENTITY"
LAUNCH_TRACE_ID = "WANDB_LAUNCH_TRACE_ID"
_REQUIRE_LEGACY_SERVICE = "WANDB_X_REQUIRE_LEGACY_SERVICE"
ENABLE_DCGM_PROFILING = "WANDB_ENABLE_DCGM_PROFILING"
# For testing, to be removed in future version
USE_V1_ARTIFACTS = "_WANDB_USE_V1_ARTIFACTS"
def immutable_keys() -> list[str]:
"""These are env keys that shouldn't change within a single process.
We use this to maintain certain values between multiple calls to wandb.init within a single process.
"""
return [
DIR,
ENTITY,
PROJECT,
API_KEY,
IGNORE,
DISABLE_CODE,
DISABLE_GIT,
DOCKER,
MODE,
BASE_URL,
ERROR_REPORTING,
CRASH_NOSYNC_TIME,
MAGIC,
USERNAME,
USER_EMAIL,
DIR,
SILENT,
CONFIG_PATHS,
ANONYMOUS,
RUN_GROUP,
JOB_TYPE,
TAGS,
RESUME,
AGENT_REPORT_INTERVAL,
HTTP_TIMEOUT,
HOST,
DATA_DIR,
ARTIFACT_DIR,
ARTIFACT_FETCH_FILE_URL_BATCH_SIZE,
CACHE_DIR,
USE_V1_ARTIFACTS,
DISABLE_SSL,
IDENTITY_TOKEN_FILE,
CREDENTIALS_FILE,
]
def _env_as_bool(
var: str, default: str | None = None, env: MutableMapping | None = None
) -> bool:
if env is None:
env = os.environ
val = env.get(var, default)
if not isinstance(val, str):
return False
try:
return strtobool(val)
except ValueError:
return False
def is_require_legacy_service(env: MutableMapping | None = None) -> bool:
"""Return whether wandb.require("legacy-service") was used."""
return _env_as_bool(_REQUIRE_LEGACY_SERVICE, default="False", env=env)
def is_debug(default: str | None = None, env: MutableMapping | None = None) -> bool:
return _env_as_bool(DEBUG, default=default, env=env)
def is_offline(env: MutableMapping | None = None) -> bool:
if env is None:
env = os.environ
return env.get(MODE) == "offline"
def error_reporting_enabled() -> bool:
return _env_as_bool(ERROR_REPORTING, default="True")
def core_debug(default: str | None = None) -> bool:
return _env_as_bool(CORE_DEBUG, default=default) or is_debug()
def ssl_disabled() -> bool:
return _env_as_bool(DISABLE_SSL, default="False")
def dcgm_profiling_enabled() -> bool:
"""Checks whether collecting profiling metrics for Nvidia GPUs using DCGM is requested.
Note: Enabling this feature can lead to increased resource usage
compared to standard monitoring.
Requires the `nvidia-dcgm` service to be running on the machine.
"""
return _env_as_bool(ENABLE_DCGM_PROFILING, default="False")
def get_error_reporting(
default: bool | str = True,
env: MutableMapping | None = None,
) -> bool | str:
if env is None:
env = os.environ
return env.get(ERROR_REPORTING, default)
def get_run(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(RUN_ID, default)
def get_args(
default: list[str] | None = None, env: MutableMapping | None = None
) -> list[str] | None:
if env is None:
env = os.environ
if env.get(ARGS):
try:
return json.loads(env.get(ARGS, "[]")) # type: ignore
except ValueError:
return None
else:
return default or sys.argv[1:]
def get_docker(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(DOCKER, default)
def get_http_timeout(default: int = 20, env: MutableMapping | None = None) -> int:
if env is None:
env = os.environ
return int(env.get(HTTP_TIMEOUT, default))
def get_file_pusher_timeout(
default: int | None = None,
env: MutableMapping | None = None,
) -> int | None:
if env is None:
env = os.environ
timeout = env.get(FILE_PUSHER_TIMEOUT, default)
return int(timeout) if timeout else None
def get_ignore(
default: list[str] | None = None, env: MutableMapping | None = None
) -> list[str] | None:
if env is None:
env = os.environ
ignore = env.get(IGNORE)
if ignore is not None:
return ignore.split(",")
else:
return default
def get_project(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(PROJECT, default)
def get_username(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(USERNAME, default)
def get_user_email(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(USER_EMAIL, default)
def get_entity(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(ENTITY, default)
def get_organization(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(ORGANIZATION, default)
def get_base_url(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(BASE_URL, default)
def get_app_url(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(APP_URL, default)
def get_show_run(default: str | None = None, env: MutableMapping | None = None) -> bool:
if env is None:
env = os.environ
return bool(env.get(SHOW_RUN, default))
def get_description(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(DESCRIPTION, default)
def get_tags(default: str = "", env: MutableMapping | None = None) -> list[str]:
if env is None:
env = os.environ
return [tag for tag in env.get(TAGS, default).split(",") if tag]
def get_dir(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(DIR, default)
def get_config_paths(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
return env.get(CONFIG_PATHS, default)
def get_agent_report_interval(
default: str | None = None, env: MutableMapping | None = None
) -> int | None:
if env is None:
env = os.environ
val = env.get(AGENT_REPORT_INTERVAL, default)
try:
val = int(val) # type: ignore
except ValueError:
val = None # silently ignore env format errors, caller should handle.
return val
def get_agent_kill_delay(
default: str | None = None, env: MutableMapping | None = None
) -> int | None:
if env is None:
env = os.environ
val = env.get(AGENT_KILL_DELAY, default)
try:
val = int(val) # type: ignore
except ValueError:
val = None # silently ignore env format errors, caller should handle.
return val
def get_crash_nosync_time(
default: str | None = None, env: MutableMapping | None = None
) -> int | None:
if env is None:
env = os.environ
val = env.get(CRASH_NOSYNC_TIME, default)
try:
val = int(val) # type: ignore
except ValueError:
val = None # silently ignore env format errors, caller should handle.
return val
def get_magic(
default: str | None = None, env: MutableMapping | None = None
) -> str | None:
if env is None:
env = os.environ
val = env.get(MAGIC, default)
return val
def get_data_dir(env: MutableMapping | None = None) -> str:
default_dir = platformdirs.user_data_dir("wandb")
if env is None:
env = os.environ
val = env.get(DATA_DIR, default_dir)
return val
def get_artifact_dir(env: MutableMapping | None = None) -> str:
default_dir = os.path.join(".", "artifacts")
if env is None:
env = os.environ
val = env.get(ARTIFACT_DIR, default_dir)
return os.path.abspath(str(val))
def get_artifact_fetch_file_url_batch_size(env: MutableMapping | None = None) -> int:
default_batch_size = 5000
if env is None:
env = os.environ
val = int(env.get(ARTIFACT_FETCH_FILE_URL_BATCH_SIZE, default_batch_size))
return val
def get_cache_dir(env: MutableMapping | None = None) -> Path:
env = env or os.environ
return Path(env.get(CACHE_DIR, platformdirs.user_cache_dir("wandb")))
def get_use_v1_artifacts(env: MutableMapping | None = None) -> bool:
if env is None:
env = os.environ
val = bool(env.get(USE_V1_ARTIFACTS, False))
return val
def get_agent_max_initial_failures(
default: int | None = None, env: MutableMapping | None = None
) -> int | None:
if env is None:
env = os.environ
val = env.get(AGENT_MAX_INITIAL_FAILURES, default)
try:
val = int(val) # type: ignore
except ValueError:
val = default
return val
def set_entity(value: str, env: MutableMapping | None = None) -> None:
if env is None:
env = os.environ
env[ENTITY] = value
def set_project(value: str, env: MutableMapping | None = None) -> None:
if env is None:
env = os.environ
env[PROJECT] = value or "uncategorized"
def should_save_code() -> bool:
save_code = _env_as_bool(SAVE_CODE, default="False")
code_disabled = _env_as_bool(DISABLE_CODE, default="False")
return save_code and not code_disabled
def disable_git(env: MutableMapping | None = None) -> bool:
if env is None:
env = os.environ
val = env.get(DISABLE_GIT, default="False")
if isinstance(val, str):
val = False if val.lower() == "false" else True
return val
def get_launch_queue_name(env: MutableMapping | None = None) -> str | None:
if env is None:
env = os.environ
val = env.get(LAUNCH_QUEUE_NAME, None)
return val
def get_launch_queue_entity(env: MutableMapping | None = None) -> str | None:
if env is None:
env = os.environ
val = env.get(LAUNCH_QUEUE_ENTITY, None)
return val
def get_launch_trace_id(env: MutableMapping | None = None) -> str | None:
if env is None:
env = os.environ
val = env.get(LAUNCH_TRACE_ID, None)
return val
def get_credentials_file(default: str, env: MutableMapping | None = None) -> Path:
"""Retrieve the path for the credentials file used to save access tokens.
The credentials file path can be set via an environment variable, otherwise
the default path is used.
"""
if env is None:
env = os.environ
credentials_file = env.get(CREDENTIALS_FILE, default)
return Path(credentials_file)
def strtobool(val: str) -> bool:
"""Convert a string representation of truth to true or false.
Copied from distutils. distutils was removed in Python 3.12.
"""
val = val.lower()
if val in ("y", "yes", "t", "true", "on", "1"):
return True
elif val in ("n", "no", "f", "false", "off", "0"):
return False
else:
raise ValueError(f"invalid truth value {val!r}")