mirror of
https://github.com/vale981/ray
synced 2025-03-05 18:11:42 -05:00

This is to limit the max number of HTTP requests the dashboard (API server) will accept before rejecting more requests. This will make sure the observability requests do not overload the downstream systems (raylet/gcs) when delegating too many concurrent state observability requests to the cluster.
53 lines
2.3 KiB
Python
53 lines
2.3 KiB
Python
from ray._private.ray_constants import env_integer
|
|
|
|
DASHBOARD_LOG_FILENAME = "dashboard.log"
|
|
DASHBOARD_AGENT_PORT_PREFIX = "DASHBOARD_AGENT_PORT_PREFIX:"
|
|
DASHBOARD_AGENT_LOG_FILENAME = "dashboard_agent.log"
|
|
DASHBOARD_AGENT_CHECK_PARENT_INTERVAL_SECONDS = 2
|
|
RAY_STATE_SERVER_MAX_HTTP_REQUEST_ENV_NAME = "RAY_STATE_SERVER_MAX_HTTP_REQUEST"
|
|
# Default number of in-progress requests to the state api server.
|
|
RAY_STATE_SERVER_MAX_HTTP_REQUEST = env_integer(
|
|
RAY_STATE_SERVER_MAX_HTTP_REQUEST_ENV_NAME, 100
|
|
)
|
|
# Max allowed number of in-progress requests could be configured.
|
|
RAY_STATE_SERVER_MAX_HTTP_REQUEST_ALLOWED = 1000
|
|
|
|
RETRY_REDIS_CONNECTION_TIMES = 10
|
|
CONNECT_REDIS_INTERNAL_SECONDS = 2
|
|
PURGE_DATA_INTERVAL_SECONDS = 60 * 10
|
|
ORGANIZE_DATA_INTERVAL_SECONDS = 2
|
|
DASHBOARD_RPC_ADDRESS = "dashboard_rpc"
|
|
GCS_SERVER_ADDRESS = "GcsServerAddress"
|
|
# GCS check alive
|
|
GCS_CHECK_ALIVE_MAX_COUNT_OF_RPC_ERROR = env_integer(
|
|
"GCS_CHECK_ALIVE_MAX_COUNT_OF_RPC_ERROR", 10
|
|
)
|
|
GCS_CHECK_ALIVE_INTERVAL_SECONDS = env_integer("GCS_CHECK_ALIVE_INTERVAL_SECONDS", 5)
|
|
GCS_CHECK_ALIVE_RPC_TIMEOUT = env_integer("GCS_CHECK_ALIVE_RPC_TIMEOUT", 10)
|
|
GCS_RETRY_CONNECT_INTERVAL_SECONDS = env_integer(
|
|
"GCS_RETRY_CONNECT_INTERVAL_SECONDS", 2
|
|
)
|
|
# aiohttp_cache
|
|
AIOHTTP_CACHE_TTL_SECONDS = 2
|
|
AIOHTTP_CACHE_MAX_SIZE = 128
|
|
AIOHTTP_CACHE_DISABLE_ENVIRONMENT_KEY = "RAY_DASHBOARD_NO_CACHE"
|
|
# Named signals
|
|
SIGNAL_NODE_INFO_FETCHED = "node_info_fetched"
|
|
SIGNAL_NODE_SUMMARY_FETCHED = "node_summary_fetched"
|
|
SIGNAL_JOB_INFO_FETCHED = "job_info_fetched"
|
|
SIGNAL_WORKER_INFO_FETCHED = "worker_info_fetched"
|
|
# Default value for datacenter (the default value in protobuf)
|
|
DEFAULT_LANGUAGE = "PYTHON"
|
|
DEFAULT_JOB_ID = "ffff"
|
|
# Cache TTL for bad runtime env. After this time, delete the cache and retry to create
|
|
# runtime env if needed.
|
|
BAD_RUNTIME_ENV_CACHE_TTL_SECONDS = env_integer(
|
|
"BAD_RUNTIME_ENV_CACHE_TTL_SECONDS", 60 * 10
|
|
)
|
|
# Hook that is invoked on the dashboard `/api/component_activities` endpoint.
|
|
# Environment variable stored here should be a callable that does not
|
|
# take any arguments and should return a dictionary mapping
|
|
# activity component type (str) to
|
|
# ray.dashboard.modules.snapshot.snapshot_head.RayActivityResponse.
|
|
# Example: "your.module.ray_cluster_activity_hook".
|
|
RAY_CLUSTER_ACTIVITY_HOOK = "RAY_CLUSTER_ACTIVITY_HOOK"
|