[serve] Add run, delete, and status to Serve CLI (#22714)

This change adds `run`, `delete`, and `status` commands to the CLI introduced in #22648. * `serve run`: Blocking command that allows users to deploy a YAML configuration or a class/function via import path. When terminated, the deployment(s) is torn down. Prints status info while running. Supports interactive development. * `serve delete`: Shuts down a Serve application and deletes all its running deployments. * `serve status`: Displays the status of a Serve application's deployments.
2025-03-06 10:31:39 -05:00 · 2022-03-03 07:50:36 -08:00 · 2022-03-03 07:50:36 -08:00 · 71a493cf1f
commit 71a493cf1f
parent 76dc4ccbfd
2 changed files with 235 additions and 6 deletions
--- a/python/ray/serve/scripts.py
+++ b/python/ray/serve/scripts.py
@ -2,11 +2,14 @@
 import json
 import yaml
 import os
 import sys
 import pathlib
 import requests
 import click
 import time
 import ray
-from ray.serve.api import Deployment
+from ray.serve.api import Deployment, deploy_group, get_deployment_statuses
 from ray.serve.config import DeploymentMode
 from ray._private.utils import import_attr
 from ray import serve
@ -15,7 +18,11 @@ from ray.serve.constants import (
    DEFAULT_HTTP_HOST,
    DEFAULT_HTTP_PORT,
 )
-from ray.dashboard.modules.serve.schema import ServeApplicationSchema
+from ray.dashboard.modules.serve.schema import (
    ServeApplicationSchema,
    schema_to_serve_application,
    serve_application_status_to_schema,
 )
 from ray.autoscaler._private.cli_logger import cli_logger
@ -52,9 +59,7 @@ def log_failed_request(response: requests.models.Response, address: str):
    default=r"{}",
    required=False,
    type=str,
-    help=(
+    help=("Runtime environment dictionary to pass into ray.init. Defaults to empty."),
        "Runtime environment dictionary to pass into ray.init. " "Defaults to empty."
    ),
 )
 def cli(address, namespace, runtime_env_json):
    ray.init(
@ -176,6 +181,91 @@ def deploy(config_file_name: str, address: str):
        log_failed_request(response, address)
@cli.command(
    help="[Experimental] Run deployments via Serve's Python API.",
    hidden=True,
 )
@click.argument("config_or_import_path")
@click.option(
    "--config_or_import_path",
    default=None,
    required=False,
    type=str,
    help="Either a Serve YAML configuration file path or an import path to "
    "a class or function to deploy. Import paths must be of the form "
    '"module.submodule_1...submodule_n.MyClassOrFunction".',
 )
@click.option(
    "--address",
    "-a",
    default=None,
    required=False,
    type=str,
    help="Address of the running Ray cluster to connect to. " 'Defaults to "auto".',
 )
 def run(config_or_import_path: str, address: str):
    """
    Deploys deployment(s) from CONFIG_OR_IMPORT_PATH, which must be either a
    Serve YAML configuration file path or an import path to
    a class or function to deploy. Import paths must be of the form
    "module.submodule_1...submodule_n.MyClassOrFunction".
    """
    try:
        # Check if path provided is for config or import
        is_config = pathlib.Path(config_or_import_path).is_file()
        if address is not None:
            ray.init(address=address, namespace="serve")
        serve.start()
        if is_config:
            cli_logger.print(
                "Deploying application in config file at " f"{config_or_import_path}."
            )
            with open(config_or_import_path, "r") as config_file:
                config = yaml.safe_load(config_file)
            schematized_config = ServeApplicationSchema.parse_obj(config)
            deployments = schema_to_serve_application(schematized_config)
            deploy_group(deployments)
            cli_logger.newline()
            cli_logger.success(
                f'\nDeployments from config file at "{config_or_import_path}" '
                "deployed successfully!\n"
            )
            cli_logger.newline()
        if not is_config:
            cli_logger.print(
                "Deploying function or class imported from " f"{config_or_import_path}."
            )
            func_or_class = import_attr(config_or_import_path)
            if not isinstance(func_or_class, Deployment):
                func_or_class = serve.deployment(func_or_class)
            func_or_class.deploy()
            cli_logger.newline()
            cli_logger.print(
                f"\nDeployed import at {config_or_import_path} successfully!\n"
            )
            cli_logger.newline()
        while True:
            statuses = serve_application_status_to_schema(
                get_deployment_statuses()
            ).json(indent=4)
            cli_logger.newline()
            cli_logger.print(f"\n{statuses}", no_format=True)
            cli_logger.newline()
            time.sleep(10)
    except KeyboardInterrupt:
        cli_logger.print("Got SIGINT (KeyboardInterrupt). Shutting down Serve.")
        sys.exit()
@cli.command(
    help="[Experimental] Get info about your Serve application's config.",
    hidden=True,
@ -195,3 +285,56 @@ def info(address: str):
        print(json.dumps(response.json(), indent=4))
    else:
        log_failed_request(response, address)
@cli.command(
    help="[Experimental] Get your Serve application's status.",
    hidden=True,
 )
@click.option(
    "--address",
    "-a",
    default=os.environ.get("RAY_ADDRESS", "http://localhost:8265"),
    required=False,
    type=str,
    help='Address of the Ray dashboard to query. For example, "http://localhost:8265".',
 )
 def status(address: str):
    full_address_path = f"{address}/api/serve/deployments/status"
    response = requests.get(full_address_path)
    if response.status_code == 200:
        print(json.dumps(response.json(), indent=4))
    else:
        log_failed_request(response, address)
@cli.command(
    help="[Experimental] Get info about your Serve application's config.",
    hidden=True,
 )
@click.option(
    "--address",
    "-a",
    default=os.environ.get("RAY_ADDRESS", "http://localhost:8265"),
    required=False,
    type=str,
    help='Address of the Ray dashboard to query. For example, "http://localhost:8265".',
 )
@click.option("--yes", "-y", is_flag=True, help="Bypass confirmation prompt.")
 def delete(address: str, yes: bool):
    if not yes:
        click.confirm(
            f"\nThis will shutdown the Serve application at address "
            f'"{address}" and delete all deployments there. Do you '
            "want to continue?",
            abort=True,
        )
    full_address_path = f"{address}/api/serve/deployments/"
    response = requests.delete(full_address_path)
    if response.status_code == 200:
        cli_logger.newline()
        cli_logger.success("\nSent delete request successfully!\n")
        cli_logger.newline()
    else:
        log_failed_request(response, address)
--- a/python/ray/serve/tests/test_cli.py
+++ b/python/ray/serve/tests/test_cli.py
@ -3,13 +3,14 @@ import os
 from pathlib import Path
 import subprocess
 import sys
-
+import signal
 import pytest
 import requests
 import ray
 from ray import serve
 from ray.tests.conftest import tmp_working_dir  # noqa: F401, E501
 from ray._private.test_utils import wait_for_condition
 from ray.dashboard.optional_utils import RAY_INTERNAL_DASHBOARD_NAMESPACE
@ -164,6 +165,8 @@ def test_deploy(ray_start_stop):
                == deployment_config["response"]
            )
    ray.shutdown()
@pytest.mark.skipif(sys.platform == "win32", reason="File path incorrect on Windows.")
 def test_info(ray_start_stop):
@ -222,5 +225,88 @@ def test_info(ray_start_stop):
    )
@pytest.mark.skipif(sys.platform == "win32", reason="File path incorrect on Windows.")
 def test_status(ray_start_stop):
    # Deploys a config file and checks its status
    config_file_name = os.path.join(
        os.path.dirname(__file__), "test_config_files", "three_deployments.yaml"
    )
    subprocess.check_output(["serve", "deploy", config_file_name])
    status_response = subprocess.check_output(["serve", "status"])
    statuses = json.loads(status_response)["statuses"]
    expected_deployments = {"shallow", "deep", "one"}
    for status in statuses:
        expected_deployments.remove(status["name"])
        assert status["status"] in {"HEALTHY", "UPDATING"}
        assert "message" in status
    assert len(expected_deployments) == 0
@pytest.mark.skipif(sys.platform == "win32", reason="File path incorrect on Windows.")
 def test_delete(ray_start_stop):
    # Deploys a config file and deletes it
    def get_num_deployments():
        info_response = subprocess.check_output(["serve", "info"])
        info = json.loads(info_response)
        return len(info["deployments"])
    config_file_name = os.path.join(
        os.path.dirname(__file__), "test_config_files", "two_deployments.yaml"
    )
    # Check idempotence
    for _ in range(2):
        subprocess.check_output(["serve", "deploy", config_file_name])
        wait_for_condition(lambda: get_num_deployments() == 2, timeout=35)
        subprocess.check_output(["serve", "delete", "-y"])
        wait_for_condition(lambda: get_num_deployments() == 0, timeout=35)
 def parrot(request):
    return request.query_params["sound"]
@pytest.mark.skipif(sys.platform == "win32", reason="File path incorrect on Windows.")
 def test_run(ray_start_stop):
    # Deploys valid config file and import path via serve run
    def ping_endpoint(endpoint: str, params: str = ""):
        try:
            return requests.get(f"http://localhost:8000/{endpoint}{params}").text
        except requests.exceptions.ConnectionError:
            return "connection error"
    # Deploy via config file
    config_file_name = os.path.join(
        os.path.dirname(__file__), "test_config_files", "two_deployments.yaml"
    )
    p = subprocess.Popen(["serve", "run", config_file_name])
    wait_for_condition(lambda: ping_endpoint("one") == "2", timeout=10)
    wait_for_condition(
        lambda: ping_endpoint("shallow") == "Hello shallow world!", timeout=10
    )
    p.send_signal(signal.SIGINT)  # Equivalent to ctrl-C
    p.wait()
    assert ping_endpoint("one") == "connection error"
    assert ping_endpoint("shallow") == "connection error"
    # Deploy via import path
    p = subprocess.Popen(["serve", "run", "ray.serve.tests.test_cli.parrot"])
    wait_for_condition(
        lambda: ping_endpoint("parrot", params="?sound=squawk") == "squawk", timeout=10
    )
    p.send_signal(signal.SIGINT)  # Equivalent to ctrl-C
    p.wait()
    assert ping_endpoint("parrot", params="?sound=squawk") == "connection error"
 if __name__ == "__main__":
    sys.exit(pytest.main(["-v", "-s", __file__]))