mirror of
https://github.com/vale981/ray
synced 2025-03-07 02:51:39 -05:00

The concept of a Serve Application, a data structure containing all information needed to deploy Serve on a Ray cluster, has surfaced during recent design discussions. This change introduces a formal Application data structure and refactors existing code to use it.
75 lines
2.5 KiB
Python
75 lines
2.5 KiB
Python
from aiohttp.web import Request, Response
|
|
import logging
|
|
|
|
import ray.dashboard.utils as dashboard_utils
|
|
import ray.dashboard.optional_utils as optional_utils
|
|
|
|
from ray import serve
|
|
from ray.serve.application import Application
|
|
from ray.serve.schema import (
|
|
serve_application_to_schema,
|
|
serve_application_status_to_schema,
|
|
)
|
|
from ray.serve.api import get_deployment_statuses
|
|
|
|
logger = logging.getLogger(__name__)
|
|
logger.setLevel(logging.INFO)
|
|
|
|
routes = optional_utils.ClassMethodRouteTable
|
|
|
|
|
|
class ServeHead(dashboard_utils.DashboardHeadModule):
|
|
def __init__(self, dashboard_head):
|
|
super().__init__(dashboard_head)
|
|
|
|
@routes.get("/api/serve/deployments/")
|
|
@optional_utils.init_ray_and_catch_exceptions(connect_to_serve=True)
|
|
async def get_all_deployments(self, req: Request) -> Response:
|
|
deployments = list(serve.list_deployments().values())
|
|
serve_application_schema = serve_application_to_schema(deployments=deployments)
|
|
return Response(
|
|
text=serve_application_schema.json(),
|
|
content_type="application/json",
|
|
)
|
|
|
|
@routes.get("/api/serve/deployments/status")
|
|
@optional_utils.init_ray_and_catch_exceptions(connect_to_serve=True)
|
|
async def get_all_deployment_statuses(self, req: Request) -> Response:
|
|
serve_application_status_schema = serve_application_status_to_schema(
|
|
get_deployment_statuses()
|
|
)
|
|
return Response(
|
|
text=serve_application_status_schema.json(),
|
|
content_type="application/json",
|
|
)
|
|
|
|
@routes.delete("/api/serve/deployments/")
|
|
@optional_utils.init_ray_and_catch_exceptions(connect_to_serve=True)
|
|
async def delete_serve_application(self, req: Request) -> Response:
|
|
serve.shutdown()
|
|
return Response()
|
|
|
|
@routes.put("/api/serve/deployments/")
|
|
@optional_utils.init_ray_and_catch_exceptions(connect_to_serve=True)
|
|
async def put_all_deployments(self, req: Request) -> Response:
|
|
app = Application.from_dict(await req.json())
|
|
app.deploy(blocking=False)
|
|
|
|
new_names = set()
|
|
for deployment in app:
|
|
new_names.add(deployment.name)
|
|
|
|
all_deployments = serve.list_deployments()
|
|
all_names = set(all_deployments.keys())
|
|
names_to_delete = all_names.difference(new_names)
|
|
for name in names_to_delete:
|
|
all_deployments[name].delete()
|
|
|
|
return Response()
|
|
|
|
async def run(self, server):
|
|
pass
|
|
|
|
@staticmethod
|
|
def is_minimal_module():
|
|
return False
|