mirror of
https://github.com/vale981/ray
synced 2025-03-05 18:11:42 -05:00
[Serve] Add serve failure test to CI (#20392)
This commit is contained in:
parent
693063d6f8
commit
ca90c63483
3 changed files with 34 additions and 3 deletions
|
@ -222,6 +222,9 @@
|
||||||
- bazel test --config=ci $(./scripts/bazel_export_options)
|
- bazel test --config=ci $(./scripts/bazel_export_options)
|
||||||
--test_tag_filters=-post_wheel_build
|
--test_tag_filters=-post_wheel_build
|
||||||
python/ray/serve/...
|
python/ray/serve/...
|
||||||
|
- bazel test --config=ci $(./scripts/bazel_export_options)
|
||||||
|
--test_tag_filters=team:serve
|
||||||
|
release/...
|
||||||
|
|
||||||
- label: ":python: Minimal install"
|
- label: ":python: Minimal install"
|
||||||
conditions: ["RAY_CI_PYTHON_AFFECTED"]
|
conditions: ["RAY_CI_PYTHON_AFFECTED"]
|
||||||
|
|
21
release/BUILD
Normal file
21
release/BUILD
Normal file
|
@ -0,0 +1,21 @@
|
||||||
|
load("@rules_python//python:defs.bzl", "py_test")
|
||||||
|
|
||||||
|
test_srcs = glob(["**/*.py"])
|
||||||
|
|
||||||
|
py_test(
|
||||||
|
name = "serve_failure_smoke_test",
|
||||||
|
size = "medium",
|
||||||
|
srcs = test_srcs,
|
||||||
|
env = {
|
||||||
|
"IS_SMOKE_TEST": "1",
|
||||||
|
},
|
||||||
|
main = "serve_failure.py",
|
||||||
|
tags = [
|
||||||
|
"exclusive",
|
||||||
|
"team:serve",
|
||||||
|
],
|
||||||
|
deps = [
|
||||||
|
"//:ray_lib",
|
||||||
|
"//python/ray/serve:serve_lib",
|
||||||
|
],
|
||||||
|
)
|
|
@ -24,6 +24,8 @@ NUM_NODES = 4
|
||||||
# RandomTest setup constants
|
# RandomTest setup constants
|
||||||
CPUS_PER_NODE = 10
|
CPUS_PER_NODE = 10
|
||||||
|
|
||||||
|
IS_SMOKE_TEST = "IS_SMOKE_TEST" in os.environ
|
||||||
|
|
||||||
|
|
||||||
def update_progress(result):
|
def update_progress(result):
|
||||||
"""
|
"""
|
||||||
|
@ -54,7 +56,8 @@ ray.init(
|
||||||
namespace="serve_failure_test",
|
namespace="serve_failure_test",
|
||||||
address=cluster.address,
|
address=cluster.address,
|
||||||
dashboard_host="0.0.0.0",
|
dashboard_host="0.0.0.0",
|
||||||
log_to_driver=True)
|
log_to_driver=True,
|
||||||
|
)
|
||||||
serve.start(detached=True)
|
serve.start(detached=True)
|
||||||
|
|
||||||
|
|
||||||
|
@ -124,7 +127,7 @@ class RandomTest:
|
||||||
start_time = time.time()
|
start_time = time.time()
|
||||||
previous_time = start_time
|
previous_time = start_time
|
||||||
while True:
|
while True:
|
||||||
for _ in range(100):
|
for _ in range(20):
|
||||||
actions, weights = zip(*self.weighted_actions)
|
actions, weights = zip(*self.weighted_actions)
|
||||||
action_chosen = random.choices(actions, weights=weights)[0]
|
action_chosen = random.choices(actions, weights=weights)[0]
|
||||||
print(f"Executing {action_chosen}")
|
print(f"Executing {action_chosen}")
|
||||||
|
@ -146,7 +149,11 @@ class RandomTest:
|
||||||
previous_time = new_time
|
previous_time = new_time
|
||||||
iteration += 1
|
iteration += 1
|
||||||
|
|
||||||
|
if IS_SMOKE_TEST:
|
||||||
|
break
|
||||||
|
|
||||||
|
|
||||||
|
tester = RandomTest(max_deployments=NUM_NODES * CPUS_PER_NODE)
|
||||||
random_killer = RandomKiller.remote()
|
random_killer = RandomKiller.remote()
|
||||||
random_killer.run.remote()
|
random_killer.run.remote()
|
||||||
RandomTest(max_deployments=NUM_NODES * CPUS_PER_NODE).run()
|
tester.run()
|
||||||
|
|
Loading…
Add table
Reference in a new issue