ray/release/long_running_tests/workloads/serve.py

import time
import subprocess
from subprocess import PIPE

import requests

import ray
from ray import serve
from ray.cluster_utils import Cluster

num_redis_shards = 1
redis_max_memory = 10**8
object_store_memory = 10**8
num_nodes = 4
cluster = Cluster()
for i in range(num_nodes):
    cluster.add_node(
        redis_port=6379 if i == 0 else None,
        num_redis_shards=num_redis_shards if i == 0 else None,
        num_cpus=8,
        num_gpus=0,
        resources={str(i): 2},
        object_store_memory=object_store_memory,
        redis_max_memory=redis_max_memory,
        dashboard_host="0.0.0.0",
    )

ray.init(address=cluster.address, dashboard_host="0.0.0.0")
client = serve.start()


@serve.accept_batch
def echo(requests_batch):
    time.sleep(0.01)  # Sleep for 10ms
    return ["hi" for _ in range(len(requests_batch))]


config = {"num_replicas": 7, "max_batch_size": 16}
client.create_backend("echo:v1", echo, config=config)
client.create_endpoint("echo", backend="echo:v1", route="/echo")

print("Warming up")
for _ in range(5):
    resp = requests.get("http://127.0.0.1:8000/echo").text
    print(resp)
    time.sleep(0.5)

connections = int(config["num_replicas"] * config["max_batch_size"] * 0.75)
num_threads = 2
time_to_run = "60m"

while True:
    proc = subprocess.Popen(
        [
            "wrk",
            "-c",
            str(connections),
            "-t",
            str(num_threads),
            "-d",
            time_to_run,
            "http://127.0.0.1:8000/echo",
        ],
        stdout=PIPE,
        stderr=PIPE,
    )
    print("started load testing")
    proc.wait()
    out, err = proc.communicate()
    print(out.decode())
    print(err.decode())
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00			`import time`
			`import subprocess`
			`from subprocess import PIPE`

			`import requests`

			`import ray`
Add ray.util package and move libraries from experimental (#7100) 2020-02-18 13:43:19 -08:00			`from ray import serve`
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00			`from ray.cluster_utils import Cluster`

			`num_redis_shards = 1`
			`redis_max_memory = 10**8`
			`object_store_memory = 10**8`
[Serve] Rescale Serve's Long Running Test to Cluster Mode (#13247) Now that `HeadOnly` becomes the new default HTTP location, we can re-enable the long running tests to use local multi-clusters. (also fixed the controller's API to match up to date, we should have caught these, I will open issues for this.) 2021-01-07 08:57:24 -08:00			`num_nodes = 4`
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00			`cluster = Cluster()`
			`for i in range(num_nodes):`
			`cluster.add_node(`
			`redis_port=6379 if i == 0 else None,`
			`num_redis_shards=num_redis_shards if i == 0 else None,`
			`num_cpus=8,`
			`num_gpus=0,`
			`resources={str(i): 2},`
			`object_store_memory=object_store_memory,`
			`redis_max_memory=redis_max_memory,`
[Serve] Fix Serve Release Tests (#12777) 2020-12-11 11:53:47 -08:00			`dashboard_host="0.0.0.0",`
			`)`
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00
Make Dashboard Port Configurable (#8999) 2020-06-19 14:26:22 -07:00			`ray.init(address=cluster.address, dashboard_host="0.0.0.0")`
[serve] Serve client refactor (#10409) 2020-09-04 12:02:23 -05:00			`client = serve.start()`
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00

			`@serve.accept_batch`
[Serve] Fix Serve Release Tests (#12777) 2020-12-11 11:53:47 -08:00			`def echo(requests_batch):`
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00			`time.sleep(0.01) # Sleep for 10ms`
[Serve] Fix Serve Release Tests (#12777) 2020-12-11 11:53:47 -08:00			`return ["hi" for _ in range(len(requests_batch))]`
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00

[Serve] Fix Serve Release Tests (#12777) 2020-12-11 11:53:47 -08:00			`config = {"num_replicas": 7, "max_batch_size": 16}`
[serve] Serve client refactor (#10409) 2020-09-04 12:02:23 -05:00			`client.create_backend("echo:v1", echo, config=config)`
			`client.create_endpoint("echo", backend="echo:v1", route="/echo")`
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00
			`print("Warming up")`
			`for _ in range(5):`
Fix Serve long running test (#8223) 2020-04-29 09:32:39 -07:00			`resp = requests.get("http://127.0.0.1:8000/echo").text`
Add serve stress test (#7076) 2020-02-10 09:37:39 -08:00			`print(resp)`
			`time.sleep(0.5)`

Fix serve long running test (#8268) 2020-05-01 11:54:27 -05:00			`connections = int(config["num_replicas"] * config["max_batch_size"] * 0.75)`
[Serve] Serve multi node tests (#10980) 2020-10-07 10:57:40 -07:00			`num_threads = 2`
			`time_to_run = "60m"`
Improve release process from 0.8.2 (#7303) 2020-02-24 21:18:53 -08:00
			`while True:`
			`proc = subprocess.Popen(`
			`[`
[Serve] Fix Serve Release Tests (#12777) 2020-12-11 11:53:47 -08:00			`"wrk",`
			`"-c",`
			`str(connections),`
			`"-t",`
			`str(num_threads),`
			`"-d",`
			`time_to_run,`
			`"http://127.0.0.1:8000/echo",`
Improve release process from 0.8.2 (#7303) 2020-02-24 21:18:53 -08:00			`],`
			`stdout=PIPE,`
[Serve] Fix Serve Release Tests (#12777) 2020-12-11 11:53:47 -08:00			`stderr=PIPE,`
			`)`
Improve release process from 0.8.2 (#7303) 2020-02-24 21:18:53 -08:00			`print("started load testing")`
			`proc.wait()`
			`out, err = proc.communicate()`
			`print(out.decode())`
			`print(err.decode())`