ray/benchmarks/benchmark_tests.yaml
Yi Cheng 72c9fef5f3
[nightly] Enable GCS HA nightly test with bootstrap (#21389)
After https://github.com/ray-project/ray/pull/21232 we are able to start ray without redis. We need to bake the test for a while before turning on the flag by default.
This PR add tests for this.
2022-01-05 10:53:07 -08:00

210 lines
4.7 KiB
YAML

- name: single_node
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: single_node.yaml
run:
timeout: 12000
prepare: sleep 0
script: python single_node/test_single_node.py
- name: object_store
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: object_store.yaml
run:
timeout: 3600
prepare: python distributed/wait_cluster.py --num-nodes=50
script: python object_store/test_object_store.py
- name: many_actors
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: distributed.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=65
script: python distributed/test_many_actors.py
- name: many_actors_smoke_test
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: distributed_smoke_test.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=2
script: SMOKE_TEST=1 python distributed/test_many_actors.py
- name: many_tasks
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: distributed.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=65
script: python distributed/test_many_tasks.py --num-tasks=10000
- name: many_tasks_smoke_test
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: distributed_smoke_test.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=2
script: python distributed/test_many_tasks.py --num-tasks=100
- name: many_pgs
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: distributed.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=65
script: python distributed/test_many_pgs.py
- name: many_pgs_smoke_test
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: distributed_smoke_test.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=2
script: SMOKE_TEST=1 python distributed/test_many_pgs.py
# NOTE: No smoke test since this shares a script with the many_tasks_smoke_test
- name: many_nodes
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: many_nodes.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=250
script: python distributed/test_many_tasks.py --num-tasks=1000
- name: many_tasks_redis_ha
owner:
mail: "core@anyscale.com"
slack: "@Yi Cheng"
cluster:
app_config: app_config.yaml
compute_template: distributed.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=65
script: python distributed/test_many_tasks.py --num-tasks=10000
app_env_vars:
RAY_gcs_grpc_based_pubsub: "1"
RAY_gcs_storage: "memory"
RAY_bootstrap_with_gcs: "1"
stable: false
- name: many_actors_redis_ha
owner:
mail: "core@anyscale.com"
slack: "@Yi Cheng"
cluster:
app_config: app_config.yaml
compute_template: distributed.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=65
script: python distributed/test_many_actors.py
app_env_vars:
RAY_gcs_grpc_based_pubsub: "1"
RAY_gcs_storage: "memory"
RAY_bootstrap_with_gcs: "1"
stable: false
- name: many_nodes_redis_ha
owner:
mail: "core@anyscale.com"
slack: "@Yi Cheng"
cluster:
app_config: app_config.yaml
compute_template: many_nodes.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=250
script: python distributed/test_many_tasks.py --num-tasks=1000
app_env_vars:
RAY_gcs_grpc_based_pubsub: "1"
RAY_gcs_storage: "memory"
RAY_bootstrap_with_gcs: "1"
stable: false
- name: many_pgs_redis_ha
owner:
mail: "core@anyscale.com"
slack: "@Yi Cheng"
cluster:
app_config: app_config.yaml
compute_template: distributed.yaml
run:
timeout: 3600 # 1hr
prepare: python distributed/wait_cluster.py --num-nodes=65
script: python distributed/test_many_pgs.py
app_env_vars:
RAY_gcs_grpc_based_pubsub: "1"
RAY_gcs_storage: "memory"
RAY_bootstrap_with_gcs: "1"
stable: false