mirror of
https://github.com/vale981/ray
synced 2025-03-06 10:31:39 -05:00

* Add scalability tests * Network overhead cluster * Update xgboost tests * Document release tests * Don't raise on failed trial * Update to multi node yamls * Update yamls * Revert xgboost test changes * Fix import * Update release/tune_tests/scalability_tests/workloads/test_bookkeeping_overhead.py Co-authored-by: Richard Liaw <rliaw@berkeley.edu> * Pass aws credentials (WIP) * Update durable trainable example * Update xgboost sweep * Change xgboost scope, fix durable trainable stop condition * Fix max depth to limit total test length * Add cluster information to test descriptions. Update release checklist/process docs Co-authored-by: Richard Liaw <rliaw@berkeley.edu>
42 lines
867 B
YAML
42 lines
867 B
YAML
cluster_name: ray-tune-scalability-tests-16x64
|
|
|
|
max_workers: 15
|
|
upscaling_speed: 15
|
|
|
|
idle_timeout_minutes: 0
|
|
|
|
docker:
|
|
image: anyscale/ray:nightly
|
|
container_name: ray_container
|
|
pull_before_run: true
|
|
|
|
provider:
|
|
type: aws
|
|
region: us-west-2
|
|
availability_zone: us-west-2a
|
|
cache_stopped_nodes: false
|
|
|
|
available_node_types:
|
|
cpu_64_ondemand:
|
|
node_config:
|
|
InstanceType: m5.16xlarge
|
|
resources: {"CPU": 64}
|
|
min_workers: 0
|
|
max_workers: 0
|
|
cpu_64_spot:
|
|
node_config:
|
|
InstanceType: m5.16xlarge
|
|
InstanceMarketOptions:
|
|
MarketType: spot
|
|
resources: {"CPU": 64}
|
|
min_workers: 15
|
|
max_workers: 15
|
|
|
|
auth:
|
|
ssh_user: ubuntu
|
|
|
|
head_node_type: cpu_64_ondemand
|
|
worker_default_node_type: cpu_64_spot
|
|
|
|
setup_commands:
|
|
- ray install-nightly
|