mirror of
https://github.com/vale981/ray
synced 2025-03-06 18:41:40 -05:00

* Add scalability tests * Network overhead cluster * Update xgboost tests * Document release tests * Don't raise on failed trial * Update to multi node yamls * Update yamls * Revert xgboost test changes * Fix import * Update release/tune_tests/scalability_tests/workloads/test_bookkeeping_overhead.py Co-authored-by: Richard Liaw <rliaw@berkeley.edu> * Pass aws credentials (WIP) * Update durable trainable example * Update xgboost sweep * Change xgboost scope, fix durable trainable stop condition * Fix max depth to limit total test length * Add cluster information to test descriptions. Update release checklist/process docs Co-authored-by: Richard Liaw <rliaw@berkeley.edu>
40 lines
809 B
YAML
40 lines
809 B
YAML
cluster_name: ray-tune-scalability-tests-1x32_hd
|
|
|
|
max_workers: 0
|
|
upscaling_speed: 1
|
|
|
|
idle_timeout_minutes: 0
|
|
|
|
docker:
|
|
image: anyscale/ray:nightly
|
|
container_name: ray_container
|
|
pull_before_run: true
|
|
|
|
provider:
|
|
type: aws
|
|
region: us-west-2
|
|
availability_zone: us-west-2a
|
|
cache_stopped_nodes: false
|
|
|
|
available_node_types:
|
|
cpu_32_hd_ondemand:
|
|
node_config:
|
|
InstanceType: m5.8xlarge
|
|
|
|
BlockDeviceMappings:
|
|
- DeviceName: /dev/sda1
|
|
Ebs:
|
|
VolumeSize: 160
|
|
|
|
resources: {"CPU": 32} # 128 GB memory
|
|
min_workers: 0
|
|
max_workers: 0
|
|
|
|
auth:
|
|
ssh_user: ubuntu
|
|
|
|
head_node_type: cpu_32_hd_ondemand
|
|
worker_default_node_type: cpu_32_hd_ondemand
|
|
|
|
setup_commands:
|
|
- ray install-nightly
|