ray/release/ml_user_tests/ml_user_tests.yaml

124 lines
2.7 KiB
YAML
Raw Normal View History

- name: horovod_user_test_latest
team: ml
cluster:
app_config: horovod/app_config.yaml
compute_template: horovod/compute_tpl.yaml
driver_setup: horovod/driver_setup_latest.sh
run:
use_connect: True
autosuspend_mins: 10
timeout: 1200
script: python horovod/horovod_user_test.py
- name: horovod_user_test_master
team: ml
cluster:
app_config: ../horovod_tests/app_config_master.yaml
compute_template: horovod/compute_tpl.yaml
driver_setup: horovod/driver_setup_master.sh
run:
use_connect: True
autosuspend_mins: 10
timeout: 1200
script: python horovod/horovod_user_test.py
- name: train_tensorflow_mnist_test
team: ml
cluster:
app_config: train/app_config.yaml
compute_template: train/compute_tpl.yaml
driver_setup: train/driver_setup.sh
run:
use_connect: True
timeout: 36000
script: python train/train_tensorflow_mnist_test.py
- name: train_torch_linear_test
team: ml
cluster:
app_config: train/app_config.yaml
compute_template: train/compute_tpl.yaml
driver_setup: train/driver_setup.sh
run:
use_connect: True
timeout: 36000
script: python train/train_torch_linear_test.py
- name: xgboost_gpu_connect_latest
team: ml
cluster:
app_config: xgboost/app_config_gpu.yaml
compute_template: xgboost/tpl_gpu_small_scaling.yaml
run:
use_connect: True
timeout: 1200
script: python xgboost/train_gpu_connect.py
- name: xgboost_gpu_connect_master
team: ml
cluster:
app_config: xgboost/app_config_gpu_master.yaml
compute_template: xgboost/tpl_gpu_small_scaling.yaml
run:
use_connect: True
timeout: 1200
script: python xgboost/train_gpu_connect.py
- name: ray_lightning_user_test_latest
team: ml
cluster:
app_config: ray-lightning/app_config.yaml
compute_template: ray-lightning/compute_tpl.yaml
driver_setup: ray-lightning/driver_setup.sh
run:
use_connect: True
autosuspend_mins: 10
timeout: 1200
script: python ray-lightning/ray_lightning_user_test.py
- name: ray_lightning_user_test_master
team: ml
cluster:
app_config: ray-lightning/app_config_master.yaml
compute_template: ray-lightning/compute_tpl.yaml
driver_setup: ray-lightning/driver_setup.sh
run:
use_connect: True
autosuspend_mins: 10
timeout: 1200
script: python ray-lightning/ray_lightning_user_test.py
- name: tune_rllib_connect_test
team: ml
cluster:
app_config: ../rllib_tests/app_config.yaml
compute_template: tune_rllib/compute_tpl.yaml
driver_setup: tune_rllib/driver_setup.sh
run:
use_connect: True
autosuspend_mins: 10
timeout: 1200
script: python tune_rllib/run_connect_tests.py