[ci/release/ml] Run ML release tests on staging (#26168)

This moves all ML release tests to staging.

Signed-off-by: Kai Fricke <kai@anyscale.com>
This commit is contained in:
Kai Fricke 2022-06-30 13:24:28 -07:00 committed by GitHub
parent ac831fded4
commit e2d8e7a6ae
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
3 changed files with 70 additions and 5 deletions

View file

@ -7,11 +7,13 @@ python:
pip_packages: pip_packages:
- ray-lightning - ray-lightning
- tblib - tblib
- torch==1.9.0
conda_packages: [] conda_packages: []
post_build_cmds: post_build_cmds:
- pip uninstall -y ray || true && pip3 install -U {{ env["RAY_WHEELS"] | default("ray") }}
- {{ env["RAY_WHEELS_SANITY_CHECK"] | default("echo No Ray wheels sanity check") }}
# Upgrade the Ray Lightning version, otherwise it will be cached in the Anyscale Docker image. # Upgrade the Ray Lightning version, otherwise it will be cached in the Anyscale Docker image.
- echo {{ env["TIMESTAMP"] }} - echo {{ env["TIMESTAMP"] }}
- pip3 install -U ray-lightning - pip3 install -U --force-reinstall ray-lightning pytorch-lightning lightning-bolts
- pip3 install --force-reinstall torch==1.9.0
- pip uninstall -y ray || true && pip3 install -U {{ env["RAY_WHEELS"] | default("ray") }}
- {{ env["RAY_WHEELS_SANITY_CHECK"] | default("echo No Ray wheels sanity check") }}

View file

@ -8,12 +8,15 @@ python:
- tblib - tblib
# Need to have in pip_packages so it is installed on the driver. # Need to have in pip_packages so it is installed on the driver.
- git+https://github.com/ray-project/ray_lightning#ray_lightning - git+https://github.com/ray-project/ray_lightning#ray_lightning
- torch==1.9.0
conda_packages: [] conda_packages: []
post_build_cmds: post_build_cmds:
- pip uninstall -y ray || true && pip3 install -U {{ env["RAY_WHEELS"] | default("ray") }}
- {{ env["RAY_WHEELS_SANITY_CHECK"] | default("echo No Ray wheels sanity check") }}
# Upgrade the Ray Lightning version in post build commands, otherwise it will be cached in the Anyscale Docker image. # Upgrade the Ray Lightning version in post build commands, otherwise it will be cached in the Anyscale Docker image.
- echo {{ env["TIMESTAMP"] }} - echo {{ env["TIMESTAMP"] }}
- pip3 install -U --force-reinstall pytorch-lightning lightning-bolts
- pip uninstall ray_lightning -y # Uninstall first so pip does a reinstall. - pip uninstall ray_lightning -y # Uninstall first so pip does a reinstall.
- pip3 install -U --no-cache-dir git+https://github.com/ray-project/ray_lightning#ray_lightning - pip3 install -U --no-cache-dir git+https://github.com/ray-project/ray_lightning#ray_lightning
- pip3 install --force-reinstall torch==1.9.0
- pip uninstall -y ray || true && pip3 install -U {{ env["RAY_WHEELS"] | default("ray") }}
- {{ env["RAY_WHEELS_SANITY_CHECK"] | default("echo No Ray wheels sanity check") }}

View file

@ -104,6 +104,7 @@
frequency: weekly frequency: weekly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: horovod/app_config_master.yaml cluster_env: horovod/app_config_master.yaml
@ -141,6 +142,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -167,6 +169,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -194,6 +197,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config_gpu.yaml cluster_env: app_config_gpu.yaml
@ -221,6 +225,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -247,6 +252,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -274,6 +280,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -301,6 +308,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -328,6 +336,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -355,6 +364,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -385,6 +395,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -410,6 +421,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -436,6 +448,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -463,6 +476,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -490,6 +504,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -516,6 +531,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -542,6 +558,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -572,6 +589,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: horovod/app_config.yaml cluster_env: horovod/app_config.yaml
@ -595,6 +613,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: horovod/app_config_master.yaml cluster_env: horovod/app_config_master.yaml
@ -618,6 +637,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: train/app_config.yaml cluster_env: train/app_config.yaml
@ -641,6 +661,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: train/app_config.yaml cluster_env: train/app_config.yaml
@ -664,6 +685,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: xgboost/app_config_gpu.yaml cluster_env: xgboost/app_config_gpu.yaml
@ -686,6 +708,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: xgboost/app_config_gpu_master.yaml cluster_env: xgboost/app_config_gpu_master.yaml
@ -708,6 +731,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: ray-lightning/app_config.yaml cluster_env: ray-lightning/app_config.yaml
@ -731,6 +755,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: ray-lightning/app_config_master.yaml cluster_env: ray-lightning/app_config_master.yaml
@ -754,6 +779,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: ../rllib_tests/app_config.yaml cluster_env: ../rllib_tests/app_config.yaml
@ -782,6 +808,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -811,6 +838,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -840,6 +868,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -869,6 +898,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config_ml.yaml cluster_env: app_config_ml.yaml
@ -900,6 +930,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config_ml.yaml cluster_env: app_config_ml.yaml
@ -930,11 +961,13 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
cluster_compute: tpl_gcp_k8s_4x8.yaml cluster_compute: tpl_gcp_k8s_4x8.yaml
cloud_id: cld_k8WcxPgjUtSE8RVmfZpTLuKM # anyscale_k8s_gcp_cloud cloud_id: cld_k8WcxPgjUtSE8RVmfZpTLuKM # anyscale_k8s_gcp_cloud
autosuspend_mins: 60
run: run:
timeout: 600 timeout: 600
@ -958,11 +991,13 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
cluster_compute: tpl_gcp_k8s_4x8.yaml cluster_compute: tpl_gcp_k8s_4x8.yaml
cloud_id: cld_k8WcxPgjUtSE8RVmfZpTLuKM # anyscale_k8s_gcp_cloud cloud_id: cld_k8WcxPgjUtSE8RVmfZpTLuKM # anyscale_k8s_gcp_cloud
autosuspend_mins: 60
run: run:
timeout: 600 timeout: 600
@ -986,11 +1021,13 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
cluster_compute: tpl_gcp_k8s_4x8.yaml cluster_compute: tpl_gcp_k8s_4x8.yaml
cloud_id: cld_k8WcxPgjUtSE8RVmfZpTLuKM # anyscale_k8s_gcp_cloud cloud_id: cld_k8WcxPgjUtSE8RVmfZpTLuKM # anyscale_k8s_gcp_cloud
autosuspend_mins: 60
run: run:
timeout: 600 timeout: 600
@ -1017,6 +1054,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -1040,6 +1078,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -1066,6 +1105,7 @@
frequency: weekly frequency: weekly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -1095,6 +1135,7 @@
frequency: weekly frequency: weekly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -1134,6 +1175,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -1161,6 +1203,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -1184,6 +1227,7 @@
frequency: weekly frequency: weekly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config_data.yaml cluster_env: app_config_data.yaml
@ -1215,6 +1259,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: dask_xgboost_app_config.yaml cluster_env: dask_xgboost_app_config.yaml
@ -1240,6 +1285,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: modin_xgboost_app_config.yaml cluster_env: modin_xgboost_app_config.yaml
@ -1265,6 +1311,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: torch_tune_serve_app_config.yaml cluster_env: torch_tune_serve_app_config.yaml
@ -1320,6 +1367,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: ../rllib_tests/app_config.yaml cluster_env: ../rllib_tests/app_config.yaml
cluster_compute: tpl_cpu_3.yaml cluster_compute: tpl_cpu_3.yaml
@ -1351,6 +1399,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config_np.yaml cluster_env: app_config_np.yaml
cluster_compute: tpl_cpu_1_large.yaml cluster_compute: tpl_cpu_1_large.yaml
@ -1437,6 +1486,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: ../rllib_tests/app_config.yaml cluster_env: ../rllib_tests/app_config.yaml
cluster_compute: many_ppo.yaml cluster_compute: many_ppo.yaml
@ -1555,6 +1605,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: ../rllib_tests/app_config.yaml cluster_env: ../rllib_tests/app_config.yaml
cluster_compute: tpl_cpu_1.yaml cluster_compute: tpl_cpu_1.yaml
@ -1646,6 +1697,7 @@
frequency: weekly frequency: weekly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
cluster_compute: compute_tpl.yaml cluster_compute: compute_tpl.yaml
@ -2083,6 +2135,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -2114,6 +2167,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -2137,6 +2191,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -2160,6 +2215,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -2183,6 +2239,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -2206,6 +2263,7 @@
frequency: nightly frequency: nightly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -2229,6 +2287,7 @@
frequency: weekly frequency: weekly
team: ml team: ml
env: staging
cluster: cluster:
cluster_env: app_config.yaml cluster_env: app_config.yaml
@ -2579,6 +2638,7 @@
team: core team: core
frequency: nightly frequency: nightly
working_dir: microbenchmark working_dir: microbenchmark
env: prod
python: "3.7" python: "3.7"