[release] Migrate Tune + XGBoost tests to new infrastructure (#22705)

Migrate XGBoost and Tune tests to new release testing infrastructure.

https://buildkite.com/ray-project/release-tests-branch/builds/50
This commit is contained in:
Kai Fricke 2022-03-01 08:10:06 +01:00 committed by GitHub
parent 7b22d662df
commit d06c3ffd6f
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
2 changed files with 59 additions and 59 deletions

View file

@ -207,33 +207,33 @@ NIGHTLY_TESTS = {
"~/ray/release/sgd_tests/sgd_tests.yaml": [
"sgd_gpu",
],
"~/ray/release/tune_tests/cloud_tests/tune_cloud_tests.yaml": [
"aws_no_sync_down",
"aws_ssh_sync",
"aws_durable_upload",
"aws_durable_upload_rllib_str",
"aws_durable_upload_rllib_trainer",
"gcp_k8s_durable_upload",
],
"~/ray/release/tune_tests/scalability_tests/tune_tests.yaml": [
"bookkeeping_overhead",
"durable_trainable",
SmokeTest("long_running_large_checkpoints"),
SmokeTest("network_overhead"),
"result_throughput_cluster",
"result_throughput_single_node",
],
"~/ray/release/xgboost_tests/xgboost_tests.yaml": [
"train_small",
"train_moderate",
"train_gpu",
"tune_small",
"tune_4x32",
"tune_32x4",
"ft_small_elastic",
"ft_small_non_elastic",
"distributed_api_test",
],
# "~/ray/release/tune_tests/cloud_tests/tune_cloud_tests.yaml": [
# "aws_no_sync_down",
# "aws_ssh_sync",
# "aws_durable_upload",
# "aws_durable_upload_rllib_str",
# "aws_durable_upload_rllib_trainer",
# "gcp_k8s_durable_upload",
# ],
# "~/ray/release/tune_tests/scalability_tests/tune_tests.yaml": [
# "bookkeeping_overhead",
# "durable_trainable",
# SmokeTest("long_running_large_checkpoints"),
# SmokeTest("network_overhead"),
# "result_throughput_cluster",
# "result_throughput_single_node",
# ],
# "~/ray/release/xgboost_tests/xgboost_tests.yaml": [
# "train_small",
# "train_moderate",
# "train_gpu",
# "tune_small",
# "tune_4x32",
# "tune_32x4",
# "ft_small_elastic",
# "ft_small_non_elastic",
# "distributed_api_test",
# ],
"~/ray/release/rllib_tests/rllib_tests.yaml": [
SmokeTest("learning_tests"),
SmokeTest("stress_tests"),
@ -259,11 +259,11 @@ WEEKLY_TESTS = {
"/long_running_distributed.yaml": [
"pytorch_pbt_failure",
],
"~/ray/release/tune_tests/scalability_tests/tune_tests.yaml": [
"network_overhead",
"long_running_large_checkpoints",
"xgboost_sweep",
],
# "~/ray/release/tune_tests/scalability_tests/tune_tests.yaml": [
# "network_overhead",
# "long_running_large_checkpoints",
# "xgboost_sweep",
# ],
"~/ray/release/rllib_tests/rllib_tests.yaml": [
"learning_tests",
"stress_tests",

View file

@ -17,7 +17,7 @@
#
# # How often to run the tests.
# # One of [disabled, any, multi, nightly, weekly].
# frequency: disabled # weekly
# frequency: weekly
# # Owning team. This field will be persisted to the database
# team: ml
#
@ -77,7 +77,7 @@
# smoke_test:
# # Smoke tests can have different frequencies. A smoke test is only triggered
# # when the regular test is not matched.
# frequency: disabled # nightly
# frequency: nightly
# # Here we adjust the run timeout down and run on less nodes. The test script
# # remains the same.
# run:
@ -130,7 +130,7 @@
test_name: train_moderate
test_suite: xgboost_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -158,7 +158,7 @@
test_name: train_gpu
test_suite: xgboost_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -186,7 +186,7 @@
test_name: distributed_api_test
test_suite: xgboost_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -213,7 +213,7 @@
test_name: ft_small_elastic
test_suite: xgboost_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -241,7 +241,7 @@
test_name: ft_small_non_elastic
test_suite: xgboost_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -269,7 +269,7 @@
test_name: tune_small
test_suite: xgboost_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -297,7 +297,7 @@
test_name: tune_32x4
test_suite: xgboost_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -325,7 +325,7 @@
test_name: tune_4x32
test_suite: xgboost_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -356,7 +356,7 @@
test_name: aws_no_sync_down
test_suite: tune_cloud_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -384,7 +384,7 @@
test_name: aws_ssh_sync
test_suite: tune_cloud_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -412,7 +412,7 @@
test_name: aws_durable_upload
test_suite: tune_cloud_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -440,7 +440,7 @@
test_name: aws_durable_upload_rllib_str
test_suite: tune_cloud_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -470,7 +470,7 @@
test_name: aws_durable_upload_rllib_trainer
test_suite: tune_cloud_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -499,7 +499,7 @@
test_name: gcp_k8s_no_sync_down
test_suite: tune_cloud_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -522,7 +522,7 @@
test_name: gcp_k8s_ssh_sync
test_suite: tune_cloud_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -545,7 +545,7 @@
test_name: gcp_k8s_durable_upload
test_suite: tune_cloud_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -573,7 +573,7 @@
test_name: bookkeeping_overhead
test_suite: tune_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -596,7 +596,7 @@
test_name: durable_trainable
test_suite: tune_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -623,7 +623,7 @@
test_name: long_running_large_checkpoints
test_suite: tune_tests
frequency: disabled # weekly
frequency: weekly
team: ml
cluster:
cluster_env: app_config.yaml
@ -637,7 +637,7 @@
file_manager: sdk
smoke_test:
frequency: disabled # nightly
frequency: nightly
run:
timeout: 3600
@ -651,7 +651,7 @@
test_name: network_overhead
test_suite: tune_tests
frequency: disabled # weekly
frequency: weekly
team: ml
cluster:
cluster_env: app_config.yaml
@ -669,7 +669,7 @@
file_manager: sdk
smoke_test:
frequency: disabled # nightly
frequency: nightly
cluster:
compute_template: tpl_20x2.yaml
@ -691,7 +691,7 @@
test_name: result_throughput_cluster
test_suite: tune_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
cluster_env: app_config.yaml
@ -718,7 +718,7 @@
test_name: result_throughput_single_node
test_suite: tune_tests
frequency: disabled # nightly
frequency: nightly
team: ml
cluster:
@ -741,7 +741,7 @@
test_name: xgboost_sweep
test_suite: tune_tests
frequency: disabled # weekly
frequency: weekly
team: ml
cluster: