[Test] Handle flaky tests (#16602)

* Handle flaky tests.

* lint

* tag more

* add test_scheduling

* Remove global gc

Co-authored-by: Amog Kamsetty <amogkamsetty@yahoo.com>
This commit is contained in:
SangBin Cho 2021-06-23 16:24:12 -07:00 committed by GitHub
parent b9e5ca4c18
commit f816f613c7
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
4 changed files with 69 additions and 41 deletions

View file

@ -25,7 +25,7 @@ steps:
commands:
- *prelude_commands
- TORCH_VERSION=1.6 ./ci/travis/install-dependencies.sh
- bazel test --config=ci $(./scripts/bazel_export_options) --build_tests_only --test_tag_filters=-flaky --
- bazel test --config=ci $(./scripts/bazel_export_options) --build_tests_only --test_tag_filters=-flaky,-flaky-mac --
//:all python/ray/serve/... python/ray/new_dashboard/... -rllib/... -core_worker_test
- label: ":mac: :apple: Small and Large"
@ -35,7 +35,7 @@ steps:
- bazel test $(./scripts/bazel_export_options) --config=ci
--test_env=CONDA_EXE --test_env=CONDA_PYTHON_EXE --test_env=CONDA_SHLVL --test_env=CONDA_PREFIX
--test_env=CONDA_DEFAULT_ENV --test_env=CONDA_PROMPT_MODIFIER
--test_tag_filters=-kubernetes,-jenkins_only,-medium_size_python_tests_a_to_j,-medium_size_python_tests_k_to_z,-flaky
--test_tag_filters=-kubernetes,-jenkins_only,-medium_size_python_tests_a_to_j,-medium_size_python_tests_k_to_z,-flaky,-flaky-mac
python/ray/tests/...
- label: ":mac: :apple: Medium A-J"
@ -43,7 +43,7 @@ steps:
commands:
- *prelude_commands
- bazel test --config=ci $(./scripts/bazel_export_options)
--test_tag_filters=-kubernetes,-jenkins_only,medium_size_python_tests_a_to_j,-flaky
--test_tag_filters=-kubernetes,-jenkins_only,medium_size_python_tests_a_to_j,-flaky,-flaky-mac
python/ray/tests/...
- label: ":mac: :apple: Medium K-Z"
@ -51,7 +51,7 @@ steps:
commands:
- *prelude_commands
- bazel test --config=ci $(./scripts/bazel_export_options)
--test_tag_filters=-kubernetes,-jenkins_only,medium_size_python_tests_k_to_z,-flaky
--test_tag_filters=-kubernetes,-jenkins_only,medium_size_python_tests_k_to_z,-flaky,-flaky-mac
python/ray/tests/...
- label: ":mac: :apple: :snowflake: Flaky"
@ -60,7 +60,7 @@ steps:
- *prelude_commands
- RLLIB_TESTING=1 ./ci/travis/install-dependencies.sh
- bazel test --config=ci $(./scripts/bazel_export_options)
--test_tag_filters=-kubernetes,-jenkins_only,flaky
--test_tag_filters=-kubernetes,-jenkins_only,flaky,flaky-mac
--test_env=CONDA_EXE
--test_env=CONDA_PYTHON_EXE
--test_env=CONDA_SHLVL

View file

@ -52,17 +52,6 @@ py_test_module_list(
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_actor.py",
"test_memstat.py",
],
size = "medium",
extra_srcs = SRCS,
tags = ["exclusive", "medium_size_python_tests_a_to_j", "flaky"],
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_memory_scheduling.py",
@ -80,7 +69,6 @@ py_test_module_list(
"test_resource_demand_scheduler.py",
"test_runtime_env_env_vars.py",
"test_runtime_env_fork_process.py",
"test_scheduling.py",
"test_serialization.py",
"test_shuffle.py",
"test_stress.py",
@ -94,28 +82,6 @@ py_test_module_list(
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_object_spilling_2.py",
"test_object_manager.py",
"test_multi_tenancy.py",
],
size = "medium",
extra_srcs = SRCS,
tags = ["exclusive", "medium_size_python_tests_k_to_z", "flaky"],
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_runtime_env_complicated.py"
],
size = "large",
extra_srcs = SRCS,
tags = ["exclusive", "post_wheel_build", "flaky"],
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_args.py",
@ -168,9 +134,7 @@ py_test_module_list(
py_test_module_list(
files = [
"test_failure_2.py",
"test_failure_3.py",
"test_failure_4.py",
"test_reference_counting_2.py",
"test_object_spilling.py",
],
size = "large",
@ -179,16 +143,78 @@ py_test_module_list(
deps = ["//:ray_lib"],
)
# Flaky tests.
py_test_module_list(
files = [
"test_runtime_env_complicated.py"
],
size = "large",
extra_srcs = SRCS,
tags = ["exclusive", "post_wheel_build", "flaky"],
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_actor.py",
"test_memstat.py",
],
size = "medium",
extra_srcs = SRCS,
tags = ["exclusive", "medium_size_python_tests_a_to_j", "flaky"],
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_object_spilling_2.py",
"test_object_manager.py",
"test_multi_tenancy.py",
"test_scheduling.py",
],
size = "medium",
extra_srcs = SRCS,
tags = ["exclusive", "medium_size_python_tests_k_to_z", "flaky"],
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_failure_3.py",
"test_reference_counting_2.py",
],
size = "large",
extra_srcs = SRCS,
tags = ["exclusive", "flaky"],
deps = ["//:ray_lib"],
)
# Flaky tests only on Mac.
py_test_module_list(
files = [
"test_placement_group.py",
],
size = "large",
extra_srcs = SRCS,
tags = ["exclusive", "flaky-mac"],
deps = ["//:ray_lib"],
)
py_test_module_list(
files = [
"test_runtime_env.py"
],
size = "large",
extra_srcs = SRCS,
tags = ["flaky-mac"],
deps = ["//:ray_lib"],
)
# TODO(barakmich): aws/ might want its own buildfile, or
# py_test_module_list should support subdirectories.
py_test(

View file

@ -55,6 +55,7 @@ def test_distributed_array_assemble(ray_start_2_cpus, reload_modules):
]))
@pytest.mark.skipif(sys.platform == "win32", reason="Failing on Windows.")
@pytest.mark.parametrize(
"ray_start_cluster_2_nodes",
[{

View file

@ -543,6 +543,7 @@ def _all_actors_dead():
for actor in list(ray.state.actors().values()))
@pytest.mark.skipif(sys.platform == "win32", reason="Failing on Windows.")
def test_kill_actor_immediately_after_creation(ray_start_regular):
@ray.remote
class A: