2020-01-23 02:02:58 +01:00
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# BAZEL/Travis-ci test cases.
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
# To add new RLlib tests, first find the correct category of your new test
|
|
|
|
# within this file.
|
|
|
|
|
|
|
|
# All new tests - within their category - should be added alphabetically!
|
|
|
|
# Do not just add tests to the bottom of the file.
|
|
|
|
|
|
|
|
# Currently we have the following categories:
|
|
|
|
|
|
|
|
# a) Learning tests/regression, tagged: "learning_tests"
|
|
|
|
# b) Quick agent compilation/tune-train tests, tagged "quick_train"
|
|
|
|
# c-e) Utils, Models, Agents, tagged "utils", "models", and "agents_dir".
|
|
|
|
# f) Tests directory (everything in rllib/tests/...), tagged: "tests_dir"
|
|
|
|
# g) Examples directory (everything in rllib/examples/...), tagged: "examples"
|
2020-01-23 02:02:58 +01:00
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
# The "examples" and "tests_dir" tags have further sub-tags going by the
|
|
|
|
# starting letter of the test name (e.g. "examples_A", or "tests_dir_F") for
|
|
|
|
# split-up purposes in travis, which doesn't like tests that run for too long
|
|
|
|
# (problems: 10min timeout, not respecting ray/ci/keep_alive.sh, or even
|
|
|
|
# `travis_wait n`, etc..).
|
2020-01-23 02:02:58 +01:00
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
# Our travis.yml file executes all these tests in 6 different jobs, which are:
|
|
|
|
# 1) everything in a) using tf2.x
|
|
|
|
# 2) everything in a) using tf1.x
|
|
|
|
# 3) everything in b) c) d) and e)
|
|
|
|
# 4) everything in g)
|
2020-05-12 08:23:10 +02:00
|
|
|
# 5) f), BUT only those tagged `tests_dir_A` to `tests_dir_L`
|
|
|
|
# 6) f), BUT only those tagged `tests_dir_M` to `tests_dir_Z`
|
2020-02-15 23:50:44 +01:00
|
|
|
|
|
|
|
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# Agents learning regression tests.
|
|
|
|
#
|
|
|
|
# Tag: learning_tests
|
|
|
|
#
|
|
|
|
# This will test all yaml files (via `rllib train`)
|
2020-05-26 11:10:27 +02:00
|
|
|
# inside rllib/tuned_examples/[algo-name] for actual learning success.
|
2020-02-15 23:50:44 +01:00
|
|
|
# --------------------------------------------------------------------
|
2020-01-23 02:02:58 +01:00
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# A2C/A3C
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "regression_test_a2c_cartpole_tf",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-04-30 15:48:11 +02:00
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
2020-05-26 11:10:27 +02:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/a3c/cartpole-a2c.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/a3c"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "regression_test_a2c_cartpole_torch",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
|
|
|
size = "medium",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/a3c/cartpole-a2c.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/a3c", "--torch"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "regression_test_a3c_cartpole_tf",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
2020-05-26 11:10:27 +02:00
|
|
|
size = "medium",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/a3c/cartpole-a3c.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/a3c"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "regression_test_a3c_cartpole_torch",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
|
|
|
size = "medium",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/a3c/cartpole-a3c.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/a3c", "--torch"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# APPO
|
2020-05-11 20:24:43 -07:00
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_appo_tf",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
2020-05-26 11:10:27 +02:00
|
|
|
size = "medium",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = [
|
2020-05-26 11:10:27 +02:00
|
|
|
"tuned_examples/ppo/cartpole-appo.yaml",
|
|
|
|
"tuned_examples/ppo/cartpole-appo-vtrace.yaml"
|
2020-05-11 20:24:43 -07:00
|
|
|
],
|
2020-05-26 11:10:27 +02:00
|
|
|
args = ["--yaml-dir=tuned_examples/ppo"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_appo_torch",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
2020-05-27 10:19:47 +02:00
|
|
|
size = "large",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = [
|
2020-05-26 11:10:27 +02:00
|
|
|
"tuned_examples/ppo/cartpole-appo.yaml",
|
|
|
|
"tuned_examples/ppo/cartpole-appo-vtrace.yaml"
|
2020-05-11 20:24:43 -07:00
|
|
|
],
|
2020-05-26 11:10:27 +02:00
|
|
|
args = ["--yaml-dir=tuned_examples/ppo", "--torch"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# ARS
|
2020-05-11 20:24:43 -07:00
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_ars_tf",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
2020-05-26 11:10:27 +02:00
|
|
|
size = "medium",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/ars/cartpole-ars.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/ars"]
|
2020-04-05 18:34:23 +02:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_ars_torch",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
|
|
|
size = "medium",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/ars/cartpole-ars.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/ars", "--torch"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# DDPG
|
2020-05-11 20:24:43 -07:00
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_pendulum_ddpg_tf",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_tf", "learning_tests_pendulum"],
|
2020-05-11 20:24:43 -07:00
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = glob(["tuned_examples/ddpg/pendulum-ddpg.yaml"]),
|
|
|
|
args = ["--yaml-dir=tuned_examples/ddpg"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_pendulum_ddpg_torch",
|
2020-04-05 18:34:23 +02:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_torch", "learning_tests_pendulum"],
|
2020-05-11 20:24:43 -07:00
|
|
|
size = "large",
|
2020-04-05 18:34:23 +02:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = glob(["tuned_examples/ddpg/pendulum-ddpg.yaml"]),
|
|
|
|
args = ["--torch", "--yaml-dir=tuned_examples/ddpg"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# DQN/Simple-Q
|
2020-05-11 20:24:43 -07:00
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_dqn_tf",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
2020-05-11 20:24:43 -07:00
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = [
|
2020-05-26 11:10:27 +02:00
|
|
|
"tuned_examples/dqn/cartpole-simpleq.yaml",
|
|
|
|
"tuned_examples/dqn/cartpole-dqn.yaml",
|
|
|
|
"tuned_examples/dqn/cartpole-dqn-param-noise.yaml",
|
2020-05-11 20:24:43 -07:00
|
|
|
],
|
2020-05-26 11:10:27 +02:00
|
|
|
args = ["--yaml-dir=tuned_examples/dqn"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_dqn_torch",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = [
|
2020-05-26 11:10:27 +02:00
|
|
|
"tuned_examples/dqn/cartpole-simpleq.yaml",
|
|
|
|
"tuned_examples/dqn/cartpole-dqn.yaml",
|
|
|
|
"tuned_examples/dqn/cartpole-dqn-param-noise.yaml",
|
2020-05-11 20:24:43 -07:00
|
|
|
],
|
2020-05-26 11:10:27 +02:00
|
|
|
args = ["--yaml-dir=tuned_examples/dqn", "--torch"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# ES
|
2020-05-11 20:24:43 -07:00
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_es_tf",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
2020-05-27 10:19:47 +02:00
|
|
|
size = "large",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/es/cartpole-es.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/es"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_es_torch",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
2020-05-27 10:19:47 +02:00
|
|
|
size = "large",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/es/cartpole-es.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/es", "--torch"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# IMPALA
|
2020-05-11 20:24:43 -07:00
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_cartpole_impala_tf",
|
2020-05-11 20:24:43 -07:00
|
|
|
main = "tests/run_regression_tests.py",
|
2020-05-26 11:10:27 +02:00
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
2020-05-27 10:19:47 +02:00
|
|
|
size = "large",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/impala/cartpole-impala.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/impala"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_cartpole_impala_torch",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
2020-05-27 10:19:47 +02:00
|
|
|
size = "large",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/impala/cartpole-impala.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/impala", "--torch"]
|
|
|
|
)
|
|
|
|
|
|
|
|
# PG
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_cartpole_pg_tf",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/pg/cartpole-pg.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/pg"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_cartpole_pg_torch",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
2020-05-26 11:10:27 +02:00
|
|
|
size = "medium",
|
2020-05-11 20:24:43 -07:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/pg/cartpole-pg.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/pg", "--torch"]
|
|
|
|
)
|
|
|
|
|
|
|
|
# PPO
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_cartpole_ppo_tf",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/ppo/cartpole-ppo.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/ppo"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_cartpole_ppo_torch",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
2020-05-26 11:10:27 +02:00
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/ppo/cartpole-ppo.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/ppo", "--torch"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_pendulum_ppo_tf",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_pendulum"],
|
2020-05-11 20:24:43 -07:00
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/ppo/pendulum-ppo.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/ppo"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_pendulum_ppo_torch",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_pendulum"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/ppo/pendulum-ppo.yaml"],
|
|
|
|
args = ["--torch", "--yaml-dir=tuned_examples/ppo"]
|
|
|
|
)
|
|
|
|
|
2020-06-05 15:40:30 +02:00
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_repeat_after_me_tf",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/ppo/repeatafterme-ppo-lstm.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/ppo"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_repeat_after_me_torch",
|
|
|
|
main = "tests/run_regression_tests.py",
|
2020-06-20 00:05:19 +02:00
|
|
|
tags = ["learning_tests_torch"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/ppo/repeatafterme-ppo-lstm.yaml"],
|
|
|
|
args = ["--torch", "--yaml-dir=tuned_examples/ppo"]
|
|
|
|
)
|
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# SAC
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_cartpole_sac_tf",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_cartpole"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/sac/cartpole-sac.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/sac"]
|
2020-05-11 20:24:43 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_cartpole_sac_torch",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_cartpole"],
|
2020-05-27 10:19:47 +02:00
|
|
|
size = "large",
|
2020-05-26 11:10:27 +02:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/sac/cartpole-sac.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/sac", "--torch"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_pendulum_sac_tf",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_pendulum"],
|
2020-05-11 20:24:43 -07:00
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/sac/pendulum-sac.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/sac"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "run_regression_tests_pendulum_sac_torch",
|
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_pendulum"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
|
|
|
data = ["tuned_examples/sac/pendulum-sac.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/sac", "--torch"]
|
2020-04-30 15:48:11 +02:00
|
|
|
)
|
|
|
|
|
2020-05-26 11:10:27 +02:00
|
|
|
# TD3
|
2020-04-30 15:48:11 +02:00
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_pendulum_td3_tf",
|
2020-04-30 15:48:11 +02:00
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_tf", "learning_tests_pendulum"],
|
2020-05-26 11:10:27 +02:00
|
|
|
size = "large",
|
2020-04-30 15:48:11 +02:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/ddpg/pendulum-td3.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/ddpg"]
|
2020-04-30 15:48:11 +02:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-26 11:10:27 +02:00
|
|
|
name = "run_regression_tests_pendulum_td3_torch",
|
2020-04-30 15:48:11 +02:00
|
|
|
main = "tests/run_regression_tests.py",
|
|
|
|
tags = ["learning_tests_torch", "learning_tests_pendulum"],
|
2020-05-26 11:10:27 +02:00
|
|
|
size = "large",
|
2020-04-30 15:48:11 +02:00
|
|
|
srcs = ["tests/run_regression_tests.py"],
|
2020-05-26 11:10:27 +02:00
|
|
|
data = ["tuned_examples/ddpg/pendulum-td3.yaml"],
|
|
|
|
args = ["--yaml-dir=tuned_examples/ddpg", "--torch"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# Agents (Compilation, Losses, simple agent functionality tests)
|
|
|
|
# rllib/agents/
|
|
|
|
#
|
|
|
|
# Tag: agents_dir
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
2020-05-27 16:19:13 +02:00
|
|
|
# A2/3CTrainer
|
2020-03-01 20:53:35 +01:00
|
|
|
py_test(
|
|
|
|
name = "test_a2c",
|
|
|
|
tags = ["agents_dir"],
|
2020-05-27 16:19:13 +02:00
|
|
|
size = "medium",
|
2020-03-01 20:53:35 +01:00
|
|
|
srcs = ["agents/a3c/tests/test_a2c.py"]
|
|
|
|
)
|
|
|
|
|
2020-05-27 16:19:13 +02:00
|
|
|
py_test(
|
|
|
|
name = "test_a3c",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["agents/a3c/tests/test_a3c.py"]
|
|
|
|
)
|
|
|
|
|
2020-05-04 09:36:27 +02:00
|
|
|
# APEXTrainer (DQN)
|
|
|
|
py_test(
|
|
|
|
name = "test_apex_dqn",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["agents/dqn/tests/test_apex_dqn.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
# APEXDDPGTrainer
|
|
|
|
py_test(
|
|
|
|
name = "test_apex_ddpg",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["agents/ddpg/tests/test_apex_ddpg.py"]
|
|
|
|
)
|
|
|
|
|
2020-05-08 16:31:31 +02:00
|
|
|
# ARS
|
|
|
|
py_test(
|
|
|
|
name = "test_ars",
|
2020-05-27 16:19:13 +02:00
|
|
|
tags = ["agents_dir"],
|
2020-05-08 16:31:31 +02:00
|
|
|
size = "medium",
|
|
|
|
srcs = ["agents/ars/tests/test_ars.py"]
|
|
|
|
)
|
|
|
|
|
2020-03-01 20:53:35 +01:00
|
|
|
# DDPGTrainer
|
|
|
|
py_test(
|
|
|
|
name = "test_ddpg",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["agents/ddpg/tests/test_ddpg.py"]
|
|
|
|
)
|
|
|
|
|
2020-04-06 20:56:16 +02:00
|
|
|
# DQNTrainer/SimpleQTrainer
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
|
|
|
name = "test_dqn",
|
|
|
|
tags = ["agents_dir"],
|
2020-02-19 21:18:45 +01:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["agents/dqn/tests/test_dqn.py"]
|
|
|
|
)
|
2020-04-06 20:56:16 +02:00
|
|
|
py_test(
|
|
|
|
name = "test_simple_q",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["agents/dqn/tests/test_simple_q.py"]
|
|
|
|
)
|
2020-01-23 02:02:58 +01:00
|
|
|
|
2020-06-16 09:01:20 +02:00
|
|
|
# DYNATrainer
|
|
|
|
py_test(
|
|
|
|
name = "test_dyna",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["agents/dyna/tests/test_dyna.py"]
|
|
|
|
)
|
|
|
|
|
2020-05-08 16:31:31 +02:00
|
|
|
# ES
|
2020-02-19 16:07:37 -08:00
|
|
|
py_test(
|
2020-05-08 16:31:31 +02:00
|
|
|
name = "test_es",
|
2020-02-19 16:07:37 -08:00
|
|
|
tags = ["agents_dir"],
|
2020-05-08 16:31:31 +02:00
|
|
|
size = "medium",
|
|
|
|
srcs = ["agents/es/tests/test_es.py"]
|
2020-02-19 16:07:37 -08:00
|
|
|
)
|
2020-05-08 16:31:31 +02:00
|
|
|
|
|
|
|
# IMPALA
|
2020-05-03 13:44:25 +02:00
|
|
|
py_test(
|
|
|
|
name = "test_impala",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["agents/impala/tests/test_impala.py"]
|
|
|
|
)
|
2020-05-08 16:31:31 +02:00
|
|
|
py_test(
|
|
|
|
name = "test_vtrace",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["agents/impala/tests/test_vtrace.py"]
|
|
|
|
)
|
2020-02-19 16:07:37 -08:00
|
|
|
|
2020-04-07 01:38:50 +02:00
|
|
|
# MARWILTrainer
|
|
|
|
py_test(
|
|
|
|
name = "test_marwil",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["agents/marwil/tests/test_marwil.py"]
|
2020-06-23 09:48:23 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
# MAMLTrainer
|
|
|
|
py_test(
|
|
|
|
name = "test_maml",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["agents/maml/tests/test_maml.py"]
|
2020-04-07 01:38:50 +02:00
|
|
|
)
|
|
|
|
|
2020-01-23 02:02:58 +01:00
|
|
|
# PGTrainer
|
|
|
|
py_test(
|
|
|
|
name = "test_pg",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["agents_dir"],
|
2020-01-23 02:02:58 +01:00
|
|
|
size = "small",
|
|
|
|
srcs = ["agents/pg/tests/test_pg.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
# PPOTrainer
|
|
|
|
py_test(
|
|
|
|
name = "test_ppo",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["agents_dir"],
|
2020-04-03 19:44:58 +02:00
|
|
|
size = "large",
|
2020-01-23 02:02:58 +01:00
|
|
|
srcs = ["agents/ppo/tests/test_ppo.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
"agents/ppo/tests/test.py"] # TODO(sven): Move down once PR 6889 merged
|
2020-01-23 02:02:58 +01:00
|
|
|
)
|
|
|
|
|
2020-04-23 09:11:12 +02:00
|
|
|
# DDPPO
|
|
|
|
py_test(
|
|
|
|
name = "test_ddppo",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["agents/ppo/tests/test_ddppo.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
# APPO
|
|
|
|
py_test(
|
|
|
|
name = "test_appo",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["agents/ppo/tests/test_appo.py"]
|
|
|
|
)
|
|
|
|
|
2020-03-06 19:37:12 +01:00
|
|
|
# SAC
|
|
|
|
py_test(
|
|
|
|
name = "test_sac",
|
|
|
|
tags = ["agents_dir"],
|
2020-04-23 09:09:22 +02:00
|
|
|
size = "large",
|
2020-03-06 19:37:12 +01:00
|
|
|
srcs = ["agents/sac/tests/test_sac.py"]
|
|
|
|
)
|
|
|
|
|
2020-03-01 20:53:35 +01:00
|
|
|
# TD3Trainer
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_td3",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["agents_dir"],
|
2020-03-01 20:53:35 +01:00
|
|
|
size = "medium",
|
|
|
|
srcs = ["agents/ddpg/tests/test_td3.py"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
2020-01-23 02:02:58 +01:00
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# contrib Agents
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "random_agent",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
main = "contrib/random_agent/random_agent.py",
|
|
|
|
size = "small",
|
|
|
|
srcs = ["contrib/random_agent/random_agent.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "alpha_zero_cartpole",
|
|
|
|
tags = ["agents_dir"],
|
|
|
|
main = "contrib/alpha_zero/examples/train_cartpole.py",
|
|
|
|
size = "large",
|
|
|
|
srcs = ["contrib/alpha_zero/examples/train_cartpole.py"],
|
|
|
|
args = ["--training-iteration=1", "--num-workers=2", "--ray-num-cpus=3"]
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# Agents (quick training test iterations via `rllib train`)
|
|
|
|
#
|
|
|
|
# Tag: quick_train
|
|
|
|
#
|
|
|
|
# These are not(!) learning tests, we only test here compilation and
|
|
|
|
# support for certain envs, spaces, setups.
|
|
|
|
# Should all be very short tests with label: "quick_train".
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
|
|
|
# A2C/A3C
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_a3c_tf_cartpole_v1_lstm",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "CartPole-v1",
|
|
|
|
"--run", "A3C",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_workers\": 2, \"model\": {\"use_lstm\": true}}'",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--ray-num-cpus", "4"
|
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_a3c_torch_pong_deterministic_v4",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-05-27 16:19:13 +02:00
|
|
|
"--env", "PongDeterministic-v4",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--run", "A3C",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"torch\", \"num_workers\": 2, \"sample_async\": false, \"model\": {\"use_lstm\": false, \"grayscale\": true, \"zero_mean\": false, \"dim\": 84}, \"preprocessor_pref\": \"rllib\"}'",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--ray-num-cpus", "4"
|
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_a3c_tf_pong_ram_v4",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "Pong-ram-v4",
|
|
|
|
"--run", "A3C",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_workers\": 2}'",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--ray-num-cpus", "4"
|
|
|
|
]
|
|
|
|
)
|
|
|
|
|
2020-03-01 20:53:35 +01:00
|
|
|
# DDPG/APEX-DDPG/TD3
|
2020-02-15 23:50:44 +01:00
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_ddpg_mountaincar_continuous_v0_num_workers_0",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "MountainCarContinuous-v0",
|
|
|
|
"--run", "DDPG",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_workers\": 0}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_ddpg_mountaincar_continuous_v0_num_workers_1",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "MountainCarContinuous-v0",
|
|
|
|
"--run", "DDPG",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_workers\": 1}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_apex_ddpg_pendulum_v0_complete_episode_batches",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "Pendulum-v0",
|
|
|
|
"--run", "APEX_DDPG",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_workers\": 2, \"optimizer\": {\"num_replay_buffer_shards\": 1}, \"learning_starts\": 100, \"min_iter_time_s\": 1, \"batch_mode\": \"complete_episodes\"}'",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--ray-num-cpus", "4",
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
2020-03-01 20:53:35 +01:00
|
|
|
# DQN/APEX
|
2020-01-28 20:07:55 +01:00
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_dqn_frozenlake_v0",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
2020-03-01 20:53:35 +01:00
|
|
|
size = "small",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "FrozenLake-v0",
|
|
|
|
"--run", "DQN",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\"}'",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_dqn_cartpole_v0_no_dueling",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
2020-03-01 20:53:35 +01:00
|
|
|
size = "small",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "CartPole-v0",
|
|
|
|
"--run", "DQN",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"lr\": 1e-3, \"exploration_config\": {\"epsilon_timesteps\": 10000, \"final_epsilon\": 0.02}, \"dueling\": false, \"hiddens\": [], \"model\": {\"fcnet_hiddens\": [64], \"fcnet_activation\": \"relu\"}}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_dqn_cartpole_v0",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "CartPole-v0",
|
|
|
|
"--run", "DQN",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_workers\": 2}'",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--ray-num-cpus", "4"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_dqn_cartpole_v0_with_offline_input_and_softq",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
2020-03-01 20:53:35 +01:00
|
|
|
tags = ["quick_train", "external_files"],
|
|
|
|
size = "small",
|
|
|
|
# Include the json data file.
|
|
|
|
data = glob(["tests/data/cartpole_small/**"]),
|
2020-02-15 23:50:44 +01:00
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "CartPole-v0",
|
|
|
|
"--run", "DQN",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"input\": \"tests/data/cartpole_small\", \"learning_starts\": 0, \"input_evaluation\": [\"wis\", \"is\"], \"exploration_config\": {\"type\": \"SoftQ\"}}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_dqn_pong_deterministic_v4",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "PongDeterministic-v4",
|
|
|
|
"--run", "DQN",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"lr\": 1e-4, \"exploration_config\": {\"epsilon_timesteps\": 200000, \"final_epsilon\": 0.01}, \"buffer_size\": 10000, \"rollout_fragment_length\": 4, \"learning_starts\": 10000, \"target_network_update_freq\": 1000, \"gamma\": 0.99, \"prioritized_replay\": true}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
# ES
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_es_pendulum_v0",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "Pendulum-v0",
|
|
|
|
"--run", "ES",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"stepsize\": 0.01, \"episodes_per_batch\": 20, \"train_batch_size\": 100, \"num_workers\": 2}'",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--ray-num-cpus", "4"
|
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_es_pong_v0",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "Pong-v0",
|
|
|
|
"--run", "ES",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"stepsize\": 0.01, \"episodes_per_batch\": 20, \"train_batch_size\": 100, \"num_workers\": 2}'",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--ray-num-cpus", "4"
|
|
|
|
]
|
|
|
|
)
|
|
|
|
|
2020-03-01 20:53:35 +01:00
|
|
|
# IMPALA
|
2020-02-15 23:50:44 +01:00
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_impala_buffers_2",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
2020-03-01 20:53:35 +01:00
|
|
|
tags = ["quick_train"],
|
2020-02-15 23:50:44 +01:00
|
|
|
args = [
|
|
|
|
"--env", "CartPole-v0",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--run", "IMPALA",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_gpus\": 0, \"num_workers\": 2, \"min_iter_time_s\": 1, \"num_data_loader_buffers\": 2, \"replay_buffer_num_slots\": 100, \"replay_proportion\": 1.0}'",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--ray-num-cpus", "4",
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_impala_cartpole_v0_buffers_2_lstm",
|
2020-05-29 11:55:47 +02:00
|
|
|
main = "train.py",
|
|
|
|
srcs = ["train.py"],
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "CartPole-v0",
|
|
|
|
"--run", "IMPALA",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_gpus\": 0, \"num_workers\": 2, \"min_iter_time_s\": 1, \"num_data_loader_buffers\": 2, \"replay_buffer_num_slots\": 100, \"replay_proportion\": 1.0, \"model\": {\"use_lstm\": true}}'",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--ray-num-cpus", "4",
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_impala_pong_deterministic_v4_40k_ts_1G_obj_store",
|
2020-05-29 11:55:47 +02:00
|
|
|
main = "train.py",
|
|
|
|
srcs = ["train.py"],
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["quick_train"],
|
2020-05-29 11:55:47 +02:00
|
|
|
size = "medium",
|
2020-03-01 20:53:35 +01:00
|
|
|
args = [
|
|
|
|
"--env", "PongDeterministic-v4",
|
|
|
|
"--run", "IMPALA",
|
2020-05-29 11:55:47 +02:00
|
|
|
"--stop", "'{\"timesteps_total\": 30000}'",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--ray-object-store-memory=1000000000",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_workers\": 1, \"num_gpus\": 0, \"num_envs_per_worker\": 32, \"rollout_fragment_length\": 50, \"train_batch_size\": 50, \"learner_queue_size\": 1}'"
|
2020-03-01 20:53:35 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
# MARWIL
|
|
|
|
|
|
|
|
py_test(
|
2020-04-07 01:38:50 +02:00
|
|
|
name = "test_marwil_cartpole_v0_tf",
|
|
|
|
main = "train.py",
|
|
|
|
srcs = ["train.py"],
|
2020-03-01 20:53:35 +01:00
|
|
|
tags = ["quick_train", "external_files"],
|
|
|
|
size = "small",
|
|
|
|
# Include the json data file.
|
|
|
|
data = glob(["tests/data/cartpole_small/**"]),
|
2020-02-15 23:50:44 +01:00
|
|
|
args = [
|
|
|
|
"--env", "CartPole-v0",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--run", "MARWIL",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"input\": \"tests/data/cartpole_small\", \"learning_starts\": 0, \"input_evaluation\": [\"wis\", \"is\"], \"shuffle_buffer_size\": 10}'"
|
2020-04-07 01:38:50 +02:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_marwil_cartpole_v0_torch",
|
|
|
|
main = "train.py",
|
|
|
|
srcs = ["train.py"],
|
|
|
|
tags = ["quick_train", "external_files"],
|
|
|
|
size = "small",
|
|
|
|
# Include the json data file.
|
|
|
|
data = glob(["tests/data/cartpole_small/**"]),
|
|
|
|
args = [
|
|
|
|
"--env", "CartPole-v0",
|
|
|
|
"--run", "MARWIL",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"torch\", \"input\": \"tests/data/cartpole_small\", \"learning_starts\": 0, \"input_evaluation\": [\"wis\", \"is\"], \"shuffle_buffer_size\": 10}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
# PG
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_pg_tf_frozenlake_v0",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "FrozenLake-v0",
|
|
|
|
"--run", "PG",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"rollout_fragment_length\": 500, \"num_workers\": 1}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_pg_torch_frozenlake_v0",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
size = "small",
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "FrozenLake-v0",
|
|
|
|
"--run", "PG",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"torch\", \"rollout_fragment_length\": 500, \"num_workers\": 1}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_pg_tf_cartpole_v0_lstm",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "CartPole-v0",
|
|
|
|
"--run", "PG",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"rollout_fragment_length\": 500, \"num_workers\": 1, \"model\": {\"use_lstm\": true, \"max_seq_len\": 100}}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_pg_tf_cartpole_v0_multi_envs_per_worker",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
size = "small",
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "CartPole-v0",
|
|
|
|
"--run", "PG",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"rollout_fragment_length\": 500, \"num_workers\": 1, \"num_envs_per_worker\": 10}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_pg_tf_pong_v0",
|
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
|
|
|
"--env", "Pong-v0",
|
|
|
|
"--run", "PG",
|
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"rollout_fragment_length\": 500, \"num_workers\": 1}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
2020-03-01 20:53:35 +01:00
|
|
|
# PPO/APPO
|
2020-02-15 23:50:44 +01:00
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_ppo_tf_frozenlake_v0",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
2020-03-01 20:53:35 +01:00
|
|
|
size = "small",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "FrozenLake-v0",
|
|
|
|
"--run", "PPO",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_sgd_iter\": 10, \"sgd_minibatch_size\": 64, \"train_batch_size\": 1000, \"num_workers\": 1}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_ppo_torch_frozenlake_v0",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
2020-03-01 20:53:35 +01:00
|
|
|
size = "small",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "FrozenLake-v0",
|
|
|
|
"--run", "PPO",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"torch\", \"num_sgd_iter\": 10, \"sgd_minibatch_size\": 64, \"train_batch_size\": 1000, \"num_workers\": 1}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_ppo_tf_cartpole_v1_lstm_simple_optimizer",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "CartPole-v1",
|
|
|
|
"--run", "PPO",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"simple_optimizer\": true, \"num_sgd_iter\": 2, \"model\": {\"use_lstm\": true}}'",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--ray-num-cpus", "4"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_ppo_tf_cartpole_v1_complete_episode_batches",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "CartPole-v1",
|
|
|
|
"--run", "PPO",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"kl_coeff\": 1.0, \"num_sgd_iter\": 10, \"lr\": 1e-4, \"sgd_minibatch_size\": 64, \"train_batch_size\": 2000, \"num_workers\": 1, \"use_gae\": false, \"batch_mode\": \"complete_episodes\"}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_ppo_tf_cartpole_v1_remote_worker_envs",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "CartPole-v1",
|
|
|
|
"--run", "PPO",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"remote_worker_envs\": true, \"remote_env_batch_wait_ms\": 99999999, \"num_envs_per_worker\": 2, \"num_workers\": 1, \"train_batch_size\": 100, \"sgd_minibatch_size\": 50}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_ppo_tf_cartpole_v1_remote_worker_envs_b",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
|
|
|
tags = ["quick_train"],
|
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "CartPole-v1",
|
|
|
|
"--run", "PPO",
|
|
|
|
"--stop", "'{\"training_iteration\": 2}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"remote_worker_envs\": true, \"num_envs_per_worker\": 2, \"num_workers\": 1, \"train_batch_size\": 100, \"sgd_minibatch_size\": 50}'"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-03-01 20:53:35 +01:00
|
|
|
name = "test_appo_tf_pendulum_v0_no_gpus",
|
2020-02-15 23:50:44 +01:00
|
|
|
main = "train.py", srcs = ["train.py"],
|
2020-03-01 20:53:35 +01:00
|
|
|
tags = ["quick_train"],
|
2020-02-15 23:50:44 +01:00
|
|
|
args = [
|
2020-03-01 20:53:35 +01:00
|
|
|
"--env", "Pendulum-v0",
|
|
|
|
"--run", "APPO",
|
2020-02-15 23:50:44 +01:00
|
|
|
"--stop", "'{\"training_iteration\": 1}'",
|
2020-05-27 16:19:13 +02:00
|
|
|
"--config", "'{\"framework\": \"tf\", \"num_workers\": 2, \"num_gpus\": 0}'",
|
2020-03-01 20:53:35 +01:00
|
|
|
"--ray-num-cpus", "4"
|
2020-02-15 23:50:44 +01:00
|
|
|
]
|
|
|
|
)
|
|
|
|
|
2020-05-30 22:48:34 +02:00
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# Env tests
|
|
|
|
# rllib/env/
|
|
|
|
#
|
|
|
|
# Tag: env
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
|
|
|
sh_test(
|
|
|
|
name = "env/tests/test_local_inference",
|
|
|
|
tags = ["env"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["env/tests/test_local_inference.sh"],
|
|
|
|
data = glob(["examples/serving/*.py"]),
|
|
|
|
)
|
|
|
|
|
|
|
|
sh_test(
|
|
|
|
name = "env/tests/test_remote_inference",
|
|
|
|
tags = ["env"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["env/tests/test_remote_inference.sh"],
|
|
|
|
data = glob(["examples/serving/*.py"]),
|
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# Models and Distributions
|
|
|
|
# rllib/models/
|
|
|
|
#
|
|
|
|
# Tag: models
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_distributions",
|
|
|
|
tags = ["models"],
|
2020-06-03 13:06:06 -04:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["models/tests/test_distributions.py"]
|
|
|
|
)
|
|
|
|
|
2020-03-12 04:39:47 +01:00
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# Optimizers and Memories
|
2020-05-21 10:16:18 -07:00
|
|
|
# rllib/execution/
|
2020-03-12 04:39:47 +01:00
|
|
|
#
|
|
|
|
# Tag: optimizers
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
2020-03-13 09:03:07 +01:00
|
|
|
py_test(
|
|
|
|
name = "test_segment_tree",
|
|
|
|
tags = ["optimizers"],
|
|
|
|
size = "small",
|
2020-05-21 10:16:18 -07:00
|
|
|
srcs = ["execution/tests/test_segment_tree.py"]
|
2020-03-13 09:03:07 +01:00
|
|
|
)
|
2020-03-12 04:39:47 +01:00
|
|
|
|
2020-03-13 09:03:07 +01:00
|
|
|
py_test(
|
|
|
|
name = "test_prioritized_replay_buffer",
|
|
|
|
tags = ["optimizers"],
|
|
|
|
size = "small",
|
2020-05-21 10:16:18 -07:00
|
|
|
srcs = ["execution/tests/test_prioritized_replay_buffer.py"]
|
2020-03-13 09:03:07 +01:00
|
|
|
)
|
2020-03-12 04:39:47 +01:00
|
|
|
|
2020-02-22 23:19:49 +01:00
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# Policies
|
|
|
|
# rllib/policy/
|
|
|
|
#
|
|
|
|
# Tag: policy
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "policy/tests/test_compute_log_likelihoods",
|
|
|
|
tags = ["policy"],
|
2020-03-29 00:16:30 +01:00
|
|
|
size = "medium",
|
2020-02-22 23:19:49 +01:00
|
|
|
srcs = ["policy/tests/test_compute_log_likelihoods.py"]
|
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# Utils:
|
|
|
|
# rllib/utils/
|
|
|
|
#
|
|
|
|
# Tag: utils
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
|
|
|
py_test(
|
2020-03-12 04:39:47 +01:00
|
|
|
name = "test_explorations",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["utils"],
|
2020-03-12 04:39:47 +01:00
|
|
|
size = "large",
|
|
|
|
srcs = ["utils/exploration/tests/test_explorations.py"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
2020-04-09 23:04:21 +02:00
|
|
|
py_test(
|
|
|
|
name = "test_parameter_noise",
|
|
|
|
tags = ["utils"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["utils/exploration/tests/test_parameter_noise.py"]
|
|
|
|
)
|
|
|
|
|
2020-01-28 20:07:55 +01:00
|
|
|
# Schedules
|
|
|
|
py_test(
|
|
|
|
name = "test_schedules",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["utils"],
|
2020-01-28 20:07:55 +01:00
|
|
|
size = "small",
|
|
|
|
srcs = ["utils/schedules/tests/test_schedules.py"]
|
|
|
|
)
|
2020-02-14 06:30:44 +00:00
|
|
|
|
2020-03-12 04:39:47 +01:00
|
|
|
py_test(
|
|
|
|
name = "test_framework_agnostic_components",
|
|
|
|
tags = ["utils"],
|
|
|
|
size = "small",
|
|
|
|
data = glob(["utils/tests/**"]),
|
|
|
|
srcs = ["utils/tests/test_framework_agnostic_components.py"]
|
|
|
|
)
|
|
|
|
|
2020-02-14 06:30:44 +00:00
|
|
|
# TaskPool
|
|
|
|
py_test(
|
|
|
|
name = "test_taskpool",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["utils"],
|
2020-02-14 06:30:44 +00:00
|
|
|
size = "small",
|
|
|
|
srcs = ["utils/tests/test_taskpool.py"]
|
|
|
|
)
|
2020-02-15 23:50:44 +01:00
|
|
|
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# rllib/tests/ directory
|
|
|
|
#
|
|
|
|
# Tag: tests_dir, tests_dir_[A-Z]
|
|
|
|
#
|
|
|
|
# NOTE: Add tests alphabetically into this list and make sure, to tag
|
|
|
|
# it correctly by its starting letter, e.g. tags=["tests_dir", "tests_dir_A"]
|
|
|
|
# for `tests/test_all_stuff.py`.
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
2020-05-27 10:19:47 +02:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_attention_net_learning",
|
|
|
|
tags = ["tests_dir", "tests_dir_A"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/test_attention_net_learning.py"]
|
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_avail_actions_qmix",
|
|
|
|
tags = ["tests_dir", "tests_dir_A"],
|
2020-06-03 08:14:29 +02:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_avail_actions_qmix.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_catalog",
|
|
|
|
tags = ["tests_dir", "tests_dir_C"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["tests/test_catalog.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_checkpoint_restore",
|
|
|
|
tags = ["tests_dir", "tests_dir_C"],
|
|
|
|
size = "enormous",
|
|
|
|
srcs = ["tests/test_checkpoint_restore.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_dependency",
|
|
|
|
tags = ["tests_dir", "tests_dir_D"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["tests/test_dependency.py"]
|
|
|
|
)
|
|
|
|
|
2020-04-07 18:07:39 -07:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_dependency_torch",
|
|
|
|
tags = ["tests_dir", "tests_dir_D"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["tests/test_dependency_torch.py"]
|
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_eager_support",
|
|
|
|
tags = ["tests_dir", "tests_dir_E"],
|
2020-03-29 00:16:30 +01:00
|
|
|
size = "enormous",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_eager_support.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "test_env_with_subprocess",
|
|
|
|
main = "tests/test_env_with_subprocess.py",
|
|
|
|
tags = ["tests_dir", "tests_dir_E"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["tests/test_env_with_subprocess.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_evaluators",
|
|
|
|
tags = ["tests_dir", "tests_dir_E"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/test_evaluators.py"]
|
|
|
|
)
|
|
|
|
|
2020-06-05 08:34:21 +02:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_exec_api",
|
|
|
|
tags = ["tests_dir", "tests_dir_E"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/test_exec_api.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_execution",
|
|
|
|
tags = ["tests_dir", "tests_dir_E"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/test_execution.py"]
|
|
|
|
)
|
|
|
|
|
2020-05-27 16:19:13 +02:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_export",
|
|
|
|
tags = ["tests_dir", "tests_dir_E"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["tests/test_export.py"]
|
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_external_env",
|
|
|
|
tags = ["tests_dir", "tests_dir_E"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/test_external_env.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_external_multi_agent_env",
|
|
|
|
tags = ["tests_dir", "tests_dir_E"],
|
2020-03-13 18:48:41 -07:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_external_multi_agent_env.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_filters",
|
|
|
|
tags = ["tests_dir", "tests_dir_F"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["tests/test_filters.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_ignore_worker_failure",
|
|
|
|
tags = ["tests_dir", "tests_dir_I"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/test_ignore_worker_failure.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_io",
|
|
|
|
tags = ["tests_dir", "tests_dir_I"],
|
2020-03-13 18:48:41 -07:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_io.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_local",
|
|
|
|
tags = ["tests_dir", "tests_dir_L"],
|
2020-03-13 18:48:41 -07:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_local.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_lstm",
|
|
|
|
tags = ["tests_dir", "tests_dir_L"],
|
2020-03-13 18:48:41 -07:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_lstm.py"]
|
|
|
|
)
|
|
|
|
|
2020-03-23 20:19:30 +01:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_model_imports",
|
|
|
|
tags = ["tests_dir", "tests_dir_M", "model_imports"],
|
|
|
|
size = "small",
|
|
|
|
data = glob(["tests/data/model_weights/**"]),
|
|
|
|
srcs = ["tests/test_model_imports.py"]
|
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_multi_agent_env",
|
|
|
|
tags = ["tests_dir", "tests_dir_M"],
|
2020-06-05 08:34:21 +02:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_multi_agent_env.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_multi_agent_pendulum",
|
|
|
|
tags = ["tests_dir", "tests_dir_M"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/test_multi_agent_pendulum.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-04-28 14:59:16 +02:00
|
|
|
name = "tests/test_nested_observation_spaces",
|
|
|
|
main = "tests/test_nested_observation_spaces.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["tests_dir", "tests_dir_N"],
|
2020-03-13 18:48:41 -07:00
|
|
|
size = "small",
|
2020-04-28 14:59:16 +02:00
|
|
|
srcs = ["tests/test_nested_observation_spaces.py"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "tests/test_reproducibility",
|
|
|
|
tags = ["tests_dir", "tests_dir_R"],
|
2020-06-05 08:34:21 +02:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_reproducibility.py"]
|
|
|
|
)
|
|
|
|
|
2020-03-12 19:02:51 +01:00
|
|
|
py_test(
|
|
|
|
name = "test_rollout",
|
|
|
|
main = "tests/test_rollout.py",
|
|
|
|
tags = ["tests_dir", "tests_dir_R"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "large",
|
2020-03-12 19:02:51 +01:00
|
|
|
data = ["train.py", "rollout.py"],
|
|
|
|
srcs = ["tests/test_rollout.py"]
|
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_rollout_worker",
|
|
|
|
tags = ["tests_dir", "tests_dir_R"],
|
2020-06-05 08:34:21 +02:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_rollout_worker.py"]
|
|
|
|
)
|
|
|
|
|
2020-05-27 16:19:13 +02:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_supported_multi_agent",
|
|
|
|
tags = ["tests_dir", "tests_dir_S"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["tests/test_supported_multi_agent.py"]
|
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
|
|
|
name = "tests/test_supported_spaces",
|
|
|
|
tags = ["tests_dir", "tests_dir_S"],
|
2020-06-05 08:34:21 +02:00
|
|
|
size = "enormous",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["tests/test_supported_spaces.py"]
|
|
|
|
)
|
|
|
|
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
# examples/ directory
|
|
|
|
#
|
|
|
|
# Tag: examples, examples_[A-Z]
|
|
|
|
#
|
|
|
|
# NOTE: Add tests alphabetically into this list and make sure, to tag
|
|
|
|
# it correctly by its starting letter, e.g. tags=["examples", "examples_A"]
|
|
|
|
# for `examples/all_stuff.py`.
|
|
|
|
# --------------------------------------------------------------------
|
|
|
|
|
|
|
|
|
2020-05-18 17:26:40 +02:00
|
|
|
py_test(
|
|
|
|
name = "examples/attention_net_tf",
|
|
|
|
main = "examples/attention_net.py",
|
|
|
|
tags = ["examples", "examples_A"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["examples/attention_net.py"],
|
|
|
|
args = ["--as-test", "--stop-reward=80"]
|
|
|
|
)
|
|
|
|
|
|
|
|
# TODO(sven): GTrXL PyTorch.
|
|
|
|
# py_test(
|
|
|
|
# name = "examples/attention_net_torch",
|
|
|
|
# main = "examples/attention_net.py",
|
|
|
|
# tags = ["examples", "examples_A"],
|
|
|
|
# size = "large",
|
|
|
|
# srcs = ["examples/attention_net.py"],
|
|
|
|
# args = ["--as-test", "--torch", "--stop-reward=90"]
|
|
|
|
# )
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/autoregressive_action_dist_tf",
|
|
|
|
main = "examples/autoregressive_action_dist.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_A"],
|
2020-05-12 08:23:10 +02:00
|
|
|
size = "medium",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["examples/autoregressive_action_dist.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=150", "--num-cpus=4"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/autoregressive_action_dist_torch",
|
|
|
|
main = "examples/autoregressive_action_dist.py",
|
|
|
|
tags = ["examples", "examples_A"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/autoregressive_action_dist.py"],
|
|
|
|
args = ["--as-test", "--torch", "--stop-reward=150", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/batch_norm_model_ppo_tf",
|
|
|
|
main = "examples/batch_norm_model.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_B"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/batch_norm_model.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--run=PPO", "--stop-reward=80"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/batch_norm_model_ppo_torch",
|
|
|
|
main = "examples/batch_norm_model.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_B"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/batch_norm_model.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--torch", "--run=PPO", "--stop-reward=80"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/batch_norm_model_dqn_tf",
|
|
|
|
main = "examples/batch_norm_model.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_B"],
|
2020-05-18 17:26:40 +02:00
|
|
|
size = "large", # DQN learns much slower with BatchNorm.
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["examples/batch_norm_model.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--run=DQN", "--stop-reward=70"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/batch_norm_model_dqn_torch",
|
|
|
|
main = "examples/batch_norm_model.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_B"],
|
2020-05-18 17:26:40 +02:00
|
|
|
size = "large", # DQN learns much slower with BatchNorm.
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/batch_norm_model.py"],
|
|
|
|
args = ["--as-test", "--torch", "--run=DQN", "--stop-reward=70"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/batch_norm_model_ddpg_tf",
|
|
|
|
main = "examples/batch_norm_model.py",
|
|
|
|
tags = ["examples", "examples_B"],
|
|
|
|
size = "small",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["examples/batch_norm_model.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--run=DDPG", "--stop-iters=1"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/batch_norm_model_ddpg_torch",
|
|
|
|
main = "examples/batch_norm_model.py",
|
|
|
|
tags = ["examples", "examples_B"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/batch_norm_model.py"],
|
|
|
|
args = ["--torch", "--run=DDPG", "--stop-iters=1"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/cartpole_lstm_impala_tf",
|
|
|
|
main = "examples/cartpole_lstm.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "large",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/cartpole_lstm.py"],
|
|
|
|
args = ["--as-test", "--run=IMPALA", "--stop-reward=40", "--num-cpus=4"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/cartpole_lstm_impala_torch",
|
|
|
|
main = "examples/cartpole_lstm.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "large",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["examples/cartpole_lstm.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--torch", "--run=IMPALA", "--stop-reward=40", "--num-cpus=4"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/cartpole_lstm_ppo_tf",
|
|
|
|
main = "examples/cartpole_lstm.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "large",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["examples/cartpole_lstm.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--run=PPO", "--stop-reward=40", "--num-cpus=4"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/cartpole_lstm_ppo_torch",
|
|
|
|
main = "examples/cartpole_lstm.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "large",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["examples/cartpole_lstm.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--torch", "--run=PPO", "--stop-reward=40", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/cartpole_lstm_ppo_tf_with_prev_a_and_r",
|
|
|
|
main = "examples/cartpole_lstm.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "large",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/cartpole_lstm.py"],
|
|
|
|
args = ["--as-test", "--run=PPO", "--stop-reward=40", "--use-prev-action-reward", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/centralized_critic_tf",
|
|
|
|
main = "examples/centralized_critic.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "large",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/centralized_critic.py"],
|
|
|
|
args = ["--as-test", "--stop-reward=7.2"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/centralized_critic_torch",
|
|
|
|
main = "examples/centralized_critic.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
2020-06-05 15:40:30 +02:00
|
|
|
size = "large",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["examples/centralized_critic.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--torch", "--stop-reward=7.2"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/centralized_critic_2_tf",
|
|
|
|
main = "examples/centralized_critic_2.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/centralized_critic_2.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=6.0"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/centralized_critic_2_torch",
|
|
|
|
main = "examples/centralized_critic_2.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/centralized_critic_2.py"],
|
|
|
|
args = ["--as-test", "--torch", "--stop-reward=6.0"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/custom_env_tf",
|
|
|
|
main = "examples/custom_env.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/custom_env.py"],
|
|
|
|
args = ["--as-test"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/custom_env_torch",
|
|
|
|
main = "examples/custom_env.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/custom_env.py"],
|
|
|
|
args = ["--as-test", "--torch"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/custom_eval_tf",
|
|
|
|
main = "examples/custom_eval.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/custom_eval.py"],
|
|
|
|
args = ["--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/custom_eval_torch",
|
|
|
|
main = "examples/custom_eval.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "small",
|
2020-02-15 23:50:44 +01:00
|
|
|
srcs = ["examples/custom_eval.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--torch", "--num-cpus=4"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/custom_fast_model_tf",
|
|
|
|
main = "examples/custom_fast_model.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/custom_fast_model.py"],
|
|
|
|
args = ["--stop-iters=1", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/custom_fast_model_torch",
|
|
|
|
main = "examples/custom_fast_model.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/custom_fast_model.py"],
|
|
|
|
args = ["--torch", "--stop-iters=1", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
2020-06-06 03:22:19 -07:00
|
|
|
py_test(
|
|
|
|
name = "examples/complex_struct_space_tf", main = "examples/complex_struct_space.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/complex_struct_space.py"],
|
|
|
|
args = ["--framework=tf"],
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/complex_struct_space_tf_eager", main = "examples/complex_struct_space.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/complex_struct_space.py"],
|
|
|
|
args = ["--framework=tfe"],
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/complex_struct_space_torch", main = "examples/complex_struct_space.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/complex_struct_space.py"],
|
|
|
|
args = ["--framework=torch"],
|
|
|
|
)
|
|
|
|
|
2020-05-12 08:23:10 +02:00
|
|
|
py_test(
|
|
|
|
name = "examples/custom_keras_model_a2c",
|
|
|
|
main = "examples/custom_keras_model.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["examples/custom_keras_model.py"],
|
|
|
|
args = ["--run=A2C", "--stop=50", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/custom_keras_model_dqn",
|
|
|
|
main = "examples/custom_keras_model.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/custom_keras_model.py"],
|
|
|
|
args = ["--run=DQN", "--stop=50"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/custom_keras_model_ppo",
|
|
|
|
main = "examples/custom_keras_model.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/custom_keras_model.py"],
|
|
|
|
args = ["--run=PPO", "--stop=50", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/custom_loss_tf",
|
|
|
|
main = "examples/custom_loss.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
2020-05-12 08:23:10 +02:00
|
|
|
size = "small",
|
|
|
|
# Include the json data file.
|
|
|
|
data = glob(["tests/data/cartpole_small/**"]),
|
|
|
|
srcs = ["examples/custom_loss.py"],
|
|
|
|
args = ["--stop-iters=2", "--input-files=tests/data/cartpole_small"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/custom_loss_torch",
|
|
|
|
main = "examples/custom_loss.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "small",
|
|
|
|
# Include the json data file.
|
|
|
|
data = glob(["tests/data/cartpole_small/**"]),
|
|
|
|
srcs = ["examples/custom_loss.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--torch", "--stop-iters=2", "--input-files=tests/data/cartpole_small"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/custom_metrics_and_callbacks",
|
2020-05-12 08:23:10 +02:00
|
|
|
main = "examples/custom_metrics_and_callbacks.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/custom_metrics_and_callbacks.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--stop-iters=2"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
2020-04-17 02:06:42 +03:00
|
|
|
py_test(
|
|
|
|
name = "examples/custom_metrics_and_callbacks_legacy",
|
2020-05-12 08:23:10 +02:00
|
|
|
main = "examples/custom_metrics_and_callbacks_legacy.py",
|
2020-04-17 02:06:42 +03:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/custom_metrics_and_callbacks_legacy.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--stop-iters=2"]
|
2020-04-17 02:06:42 +03:00
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/custom_rnn_model_repeat_after_me_tf",
|
|
|
|
main = "examples/custom_rnn_model.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_C"],
|
2020-02-22 20:02:31 +01:00
|
|
|
size = "medium",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/custom_rnn_model.py"],
|
|
|
|
args = ["--as-test", "--run=PPO", "--stop-reward=40", "--env=RepeatAfterMeEnv", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/custom_rnn_model_repeat_initial_obs_tf",
|
|
|
|
main = "examples/custom_rnn_model.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/custom_rnn_model.py"],
|
|
|
|
args = ["--as-test", "--run=PPO", "--stop-reward=10", "--stop-timesteps=300000", "--env=RepeatInitialObsEnv", "--num-cpus=4"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
2020-04-01 07:00:28 +02:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/custom_rnn_model_repeat_after_me_torch",
|
|
|
|
main = "examples/custom_rnn_model.py",
|
2020-04-01 07:00:28 +02:00
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/custom_rnn_model.py"],
|
|
|
|
args = ["--as-test", "--torch", "--run=PPO", "--stop-reward=40", "--env=RepeatAfterMeEnv", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/custom_rnn_model_repeat_initial_obs_torch",
|
|
|
|
main = "examples/custom_rnn_model.py",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/custom_rnn_model.py"],
|
|
|
|
args = ["--as-test", "--torch", "--run=PPO", "--stop-reward=10", "--stop-timesteps=300000", "--env=RepeatInitialObsEnv", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/custom_tf_policy",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/custom_tf_policy.py"],
|
|
|
|
args = ["--stop-iters=2", "--num-cpus=4"]
|
2020-04-01 07:00:28 +02:00
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
|
|
|
name = "examples/custom_torch_policy",
|
|
|
|
tags = ["examples", "examples_C"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/custom_torch_policy.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--stop-iters=2", "--num-cpus=4"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/eager_execution",
|
|
|
|
tags = ["examples", "examples_E"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/eager_execution.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--stop-iters=2"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
2020-05-01 22:59:34 +02:00
|
|
|
py_test(
|
|
|
|
name = "examples/hierarchical_training_tf",
|
2020-05-12 08:23:10 +02:00
|
|
|
main = "examples/hierarchical_training.py",
|
2020-05-01 22:59:34 +02:00
|
|
|
tags = ["examples", "examples_H"],
|
2020-05-12 08:23:10 +02:00
|
|
|
size = "medium",
|
2020-05-01 22:59:34 +02:00
|
|
|
srcs = ["examples/hierarchical_training.py"],
|
|
|
|
args = ["--stop-reward=0.0"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/hierarchical_training_torch",
|
2020-05-12 08:23:10 +02:00
|
|
|
main = "examples/hierarchical_training.py",
|
2020-05-01 22:59:34 +02:00
|
|
|
tags = ["examples", "examples_H"],
|
2020-05-12 08:23:10 +02:00
|
|
|
size = "medium",
|
2020-05-01 22:59:34 +02:00
|
|
|
srcs = ["examples/hierarchical_training.py"],
|
|
|
|
args = ["--torch", "--stop-reward=0.0"]
|
|
|
|
)
|
|
|
|
|
2020-05-12 08:23:10 +02:00
|
|
|
# Do not run this test (MobileNetV2 is gigantic and takes forever for 1 iter).
|
|
|
|
# py_test(
|
|
|
|
# name = "examples/mobilenet_v2_with_lstm_tf",
|
|
|
|
# main = "examples/mobilenet_v2_with_lstm.py",
|
|
|
|
# tags = ["examples", "examples_M"],
|
|
|
|
# size = "small",
|
|
|
|
# srcs = ["examples/mobilenet_v2_with_lstm.py"]
|
|
|
|
# )
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/multi_agent_cartpole_tf",
|
|
|
|
main = "examples/multi_agent_cartpole.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_M"],
|
|
|
|
size = "medium",
|
2020-02-19 21:18:45 +01:00
|
|
|
srcs = ["examples/multi_agent_cartpole.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=70.0", "--num-cpus=4"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/multi_agent_cartpole_torch",
|
|
|
|
main = "examples/multi_agent_cartpole.py",
|
2020-04-27 23:19:26 +02:00
|
|
|
tags = ["examples", "examples_M"],
|
2020-05-30 22:48:34 +02:00
|
|
|
size = "medium",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/multi_agent_cartpole.py"],
|
|
|
|
args = ["--as-test", "--torch", "--stop-reward=70.0", "--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/multi_agent_custom_policy_tf",
|
|
|
|
main = "examples/multi_agent_custom_policy.py",
|
|
|
|
tags = ["examples", "examples_M"],
|
|
|
|
size = "small",
|
2020-02-19 21:18:45 +01:00
|
|
|
srcs = ["examples/multi_agent_custom_policy.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=80"]
|
2020-02-19 21:18:45 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/multi_agent_custom_policy_torch",
|
|
|
|
main = "examples/multi_agent_custom_policy.py",
|
|
|
|
tags = ["examples", "examples_M"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/multi_agent_custom_policy.py"],
|
|
|
|
args = ["--as-test", "--torch", "--stop-reward=80"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/multi_agent_two_trainers_tf",
|
|
|
|
main = "examples/multi_agent_two_trainers.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_M"],
|
|
|
|
size = "medium",
|
2020-02-19 21:18:45 +01:00
|
|
|
srcs = ["examples/multi_agent_two_trainers.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=70"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
2020-05-07 23:40:29 -07:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/multi_agent_two_trainers_torch",
|
|
|
|
main = "examples/multi_agent_two_trainers.py",
|
|
|
|
tags = ["examples", "examples_M"],
|
2020-05-07 23:40:29 -07:00
|
|
|
size = "medium",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/multi_agent_two_trainers.py"],
|
|
|
|
args = ["--as-test", "--torch", "--stop-reward=70"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/multi_agent_two_trainers_mixed_torch_tf",
|
|
|
|
main = "examples/multi_agent_two_trainers.py",
|
|
|
|
tags = ["examples", "examples_M"],
|
2020-05-18 17:26:40 +02:00
|
|
|
size = "medium",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/multi_agent_two_trainers.py"],
|
|
|
|
args = ["--as-test", "--mixed-torch-tf", "--stop-reward=70"]
|
2020-05-07 23:40:29 -07:00
|
|
|
)
|
|
|
|
|
2020-04-28 14:59:16 +02:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/nested_action_spaces_ppo_tf",
|
2020-04-28 14:59:16 +02:00
|
|
|
main = "examples/nested_action_spaces.py",
|
|
|
|
tags = ["examples", "examples_N"],
|
2020-04-29 12:12:59 +02:00
|
|
|
size = "medium",
|
2020-04-28 14:59:16 +02:00
|
|
|
srcs = ["examples/nested_action_spaces.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=-600", "--run=PPO"]
|
2020-04-28 14:59:16 +02:00
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/nested_action_spaces_ppo_torch",
|
|
|
|
main = "examples/nested_action_spaces.py",
|
|
|
|
tags = ["examples", "examples_N"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/nested_action_spaces.py"],
|
|
|
|
args = ["--as-test", "--torch", "--stop-reward=-600", "--run=PPO"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/parametric_actions_cartpole_pg_tf",
|
2020-05-01 22:59:34 +02:00
|
|
|
main = "examples/parametric_actions_cartpole.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_P"],
|
|
|
|
size = "medium",
|
2020-05-01 22:59:34 +02:00
|
|
|
srcs = ["examples/parametric_actions_cartpole.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=60.0", "--run=PG"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/parametric_actions_cartpole_dqn_tf",
|
2020-05-01 22:59:34 +02:00
|
|
|
main = "examples/parametric_actions_cartpole.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_P"],
|
|
|
|
size = "medium",
|
2020-05-01 22:59:34 +02:00
|
|
|
srcs = ["examples/parametric_actions_cartpole.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=60.0", "--run=DQN"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/parametric_actions_cartpole_pg_torch",
|
|
|
|
main = "examples/parametric_actions_cartpole.py",
|
|
|
|
tags = ["examples", "examples_P"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/parametric_actions_cartpole.py"],
|
|
|
|
args = ["--as-test", "--torch", "--stop-reward=60.0", "--run=PG"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/parametric_actions_cartpole_dqn_torch",
|
2020-05-01 22:59:34 +02:00
|
|
|
main = "examples/parametric_actions_cartpole.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_P"],
|
|
|
|
size = "medium",
|
2020-05-01 22:59:34 +02:00
|
|
|
srcs = ["examples/parametric_actions_cartpole.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--torch", "--stop-reward=60.0", "--run=DQN"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/rollout_worker_custom_workflow",
|
|
|
|
tags = ["examples", "examples_R"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/rollout_worker_custom_workflow.py"],
|
|
|
|
args = ["--num-cpus=4"]
|
|
|
|
)
|
|
|
|
|
2020-05-12 08:23:10 +02:00
|
|
|
py_test(
|
|
|
|
name = "examples/rock_paper_scissors_multiagent_tf",
|
|
|
|
main = "examples/rock_paper_scissors_multiagent.py",
|
|
|
|
tags = ["examples", "examples_R"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/rock_paper_scissors_multiagent.py"],
|
|
|
|
args = ["--as-test"],
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "examples/rock_paper_scissors_multiagent_torch",
|
|
|
|
main = "examples/rock_paper_scissors_multiagent.py",
|
|
|
|
tags = ["examples", "examples_R"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/rock_paper_scissors_multiagent.py"],
|
|
|
|
args = ["--as-test", "--torch"],
|
|
|
|
)
|
|
|
|
|
2020-02-26 22:54:41 -08:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/two_trainer_workflow_tf",
|
|
|
|
main = "examples/two_trainer_workflow.py",
|
|
|
|
tags = ["examples", "examples_T"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/two_trainer_workflow.py"],
|
|
|
|
args = ["--as-test", "--stop-reward=100.0"]
|
2020-02-26 22:54:41 -08:00
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/two_trainer_workflow_torch",
|
|
|
|
main = "examples/two_trainer_workflow.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_T"],
|
2020-05-12 08:23:10 +02:00
|
|
|
size = "small",
|
|
|
|
srcs = ["examples/two_trainer_workflow.py"],
|
|
|
|
args = ["--as-test", "--torch", "--stop-reward=100.0"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
2020-03-26 13:41:16 -07:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/two_trainer_workflow_mixed_torch_tf",
|
|
|
|
main = "examples/two_trainer_workflow.py",
|
2020-03-26 13:41:16 -07:00
|
|
|
tags = ["examples", "examples_T"],
|
|
|
|
size = "small",
|
2020-05-12 08:23:10 +02:00
|
|
|
srcs = ["examples/two_trainer_workflow.py"],
|
|
|
|
args = ["--as-test", "--mixed-torch-tf", "--stop-reward=100.0"]
|
2020-03-26 13:41:16 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/twostep_game_maddpg",
|
|
|
|
main = "examples/twostep_game.py",
|
|
|
|
tags = ["examples", "examples_T"],
|
|
|
|
size = "large",
|
|
|
|
srcs = ["examples/twostep_game.py"],
|
|
|
|
args = ["--stop-timesteps=2000", "--run=contrib/MADDPG"]
|
2020-03-26 13:41:16 -07:00
|
|
|
)
|
|
|
|
|
2020-02-15 23:50:44 +01:00
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/twostep_game_pg_tf",
|
|
|
|
main = "examples/twostep_game.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_T"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/twostep_game.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--stop-reward=7", "--run=PG"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/twostep_game_pg_torch",
|
|
|
|
main = "examples/twostep_game.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_T"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/twostep_game.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--as-test", "--torch", "--stop-reward=7", "--run=PG"]
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
2020-05-12 08:23:10 +02:00
|
|
|
name = "examples/twostep_game_qmix",
|
|
|
|
main = "examples/twostep_game.py",
|
2020-02-15 23:50:44 +01:00
|
|
|
tags = ["examples", "examples_T"],
|
|
|
|
size = "medium",
|
|
|
|
srcs = ["examples/twostep_game.py"],
|
2020-05-12 08:23:10 +02:00
|
|
|
args = ["--stop-timesteps=2000", "--run=QMIX"]
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "contrib/bandits/examples/lin_ts",
|
|
|
|
main = "contrib/bandits/examples/simple_context_bandit.py",
|
|
|
|
tags = ["examples", "examples_T"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["contrib/bandits/examples/simple_context_bandit.py"],
|
|
|
|
args = ["--as-test", "--stop-reward=10", "--run=contrib/LinTS"],
|
|
|
|
)
|
|
|
|
|
|
|
|
py_test(
|
|
|
|
name = "contrib/bandits/examples/lin_ucb",
|
|
|
|
main = "contrib/bandits/examples/simple_context_bandit.py",
|
|
|
|
tags = ["examples", "examples_U"],
|
|
|
|
size = "small",
|
|
|
|
srcs = ["contrib/bandits/examples/simple_context_bandit.py"],
|
|
|
|
args = ["--as-test", "--stop-reward=10", "--run=contrib/LinUCB"],
|
2020-02-15 23:50:44 +01:00
|
|
|
)
|