2022-05-28 10:50:03 +02:00
|
|
|
cartpole-crashing-with-remote-envs-pg:
|
|
|
|
env: ray.rllib.examples.env.cartpole_crashing.CartPoleCrashing
|
|
|
|
run: PG
|
|
|
|
stop:
|
2022-07-27 18:03:51 -07:00
|
|
|
evaluation/episode_reward_mean: 35.0
|
2022-05-28 10:50:03 +02:00
|
|
|
timesteps_total: 25000
|
|
|
|
config:
|
|
|
|
# Works for both torch and tf.
|
|
|
|
framework: tf
|
|
|
|
env_config:
|
|
|
|
config:
|
|
|
|
p_crash: 0.0
|
2022-06-20 19:53:47 +02:00
|
|
|
# Crash all envs always exactly after n steps.
|
2022-05-28 10:50:03 +02:00
|
|
|
crash_after_n_steps: 60
|
|
|
|
# Time for the env to initialize when newly created.
|
|
|
|
# Every time a remote sub-environment crashes, a new env is created
|
2022-07-15 08:55:14 +02:00
|
|
|
# in its place and will take this long (sleep) to "initialize".
|
2022-05-28 10:50:03 +02:00
|
|
|
init_time_s: 2.0
|
|
|
|
num_workers: 4
|
|
|
|
num_envs_per_worker: 3
|
|
|
|
rollout_fragment_length: 50
|
|
|
|
# Use parallel remote envs.
|
|
|
|
remote_worker_envs: true
|
2022-07-15 08:55:14 +02:00
|
|
|
|
2022-07-27 18:03:51 -07:00
|
|
|
# Disable env checking. Env checker doesn't handle Exceptions from
|
|
|
|
# user envs, and will crash rollout worker.
|
|
|
|
disable_env_checking: true
|
|
|
|
|
2022-05-28 10:50:03 +02:00
|
|
|
# Switch on resiliency for failed sub environments (within a vectorized stack).
|
|
|
|
restart_failed_sub_environments: true
|
2022-07-27 18:03:51 -07:00
|
|
|
|
|
|
|
evaluation_num_workers: 2
|
|
|
|
evaluation_interval: 1
|
|
|
|
evaluation_duration: 20
|
|
|
|
evaluation_duration_unit: episodes
|
|
|
|
evaluation_parallel_to_training: true
|
|
|
|
evaluation_config:
|
|
|
|
explore: false
|
|
|
|
env_config:
|
|
|
|
config:
|
|
|
|
# Make eval workers solid.
|
|
|
|
# This test is to prove that we can learn with crashing env,
|
|
|
|
# not eval with crashing env.
|
|
|
|
p_crash: 0.0
|
|
|
|
p_crash_reset: 0.0
|
|
|
|
init_time_s: 0.0
|