ray/rllib/tuned_examples/ppo/memory-leak-test-ppo.yaml

17 lines
505 B
YAML

memory-leak-test-ppo:
env:
ray.rllib.examples.env.random_env.RandomLargeObsSpaceEnv
run: PPO
config:
# Works for both torch and tf.
framework: tf
# Switch off np.random, which is known to have memory leaks.
env_config:
config:
static_samples: true
rollout_fragment_length: 20
num_workers: 4
num_envs_per_worker: 5
train_batch_size: 1000
sgd_minibatch_size: 256
num_sgd_iter: 5