ray/rllib/tuned_examples/regression_tests/cartpole-appo.yaml

13 lines
292 B
YAML

cartpole-appo:
env: CartPole-v0
run: APPO
stop:
episode_reward_mean: 100
timesteps_total: 100000
config:
sample_batch_size: 10
train_batch_size: 10
num_envs_per_worker: 5
num_workers: 1
num_gpus: 0
vtrace: false