ray/rllib/tuned_examples/ddpg/pendulum-td3-fake-gpus.yaml
2022-05-05 09:41:38 +02:00

20 lines
501 B
YAML

pendulum-td3-fake-gpus:
env: Pendulum-v1
run: TD3
stop:
episode_reward_mean: -900
timesteps_total: 100000
config:
# Works for both torch and tf.
framework: tf
actor_hiddens: [64, 64]
critic_hiddens: [64, 64]
learning_starts: 5000
exploration_config:
random_timesteps: 5000
evaluation_interval: 10
evaluation_num_episodes: 5
# Fake 2 GPUs.
num_gpus: 2
_fake_gpus: true