mirror of
https://github.com/vale981/ray
synced 2025-03-12 06:06:39 -04:00
29 lines
696 B
YAML
29 lines
696 B
YAML
![]() |
pendulum-ddpg-fake-gpus:
|
||
|
env: Pendulum-v0
|
||
|
run: DDPG
|
||
|
stop:
|
||
|
episode_reward_mean: -700
|
||
|
timesteps_total: 100000
|
||
|
config:
|
||
|
# Works for both torch and tf.
|
||
|
framework: tf
|
||
|
actor_hiddens: [64, 64]
|
||
|
critic_hiddens: [64, 64]
|
||
|
n_step: 1
|
||
|
model: {}
|
||
|
gamma: 0.99
|
||
|
exploration_config:
|
||
|
final_scale: 0.02
|
||
|
timesteps_per_iteration: 600
|
||
|
buffer_size: 10000
|
||
|
clip_rewards: false
|
||
|
use_huber: true
|
||
|
learning_starts: 500
|
||
|
train_batch_size: 64
|
||
|
num_workers: 0
|
||
|
worker_side_prioritization: False
|
||
|
|
||
|
# Fake 2 GPUs.
|
||
|
num_gpus: 2
|
||
|
_fake_gpus: true
|