2018-04-11 15:08:39 -07:00
|
|
|
pendulum-ddpg:
|
|
|
|
env: Pendulum-v0
|
|
|
|
run: DDPG
|
|
|
|
stop:
|
2018-12-11 17:21:53 -08:00
|
|
|
episode_reward_mean: -900
|
|
|
|
timesteps_total: 100000
|
2018-04-11 15:08:39 -07:00
|
|
|
config:
|
2018-04-30 00:18:15 -07:00
|
|
|
use_huber: True
|
|
|
|
clip_rewards: False
|
|
|
|
exploration_fraction: 0.1
|