2018-04-19 22:36:29 -07:00
|
|
|
# This can be expected to reach 90 reward within ~1.5-2.5m timesteps / ~150-250 seconds on a K40 GPU
|
2018-04-30 00:18:15 -07:00
|
|
|
mountaincarcontinuous-apex-ddpg:
|
2018-04-19 22:36:29 -07:00
|
|
|
env: MountainCarContinuous-v0
|
2018-04-30 00:18:15 -07:00
|
|
|
run: APEX_DDPG
|
2018-04-19 22:36:29 -07:00
|
|
|
stop:
|
|
|
|
episode_reward_mean: 90
|
|
|
|
config:
|
|
|
|
clip_rewards: False
|
|
|
|
num_workers: 16
|
2019-04-26 17:49:53 -07:00
|
|
|
exploration_ou_noise_scale: 1.0
|
2018-04-19 22:36:29 -07:00
|
|
|
n_step: 3
|
|
|
|
target_network_update_freq: 50000
|
|
|
|
tau: 1.0
|
2019-04-26 17:49:53 -07:00
|
|
|
evaluation_interval: 5
|
|
|
|
evaluation_num_episodes: 10
|