mirror of
https://github.com/vale981/ray
synced 2025-03-06 10:31:39 -05:00
15 lines
477 B
YAML
15 lines
477 B
YAML
# This can be expected to reach 90 reward within ~1.5-2.5m timesteps / ~150-250 seconds on a K40 GPU
|
|
mountaincarcontinuous-apex-ddpg:
|
|
env: MountainCarContinuous-v0
|
|
run: APEX_DDPG
|
|
stop:
|
|
episode_reward_mean: 90
|
|
config:
|
|
clip_rewards: False
|
|
num_workers: 16
|
|
exploration_ou_noise_scale: 1.0
|
|
n_step: 3
|
|
target_network_update_freq: 50000
|
|
tau: 1.0
|
|
evaluation_interval: 5
|
|
evaluation_num_episodes: 10
|