mirror of
https://github.com/vale981/ray
synced 2025-03-06 18:41:40 -05:00

* SAC Performance Fixes * Small Changes * Update sac_model.py * fix normalize wrapper * Update test_eager_support.py Co-authored-by: Eric Liang <ekhliang@gmail.com>
12 lines
371 B
YAML
12 lines
371 B
YAML
pendulum-sac:
|
|
env: Pendulum-v0
|
|
run: SAC
|
|
stop:
|
|
episode_reward_mean: -300 # note that evaluation perf is higher
|
|
timesteps_total: 10000
|
|
config:
|
|
evaluation_interval: 1 # logged under evaluation/* metric keys
|
|
soft_horizon: True
|
|
clip_actions: False
|
|
normalize_actions: True
|
|
metrics_smoothing_episodes: 5
|