2018-11-06 17:09:34 -10:00
|
|
|
# can expect improvement to -140 reward in ~300-500k timesteps
|
2018-09-26 22:32:26 -07:00
|
|
|
swimmer-ars:
|
2018-08-24 22:20:02 -07:00
|
|
|
env: Swimmer-v2
|
|
|
|
run: ARS
|
|
|
|
config:
|
2020-05-26 11:10:27 +02:00
|
|
|
# Works for both torch and tf.
|
2020-05-27 16:19:13 +02:00
|
|
|
framework: tf
|
2018-08-24 22:20:02 -07:00
|
|
|
noise_stdev: 0.01
|
2018-09-26 22:32:26 -07:00
|
|
|
num_rollouts: 1
|
|
|
|
rollouts_used: 1
|
2018-08-24 22:20:02 -07:00
|
|
|
num_workers: 1
|
2018-09-26 22:32:26 -07:00
|
|
|
sgd_stepsize: 0.02
|
2018-08-24 22:20:02 -07:00
|
|
|
noise_size: 250000000
|
|
|
|
eval_prob: 0.2
|
|
|
|
offset: 0
|
2018-09-26 22:32:26 -07:00
|
|
|
observation_filter: NoFilter
|
|
|
|
report_length: 3
|
2018-10-01 12:49:39 -07:00
|
|
|
model:
|
|
|
|
fcnet_hiddens: [] # a linear policy
|