2020-04-21 09:47:52 +02:00
|
|
|
cartpole-ars-tf:
|
2018-08-24 22:20:02 -07:00
|
|
|
env: CartPole-v0
|
|
|
|
run: ARS
|
|
|
|
stop:
|
2018-12-11 17:21:53 -08:00
|
|
|
episode_reward_mean: 50
|
|
|
|
timesteps_total: 500000
|
2018-08-24 22:20:02 -07:00
|
|
|
config:
|
2020-04-21 09:47:52 +02:00
|
|
|
use_pytorch: false
|
2018-08-24 22:20:02 -07:00
|
|
|
noise_stdev: 0.02
|
2018-09-26 22:32:26 -07:00
|
|
|
num_rollouts: 50
|
|
|
|
rollouts_used: 25
|
2018-08-24 22:20:02 -07:00
|
|
|
num_workers: 2
|
2018-09-26 22:32:26 -07:00
|
|
|
sgd_stepsize: 0.01
|
2018-12-11 17:21:53 -08:00
|
|
|
noise_size: 25000000
|
2018-08-24 22:20:02 -07:00
|
|
|
eval_prob: 0.5
|
2018-12-11 17:21:53 -08:00
|
|
|
model:
|
|
|
|
fcnet_hiddens: [] # a linear policy
|