2019-07-07 15:06:41 -07:00
|
|
|
atari-dist-dqn:
|
2018-09-29 23:13:36 -07:00
|
|
|
env:
|
|
|
|
grid_search:
|
|
|
|
- BreakoutNoFrameskip-v4
|
|
|
|
- BeamRiderNoFrameskip-v4
|
|
|
|
- QbertNoFrameskip-v4
|
|
|
|
- SpaceInvadersNoFrameskip-v4
|
|
|
|
run: DQN
|
|
|
|
config:
|
|
|
|
double_q: false
|
|
|
|
dueling: false
|
|
|
|
num_atoms: 51
|
|
|
|
noisy: false
|
2022-05-17 13:43:49 +02:00
|
|
|
replay_buffer_config:
|
|
|
|
type: MultiAgentReplayBuffer
|
|
|
|
capacity: 1000000
|
2022-08-11 13:07:30 +02:00
|
|
|
num_steps_sampled_before_learning_starts: 20000
|
2018-09-29 23:13:36 -07:00
|
|
|
n_step: 1
|
|
|
|
target_network_update_freq: 8000
|
|
|
|
lr: .0000625
|
|
|
|
adam_epsilon: .00015
|
|
|
|
hiddens: [512]
|
2020-03-14 12:05:04 -07:00
|
|
|
rollout_fragment_length: 4
|
2018-09-29 23:13:36 -07:00
|
|
|
train_batch_size: 32
|
2020-02-20 17:39:16 +01:00
|
|
|
exploration_config:
|
2020-02-11 00:22:07 +01:00
|
|
|
epsilon_timesteps: 200000
|
|
|
|
final_epsilon: 0.01
|
2018-11-27 23:35:19 -08:00
|
|
|
num_gpus: 0.2
|
2022-06-10 17:09:18 +02:00
|
|
|
min_sample_timesteps_per_iteration: 10000
|