impala-breakoutnoframeskip-v4: env: BreakoutNoFrameskip-v4 run: IMPALA # Minimum reward and total ts (in given time_total_s) to pass this test. pass_criteria: episode_reward_mean: 200.0 timesteps_total: 6000000 stop: time_total_s: 3600 config: rollout_fragment_length: 50 train_batch_size: 500 num_workers: 10 num_envs_per_worker: 5 clip_rewards: True lr_schedule: [ [0, 0.0005], [20000000, 0.000000000001], ] num_gpus: 1