td3-halfcheetahbulletenv-v0: env: HalfCheetahBulletEnv-v0 run: TD3 # Minimum reward and total ts (in given time_total_s) to pass this test. pass_criteria: episode_reward_mean: 400.0 timesteps_total: 1000000 stop: time_total_s: 7200 config: num_gpus: 1 learning_starts: 10000 exploration_config: random_timesteps: 10000