dynamics-dyna: env: grid_search: - HalfCheetah-v2 - Humanoid-v2 - Ant-v2 - Hopper-v2 run: DYNA local_dir: ~/dyna_results stop: training_iteration: 4000 config: # Works for both torch and tf. framework: torch rollout_fragment_length: 200 train_batch_size: 1000 num_workers: 1