cartpole-a2c-torch: env: CartPole-v0 run: A2C stop: episode_reward_mean: 100 timesteps_total: 100000 config: num_workers: 0 use_pytorch: true