pendulum-ddpg-tf: env: Pendulum-v0 run: DDPG stop: episode_reward_mean: -700 timesteps_total: 100000 config: use_pytorch: false use_huber: true clip_rewards: false