from ray import tune from ray.rllib.agents.ppo import PPOTrainer tune.run( PPOTrainer, stop={"episode_len_mean": 20}, config={"env": "CartPole-v0", "framework": "torch", "log_level": "INFO"}, )