from ray import tune
from ray.rllib.agents.ppo import PPOTrainer

tune.run(
    PPOTrainer,
    stop={"episode_len_mean": 20},
    config={"env": "CartPole-v0", "framework": "torch", "log_level": "INFO"},
)