2020-11-24 16:00:33 -08:00
|
|
|
# This workload tests running many instances of PPO (many actors)
|
|
|
|
# This covers https://github.com/ray-project/ray/pull/12148
|
|
|
|
|
|
|
|
import ray
|
|
|
|
from ray.tune import run_experiments
|
|
|
|
|
|
|
|
num_redis_shards = 5
|
|
|
|
redis_max_memory = 10**8
|
|
|
|
object_store_memory = 10**9
|
|
|
|
num_nodes = 3
|
|
|
|
|
|
|
|
message = ("Make sure there is enough memory on this machine to run this "
|
|
|
|
"workload. We divide the system memory by 2 to provide a buffer.")
|
|
|
|
assert (num_nodes * object_store_memory + num_redis_shards * redis_max_memory <
|
2021-05-04 23:10:04 +02:00
|
|
|
ray._private.utils.get_system_memory() / 2), message
|
2020-11-24 16:00:33 -08:00
|
|
|
|
|
|
|
# Simulate a cluster on one machine.
|
|
|
|
|
2021-05-04 23:10:04 +02:00
|
|
|
ray.init(address="auto")
|
2020-11-24 16:00:33 -08:00
|
|
|
|
|
|
|
# Run the workload.
|
|
|
|
|
|
|
|
run_experiments({
|
|
|
|
"ppo": {
|
|
|
|
"run": "PPO",
|
|
|
|
"env": "CartPole-v0",
|
|
|
|
"num_samples": 10000,
|
|
|
|
"config": {
|
2021-05-04 23:10:04 +02:00
|
|
|
"framework": "torch",
|
|
|
|
"num_workers": 7,
|
2020-11-24 16:00:33 -08:00
|
|
|
"num_gpus": 0,
|
|
|
|
"num_sgd_iter": 1,
|
|
|
|
},
|
|
|
|
"stop": {
|
|
|
|
"timesteps_total": 1,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
})
|