ray/rllib/tuned_examples/pong-impala.yaml

14 lines
428 B
YAML
Raw Normal View History

# This can reach 18-19 reward within 10 minutes on a Tesla M60 GPU (e.g., G3 EC2 node):
# 128 workers -> 8 minutes
# 32 workers -> 17 minutes
# 16 workers -> 40 min+
# See also: pong-impala-fast.yaml, pong-impala-vectorized.yaml
pong-impala:
env: PongNoFrameskip-v4
run: IMPALA
config:
rollout_fragment_length: 50
train_batch_size: 500
num_workers: 128
num_envs_per_worker: 1