ray/release/rllib_tests/learning_tests/yaml_files/bc-halfcheetahbulletenv-v0.yaml

25 lines
688 B
YAML

bc-halfcheetahbulletenv-v0:
env: HalfCheetahBulletEnv-v0
run: BC
pass_criteria:
evaluation/episode_reward_mean: 400.0
timesteps_total: 10000000
stop:
time_total_s: 3600
config:
# Use input produced by expert SAC algo.
input: ["~/halfcheetah_expert_sac.zip"]
actions_in_input_normalized: true
num_gpus: 1
model:
fcnet_activation: relu
fcnet_hiddens: [256, 256, 256]
evaluation_num_workers: 1
evaluation_parallel_to_training: true
evaluation_interval: 3
evaluation_config:
input: sampler
always_attach_evaluation_results: True