2018-12-21 03:44:34 +09:00
|
|
|
"""Registry of algorithm names for `rllib train --run=<alg_name>`"""
|
|
|
|
|
|
|
|
|
|
|
|
def _import_random_agent():
|
|
|
|
from ray.rllib.contrib.random_agent.random_agent import RandomAgent
|
2021-02-08 12:05:16 +01:00
|
|
|
return RandomAgent, RandomAgent._default_config
|
2018-12-21 03:44:34 +09:00
|
|
|
|
|
|
|
|
2019-08-06 19:22:06 -04:00
|
|
|
def _import_maddpg():
|
|
|
|
from ray.rllib.contrib import maddpg
|
2021-02-08 12:05:16 +01:00
|
|
|
return maddpg.MADDPGTrainer, maddpg.DEFAULT_CONFIG
|
2019-08-06 19:22:06 -04:00
|
|
|
|
|
|
|
|
2019-12-07 21:08:40 +01:00
|
|
|
def _import_alphazero():
|
|
|
|
from ray.rllib.contrib.alpha_zero.core.alpha_zero_trainer import\
|
2021-02-08 12:05:16 +01:00
|
|
|
AlphaZeroTrainer, DEFAULT_CONFIG
|
|
|
|
return AlphaZeroTrainer, DEFAULT_CONFIG
|
2019-12-07 21:08:40 +01:00
|
|
|
|
|
|
|
|
2020-03-26 13:41:16 -07:00
|
|
|
def _import_bandit_lints():
|
2021-02-08 12:05:16 +01:00
|
|
|
from ray.rllib.contrib.bandits.agents.lin_ts import LinTSTrainer, TS_CONFIG
|
|
|
|
return LinTSTrainer, TS_CONFIG
|
2020-03-26 13:41:16 -07:00
|
|
|
|
|
|
|
|
|
|
|
def _import_bandit_linucb():
|
2021-02-08 12:05:16 +01:00
|
|
|
from ray.rllib.contrib.bandits.agents.lin_ucb import LinUCBTrainer, \
|
|
|
|
UCB_CONFIG
|
|
|
|
return LinUCBTrainer, UCB_CONFIG
|
2020-03-26 13:41:16 -07:00
|
|
|
|
|
|
|
|
2018-12-21 03:44:34 +09:00
|
|
|
CONTRIBUTED_ALGORITHMS = {
|
|
|
|
"contrib/RandomAgent": _import_random_agent,
|
2019-08-06 19:22:06 -04:00
|
|
|
"contrib/MADDPG": _import_maddpg,
|
2019-12-07 21:08:40 +01:00
|
|
|
"contrib/AlphaZero": _import_alphazero,
|
2020-03-26 13:41:16 -07:00
|
|
|
"contrib/LinTS": _import_bandit_lints,
|
|
|
|
"contrib/LinUCB": _import_bandit_linucb
|
2018-12-21 03:44:34 +09:00
|
|
|
}
|