ray/rllib/utils/__init__.py

import logging
import os

from ray.rllib.utils.filter_manager import FilterManager
from ray.rllib.utils.filter import Filter
from ray.rllib.utils.policy_client import PolicyClient
from ray.rllib.utils.policy_server import PolicyServer
from ray.tune.util import merge_dicts, deep_update

logger = logging.getLogger(__name__)


def renamed_class(cls, old_name):
    """Helper class for renaming classes with a warning."""

    class DeprecationWrapper(cls):
        # note: **kw not supported for ray.remote classes
        def __init__(self, *args, **kw):
            new_name = cls.__module__ + "." + cls.__name__
            logger.warn("DeprecationWarning: {} has been renamed to {}. ".
                        format(old_name, new_name) +
                        "This will raise an error in the future.")
            cls.__init__(self, *args, **kw)

    DeprecationWrapper.__name__ = cls.__name__

    return DeprecationWrapper


def add_mixins(base, mixins):
    """Returns a new class with mixins applied in priority order."""

    mixins = list(mixins or [])

    while mixins:

        class new_base(mixins.pop(), base):
            pass

        base = new_base

    return base


def renamed_agent(cls):
    """Helper class for renaming Agent => Trainer with a warning."""

    class DeprecationWrapper(cls):
        def __init__(self, config=None, env=None, logger_creator=None):
            old_name = cls.__name__.replace("Trainer", "Agent")
            new_name = cls.__module__ + "." + cls.__name__
            logger.warn("DeprecationWarning: {} has been renamed to {}. ".
                        format(old_name, new_name) +
                        "This will raise an error in the future.")
            cls.__init__(self, config, env, logger_creator)

    DeprecationWrapper.__name__ = cls.__name__

    return DeprecationWrapper


def try_import_tf():
    if "RLLIB_TEST_NO_TF_IMPORT" in os.environ:
        logger.warning("Not importing TensorFlow for test purposes")
        return None

    try:
        if "TF_CPP_MIN_LOG_LEVEL" not in os.environ:
            os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
        import tensorflow.compat.v1 as tf
        tf.logging.set_verbosity(tf.logging.ERROR)
        tf.disable_v2_behavior()
        return tf
    except ImportError:
        try:
            import tensorflow as tf
            return tf
        except ImportError:
            return None


def try_import_tfp():
    if "RLLIB_TEST_NO_TF_IMPORT" in os.environ:
        logger.warning(
            "Not importing TensorFlow Probability for test purposes.")
        return None

    try:
        import tensorflow_probability as tfp
        return tfp
    except ImportError:
        return None


__all__ = [
    "Filter",
    "FilterManager",
    "PolicyClient",
    "PolicyServer",
    "merge_dicts",
    "deep_update",
    "renamed_class",
    "try_import_tf",
]
[rllib] Rename Agent to Trainer (#4556) 2019-04-07 00:36:18 -07:00			`import logging`
[rllib] Remove dependency on TensorFlow (#4764) * remove hard tf dep * add test * comment fix * fix test 2019-05-10 20:36:18 -07:00			`import os`
[rllib] Rename Agent to Trainer (#4556) 2019-04-07 00:36:18 -07:00
[rllib] Evaluators and Optimizers Refactoring (#1339) 2017-12-30 00:24:54 -08:00			`from ray.rllib.utils.filter_manager import FilterManager`
[rllib] Document "v2" APIs (#2316) * re * wip * wip * a3c working * torch support * pg works * lint * rm v2 * consumer id * clean up pg * clean up more * fix python 2.7 * tf session management * docs * dqn wip * fix compile * dqn * apex runs * up * impotrs * ddpg * quotes * fix tests * fix last r * fix tests * lint * pass checkpoint restore * kwar * nits * policy graph * fix yapf * com * class * pyt * vectorization * update * test cpe * unit test * fix ddpg2 * changes * wip * args * faster test * common * fix * add alg option * batch mode and policy serving * multi serving test * todo * wip * serving test * doc async env * num envs * comments * thread * remove init hook * update * fix ppo * comments1 * fix * updates * add jenkins tests * fix * fix pytorch * fix * fixes * fix a3c policy * fix squeeze * fix trunc on apex * fix squeezing for real * update * remove horizon test for now * multiagent wip * update * fix race condition * fix ma * t * doc * st * wip * example * wip * working * cartpole * wip * batch wip * fix bug * make other_batches None default * working * debug * nit * warn * comments * fix ppo * fix obs filter * update * wip * tf * update * fix * cleanup * cleanup * spacing * model * fix * dqn * fix ddpg * doc * keep names * update * fix * com * docs * clarify model outputs * Update torch_policy_graph.py * fix obs filter * pass thru worker index * fix * rename * vlad torch comments * fix log action * debug name * fix lstm * remove unused ddpg net * remove conv net * revert lstm * wip * wip * cast * wip * works * fix a3c * works * lstm util test * doc * clean up * update * fix lstm check * move to end * fix sphinx * fix cmd * remove bad doc * envs * vec * doc prep * models * rl * alg * up * clarify * copy * async sa * fix * comments * fix a3c conf * tune lstm * fix reshape * fix * back to 16 * tuned a3c update * update * tuned * optional * merge * wip * fix up * move pg class * rename env * wip * update * tip * alg * readme * fix catalog * readme * doc * context * remove prep * comma * add env * link to paper * paper * update * rnn * update * wip * clean up ev creation * fix * fix * fix * fix lint * up * no comma * ma * Update run_multi_node_tests.sh * fix * sphinx is stupid * sphinx is stupid * clarify torch graph * no horizon * fix config * sb * Update test_optimizers.py 2018-07-01 00:05:08 -07:00			`from ray.rllib.utils.filter import Filter`
			`from ray.rllib.utils.policy_client import PolicyClient`
			`from ray.rllib.utils.policy_server import PolicyServer`
[tune] Support Configuration Merging (#3584) * merge configs * deep merge * lint * add resolve * test 2018-12-26 03:07:11 -08:00			`from ray.tune.util import merge_dicts, deep_update`
[rllib] Evaluators and Optimizers Refactoring (#1339) 2017-12-30 00:24:54 -08:00
[rllib] Rename Agent to Trainer (#4556) 2019-04-07 00:36:18 -07:00			`logger = logging.getLogger(__name__)`


[rllib] Rename PolicyGraph => Policy, move from evaluation/ to policy/ (#4819) This implements some of the renames proposed in #4813 We leave behind backwards-compatibility aliases for *PolicyGraph and SampleBatch. 2019-05-20 16:46:05 -07:00			`def renamed_class(cls, old_name):`
			`"""Helper class for renaming classes with a warning."""`

			`class DeprecationWrapper(cls):`
			`# note: **kw not supported for ray.remote classes`
			`def __init__(self, args, *kw):`
			`new_name = cls.__module__ + "." + cls.__name__`
			`logger.warn("DeprecationWarning: {} has been renamed to {}. ".`
			`format(old_name, new_name) +`
			`"This will raise an error in the future.")`
			`cls.__init__(self, args, *kw)`

			`DeprecationWrapper.__name__ = cls.__name__`

			`return DeprecationWrapper`


[rllib] Port remainder of algorithms to build_trainer() pattern (#4920) 2019-06-07 16:45:36 -07:00			`def add_mixins(base, mixins):`
			`"""Returns a new class with mixins applied in priority order."""`

			`mixins = list(mixins or [])`

			`while mixins:`

			`class new_base(mixins.pop(), base):`
			`pass`

			`base = new_base`

			`return base`


[rllib] Rename PolicyGraph => Policy, move from evaluation/ to policy/ (#4819) This implements some of the renames proposed in #4813 We leave behind backwards-compatibility aliases for *PolicyGraph and SampleBatch. 2019-05-20 16:46:05 -07:00			`def renamed_agent(cls):`
[rllib] Fix tune.run(Agent class) (#4630) * update * Update __init__.py 2019-04-15 09:12:23 -07:00			`"""Helper class for renaming Agent => Trainer with a warning."""`

[rllib] Rename Agent to Trainer (#4556) 2019-04-07 00:36:18 -07:00			`class DeprecationWrapper(cls):`
[rllib] Fix tune.run(Agent class) (#4630) * update * Update __init__.py 2019-04-15 09:12:23 -07:00			`def __init__(self, config=None, env=None, logger_creator=None):`
[rllib] Rename Agent to Trainer (#4556) 2019-04-07 00:36:18 -07:00			`old_name = cls.__name__.replace("Trainer", "Agent")`
[rllib] Rename PolicyGraph => Policy, move from evaluation/ to policy/ (#4819) This implements some of the renames proposed in #4813 We leave behind backwards-compatibility aliases for *PolicyGraph and SampleBatch. 2019-05-20 16:46:05 -07:00			`new_name = cls.__module__ + "." + cls.__name__`
[rllib] Rename Agent to Trainer (#4556) 2019-04-07 00:36:18 -07:00			`logger.warn("DeprecationWarning: {} has been renamed to {}. ".`
			`format(old_name, new_name) +`
			`"This will raise an error in the future.")`
[rllib] Fix tune.run(Agent class) (#4630) * update * Update __init__.py 2019-04-15 09:12:23 -07:00			`cls.__init__(self, config, env, logger_creator)`

			`DeprecationWrapper.__name__ = cls.__name__`
[rllib] Rename Agent to Trainer (#4556) 2019-04-07 00:36:18 -07:00
			`return DeprecationWrapper`


[rllib] Remove dependency on TensorFlow (#4764) * remove hard tf dep * add test * comment fix * fix test 2019-05-10 20:36:18 -07:00			`def try_import_tf():`
			`if "RLLIB_TEST_NO_TF_IMPORT" in os.environ:`
			`logger.warning("Not importing TensorFlow for test purposes")`
			`return None`

			`try:`
Reduce Ray / RLlib startup messages (#5368) 2019-08-05 13:23:54 -07:00			`if "TF_CPP_MIN_LOG_LEVEL" not in os.environ:`
			`os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"`
[rllib] TensorFlow 2 compatibility (#4802) 2019-05-16 22:12:07 -07:00			`import tensorflow.compat.v1 as tf`
Reduce Ray / RLlib startup messages (#5368) 2019-08-05 13:23:54 -07:00			`tf.logging.set_verbosity(tf.logging.ERROR)`
[rllib] TensorFlow 2 compatibility (#4802) 2019-05-16 22:12:07 -07:00			`tf.disable_v2_behavior()`
[rllib] Remove dependency on TensorFlow (#4764) * remove hard tf dep * add test * comment fix * fix test 2019-05-10 20:36:18 -07:00			`return tf`
			`except ImportError:`
[rllib] TensorFlow 2 compatibility (#4802) 2019-05-16 22:12:07 -07:00			`try:`
			`import tensorflow as tf`
			`return tf`
			`except ImportError:`
			`return None`
[rllib] Remove dependency on TensorFlow (#4764) * remove hard tf dep * add test * comment fix * fix test 2019-05-10 20:36:18 -07:00

[rllib] Feature/soft actor critic v2 (#5328) * Add base for Soft Actor-Critic * Pick changes from old SAC branch * Update sac.py * First implementation of sac model * Remove unnecessary SAC imports * Prune unnecessary noise and exploration code * Implement SAC model and use that in SAC policy * runs but doesn't learn * clear state * fix batch size * Add missing alpha grads and vars * -200 by 2k timesteps * doc * lazy squash * one file * ignore tfp * revert done 2019-08-01 23:37:36 -07:00			`def try_import_tfp():`
			`if "RLLIB_TEST_NO_TF_IMPORT" in os.environ:`
			`logger.warning(`
			`"Not importing TensorFlow Probability for test purposes.")`
			`return None`

			`try:`
			`import tensorflow_probability as tfp`
			`return tfp`
			`except ImportError:`
			`return None`


[tune] Support Configuration Merging (#3584) * merge configs * deep merge * lint * add resolve * test 2018-12-26 03:07:11 -08:00			`__all__ = [`
[rllib] Rename Agent to Trainer (#4556) 2019-04-07 00:36:18 -07:00			`"Filter",`
			`"FilterManager",`
			`"PolicyClient",`
			`"PolicyServer",`
			`"merge_dicts",`
			`"deep_update",`
			`"renamed_class",`
[rllib] Remove dependency on TensorFlow (#4764) * remove hard tf dep * add test * comment fix * fix test 2019-05-10 20:36:18 -07:00			`"try_import_tf",`
[tune] Support Configuration Merging (#3584) * merge configs * deep merge * lint * add resolve * test 2018-12-26 03:07:11 -08:00			`]`