ray/rllib/utils/test_utils.py

import logging
import numpy as np

from ray.rllib.utils.framework import try_import_tf, try_import_torch

tf = try_import_tf()
if tf:
    eager_mode = None
    try:
        from tensorflow.python.eager.context import eager_mode
    except (ImportError, ModuleNotFoundError):
        pass

torch, _ = try_import_torch()

logger = logging.getLogger(__name__)


def framework_iterator(config=None,
                       frameworks=("tf", "eager", "torch"),
                       session=False):
    """An generator that allows for looping through n frameworks for testing.

    Provides the correct config entries ("use_pytorch" and "eager") as well
    as the correct eager/non-eager contexts for tf.

    Args:
        config (Optional[dict]): An optional config dict to alter in place
            depending on the iteration.
        frameworks (Tuple[str]): A list/tuple of the frameworks to be tested.
            Allowed are: "tf", "eager", and "torch".
        session (bool): If True, enter a tf.Session() and yield that as
            well in the tf-case (otherwise, yield (fw, None)).

    Yields:
        str: If enter_session is False:
            The current framework ("tf", "eager", "torch") used.
        Tuple(str, Union[None,tf.Session]: If enter_session is True:
            A tuple of the current fw and the tf.Session if fw="tf".
    """
    config = config or {}
    frameworks = [frameworks] if isinstance(frameworks, str) else frameworks

    for fw in frameworks:
        # Skip non-installed frameworks.
        if fw == "torch" and not torch:
            logger.warning(
                "framework_iterator skipping torch (not installed)!")
            continue
        if fw != "torch" and not tf:
            logger.warning("framework_iterator skipping {} (tf not "
                           "installed)!".format(fw))
            continue
        elif fw == "eager" and not eager_mode:
            logger.warning("framework_iterator skipping eager (could not "
                           "import `eager_mode` from tensorflow.python)!")
            continue
        assert fw in ["tf", "eager", "torch", None]

        # Do we need a test session?
        sess = None
        if fw == "tf" and session is True:
            sess = tf.Session()
            sess.__enter__()

        print("framework={}".format(fw))

        config["eager"] = fw == "eager"
        config["use_pytorch"] = fw == "torch"

        eager_ctx = None
        if fw == "eager":
            eager_ctx = eager_mode()
            eager_ctx.__enter__()
            assert tf.executing_eagerly()
        elif fw == "tf":
            assert not tf.executing_eagerly()

        yield fw if session is False else (fw, sess)

        # Exit any context we may have entered.
        if eager_ctx:
            eager_ctx.__exit__(None, None, None)
        elif sess:
            sess.__exit__(None, None, None)


def check(x, y, decimals=5, atol=None, rtol=None, false=False):
    """
    Checks two structures (dict, tuple, list,
    np.array, float, int, etc..) for (almost) numeric identity.
    All numbers in the two structures have to match up to `decimal` digits
    after the floating point. Uses assertions.

    Args:
        x (any): The value to be compared (to the expectation: `y`). This
            may be a Tensor.
        y (any): The expected value to be compared to `x`. This must not
            be a Tensor.
        decimals (int): The number of digits after the floating point up to
            which all numeric values have to match.
        atol (float): Absolute tolerance of the difference between x and y
            (overrides `decimals` if given).
        rtol (float): Relative tolerance of the difference between x and y
            (overrides `decimals` if given).
        false (bool): Whether to check that x and y are NOT the same.
    """
    # A dict type.
    if isinstance(x, dict):
        assert isinstance(y, dict), \
            "ERROR: If x is dict, y needs to be a dict as well!"
        y_keys = set(x.keys())
        for key, value in x.items():
            assert key in y, \
                "ERROR: y does not have x's key='{}'! y={}".format(key, y)
            check(
                value,
                y[key],
                decimals=decimals,
                atol=atol,
                rtol=rtol,
                false=false)
            y_keys.remove(key)
        assert not y_keys, \
            "ERROR: y contains keys ({}) that are not in x! y={}".\
            format(list(y_keys), y)
    # A tuple type.
    elif isinstance(x, (tuple, list)):
        assert isinstance(y, (tuple, list)),\
            "ERROR: If x is tuple, y needs to be a tuple as well!"
        assert len(y) == len(x),\
            "ERROR: y does not have the same length as x ({} vs {})!".\
            format(len(y), len(x))
        for i, value in enumerate(x):
            check(
                value,
                y[i],
                decimals=decimals,
                atol=atol,
                rtol=rtol,
                false=false)
    # Boolean comparison.
    elif isinstance(x, (np.bool_, bool)):
        if false is True:
            assert bool(x) is not bool(y), \
                "ERROR: x ({}) is y ({})!".format(x, y)
        else:
            assert bool(x) is bool(y), \
                "ERROR: x ({}) is not y ({})!".format(x, y)
    # Nones or primitives.
    elif x is None or y is None or isinstance(x, (str, int)):
        if false is True:
            assert x != y, "ERROR: x ({}) is the same as y ({})!".format(x, y)
        else:
            assert x == y, \
                "ERROR: x ({}) is not the same as y ({})!".format(x, y)
    # String comparison.
    elif hasattr(x, "dtype") and x.dtype == np.object:
        try:
            np.testing.assert_array_equal(x, y)
            if false is True:
                assert False, \
                    "ERROR: x ({}) is the same as y ({})!".format(x, y)
        except AssertionError as e:
            if false is False:
                raise e
    # Everything else (assume numeric or tf/torch.Tensor).
    else:
        if tf is not None:
            # y should never be a Tensor (y=expected value).
            if isinstance(y, tf.Tensor):
                raise ValueError("`y` (expected value) must not be a Tensor. "
                                 "Use numpy.ndarray instead")
            if isinstance(x, tf.Tensor):
                # In eager mode, numpyize tensors.
                if tf.executing_eagerly():
                    x = x.numpy()
                # Otherwise, use a quick tf-session.
                else:
                    with tf.Session() as sess:
                        x = sess.run(x)
                        return check(
                            x,
                            y,
                            decimals=decimals,
                            atol=atol,
                            rtol=rtol,
                            false=false)
        if torch is not None:
            if isinstance(x, torch.Tensor):
                x = x.detach().numpy()
            if isinstance(y, torch.Tensor):
                y = y.detach().numpy()

        # Using decimals.
        if atol is None and rtol is None:
            # Assert equality of both values.
            try:
                np.testing.assert_almost_equal(x, y, decimal=decimals)
            # Both values are not equal.
            except AssertionError as e:
                # Raise error in normal case.
                if false is False:
                    raise e
            # Both values are equal.
            else:
                # If false is set -> raise error (not expected to be equal).
                if false is True:
                    assert False, \
                        "ERROR: x ({}) is the same as y ({})!".format(x, y)

        # Using atol/rtol.
        else:
            # Provide defaults for either one of atol/rtol.
            if atol is None:
                atol = 0
            if rtol is None:
                rtol = 1e-7
            try:
                np.testing.assert_allclose(x, y, atol=atol, rtol=rtol)
            except AssertionError as e:
                if false is False:
                    raise e
            else:
                if false is True:
                    assert False, \
                        "ERROR: x ({}) is the same as y ({})!".format(x, y)
[RLlib] Add testing framework_iterator. (#7852) * Add testing framework_iterator. * LINT. * WIP. * Fix and LINT. * LINT fix. 2020-04-03 21:24:25 +02:00			`import logging`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`import numpy as np`

[RLlib] Exploration API: merge deterministic flag with exploration classes (SoftQ and StochasticSampling). (#7155) 2020-02-19 21:18:45 +01:00			`from ray.rllib.utils.framework import try_import_tf, try_import_torch`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00
			`tf = try_import_tf()`
[RLlib] Add testing framework_iterator. (#7852) * Add testing framework_iterator. * LINT. * WIP. * Fix and LINT. * LINT fix. 2020-04-03 21:24:25 +02:00			`if tf:`
			`eager_mode = None`
			`try:`
			`from tensorflow.python.eager.context import eager_mode`
			`except (ImportError, ModuleNotFoundError):`
			`pass`

[RLlib] Exploration API: merge deterministic flag with exploration classes (SoftQ and StochasticSampling). (#7155) 2020-02-19 21:18:45 +01:00			`torch, _ = try_import_torch()`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00
[RLlib] Add testing framework_iterator. (#7852) * Add testing framework_iterator. * LINT. * WIP. * Fix and LINT. * LINT fix. 2020-04-03 21:24:25 +02:00			`logger = logging.getLogger(__name__)`


			`def framework_iterator(config=None,`
			`frameworks=("tf", "eager", "torch"),`
			`session=False):`
			`"""An generator that allows for looping through n frameworks for testing.`

			`Provides the correct config entries ("use_pytorch" and "eager") as well`
			`as the correct eager/non-eager contexts for tf.`

			`Args:`
			`config (Optional[dict]): An optional config dict to alter in place`
			`depending on the iteration.`
			`frameworks (Tuple[str]): A list/tuple of the frameworks to be tested.`
			`Allowed are: "tf", "eager", and "torch".`
			`session (bool): If True, enter a tf.Session() and yield that as`
			`well in the tf-case (otherwise, yield (fw, None)).`

			`Yields:`
			`str: If enter_session is False:`
			`The current framework ("tf", "eager", "torch") used.`
			`Tuple(str, Union[None,tf.Session]: If enter_session is True:`
			`A tuple of the current fw and the tf.Session if fw="tf".`
			`"""`
			`config = config or {}`
			`frameworks = [frameworks] if isinstance(frameworks, str) else frameworks`

			`for fw in frameworks:`
			`# Skip non-installed frameworks.`
			`if fw == "torch" and not torch:`
			`logger.warning(`
			`"framework_iterator skipping torch (not installed)!")`
			`continue`
[RLlib] IMPALA PyTorch (#8287) This PR adds an IMPALA PyTorch implementation. - adds compilation tests for LSTM and w/o LSTM. - adds learning test for CartPole. 2020-05-03 13:44:25 +02:00			`if fw != "torch" and not tf:`
[RLlib] Add testing framework_iterator. (#7852) * Add testing framework_iterator. * LINT. * WIP. * Fix and LINT. * LINT fix. 2020-04-03 21:24:25 +02:00			`logger.warning("framework_iterator skipping {} (tf not "`
			`"installed)!".format(fw))`
			`continue`
			`elif fw == "eager" and not eager_mode:`
			`logger.warning("framework_iterator skipping eager (could not "`
			"import `eager_mode` from tensorflow.python)!")
			`continue`
			`assert fw in ["tf", "eager", "torch", None]`

			`# Do we need a test session?`
			`sess = None`
			`if fw == "tf" and session is True:`
			`sess = tf.Session()`
			`sess.__enter__()`

			`print("framework={}".format(fw))`

			`config["eager"] = fw == "eager"`
			`config["use_pytorch"] = fw == "torch"`

			`eager_ctx = None`
			`if fw == "eager":`
			`eager_ctx = eager_mode()`
			`eager_ctx.__enter__()`
			`assert tf.executing_eagerly()`
			`elif fw == "tf":`
			`assert not tf.executing_eagerly()`

			`yield fw if session is False else (fw, sess)`

			`# Exit any context we may have entered.`
			`if eager_ctx:`
			`eager_ctx.__exit__(None, None, None)`
			`elif sess:`
			`sess.__exit__(None, None, None)`

Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00
			`def check(x, y, decimals=5, atol=None, rtol=None, false=False):`
			`"""`
			`Checks two structures (dict, tuple, list,`
			`np.array, float, int, etc..) for (almost) numeric identity.`
			All numbers in the two structures have to match up to `decimal` digits
			`after the floating point. Uses assertions.`

			`Args:`
[RLlib] Experiment with py_func as a means to further unify tf and torch (Schedule classes). (#6951) 2020-01-30 20:27:57 +01:00			x (any): The value to be compared (to the expectation: `y`). This
			`may be a Tensor.`
			y (any): The expected value to be compared to `x`. This must not
			`be a Tensor.`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`decimals (int): The number of digits after the floating point up to`
			`which all numeric values have to match.`
			`atol (float): Absolute tolerance of the difference between x and y`
			(overrides `decimals` if given).
			`rtol (float): Relative tolerance of the difference between x and y`
			(overrides `decimals` if given).
			`false (bool): Whether to check that x and y are NOT the same.`
			`"""`
			`# A dict type.`
			`if isinstance(x, dict):`
			`assert isinstance(y, dict), \`
			`"ERROR: If x is dict, y needs to be a dict as well!"`
			`y_keys = set(x.keys())`
			`for key, value in x.items():`
			`assert key in y, \`
			`"ERROR: y does not have x's key='{}'! y={}".format(key, y)`
[RLlib] from_config util method for framework agnostic components; start moving RLlib tests into Bazel. (#6865) 2020-01-23 02:02:58 +01:00			`check(`
			`value,`
			`y[key],`
			`decimals=decimals,`
			`atol=atol,`
			`rtol=rtol,`
			`false=false)`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`y_keys.remove(key)`
			`assert not y_keys, \`
			`"ERROR: y contains keys ({}) that are not in x! y={}".\`
			`format(list(y_keys), y)`
			`# A tuple type.`
			`elif isinstance(x, (tuple, list)):`
			`assert isinstance(y, (tuple, list)),\`
			`"ERROR: If x is tuple, y needs to be a tuple as well!"`
			`assert len(y) == len(x),\`
			`"ERROR: y does not have the same length as x ({} vs {})!".\`
			`format(len(y), len(x))`
			`for i, value in enumerate(x):`
[RLlib] from_config util method for framework agnostic components; start moving RLlib tests into Bazel. (#6865) 2020-01-23 02:02:58 +01:00			`check(`
			`value,`
			`y[i],`
			`decimals=decimals,`
			`atol=atol,`
			`rtol=rtol,`
			`false=false)`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`# Boolean comparison.`
			`elif isinstance(x, (np.bool_, bool)):`
			`if false is True:`
			`assert bool(x) is not bool(y), \`
			`"ERROR: x ({}) is y ({})!".format(x, y)`
			`else:`
			`assert bool(x) is bool(y), \`
			`"ERROR: x ({}) is not y ({})!".format(x, y)`
[RLlib] from_config util method for framework agnostic components; start moving RLlib tests into Bazel. (#6865) 2020-01-23 02:02:58 +01:00			`# Nones or primitives.`
[RLlib] Schedule-classes multi-framework support. (#6926) 2020-01-28 20:07:55 +01:00			`elif x is None or y is None or isinstance(x, (str, int)):`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`if false is True:`
			`assert x != y, "ERROR: x ({}) is the same as y ({})!".format(x, y)`
			`else:`
			`assert x == y, \`
			`"ERROR: x ({}) is not the same as y ({})!".format(x, y)`
			`# String comparison.`
			`elif hasattr(x, "dtype") and x.dtype == np.object:`
			`try:`
			`np.testing.assert_array_equal(x, y)`
			`if false is True:`
			`assert False, \`
			`"ERROR: x ({}) is the same as y ({})!".format(x, y)`
			`except AssertionError as e:`
			`if false is False:`
			`raise e`
[RLlib] Exploration API: merge deterministic flag with exploration classes (SoftQ and StochasticSampling). (#7155) 2020-02-19 21:18:45 +01:00			`# Everything else (assume numeric or tf/torch.Tensor).`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`else:`
[RLlib] Experiment with py_func as a means to further unify tf and torch (Schedule classes). (#6951) 2020-01-30 20:27:57 +01:00			`if tf is not None:`
			`# y should never be a Tensor (y=expected value).`
			`if isinstance(y, tf.Tensor):`
			raise ValueError("`y` (expected value) must not be a Tensor. "
			`"Use numpy.ndarray instead")`
			`if isinstance(x, tf.Tensor):`
			`# In eager mode, numpyize tensors.`
			`if tf.executing_eagerly():`
			`x = x.numpy()`
[RLlib] Exploration API: merge deterministic flag with exploration classes (SoftQ and StochasticSampling). (#7155) 2020-02-19 21:18:45 +01:00			`# Otherwise, use a quick tf-session.`
[RLlib] Experiment with py_func as a means to further unify tf and torch (Schedule classes). (#6951) 2020-01-30 20:27:57 +01:00			`else:`
			`with tf.Session() as sess:`
			`x = sess.run(x)`
[RLlib] PPO torch memory leak and unnecessary torch.Tensor creation and gc'ing. (#7238) * Take out stats to analyze memory leak in torch PPO. * WIP * WIP * WIP * WIP * WIP * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * LINT. * Fix determine_tests_to_run.py. * minor change to re-test after determine_tests_to_run.py. * LINT. * update comments. * WIP * WIP * WIP * FIX. * Fix sequence_mask being dependent on torch being installed. * Fix strange ray-core tf-error in test_memory_scheduling test case. * Fix strange ray-core tf-error in test_memory_scheduling test case. * Fix strange ray-core tf-error in test_memory_scheduling test case. * Fix strange ray-core tf-error in test_memory_scheduling test case. 2020-02-22 20:02:31 +01:00			`return check(`
[RLlib] Experiment with py_func as a means to further unify tf and torch (Schedule classes). (#6951) 2020-01-30 20:27:57 +01:00			`x,`
			`y,`
			`decimals=decimals,`
			`atol=atol,`
			`rtol=rtol,`
			`false=false)`
[RLlib] Exploration API: merge deterministic flag with exploration classes (SoftQ and StochasticSampling). (#7155) 2020-02-19 21:18:45 +01:00			`if torch is not None:`
			`if isinstance(x, torch.Tensor):`
[RLlib] DQN torch version. (#7597) * Fix. * Rollback. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * WIP. * Fix. * Fix. * Fix. * Fix. * Fix. * WIP. * WIP. * Fix. * Test case fixes. * Test case fixes and LINT. * Test case fixes and LINT. * Rollback. * WIP. * WIP. * Test case fixes. * Fix. * Fix. * Fix. * Add regression test for DQN w/ param noise. * Fixes and LINT. * Fixes and LINT. * Fixes and LINT. * Fixes and LINT. * Fixes and LINT. * Comment * Regression test case. * WIP. * WIP. * LINT. * LINT. * WIP. * Fix. * Fix. * Fix. * LINT. * Fix (SAC does currently not support eager). * Fix. * WIP. * LINT. * Update rllib/evaluation/sampler.py Co-Authored-By: Eric Liang <ekhliang@gmail.com> * Update rllib/evaluation/sampler.py Co-Authored-By: Eric Liang <ekhliang@gmail.com> * Update rllib/utils/exploration/exploration.py Co-Authored-By: Eric Liang <ekhliang@gmail.com> * Update rllib/utils/exploration/exploration.py Co-Authored-By: Eric Liang <ekhliang@gmail.com> * WIP. * WIP. * Fix. * LINT. * LINT. * Fix and LINT. * WIP. * WIP. * WIP. * WIP. * Fix. * LINT. * Fix. * Fix and LINT. * Update rllib/utils/exploration/exploration.py * Update rllib/policy/dynamic_tf_policy.py Co-Authored-By: Eric Liang <ekhliang@gmail.com> * Update rllib/policy/dynamic_tf_policy.py Co-Authored-By: Eric Liang <ekhliang@gmail.com> * Update rllib/policy/dynamic_tf_policy.py Co-Authored-By: Eric Liang <ekhliang@gmail.com> * Fixes. * WIP. * LINT. * Fixes and LINT. * LINT and fixes. * LINT. * Move action_dist back into torch extra_action_out_fn and LINT. * Working SimpleQ learning cartpole on both torch AND tf. * Working Rainbow learning cartpole on tf. * Working Rainbow learning cartpole on tf. * WIP. * LINT. * LINT. * Update docs and add torch to APEX test. * LINT. * Fix. * LINT. * Fix. * Fix. * Fix and docstrings. * Fix broken RLlib tests in master. * Split BAZEL learning tests into cartpole and pendulum (reached the 60min barrier). * Fix error_outputs option in BAZEL for RLlib regression tests. * Fix. * Tune param-noise tests. * LINT. * Fix. * Fix. * test * test * test * Fix. * Fix. * WIP. * WIP. * WIP. * WIP. * LINT. * WIP. Co-authored-by: Eric Liang <ekhliang@gmail.com> 2020-04-06 20:56:16 +02:00			`x = x.detach().numpy()`
			`if isinstance(y, torch.Tensor):`
			`y = y.detach().numpy()`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00
			`# Using decimals.`
			`if atol is None and rtol is None:`
[RLlib] Exploration API: ParamNoise Integration into DQN; working example/test cases. (#7814) 2020-04-03 19:44:25 +02:00			`# Assert equality of both values.`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`try:`
			`np.testing.assert_almost_equal(x, y, decimal=decimals)`
[RLlib] Exploration API: ParamNoise Integration into DQN; working example/test cases. (#7814) 2020-04-03 19:44:25 +02:00			`# Both values are not equal.`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`except AssertionError as e:`
[RLlib] Exploration API: ParamNoise Integration into DQN; working example/test cases. (#7814) 2020-04-03 19:44:25 +02:00			`# Raise error in normal case.`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00			`if false is False:`
			`raise e`
[RLlib] Exploration API: ParamNoise Integration into DQN; working example/test cases. (#7814) 2020-04-03 19:44:25 +02:00			`# Both values are equal.`
			`else:`
			`# If false is set -> raise error (not expected to be equal).`
			`if false is True:`
			`assert False, \`
			`"ERROR: x ({}) is the same as y ({})!".format(x, y)`
Get utils ready for better Agent torch support. (#6561) 2019-12-30 15:27:32 -05:00
			`# Using atol/rtol.`
			`else:`
			`# Provide defaults for either one of atol/rtol.`
			`if atol is None:`
			`atol = 0`
			`if rtol is None:`
			`rtol = 1e-7`
			`try:`
			`np.testing.assert_allclose(x, y, atol=atol, rtol=rtol)`
			`except AssertionError as e:`
			`if false is False:`
			`raise e`
[RLlib] Exploration API: ParamNoise Integration into DQN; working example/test cases. (#7814) 2020-04-03 19:44:25 +02:00			`else:`
			`if false is True:`
			`assert False, \`
			`"ERROR: x ({}) is the same as y ({})!".format(x, y)`