ray/rllib/models/utils.py

from typing import Optional

from ray.rllib.utils.annotations import DeveloperAPI
from ray.rllib.utils.framework import try_import_jax, try_import_tf, try_import_torch


@DeveloperAPI
def get_activation_fn(name: Optional[str] = None, framework: str = "tf"):
    """Returns a framework specific activation function, given a name string.

    Args:
        name (Optional[str]): One of "relu" (default), "tanh", "elu",
            "swish", or "linear" (same as None).
        framework: One of "jax", "tf|tfe|tf2" or "torch".

    Returns:
        A framework-specific activtion function. e.g. tf.nn.tanh or
            torch.nn.ReLU. None if name in ["linear", None].

    Raises:
        ValueError: If name is an unknown activation function.
    """
    # Already a callable, return as-is.
    if callable(name):
        return name

    # Infer the correct activation function from the string specifier.
    if framework == "torch":
        if name in ["linear", None]:
            return None
        if name == "swish":
            from ray.rllib.utils.torch_utils import Swish

            return Swish
        _, nn = try_import_torch()
        if name == "relu":
            return nn.ReLU
        elif name == "tanh":
            return nn.Tanh
        elif name == "elu":
            return nn.ELU
    elif framework == "jax":
        if name in ["linear", None]:
            return None
        jax, _ = try_import_jax()
        if name == "swish":
            return jax.nn.swish
        if name == "relu":
            return jax.nn.relu
        elif name == "tanh":
            return jax.nn.hard_tanh
        elif name == "elu":
            return jax.nn.elu
    else:
        assert framework in ["tf", "tfe", "tf2"], "Unsupported framework `{}`!".format(
            framework
        )
        if name in ["linear", None]:
            return None
        tf1, tf, tfv = try_import_tf()
        fn = getattr(tf.nn, name, None)
        if fn is not None:
            return fn

    raise ValueError(
        "Unknown activation ({}) for framework={}!".format(name, framework)
    )


@DeveloperAPI
def get_filter_config(shape):
    """Returns a default Conv2D filter config (list) for a given image shape.

    Args:
        shape (Tuple[int]): The input (image) shape, e.g. (84,84,3).

    Returns:
        List[list]: The Conv2D filter configuration usable as `conv_filters`
            inside a model config dict.
    """
    # VizdoomGym (large 480x640).
    filters_480x640 = [
        [16, [24, 32], [14, 18]],
        [32, [6, 6], 4],
        [256, [9, 9], 1],
    ]
    # VizdoomGym (small 240x320).
    filters_240x320 = [
        [16, [12, 16], [7, 9]],
        [32, [6, 6], 4],
        [256, [9, 9], 1],
    ]
    # 96x96x3 (e.g. CarRacing-v0).
    filters_96x96 = [
        [16, [8, 8], 4],
        [32, [4, 4], 2],
        [256, [11, 11], 2],
    ]
    # Atari.
    filters_84x84 = [
        [16, [8, 8], 4],
        [32, [4, 4], 2],
        [256, [11, 11], 1],
    ]
    # Small (1/2) Atari.
    filters_42x42 = [
        [16, [4, 4], 2],
        [32, [4, 4], 2],
        [256, [11, 11], 1],
    ]
    # Test image (10x10).
    filters_10x10 = [
        [16, [5, 5], 2],
        [32, [5, 5], 2],
    ]

    shape = list(shape)
    if len(shape) in [2, 3] and (shape[:2] == [480, 640] or shape[1:] == [480, 640]):
        return filters_480x640
    elif len(shape) in [2, 3] and (shape[:2] == [240, 320] or shape[1:] == [240, 320]):
        return filters_240x320
    elif len(shape) in [2, 3] and (shape[:2] == [96, 96] or shape[1:] == [96, 96]):
        return filters_96x96
    elif len(shape) in [2, 3] and (shape[:2] == [84, 84] or shape[1:] == [84, 84]):
        return filters_84x84
    elif len(shape) in [2, 3] and (shape[:2] == [42, 42] or shape[1:] == [42, 42]):
        return filters_42x42
    elif len(shape) in [2, 3] and (shape[:2] == [10, 10] or shape[1:] == [10, 10]):
        return filters_10x10
    else:
        raise ValueError(
            "No default configuration for obs shape {}".format(shape)
            + ", you must specify `conv_filters` manually as a model option. "
            "Default configurations are only available for inputs of the following "
            "shapes: [42, 42, K], [84, 84, K], [10, 10, K], [240, 320, K] and "
            " [480, 640, K]. You may "
            "alternatively "
            "want "
            "to use a custom model or preprocessor."
        )


@DeveloperAPI
def get_initializer(name, framework="tf"):
    """Returns a framework specific initializer, given a name string.

    Args:
        name: One of "xavier_uniform" (default), "xavier_normal".
        framework: One of "jax", "tf|tfe|tf2" or "torch".

    Returns:
        A framework-specific initializer function, e.g.
            tf.keras.initializers.GlorotUniform or
            torch.nn.init.xavier_uniform_.

    Raises:
        ValueError: If name is an unknown initializer.
    """
    # Already a callable, return as-is.
    if callable(name):
        return name

    if framework == "jax":
        _, flax = try_import_jax()
        assert flax is not None, "`flax` not installed. Try `pip install jax flax`."
        import flax.linen as nn

        if name in [None, "default", "xavier_uniform"]:
            return nn.initializers.xavier_uniform()
        elif name == "xavier_normal":
            return nn.initializers.xavier_normal()
    if framework == "torch":
        _, nn = try_import_torch()
        assert nn is not None, "`torch` not installed. Try `pip install torch`."
        if name in [None, "default", "xavier_uniform"]:
            return nn.init.xavier_uniform_
        elif name == "xavier_normal":
            return nn.init.xavier_normal_
    else:
        assert framework in ["tf", "tfe", "tf2"], "Unsupported framework `{}`!".format(
            framework
        )
        tf1, tf, tfv = try_import_tf()
        assert (
            tf is not None
        ), "`tensorflow` not installed. Try `pip install tensorflow`."
        if name in [None, "default", "xavier_uniform"]:
            return tf.keras.initializers.GlorotUniform
        elif name == "xavier_normal":
            return tf.keras.initializers.GlorotNormal

    raise ValueError(
        "Unknown activation ({}) for framework={}!".format(name, framework)
    )
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`from typing import Optional`

[api] Add API stability annotations for all RLlib symbols and add to LINT (#25060) 2022-05-24 22:14:25 -07:00			`from ray.rllib.utils.annotations import DeveloperAPI`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`from ray.rllib.utils.framework import try_import_jax, try_import_tf, try_import_torch`


[api] Add API stability annotations for all RLlib symbols and add to LINT (#25060) 2022-05-24 22:14:25 -07:00			`@DeveloperAPI`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`def get_activation_fn(name: Optional[str] = None, framework: str = "tf"):`
			`"""Returns a framework specific activation function, given a name string.`

			`Args:`
[RLlib Testing] Add A3C/APPO/BC/DDPPO/MARWIL/CQL/ES/ARS/TD3 to weekly learning tests. (#18381) 2021-09-07 11:48:41 +02:00			`name (Optional[str]): One of "relu" (default), "tanh", "elu",`
			`"swish", or "linear" (same as None).`
Clean up docstyle in python modules and add LINT rule (#25272) 2022-06-01 11:27:54 -07:00			`framework: One of "jax", "tf\|tfe\|tf2" or "torch".`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00
			`Returns:`
			`A framework-specific activtion function. e.g. tf.nn.tanh or`
			`torch.nn.ReLU. None if name in ["linear", None].`

			`Raises:`
			`ValueError: If name is an unknown activation function.`
			`"""`
			`# Already a callable, return as-is.`
			`if callable(name):`
			`return name`

			`# Infer the correct activation function from the string specifier.`
			`if framework == "torch":`
			`if name in ["linear", None]:`
			`return None`
			`if name == "swish":`
[RLlib] Fix deprecated warning for torch_ops.py (soft-replaced by torch_utils.py). (#19982) 2021-11-03 10:00:46 +01:00			`from ray.rllib.utils.torch_utils import Swish`
[CI] Format Python code with Black (#21975) See #21316 and #21311 for the motivation behind these changes. 2022-01-29 18:41:57 -08:00
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`return Swish`
			`_, nn = try_import_torch()`
			`if name == "relu":`
			`return nn.ReLU`
			`elif name == "tanh":`
			`return nn.Tanh`
[RLlib Testing] Add A3C/APPO/BC/DDPPO/MARWIL/CQL/ES/ARS/TD3 to weekly learning tests. (#18381) 2021-09-07 11:48:41 +02:00			`elif name == "elu":`
			`return nn.ELU`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`elif framework == "jax":`
			`if name in ["linear", None]:`
			`return None`
			`jax, _ = try_import_jax()`
			`if name == "swish":`
			`return jax.nn.swish`
			`if name == "relu":`
			`return jax.nn.relu`
			`elif name == "tanh":`
			`return jax.nn.hard_tanh`
[RLlib Testing] Add A3C/APPO/BC/DDPPO/MARWIL/CQL/ES/ARS/TD3 to weekly learning tests. (#18381) 2021-09-07 11:48:41 +02:00			`elif name == "elu":`
			`return jax.nn.elu`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`else:`
			assert framework in ["tf", "tfe", "tf2"], "Unsupported framework `{}`!".format(
			`framework`
			`)`
			`if name in ["linear", None]:`
			`return None`
			`tf1, tf, tfv = try_import_tf()`
			`fn = getattr(tf.nn, name, None)`
			`if fn is not None:`
			`return fn`

			`raise ValueError(`
			`"Unknown activation ({}) for framework={}!".format(name, framework)`
			`)`
[RLlib] ConvTranspose2D module (#11231) 2020-10-12 15:00:42 +02:00

[api] Add API stability annotations for all RLlib symbols and add to LINT (#25060) 2022-05-24 22:14:25 -07:00			`@DeveloperAPI`
[RLlib] Deprecate old classes, methods, functions, config keys (in prep for RLlib 1.0). (#10544) 2020-09-06 10:58:00 +02:00			`def get_filter_config(shape):`
			`"""Returns a default Conv2D filter config (list) for a given image shape.`

			`Args:`
			`shape (Tuple[int]): The input (image) shape, e.g. (84,84,3).`

			`Returns:`
			List[list]: The Conv2D filter configuration usable as `conv_filters`
			`inside a model config dict.`
			`"""`
[RLlib] Upgrade RLlib regression test scripts to new testing tool - RLlib release logs for 1.4. (#16080) 2021-06-01 17:39:18 +02:00			`# VizdoomGym (large 480x640).`
			`filters_480x640 = [`
			`[16, [24, 32], [14, 18]],`
			`[32, [6, 6], 4],`
			`[256, [9, 9], 1],`
			`]`
			`# VizdoomGym (small 240x320).`
			`filters_240x320 = [`
[RLlib] Unity3D example broken due to change in ML-Agents API. Attention-net prev-n-a/r. Attention-wrapper works with images. (#14569) 2021-03-12 18:27:25 +01:00			`[16, [12, 16], [7, 9]],`
			`[32, [6, 6], 4],`
			`[256, [9, 9], 1],`
			`]`
[RLlib] Discussion 4351: Conv2d default filter tests and add default setting for 96x96 image obs space. (#21560) 2022-01-13 18:50:42 +01:00			`# 96x96x3 (e.g. CarRacing-v0).`
			`filters_96x96 = [`
			`[16, [8, 8], 4],`
			`[32, [4, 4], 2],`
			`[256, [11, 11], 2],`
			`]`
[RLlib] Unity3D example broken due to change in ML-Agents API. Attention-net prev-n-a/r. Attention-wrapper works with images. (#14569) 2021-03-12 18:27:25 +01:00			`# Atari.`
[RLlib] Deprecate old classes, methods, functions, config keys (in prep for RLlib 1.0). (#10544) 2020-09-06 10:58:00 +02:00			`filters_84x84 = [`
			`[16, [8, 8], 4],`
			`[32, [4, 4], 2],`
			`[256, [11, 11], 1],`
			`]`
[RLlib] Unity3D example broken due to change in ML-Agents API. Attention-net prev-n-a/r. Attention-wrapper works with images. (#14569) 2021-03-12 18:27:25 +01:00			`# Small (1/2) Atari.`
[RLlib] Deprecate old classes, methods, functions, config keys (in prep for RLlib 1.0). (#10544) 2020-09-06 10:58:00 +02:00			`filters_42x42 = [`
			`[16, [4, 4], 2],`
			`[32, [4, 4], 2],`
			`[256, [11, 11], 1],`
			`]`
[RLlib] Switch off preprocessors by default for PGTrainer. (#21008) 2021-12-13 12:04:23 +01:00			`# Test image (10x10).`
			`filters_10x10 = [`
			`[16, [5, 5], 2],`
			`[32, [5, 5], 2],`
			`]`
[RLlib] Discussion 4351: Conv2d default filter tests and add default setting for 96x96 image obs space. (#21560) 2022-01-13 18:50:42 +01:00
			`shape = list(shape)`
[RLlib] Upgrade RLlib regression test scripts to new testing tool - RLlib release logs for 1.4. (#16080) 2021-06-01 17:39:18 +02:00			`if len(shape) in [2, 3] and (shape[:2] == [480, 640] or shape[1:] == [480, 640]):`
			`return filters_480x640`
			`elif len(shape) in [2, 3] and (shape[:2] == [240, 320] or shape[1:] == [240, 320]):`
			`return filters_240x320`
[RLlib] Discussion 4351: Conv2d default filter tests and add default setting for 96x96 image obs space. (#21560) 2022-01-13 18:50:42 +01:00			`elif len(shape) in [2, 3] and (shape[:2] == [96, 96] or shape[1:] == [96, 96]):`
			`return filters_96x96`
[RLlib] Unity3D example broken due to change in ML-Agents API. Attention-net prev-n-a/r. Attention-wrapper works with images. (#14569) 2021-03-12 18:27:25 +01:00			`elif len(shape) in [2, 3] and (shape[:2] == [84, 84] or shape[1:] == [84, 84]):`
[RLlib] Deprecate old classes, methods, functions, config keys (in prep for RLlib 1.0). (#10544) 2020-09-06 10:58:00 +02:00			`return filters_84x84`
[RLlib] Trajectory View API: Atari framestacking. (#13315) 2021-01-13 08:53:34 +01:00			`elif len(shape) in [2, 3] and (shape[:2] == [42, 42] or shape[1:] == [42, 42]):`
[RLlib] Deprecate old classes, methods, functions, config keys (in prep for RLlib 1.0). (#10544) 2020-09-06 10:58:00 +02:00			`return filters_42x42`
[RLlib] Switch off preprocessors by default for PGTrainer. (#21008) 2021-12-13 12:04:23 +01:00			`elif len(shape) in [2, 3] and (shape[:2] == [10, 10] or shape[1:] == [10, 10]):`
			`return filters_10x10`
[RLlib] Deprecate old classes, methods, functions, config keys (in prep for RLlib 1.0). (#10544) 2020-09-06 10:58:00 +02:00			`else:`
			`raise ValueError(`
			`"No default configuration for obs shape {}".format(shape)`
			+ ", you must specify `conv_filters` manually as a model option. "
[RLlib] Issue 25401: Faulty usage of get_filter_config in ComplexInputNetworks (#25493) 2022-06-06 13:04:17 +02:00			`"Default configurations are only available for inputs of the following "`
			`"shapes: [42, 42, K], [84, 84, K], [10, 10, K], [240, 320, K] and "`
			`" [480, 640, K]. You may "`
			`"alternatively "`
			`"want "`
[RLlib] Deprecate old classes, methods, functions, config keys (in prep for RLlib 1.0). (#10544) 2020-09-06 10:58:00 +02:00			`"to use a custom model or preprocessor."`
			`)`
[RLlib] ConvTranspose2D module (#11231) 2020-10-12 15:00:42 +02:00

[api] Add API stability annotations for all RLlib symbols and add to LINT (#25060) 2022-05-24 22:14:25 -07:00			`@DeveloperAPI`
[RLlib] ConvTranspose2D module (#11231) 2020-10-12 15:00:42 +02:00			`def get_initializer(name, framework="tf"):`
			`"""Returns a framework specific initializer, given a name string.`

			`Args:`
Clean up docstyle in python modules and add LINT rule (#25272) 2022-06-01 11:27:54 -07:00			`name: One of "xavier_uniform" (default), "xavier_normal".`
			`framework: One of "jax", "tf\|tfe\|tf2" or "torch".`
[RLlib] ConvTranspose2D module (#11231) 2020-10-12 15:00:42 +02:00
			`Returns:`
			`A framework-specific initializer function, e.g.`
			`tf.keras.initializers.GlorotUniform or`
			`torch.nn.init.xavier_uniform_.`

			`Raises:`
			`ValueError: If name is an unknown initializer.`
			`"""`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`# Already a callable, return as-is.`
			`if callable(name):`
			`return name`

			`if framework == "jax":`
			`_, flax = try_import_jax()`
			assert flax is not None, "`flax` not installed. Try `pip install jax flax`."
			`import flax.linen as nn`
[CI] Format Python code with Black (#21975) See #21316 and #21311 for the motivation behind these changes. 2022-01-29 18:41:57 -08:00
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`if name in [None, "default", "xavier_uniform"]:`
			`return nn.initializers.xavier_uniform()`
			`elif name == "xavier_normal":`
			`return nn.initializers.xavier_normal()`
[RLlib] ConvTranspose2D module (#11231) 2020-10-12 15:00:42 +02:00			`if framework == "torch":`
			`_, nn = try_import_torch()`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			assert nn is not None, "`torch` not installed. Try `pip install torch`."
[RLlib] ConvTranspose2D module (#11231) 2020-10-12 15:00:42 +02:00			`if name in [None, "default", "xavier_uniform"]:`
			`return nn.init.xavier_uniform_`
			`elif name == "xavier_normal":`
			`return nn.init.xavier_normal_`
			`else:`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			assert framework in ["tf", "tfe", "tf2"], "Unsupported framework `{}`!".format(
			`framework`
			`)`
[RLlib] ConvTranspose2D module (#11231) 2020-10-12 15:00:42 +02:00			`tf1, tf, tfv = try_import_tf()`
[RLlib] JAXPolicy prep PR #2 (move get_activation_fn (backward-compatibly), minor fixes and preparations). (#13091) 2020-12-30 22:30:52 -05:00			`assert (`
			`tf is not None`
			), "`tensorflow` not installed. Try `pip install tensorflow`."
[RLlib] ConvTranspose2D module (#11231) 2020-10-12 15:00:42 +02:00			`if name in [None, "default", "xavier_uniform"]:`
			`return tf.keras.initializers.GlorotUniform`
			`elif name == "xavier_normal":`
			`return tf.keras.initializers.GlorotNormal`

			`raise ValueError(`
			`"Unknown activation ({}) for framework={}!".format(name, framework)`
			`)`