Source code for rlgraph.components.neural_networks.neural_network

# Copyright 2018 The RLgraph authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

from rlgraph import get_backend
from rlgraph.components import Component
from rlgraph.components.neural_networks.stack import Stack
from rlgraph.components.layers.nn.lstm_layer import LSTMLayer
from rlgraph.utils import force_tuple, force_list
from rlgraph.utils.decorators import rlgraph_api

if get_backend() == "pytorch":
    import torch


[docs]class NeuralNetwork(Stack):
    """
    A NeuralNetwork is a Stack, in which the apply method is defined either by custom-API-method OR by connecting
    through all sub-Components' `apply` methods.
    In both cases, a dict should be returned with at least the `output` key set. Possible further keys could
    be `last_internal_states` for RNN-based NNs and other keys.
    """

    def __init__(self, *layers, **kwargs):
        """
        Args:
            *layers (Component): Same as `sub_components` argument of Stack. Can be used to add Layer Components
                (or any other Components) to this Network.

        Keyword Args:
            layers (Optional[list]): An optional list of Layer objects or spec-dicts to overwrite(!)
                *layers.
        """
        # Network object for fast-path execution where we do not repeatedely call `call` between layers.
        # self.network_obj = None

        # In case layers come in via a spec dict -> push it into *layers.
        layers_args = kwargs.pop("layers", layers)
        # Add a default scope (if not given) and pass on via kwargs.
        kwargs["scope"] = kwargs.get("scope", "neural-network")

        # Force the only API-method to be `apply`. No matter whether custom-API or auto-generated (via Stack).
        if "api_methods" not in kwargs:
            @rlgraph_api
            def apply(self, *inputs):
                out = self.apply_shadowed_(*inputs)
                if isinstance(out, dict):
                    assert "output" in out
                    return out
                else:
                    return dict(output=out)

            kwargs["api_methods"] = {("apply_shadowed_", "apply")}
        else:
            assert len(kwargs["api_methods"]) == 1, \
                "ERROR: Only 0 or 1 given API-methods are allowed in NeuralNetwork ctor! You provided " \
                "'{}'.".format(kwargs["api_methods"])
            # Make sure the only allowed api_method is `apply`.
            assert next(iter(kwargs["api_methods"]))[0] == "apply", \
                "ERROR: NeuralNetwork's custom API-method must be called `apply`! You named it '{}'.". \
                    format(next(iter(kwargs["api_methods"]))[0])

        super(NeuralNetwork, self).__init__(*layers_args, **kwargs)

    def _build_stack(self, api_methods):
        """
        For each api-method in set `api_methods`, automatically create this Stack's own API-method by connecting
        through all sub-Component's API-methods. This is skipped if this Stack already has a custom API-method
        by that name.

        Args:
           api_methods (Set[Union[str,Tuple[str,str]]]): See ctor kwargs.
           #connection_rule (str): See ctor kwargs.
        """
        # Loop through the API-method set.
        for api_method_spec in api_methods:
            # API-method of sub-Components and this Stack should have different names.
            if isinstance(api_method_spec, tuple):
                # Custom method given, use that instead of creating one automatically.
                if callable(api_method_spec[1]):
                    stack_api_method_name = components_api_method_name = api_method_spec[0]
                else:
                    stack_api_method_name, components_api_method_name = api_method_spec[0], api_method_spec[1]
                # API-method of sub-Components and this Stack should have the same name.
            else:
                stack_api_method_name = components_api_method_name = api_method_spec

            # API-method for this Stack does not exist yet -> Automatically create it.
            if not hasattr(self, stack_api_method_name):
                @rlgraph_api(name=stack_api_method_name, component=self)
                def method(self_, *inputs, **kwargs):
                    if get_backend() == "pytorch" and self.execution_mode == "define_by_run":
                        # Avoid jumping back between layers and calls at runtime.
                        return self.fast_path_exec(inputs, **kwargs)
                    else:
                        args_ = inputs
                        kwargs_ = kwargs
                        for i, sub_component in enumerate(self_.sub_components.values()):  # type: Component
                            # TODO: python-Components: For now, we call each preprocessor's graph_fn
                            #  directly (assuming that inputs are not ContainerSpaces).
                            if self_.backend == "python" or get_backend() == "python":
                                graph_fn = getattr(sub_component, "_graph_fn_" + components_api_method_name)
                                #if sub_component.api_methods[components_api_method_name].add_auto_key_as_first_param:
                                #    results = graph_fn("", *args_)  # TODO: kwargs??
                                #else:
                                results = graph_fn(*args_)
                            elif get_backend() == "pytorch":
                                # Do NOT convert to tuple, has to be in unpacked again immediately.n
                                results = getattr(sub_component, components_api_method_name)(*force_list(args_))
                            else:  #if get_backend() == "tf":
                                results = getattr(sub_component, components_api_method_name)(*args_, **kwargs_)

                            # Recycle args_, kwargs_ for reuse in next sub-Component's API-method call.
                            if isinstance(results, dict):
                                args_ = ()
                                kwargs_ = results
                            else:
                                args_ = force_tuple(results)
                                kwargs_ = {}

                        if args_ == ():
                            return kwargs_
                        elif len(args_) == 1:
                            return args_[0]
                        else:
                            return args_

            # Build fast-path execution method for pytorch / eager.
            if get_backend() == "pytorch":
                def fast_path_exec(*inputs, **kwargs):
                    inputs = inputs[0]
                    forward_inputs = []
                    for v in inputs:
                        if v is not None:
                            if isinstance(v, tuple):
                                # Unitary tuples
                                forward_inputs.append(v[0])
                            else:
                                forward_inputs.append(v)
                    result = self.network_obj.forward(*forward_inputs)
                    # Problem: Not everything in the neural network stack is a true layer.
                    for c in self.non_layer_components:
                        result = getattr(c, "apply")(*force_list(result))
                    return result

                self.fast_path_exec = fast_path_exec

    def _post_define_by_run_build(self):
        # Layer objects only exist after build - define torch neural network.
        layer_objects = []
        self.non_layer_components = []
        for component in self.sub_components.values():
            if hasattr(component, "layer"):
                # Store Layer object itself.
                layer_objects.append(component.layer)

                # Append activation fn if needed.
                # N.b. linear returns None here.
                if component.activation_fn is not None:
                    layer_objects.append(component.activation_fn)
            else:
                self.non_layer_components.append(component)
        self.network_obj = torch.nn.Sequential(*layer_objects)

[docs]    def has_rnn(self):
        # TODO: Maybe it would be better to create a child class (RecurrentNeuralNetwork with has_rrn=True and
        # TODO: other available information for its API-clients such as internal_states_space, etc..)
        # Set a convenience flag if one of our sub-Components is an LSTMLayer.
        return any(isinstance(sc, LSTMLayer) for sc in self.get_all_sub_components())