Module `delta.extensions.layers.pretrained`

Use a pretrained model inside another network.

Expand source code

# Copyright © 2020, United States Government, as represented by the
# Administrator of the National Aeronautics and Space Administration.
# All rights reserved.
#
# The DELTA (Deep Earth Learning, Tools, and Analysis) platform is
# licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#        http://www.apache.org/licenses/LICENSE-2.0.
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""
Use a pretrained model inside another network.
"""
from typing import List, Optional
import tensorflow
import tensorflow.keras.models #pylint: disable=no-name-in-module

from delta.ml.io import load_model
from delta.config.extensions import register_layer

class InputSelectLayer(tensorflow.keras.layers.Layer):
    """
    A layer that takes any number of inputs, and returns a given one.
    """
    def __init__(self, arg_number, **kwargs):
        """
        Parameters
        ----------
        arg_number: int
            The index of the input to select.
        """
        super().__init__(**kwargs)
        self._arg = arg_number
    def call(self, inputs, **kwargs): #pylint: disable=unused-argument
        return inputs[self._arg]
    def get_config(self):
        return {'arg_number' : self._arg}

def _model_to_output_layers(model, break_point, trainable):
    output_layers = []
    for idx, l in enumerate(model.layers):
        if not isinstance(l, tensorflow.keras.layers.BatchNormalization):
            l.trainable = trainable
        if isinstance(l, tensorflow.keras.models.Model): # assumes sequential
            output_layers.extend(_model_to_output_layers(l, break_point, trainable))
        else:
            output_layers.append(l)
        if break_point(idx, l):
            break
    return output_layers

def pretrained(filename, encoding_layer, outputs: Optional[List[str]]=None, trainable: bool=True,
               training: bool=True, **kwargs):
    """
    Creates pre-trained layer from an existing model file.
    Only works with sequential models. This was quite tricky to get right with tensorflow.

    Parameters
    ----------
    filename: str
        Model file to load.
    encoding_layer: str
        Name of the layer to stop at.
    outputs: Optional[List[str]]
        List of names of output layers that may be used later in the model.
        Only layers listed here will be accessible as inputs to other layers, in the form
        this_layer_name/internal_name. (internal_name must be included in outputs to do so)
    trainable: bool
        Whether to update weights during training for this layer.
    training: bool
        Standard tensorflow option, used for batch norm layers.
    """
    model = load_model(filename)

    if isinstance(encoding_layer, int):
        break_point = lambda x, y: x == encoding_layer
    elif isinstance(encoding_layer, str):
        break_point = lambda x, y: y.name == encoding_layer

    output_layers = _model_to_output_layers(model, break_point, trainable)

    output_tensors = []
    cur = model.inputs[0]
    old_to_new = {}
    old_to_new[cur.ref()] = cur
    for l in output_layers:
        if isinstance(l, tensorflow.keras.layers.InputLayer):
            old_to_new[l.output.ref()] = cur
            output_tensors.append(cur)
            continue
        if isinstance(l.input, list):
            inputs = [old_to_new[t.ref()] for t in l.input]
        else:
            inputs = old_to_new[l.input.ref()]
        cur = l(inputs)
        old_to_new[l.output.ref()] = cur
        output_tensors.append(cur)
    new_model = tensorflow.keras.models.Model(model.inputs, output_tensors, **kwargs)

    layers_dict = {}
    if outputs:
        for (i, l) in enumerate(output_layers):
            if l.name not in outputs:
                continue
            layers_dict[l.name] = InputSelectLayer(i)

    def call(*inputs):
        result = new_model(inputs, training=training)
        output = (InputSelectLayer(len(output_layers)-1)(result), {k : v(result) for k, v in layers_dict.items()})
        return output
    return call

register_layer('InputSelectLayer', InputSelectLayer)
register_layer('Pretrained', pretrained)

Functions

def pretrained(filename, encoding_layer, outputs: Optional[List[str]] = None, trainable: bool = True, training: bool = True, **kwargs)

Creates pre-trained layer from an existing model file. Only works with sequential models. This was quite tricky to get right with tensorflow.

Parameters

filename : str: Model file to load.
encoding_layer : str: Name of the layer to stop at.
outputs : Optional[List[str]]: List of names of output layers that may be used later in the model. Only layers listed here will be accessible as inputs to other layers, in the form this_layer_name/internal_name. (internal_name must be included in outputs to do so)
trainable : bool: Whether to update weights during training for this layer.
training : bool: Standard tensorflow option, used for batch norm layers.

Expand source code

def pretrained(filename, encoding_layer, outputs: Optional[List[str]]=None, trainable: bool=True,
               training: bool=True, **kwargs):
    """
    Creates pre-trained layer from an existing model file.
    Only works with sequential models. This was quite tricky to get right with tensorflow.

    Parameters
    ----------
    filename: str
        Model file to load.
    encoding_layer: str
        Name of the layer to stop at.
    outputs: Optional[List[str]]
        List of names of output layers that may be used later in the model.
        Only layers listed here will be accessible as inputs to other layers, in the form
        this_layer_name/internal_name. (internal_name must be included in outputs to do so)
    trainable: bool
        Whether to update weights during training for this layer.
    training: bool
        Standard tensorflow option, used for batch norm layers.
    """
    model = load_model(filename)

    if isinstance(encoding_layer, int):
        break_point = lambda x, y: x == encoding_layer
    elif isinstance(encoding_layer, str):
        break_point = lambda x, y: y.name == encoding_layer

    output_layers = _model_to_output_layers(model, break_point, trainable)

    output_tensors = []
    cur = model.inputs[0]
    old_to_new = {}
    old_to_new[cur.ref()] = cur
    for l in output_layers:
        if isinstance(l, tensorflow.keras.layers.InputLayer):
            old_to_new[l.output.ref()] = cur
            output_tensors.append(cur)
            continue
        if isinstance(l.input, list):
            inputs = [old_to_new[t.ref()] for t in l.input]
        else:
            inputs = old_to_new[l.input.ref()]
        cur = l(inputs)
        old_to_new[l.output.ref()] = cur
        output_tensors.append(cur)
    new_model = tensorflow.keras.models.Model(model.inputs, output_tensors, **kwargs)

    layers_dict = {}
    if outputs:
        for (i, l) in enumerate(output_layers):
            if l.name not in outputs:
                continue
            layers_dict[l.name] = InputSelectLayer(i)

    def call(*inputs):
        result = new_model(inputs, training=training)
        output = (InputSelectLayer(len(output_layers)-1)(result), {k : v(result) for k, v in layers_dict.items()})
        return output
    return call

Classes

class InputSelectLayer (arg_number, **kwargs)

A layer that takes any number of inputs, and returns a given one.

Parameters

arg_number : int: The index of the input to select.

Expand source code

class InputSelectLayer(tensorflow.keras.layers.Layer):
    """
    A layer that takes any number of inputs, and returns a given one.
    """
    def __init__(self, arg_number, **kwargs):
        """
        Parameters
        ----------
        arg_number: int
            The index of the input to select.
        """
        super().__init__(**kwargs)
        self._arg = arg_number
    def call(self, inputs, **kwargs): #pylint: disable=unused-argument
        return inputs[self._arg]
    def get_config(self):
        return {'arg_number' : self._arg}

Ancestors

keras.engine.base_layer.Layer
tensorflow.python.module.module.Module
tensorflow.python.training.tracking.autotrackable.AutoTrackable
tensorflow.python.training.tracking.base.Trackable
keras.utils.version_utils.LayerVersionSelector

Methods

def call(self, inputs, **kwargs)

This is where the layer's logic lives.

The call() method may not create state (except in its first invocation, wrapping the creation of variables or other resources in tf.init_scope()). It is recommended to create state in __init__(), or the build() method that is called automatically before call() executes the first time.

Args

inputs: Input tensor, or dict/list/tuple of input tensors. The first positional inputs argument is subject to special rules: - inputs must be explicitly passed. A layer cannot have zero arguments, and inputs cannot be provided via the default value of a keyword argument. - NumPy array or Python scalar values in inputs get cast as tensors. - Keras mask metadata is only collected from inputs. - Layers are built (build(input_shape) method) using shape info from inputs only. - input_spec compatibility is only checked against inputs. - Mixed precision input casting is only applied to inputs. If a layer has tensor arguments in *args or **kwargs, their casting behavior in mixed precision should be handled manually. - The SavedModel input specification is generated using inputs only. - Integration with various ecosystem packages like TFMOT, TFLite, TF.js, etc is only supported for inputs and not for tensors in positional and keyword arguments.
*args: Additional positional arguments. May contain tensors, although this is not recommended, for the reasons above.
**kwargs: Additional keyword arguments. May contain tensors, although this is not recommended, for the reasons above. The following optional keyword arguments are reserved: - training: Boolean scalar tensor of Python boolean indicating whether the call is meant for training or inference. - mask: Boolean input mask. If the layer's call() method takes a mask argument, its default value will be set to the mask generated for inputs by the previous layer (if input did come from a layer that generated a corresponding mask, i.e. if it came from a Keras layer with masking support).

Returns

A tensor or list/tuple of tensors.

Expand source code

def call(self, inputs, **kwargs): #pylint: disable=unused-argument
    return inputs[self._arg]

def get_config(self)

Returns the config of the layer.

A layer config is a Python dictionary (serializable) containing the configuration of a layer. The same layer can be reinstantiated later (without its trained weights) from this configuration.

The config of a layer does not include connectivity information, nor the layer class name. These are handled by Network (one layer of abstraction above).

Note that get_config() does not guarantee to return a fresh copy of dict every time it is called. The callers should make a copy of the returned dict if they want to modify it.

Returns

Python dictionary.

Expand source code

def get_config(self):
    return {'arg_number' : self._arg}