SunnyMirror
/
DeepLearningExamples
mirror of https://github.com/NVIDIA/DeepLearningExamples.git


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181
							# Copyright (c) 2021, NVIDIA CORPORATION. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

""" High level definition of layers for model construction """
import tensorflow as tf


def _normalization(inputs, name, mode):
    """ Choose a normalization layer

    :param inputs: Input node from the graph
    :param name: Name of layer
    :param mode: Estimator's execution mode
    :return: Normalized output
    """
    training = mode == tf.estimator.ModeKeys.TRAIN

    if name == 'instancenorm':
        gamma_initializer = tf.constant_initializer(1.0)
        return tf.contrib.layers.instance_norm(
            inputs,
            center=True,
            scale=True,
            epsilon=1e-6,
            param_initializers={'gamma': gamma_initializer},
            reuse=None,
            variables_collections=None,
            outputs_collections=None,
            trainable=True,
            data_format='NHWC',
            scope=None)

    if name == 'groupnorm':
        return tf.contrib.layers.group_norm(inputs=inputs,
                                            groups=16,
                                            channels_axis=-1,
                                            reduction_axes=(-4, -3, -2),
                                            activation_fn=None,
                                            trainable=True)

    if name == 'batchnorm':
        return tf.keras.layers.BatchNormalization(axis=-1,
                                                  trainable=True,
                                                  virtual_batch_size=None)(inputs, training=training)
    if name == 'none':
        return inputs

    raise ValueError('Invalid normalization layer')


def _activation(out, activation):
    """ Choose an activation layer

    :param out: Input node from the graph
    :param activation: Name of layer
    :return: Activation output
    """
    if activation == 'relu':
        return tf.nn.relu(out)
    if activation == 'leaky_relu':
        return tf.nn.leaky_relu(out, alpha=0.01)
    if activation == 'sigmoid':
        return tf.nn.sigmoid(out)
    if activation == 'softmax':
        return tf.nn.softmax(out, axis=-1)
    if activation == 'none':
        return out

    raise ValueError("Unknown activation {}".format(activation))


def convolution(inputs,  # pylint: disable=R0913
                out_channels,
                kernel_size=3,
                stride=1,
                mode=tf.estimator.ModeKeys.TRAIN,
                normalization='batchnorm',
                activation='leaky_relu',
                transpose=False):
    """ Create a convolution layer

    :param inputs: Input node from graph
    :param out_channels: Output number of channels
    :param kernel_size: Size of the kernel
    :param stride: Stride of the kernel
    :param mode: Estimator's execution mode
    :param normalization: Name of the normalization layer
    :param activation: Name of the activation layer
    :param transpose: Select between regular and transposed convolution
    :return: Convolution output
    """
    if transpose:
        conv = tf.keras.layers.Conv3DTranspose
    else:
        conv = tf.keras.layers.Conv3D
    regularizer = None  # tf.keras.regularizers.l2(1e-5)

    use_bias = normalization == "none"
    inputs = conv(filters=out_channels,
                  kernel_size=kernel_size,
                  strides=stride,
                  activation=None,
                  padding='same',
                  data_format='channels_last',
                  kernel_initializer=tf.compat.v1.glorot_uniform_initializer(),
                  kernel_regularizer=regularizer,
                  bias_initializer=tf.zeros_initializer(),
                  bias_regularizer=regularizer,
                  use_bias=use_bias)(inputs)

    inputs = _normalization(inputs, normalization, mode)

    return _activation(inputs, activation)


def upsample_block(inputs, skip_connection, out_channels, normalization, mode):
    """ Create a block for upsampling

    :param inputs: Input node from the graph
    :param skip_connection: Choose whether or not to use skip connection
    :param out_channels: Number of output channels
    :param normalization: Name of the normalizaiton layer
    :param mode: Estimator's execution mode
    :return: Output from the upsample block
    """
    inputs = convolution(inputs, kernel_size=2, out_channels=out_channels, stride=2,
                         normalization='none', activation='none', transpose=True)
    inputs = tf.keras.layers.Concatenate(axis=-1)([inputs, skip_connection])

    inputs = convolution(inputs, out_channels=out_channels, normalization=normalization, mode=mode)
    inputs = convolution(inputs, out_channels=out_channels, normalization=normalization, mode=mode)
    return inputs


def input_block(inputs, out_channels, normalization, mode):
    """ Create the input block

    :param inputs: Input node from the graph
    :param out_channels: Number of output channels
    :param normalization:  Name of the normalization layer
    :param mode: Estimator's execution mode
    :return: Output from the input block
    """
    inputs = convolution(inputs, out_channels=out_channels, normalization=normalization, mode=mode)
    inputs = convolution(inputs, out_channels=out_channels, normalization=normalization, mode=mode)
    return inputs


def downsample_block(inputs, out_channels, normalization, mode):
    """ Create a downsample block

    :param inputs: Input node from the graph
    :param out_channels: Number of output channels
    :param normalization:  Name of the normalization layer
    :param mode: Estimator's execution mode
    :return: Output from the downsample block
    """
    inputs = convolution(inputs, out_channels=out_channels, normalization=normalization, mode=mode, stride=2)
    return convolution(inputs, out_channels=out_channels, normalization=normalization, mode=mode)


def output_layer(inputs, out_channels, activation):
    """ Create the output layer

    :param inputs: Input node from the graph
    :param out_channels: Number of output channels
    :param activation:  Name of the activation layer
    :return: Output from the output block
    """
    return convolution(inputs, out_channels=out_channels, kernel_size=3, normalization='none', activation=activation)