android-12.0.0_r34/s

# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Tests add_loss API correctness."""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import numpy as np

from tensorflow.python.eager import backprop
from tensorflow.python.eager import context
from tensorflow.python.eager import def_function
from tensorflow.python.keras import Input
from tensorflow.python.keras import keras_parameterized
from tensorflow.python.keras import layers
from tensorflow.python.keras import losses
from tensorflow.python.keras import Model
from tensorflow.python.keras import optimizer_v2
from tensorflow.python.keras import Sequential
from tensorflow.python.keras import testing_utils
from tensorflow.python.ops import array_ops
from tensorflow.python.ops import math_ops
from tensorflow.python.platform import test
from tensorflow.python.platform import tf_logging as logging
from tensorflow.python.training.rmsprop import RMSPropOptimizer

MAE = losses.MeanAbsoluteError
mae = losses.mean_absolute_error


def get_ctl_train_step(model):
  optimizer = optimizer_v2.gradient_descent.SGD(0.05)

  def train_step(x, y, w=None):
    with backprop.GradientTape() as tape:
      if w is not None:
        model([x, y, w])
      else:
        model([x, y])
      loss = math_ops.reduce_sum(model.losses)
    gradients = tape.gradient(loss, model.trainable_weights)
    optimizer.apply_gradients(zip(gradients, model.trainable_weights))
    return loss

  return train_step


# TODO(psv): Add tests cases where a model is used in loss function but is
# not part of the training model.


class TestAddLossCorrectness(keras_parameterized.TestCase):

  def setUp(self):
    super(TestAddLossCorrectness, self).setUp()
    self.x = np.array([[0.], [1.], [2.]], dtype='float32')
    self.y = np.array([[0.5], [2.], [3.5]], dtype='float32')
    self.w = np.array([[1.25], [0.5], [1.25]], dtype='float32')

  @keras_parameterized.run_all_keras_modes
  def test_loss_on_model_fit(self):
    inputs = Input(shape=(1,))
    targets = Input(shape=(1,))
    outputs = testing_utils.Bias()(inputs)
    model = Model([inputs, targets], outputs)
    model.add_loss(MAE()(targets, outputs))
    model.add_loss(math_ops.reduce_mean(mae(targets, outputs)))
    model.compile(
        optimizer_v2.gradient_descent.SGD(0.05),
        run_eagerly=testing_utils.should_run_eagerly())

    history = model.fit([self.x, self.y], batch_size=3, epochs=5)
    self.assertAllClose(history.history['loss'], [2., 1.8, 1.6, 1.4, 1.2], 1e-3)

  @keras_parameterized.run_with_all_model_types(exclude_models=['sequential'])
  @keras_parameterized.run_all_keras_modes(always_skip_v1=True)
  def test_loss_callable_on_model_fit(self):
    model = testing_utils.get_model_from_layers([testing_utils.Bias()],
                                                input_shape=(1,))

    def callable_loss():
      return math_ops.reduce_sum(model.weights)

    model.add_loss(callable_loss)
    model.compile(
        optimizer_v2.gradient_descent.SGD(0.1),
        run_eagerly=testing_utils.should_run_eagerly())

    history = model.fit(self.x, batch_size=3, epochs=5)
    self.assertAllClose(history.history['loss'], [0., -.1, -.2, -.3, -.4], 1e-3)

  @keras_parameterized.run_all_keras_modes(always_skip_v1=True)
  def test_loss_on_model_ctl(self):
    def get_model_and_train_step():
      inputs = Input(shape=(1,))
      targets = Input(shape=(1,))
      outputs = testing_utils.Bias()(inputs)
      model = Model([inputs, targets], outputs)
      model.add_loss(MAE()(targets, outputs))
      model.add_loss(math_ops.reduce_mean(mae(targets, outputs)))
      return get_ctl_train_step(model)

    train_step = get_model_and_train_step()
    loss = [train_step(self.x, self.y) for _ in range(5)]
    self.assertAllClose(loss, [2., 1.8, 1.6, 1.4, 1.2], 1e-3)

    train_step = def_function.function(get_model_and_train_step())
    loss = [train_step(self.x, self.y) for _ in range(5)]
    self.assertAllClose(loss, [2., 1.8, 1.6, 1.4, 1.2], 1e-3)

  @keras_parameterized.run_all_keras_modes(always_skip_v1=True)
  def test_loss_callable_on_model_ctl(self):
    def get_model_and_train_step():
      inputs = Input(shape=(1,))
      targets = Input(shape=(1,))
      outputs = testing_utils.Bias()(inputs)
      model = Model([inputs, targets], outputs)

      def callable_loss():
        return math_ops.reduce_sum(model.weights)

      model.add_loss(callable_loss)
      return get_ctl_train_step(model)

    train_step = get_model_and_train_step()
    loss = [train_step(self.x, self.y) for _ in range(5)]
    self.assertAllClose(loss, [0., -0.05, -0.1, -0.15, -0.2], 1e-3)

    train_step = def_function.function(get_model_and_train_step())
    loss = [train_step(self.x, self.y) for _ in range(5)]
    self.assertAllClose(loss, [0., -0.05, -0.1, -0.15, -0.2], 1e-3)

  @keras_parameterized.run_all_keras_modes
  def test_loss_with_sample_weight_on_model_fit(self):
    inputs = Input(shape=(1,))
    targets = Input(shape=(1,))
    sw = Input(shape=(1,))
    outputs = testing_utils.Bias()(inputs)
    model = Model([inputs, targets, sw], outputs)
    model.add_loss(MAE()(targets, outputs, sw))
    model.add_loss(3 * math_ops.reduce_mean(sw * mae(targets, outputs)))
    model.compile(
        optimizer_v2.gradient_descent.SGD(0.025),
        run_eagerly=testing_utils.should_run_eagerly())

    history = model.fit([self.x, self.y, self.w], batch_size=3, epochs=5)
    self.assertAllClose(history.history['loss'], [4., 3.6, 3.2, 2.8, 2.4], 1e-3)

  @keras_parameterized.run_all_keras_modes(always_skip_v1=True)
  def test_loss_with_sample_weight_on_model_ctl(self):
    def get_model_and_train_step():
      inputs = Input(shape=(1,))
      targets = Input(shape=(1,))
      sw = Input(shape=(1,))
      outputs = testing_utils.Bias()(inputs)
      model = Model([inputs, targets, sw], outputs)
      model.add_loss(MAE()(targets, outputs, sw))
      model.add_loss(math_ops.reduce_mean(sw * mae(targets, outputs)))
      return get_ctl_train_step(model)

    train_step = get_model_and_train_step()
    loss = [train_step(self.x, self.y, self.w) for _ in range(5)]
    self.assertAllClose(loss, [2., 1.8, 1.6, 1.4, 1.2], 1e-3)

    train_step = def_function.function(get_model_and_train_step())
    loss = [train_step(self.x, self.y, self.w) for _ in range(5)]
    self.assertAllClose(loss, [2., 1.8, 1.6, 1.4, 1.2], 1e-3)

  @keras_parameterized.run_all_keras_modes
  def test_loss_with_sample_weight_in_model_call(self):

    class MyModel(Model):

      def __init__(self):
        super(MyModel, self).__init__()
        self.bias = testing_utils.Bias()

      def call(self, inputs):
        outputs = self.bias(inputs[0])
        self.add_loss(MAE()(inputs[1], outputs, inputs[2]))
        self.add_loss(math_ops.reduce_mean(inputs[2] * mae(inputs[1], outputs)))
        return outputs

    model = MyModel()
    model.predict([self.x, self.y, self.w])
    model.compile(
        optimizer_v2.gradient_descent.SGD(0.05),
        run_eagerly=testing_utils.should_run_eagerly())

    history = model.fit([self.x, self.y, self.w], batch_size=3, epochs=5)
    self.assertEqual(len(model.losses), 2)
    self.assertAllClose(history.history['loss'], [2., 1.8, 1.6, 1.4, 1.2], 1e-3)

    eval_out = model.evaluate([self.x, self.y, self.w])
    self.assertAlmostEqual(eval_out, 1.0, 3)

  @keras_parameterized.run_all_keras_modes
  def test_loss_with_sample_weight_in_layer_call(self):

    class MyLayer(layers.Layer):

      def __init__(self):
        super(MyLayer, self).__init__()
        self.bias = testing_utils.Bias()

      def call(self, inputs):
        out = self.bias(inputs[0])
        self.add_loss(MAE()(inputs[1], out, inputs[2]))
        self.add_loss(math_ops.reduce_mean(inputs[2] * mae(inputs[1], out)))
        return out

    inputs = Input(shape=(1,))
    targets = Input(shape=(1,))
    sw = Input(shape=(1,))

    outputs = MyLayer()([inputs, targets, sw])
    model = Model([inputs, targets, sw], outputs)
    model.predict([self.x, self.y, self.w])
    model.compile(
        optimizer_v2.gradient_descent.SGD(0.05),
        run_eagerly=testing_utils.should_run_eagerly())

    history = model.fit([self.x, self.y, self.w], batch_size=3, epochs=5)
    self.assertAllClose(history.history['loss'], [2., 1.8, 1.6, 1.4, 1.2], 1e-3)

    output = model.evaluate([self.x, self.y, self.w])
    self.assertAlmostEqual(output, 1.0, 3)

    output = model.test_on_batch([self.x, self.y, self.w])
    self.assertAlmostEqual(output, 1.0, 3)

  @keras_parameterized.run_all_keras_modes
  def test_loss_on_layer(self):

    class MyLayer(layers.Layer):

      def call(self, inputs):
        self.add_loss(math_ops.reduce_sum(inputs))
        return inputs

    inputs = Input((3,))
    layer = MyLayer()
    outputs = layer(inputs)
    model = Model(inputs, outputs)
    self.assertEqual(len(model.losses), 1)
    model.compile(
        'sgd',
        'mse',
        run_eagerly=testing_utils.should_run_eagerly())
    loss = model.train_on_batch(np.ones((2, 3)), np.ones((2, 3)))
    self.assertEqual(loss, 2 * 3)

  @keras_parameterized.run_all_keras_modes
  @keras_parameterized.run_with_all_model_types
  def test_activity_regularizer(self):
    loss = {}
    for reg in [None, 'l2']:
      model_layers = [
          layers.Dense(
              10,
              activation='relu',
              activity_regularizer=reg,
              kernel_initializer='ones',
              use_bias=False),
          layers.Dense(
              1,
              activation='sigmoid',
              kernel_initializer='ones',
              use_bias=False),
      ]

      model = testing_utils.get_model_from_layers(
          model_layers, input_shape=(10,))

      x = np.ones((10, 10), 'float32')
      y = np.zeros((10, 1), 'float32')

      optimizer = RMSPropOptimizer(learning_rate=0.001)
      model.compile(
          optimizer,
          'binary_crossentropy',
          run_eagerly=testing_utils.should_run_eagerly())
      model.fit(x, y, batch_size=2, epochs=5)
      loss[reg] = model.evaluate(x, y)
    self.assertLess(loss[None], loss['l2'])

  @keras_parameterized.run_all_keras_modes
  @keras_parameterized.run_with_all_model_types
  def test_activity_regularizer_loss_value(self):
    layer = layers.Dense(
        1,
        kernel_initializer='zeros',
        bias_initializer='ones',
        activity_regularizer='l2')

    model = testing_utils.get_model_from_layers([layer], input_shape=(10,))

    x = np.ones((10, 10), 'float32')
    optimizer = RMSPropOptimizer(learning_rate=0.001)
    model.compile(
        optimizer,
        run_eagerly=testing_utils.should_run_eagerly())
    loss = model.test_on_batch(x)
    self.assertAlmostEqual(0.01, loss, places=4)

  @keras_parameterized.run_all_keras_modes
  def test_activity_regularizer_batch_independent(self):
    inputs = layers.Input(shape=(10,))
    x = layers.Dense(10, activation='relu', activity_regularizer='l2')(inputs)
    outputs = layers.Dense(1, activation='sigmoid')(x)
    model = Model(inputs, outputs)

    optimizer = RMSPropOptimizer(learning_rate=0.001)
    model.compile(
        optimizer,
        run_eagerly=testing_utils.should_run_eagerly())

    loss_small_batch = model.test_on_batch(np.ones((10, 10), 'float32'))
    loss_big_batch = model.test_on_batch(np.ones((20, 10), 'float32'))
    self.assertAlmostEqual(loss_small_batch, loss_big_batch, places=4)

  @keras_parameterized.run_all_keras_modes
  def test_with_shared_layer(self):

    class LayerWithLoss(layers.Layer):

      def call(self, inputs):
        self.add_loss(math_ops.reduce_sum(inputs), inputs=inputs)
        return inputs * 2

    shared_layer = LayerWithLoss()

    m = Sequential([shared_layer])
    m2 = Sequential([shared_layer, m])
    m2(array_ops.constant([1, 2, 3]))
    self.assertEqual(len(m2.losses), 2)
    self.assertAllClose(m2.losses, [6, 12])

  @keras_parameterized.run_all_keras_modes
  def test_with_shared_nested_layer(self):

    class LayerWithLoss(layers.Layer):

      def call(self, inputs):
        self.add_loss(math_ops.reduce_sum(inputs), inputs=inputs)
        return inputs * 2

    class LayerWithNestedLayerWithLoss(layers.Layer):

      def __init__(self):
        super(LayerWithNestedLayerWithLoss, self).__init__()
        self.loss_layer = LayerWithLoss()

      def call(self, inputs):
        return self.loss_layer(inputs)

    shared_layer = LayerWithNestedLayerWithLoss()

    m = Sequential([shared_layer])
    m2 = Sequential([shared_layer, m])
    m2(array_ops.constant([1, 2, 3]))
    self.assertEqual(len(m2.losses), 2)
    self.assertAllClose(m2.losses, [6, 12])

  @keras_parameterized.run_all_keras_modes
  def test_clear_losses(self):

    class LayerWithSharedNestedLossLayer(layers.Layer):

      def __init__(self):
        super(LayerWithSharedNestedLossLayer, self).__init__()
        self.loss_layer = layers.ActivityRegularization(l2=0.001)
        self.add_weight(shape=(1,), regularizer='l2')

      def call(self, x):
        x = self.loss_layer(x)
        return self.loss_layer(x)

    inputs = Input(shape=(1,))
    l = LayerWithSharedNestedLossLayer()  # Weight loss + 2 activity losses.

    x1 = array_ops.ones((1, 1))
    _ = l(x1)
    if not context.executing_eagerly():
      self.assertEqual(len(l.get_losses_for(x1)), 2)
      self.assertEqual(len(l.get_losses_for(None)), 1)

    x2 = array_ops.ones((1, 1))
    _ = l(x2)
    if not context.executing_eagerly():
      self.assertEqual(len(l.get_losses_for(x1)), 2)
      self.assertEqual(len(l.get_losses_for(x2)), 2)
      self.assertEqual(len(l.get_losses_for(None)), 1)

    outputs = l(inputs)
    model = Model(inputs, outputs)
    if not context.executing_eagerly():
      self.assertEqual(len(model.losses), 7)
      self.assertEqual(len(l.get_losses_for(x1)), 2)
      self.assertEqual(len(l.get_losses_for(x2)), 2)
      self.assertEqual(len(l.get_losses_for(None)), 1)

    x3 = array_ops.ones((1, 1))
    model(x3)
    x4 = array_ops.ones((1, 1))
    model(x4)
    if context.executing_eagerly():
      # Eager losses are cleared every `__call__`.
      self.assertEqual(len(model.losses), 3)
    else:
      self.assertEqual(len(model.losses), 11)
      self.assertEqual(len(model.get_losses_for(x3)), 2)
      self.assertEqual(len(model.get_losses_for(x4)), 2)
      self.assertEqual(len(model.get_losses_for(None)), 1)

  @keras_parameterized.run_all_keras_modes(always_skip_v1=True)
  def test_invalid_constant_input(self):
    inputs = Input(shape=(1,))
    outputs = testing_utils.Bias()(inputs)
    model = Model(inputs, outputs)
    with self.assertRaisesRegex(
        ValueError,
        'Expected a symbolic Tensors or a callable for the loss value'):
      model.add_loss(1.)

  @keras_parameterized.run_all_keras_modes(always_skip_v1=True)
  def test_invalid_variable_input(self):
    inputs = Input(shape=(1,))
    outputs = testing_utils.Bias()(inputs)
    model = Model(inputs, outputs)
    with self.assertRaisesRegex(
        ValueError,
        'Expected a symbolic Tensors or a callable for the loss value'):
      model.add_loss(model.weights[0])

  @keras_parameterized.run_all_keras_modes
  def test_add_entropy_loss_on_functional_model(self):
    inputs = Input(shape=(1,))
    targets = Input(shape=(1,))
    outputs = testing_utils.Bias()(inputs)
    model = Model([inputs, targets], outputs)
    model.add_loss(losses.binary_crossentropy(targets, outputs))
    model.compile('sgd', run_eagerly=testing_utils.should_run_eagerly())
    with test.mock.patch.object(logging, 'warning') as mock_log:
      model.fit([self.x, self.y], batch_size=3, epochs=5)
      self.assertNotIn('Gradients do not exist for variables',
                       str(mock_log.call_args))


if __name__ == '__main__':
  test.main()