Implement lifted_struct_loss (#30)

supercontracts · seanpmorgan · commit 1d6b2455f328 · 2019-02-23T18:43:54.000-05:00
* lifted_struct_loss function added
diff --git a/tensorflow_addons/losses/BUILD b/tensorflow_addons/losses/BUILD
@@ -7,8 +7,9 @@ py_library(
     srcs = [
         "__init__.py",
         "python/__init__.py",
-        "python/triplet.py",
+        "python/lifted.py",
         "python/metric_learning.py",
+        "python/triplet.py",
     ],
     srcs_version = "PY2AND3",
     deps = [
@@ -28,3 +29,16 @@ py_test(
     ],
     srcs_version = "PY2AND3",
 )
+
+py_test(
+    name = "lifted_py_test",
+    size = "small",
+    srcs = [
+        "python/lifted_test.py",
+    ],
+    main = "python/lifted_test.py",
+    deps = [
+        ":losses_py",
+    ],
+    srcs_version = "PY2AND3",
+)
diff --git a/tensorflow_addons/losses/python/lifted.py b/tensorflow_addons/losses/python/lifted.py
@@ -0,0 +1,132 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Implements lifted_struct_loss."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf
+from tensorflow.python.framework import dtypes
+from tensorflow.python.keras import losses
+from tensorflow.python.keras.utils import losses_utils
+from tensorflow.python.ops import array_ops
+from tensorflow.python.ops import math_ops
+from tensorflow_addons.losses.python import metric_learning
+from tensorflow_addons.utils.python import keras_utils
+
+
+@keras_utils.register_keras_custom_object
+@tf.function
+def lifted_struct_loss(labels, embeddings, margin=1.0):
+    """Computes the lifted structured loss.
+
+    Args:
+      labels: 1-D tf.int32 `Tensor` with shape [batch_size] of
+        multiclass integer labels.
+      embeddings: 2-D float `Tensor` of embedding vectors. Embeddings should
+        not be l2 normalized.
+      margin: Float, margin term in the loss definition.
+
+    Returns:
+      lifted_loss: tf.float32 scalar.
+    """
+    # Reshape [batch_size] label tensor to a [batch_size, 1] label tensor.
+    lshape = array_ops.shape(labels)
+    assert lshape.shape == 1
+    labels = array_ops.reshape(labels, [lshape[0], 1])
+
+    # Build pairwise squared distance matrix.
+    pairwise_distances = metric_learning.pairwise_distance(embeddings)
+
+    # Build pairwise binary adjacency matrix.
+    adjacency = math_ops.equal(labels, array_ops.transpose(labels))
+    # Invert so we can select negatives only.
+    adjacency_not = math_ops.logical_not(adjacency)
+
+    batch_size = array_ops.size(labels)
+
+    diff = margin - pairwise_distances
+    mask = math_ops.cast(adjacency_not, dtype=dtypes.float32)
+    # Safe maximum: Temporarily shift negative distances
+    #   above zero before taking max.
+    #     this is to take the max only among negatives.
+    row_minimums = math_ops.reduce_min(diff, 1, keepdims=True)
+    row_negative_maximums = math_ops.reduce_max(
+        math_ops.multiply(diff - row_minimums, mask), 1,
+        keepdims=True) + row_minimums
+
+    # Compute the loss.
+    # Keep track of matrix of maximums where M_ij = max(m_i, m_j)
+    #   where m_i is the max of alpha - negative D_i's.
+    # This matches the Caffe loss layer implementation at:
+    #   https://github.com/rksltnl/Caffe-Deep-Metric-Learning-CVPR16/blob/0efd7544a9846f58df923c8b992198ba5c355454/src/caffe/layers/lifted_struct_similarity_softmax_layer.cpp  # pylint: disable=line-too-long
+
+    max_elements = math_ops.maximum(row_negative_maximums,
+                                    array_ops.transpose(row_negative_maximums))
+    diff_tiled = array_ops.tile(diff, [batch_size, 1])
+    mask_tiled = array_ops.tile(mask, [batch_size, 1])
+    max_elements_vect = array_ops.reshape(
+        array_ops.transpose(max_elements), [-1, 1])
+
+    loss_exp_left = array_ops.reshape(
+        math_ops.reduce_sum(
+            math_ops.multiply(
+                math_ops.exp(diff_tiled - max_elements_vect), mask_tiled),
+            1,
+            keepdims=True), [batch_size, batch_size])
+
+    loss_mat = max_elements + math_ops.log(loss_exp_left +
+                                           array_ops.transpose(loss_exp_left))
+    # Add the positive distance.
+    loss_mat += pairwise_distances
+
+    mask_positives = math_ops.cast(
+        adjacency, dtype=dtypes.float32) - array_ops.diag(
+            array_ops.ones([batch_size]))
+
+    # *0.5 for upper triangular, and another *0.5 for 1/2 factor for loss^2.
+    num_positives = math_ops.reduce_sum(mask_positives) / 2.0
+
+    lifted_loss = math_ops.truediv(
+        0.25 * math_ops.reduce_sum(
+            math_ops.square(
+                math_ops.maximum(
+                    math_ops.multiply(loss_mat, mask_positives), 0.0))),
+        num_positives)
+    return lifted_loss
+
+
+@keras_utils.register_keras_custom_object
+class LiftedStructLoss(losses.LossFunctionWrapper):
+    """Computes the lifted structured loss.
+
+    The loss encourages the positive distances (between a pair of embeddings
+    with the same labels) to be smaller than any negative distances (between
+    a pair of embeddings with different labels) in the mini-batch in a way
+    that is differentiable with respect to the embedding vectors.
+    See: https://arxiv.org/abs/1511.06452.
+
+    Args:
+      margin: Float, margin term in the loss definition.
+      name: Optional name for the op.
+    """
+
+    def __init__(self, margin=1.0, name=None):
+        super(LiftedStructLoss, self).__init__(
+            lifted_struct_loss,
+            name=name,
+            reduction=losses_utils.ReductionV2.NONE,
+            margin=margin)
diff --git a/tensorflow_addons/losses/python/lifted_test.py b/tensorflow_addons/losses/python/lifted_test.py
@@ -0,0 +1,109 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Tests for lifted loss."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import numpy as np
+
+from tensorflow.python.framework import constant_op
+from tensorflow.python.framework import test_util
+from tensorflow.python.platform import test
+from tensorflow_addons.losses.python import lifted
+
+
+def pairwise_distance_np(feature, squared=False):
+    """Computes the pairwise distance matrix in numpy.
+
+    Args:
+      feature: 2-D numpy array of size [number of data, feature dimension]
+      squared: Boolean. If true, output is the pairwise squared euclidean
+        distance matrix; else, output is the pairwise euclidean distance
+        matrix.
+
+    Returns:
+      pairwise_distances: 2-D numpy array of size
+        [number of data, number of data].
+    """
+    triu = np.triu_indices(feature.shape[0], 1)
+    upper_tri_pdists = np.linalg.norm(
+        feature[triu[1]] - feature[triu[0]], axis=1)
+    if squared:
+        upper_tri_pdists **= 2.
+    num_data = feature.shape[0]
+    pairwise_distances = np.zeros((num_data, num_data))
+    pairwise_distances[np.triu_indices(num_data, 1)] = upper_tri_pdists
+    # Make symmetrical.
+    pairwise_distances = pairwise_distances + pairwise_distances.T - np.diag(
+        pairwise_distances.diagonal())
+    return pairwise_distances
+
+
+class LiftedStructLossTest(test.TestCase):
+
+    @test_util.run_all_in_graph_and_eager_modes
+    def testLiftedStruct(self):
+        num_data = 10
+        feat_dim = 6
+        margin = 1.0
+        num_classes = 4
+
+        embedding = np.random.rand(num_data, feat_dim).astype(np.float32)
+        labels = np.random.randint(
+            0, num_classes, size=(num_data)).astype(np.float32)
+        # Reshape labels to compute adjacency matrix.
+        labels_reshaped = np.reshape(labels, (labels.shape[0], 1))
+
+        # Compute the loss in NP
+        adjacency = np.equal(labels_reshaped, labels_reshaped.T)
+        pdist_matrix = pairwise_distance_np(embedding)
+        loss_np = 0.0
+        num_constraints = 0.0
+        for i in range(num_data):
+            for j in range(num_data):
+                if adjacency[i][j] > 0.0 and i != j:
+                    d_pos = pdist_matrix[i][j]
+                    negs = []
+                    for k in range(num_data):
+                        if not adjacency[i][k]:
+                            negs.append(margin - pdist_matrix[i][k])
+                    for l in range(num_data):
+                        if not adjacency[j][l]:
+                            negs.append(margin - pdist_matrix[j][l])
+
+                    negs = np.array(negs)
+                    max_elem = np.max(negs)
+                    negs -= max_elem
+                    negs = np.exp(negs)
+                    soft_maximum = np.log(np.sum(negs)) + max_elem
+
+                    num_constraints += 1.0
+                    this_loss = max(soft_maximum + d_pos, 0)
+                    loss_np += this_loss * this_loss
+
+        loss_np = loss_np / num_constraints / 2.0
+
+        # Compute the loss in TF.
+        y_true = constant_op.constant(labels)
+        y_pred = constant_op.constant(embedding)
+        cce_obj = lifted.LiftedStructLoss()
+        loss = cce_obj(y_true, y_pred)
+        self.assertAlmostEqual(self.evaluate(loss), loss_np, 3)
+
+
+if __name__ == '__main__':
+    test.main()
diff --git a/tensorflow_addons/losses/python/triplet.py b/tensorflow_addons/losses/python/triplet.py
@@ -34,6 +34,7 @@ def _masked_maximum(data, mask, dim=1):
       data: 2-D float `Tensor` of size [n, m].
       mask: 2-D Boolean `Tensor` of size [n, m].
       dim: The dimension over which to compute the maximum.
+
     Returns:
       masked_maximums: N-D `Tensor`.
         The maximized dimension is of size 1 after the operation.
@@ -53,6 +54,7 @@ def _masked_minimum(data, mask, dim=1):
       data: 2-D float `Tensor` of size [n, m].
       mask: 2-D Boolean `Tensor` of size [n, m].
       dim: The dimension over which to compute the minimum.
+
     Returns:
       masked_minimums: N-D `Tensor`.
         The minimized dimension is of size 1 after the operation.