google-deepmind · cvnad1 · Oct 26, 2024 · Oct 26, 2024 · Oct 26, 2024 · Oct 26, 2024
diff --git a/docs/api/losses.rst b/docs/api/losses.rst
@@ -31,7 +31,7 @@ Losses
     softmax_cross_entropy_with_integer_labels
     sparsemax_loss
     squared_error
-
+    triplet_margin_loss
 
 Convex Kullback Leibler divergence
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -116,3 +116,7 @@ Sparsemax
 ~~~~~~~~~
 .. autofunction:: sparsemax_loss
 .. autofunction:: multiclass_sparsemax_loss
+
+Triplet margin loss
+~~~~~~~~~~~~~~~~~~~
+.. autofunction:: triplet_margin_loss
diff --git a/optax/losses/__init__.py b/optax/losses/__init__.py
@@ -42,4 +42,5 @@
 from optax.losses._regression import log_cosh
 from optax.losses._regression import squared_error
 from optax.losses._self_supervised import ntxent
+from optax.losses._self_supervised import triplet_loss
 from optax.losses._smoothing import smooth_labels
diff --git a/optax/losses/_self_supervised.py b/optax/losses/_self_supervised.py
@@ -115,6 +115,72 @@ def ntxent(
   denom = jnp.sum(jnp.exp(xcs_shift_diffs), axis=1, keepdims=True)
   denom += numer_exp
   log_softm = numer - jnp.log(denom)
-  loss = -jnp.where(matches == 1, log_softm, 0.0).sum() / matches.sum()
+  loss = -jnp.where(matches == 1, log_softm, 0.0).sum()/matches.sum()
 
   return loss
+
+
+def triplet_loss(
+    anchors: chex.Array,
+    positives: chex.Array,
+    negatives: chex.Array,
+    axis: chex.Numeric = -1,
+    p: chex.Numeric = 2,
+    margin: chex.Numeric = 1.0,
+    eps: chex.Numeric = 1e-6,
+    reduction: str = 'none',
+) -> chex.Array:
+  """Computes the triplet loss for a batch of embeddings.
+
+    Examples:
+      >>> import jax.numpy as jnp
+      >>> import optax
+      >>> import chex
+      >>> anchors = jnp.array([[0.0, 0.0], [1.0, 1.0]])
+      >>> positives = jnp.array([[0.1, 0.1], [1.1, 1.1]])
+      >>> negatives = jnp.array([[1.0, 0.0], [0.0, 1.0]])
+      >>> output =optax.triplet_loss(anchors, positives, negatives, margin=1.0)
+      >>> print(output)
+      >>> Array([0.14142442, 0.14142442], dtype=float32)
+
+    Args:
+        anchors: An array of anchor embeddings, with shape [batch, feature_dim].
+        positives: An array of positive embeddings
+        (similar to anchors), with shape [batch, feature_dim].
+        negatives: An array of negative embeddings
+        (dissimilar to anchors), with shape [batch, feature_dim].
+        axis: The axis along which to compute the distances
+        (default is -1).
+        p: The norm degree for distance calculation
+        (default is 2 for Euclidean distance).
+        margin: The minimum margin by which the positive distance
+        should be smaller than the negative distance.
+        eps: A small epsilon value to ensure numerical stability
+        in the distance calculation.
+        reduction: Specifies the reduction to apply to the
+        output: 'none' | 'mean' | 'sum'.
+
+    Returns:
+        The computed triplet loss as an array or scalar
+        depending on the reduction parameter. 
+        If reduction is 'mean' or 'sum', returns a scalar.
+
+    References:
+        Learning shallow convolutional feature descriptors with triplet losses
+        by V. Balntas, E. Riba et al.
+        <https://bmva-archive.org.uk/bmvc/2016/papers/paper119/abstract119.pdf>
+    """
+  chex.assert_type([anchors], float)
+  chex.assert_type([positives], float)
+  chex.assert_type([negatives], float)
+  positive_distance = jnp.sqrt(jnp.power(anchors - positives, p).sum(axis) + eps
+                               )
+  negative_distance = jnp.sqrt(jnp.power(anchors - negatives, p).sum(axis) + eps
+                               )
+  loss = jnp.maximum(positive_distance - negative_distance + margin, 0)
+  if reduction == 'mean':
+    return loss.mean()
+  elif reduction == 'sum':
+    return loss.sum()
+  else:
+    return loss
diff --git a/optax/losses/_self_supervised_test.py b/optax/losses/_self_supervised_test.py
@@ -14,12 +14,13 @@
 # ==============================================================================
 """Tests for self-supervised losses in `optax.losses._self_supervised.py`."""
 
-from absl.testing import absltest
+from absl.testing import absltest, parameterized
 import chex
+import jax
 import jax.numpy as jnp
 import numpy as np
-from optax.losses import _self_supervised
 
+from optax.losses import _self_supervised
 
 class NtxentTest(chex.TestCase):
 
@@ -46,7 +47,6 @@ def setUp(self):
 
   @chex.all_variants
   def test_batched(self):
-    """Tests for a full batch."""
     np.testing.assert_allclose(
         self.variant(_self_supervised.ntxent)(self.ys, self.ts_1),
         self.exp_1,
@@ -65,6 +65,67 @@ def test_batched(self):
         atol=1e-4,
     )
 
+class TripletMarginLossTest(chex.TestCase, parameterized.TestCase):
+
+  def setUp(self):
+    super().setUp()
+    self.a1 = jnp.ones((2, 2))
+    self.p1 = jnp.zeros((2, 2))
+    self.n1 = jnp.ones((2, 2)) * 2
+    self.a2 = jnp.zeros((2, 2))
+    self.p2 = jnp.ones((2, 2))
+    self.n2 = jnp.ones((2, 2)) * 2
+
+  @chex.all_variants
+  @parameterized.parameters([
+      {
+          'anchor': jnp.ones((2, 2)),
+          'positive': jnp.zeros((2, 2)),
+          'negative': jnp.ones((2, 2)) * 2,
+          'margin': 1.0,
+      },
+      {
+          'anchor': jnp.zeros((2, 2)),
+          'positive': jnp.ones((2, 2)),
+          'negative': jnp.ones((2, 2)) * 2,
+          'margin': 1.0,
+      }
+  ])
+  def test_batched(self, anchor, positive, negative, margin):
+    def testing_triplet_loss(a, p, n, margin=1.0, p_norm=2, eps=1e-6):
+      ap_distance = jnp.sqrt(jnp.sum(jnp.power(a - p, p_norm)) + eps)
+      an_distance = jnp.sqrt(jnp.sum(jnp.power(a - n, p_norm)) + eps)
+      return jnp.maximum(ap_distance - an_distance + margin, 0)
+
+    handmade_result = testing_triplet_loss(
+        a=anchor, p=positive, n=negative, margin=margin
+    )
+    result = self.variant(_self_supervised.triplet_loss)(
+        anchor, positive, negative
+    )
+    np.testing.assert_allclose(result, handmade_result, atol=1e-4)
+
+  @chex.all_variants
+  @parameterized.parameters([
+    {
+        'anchor': jnp.ones((2, 2)),
+        'positive': jnp.zeros((2, 2)),
+        'negative': jnp.ones((2, 2)) * 2,
+    },
+  ])
+  def test_vmap(self, anchor, positive, negative):
+    original_loss = _self_supervised.triplet_loss(anchor, positive,
+                                         negative, reduction='none')
+    anchor_batched = anchor.reshape(1, *anchor.shape)
+    positive_batched = positive.reshape(1, *positive.shape)
+    negative_batched = negative.reshape(1, *negative.shape)
+    vmap_loss = self.variant(jax.vmap(_self_supervised.triplet_loss,
+                                in_axes=(0, 0, 0)))(anchor_batched,
+                                                    positive_batched,
+                                                    negative_batched)
+    np.testing.assert_allclose(vmap_loss.flatten(), original_loss.flatten()
+                               , atol=1e-4)
+
 
 if __name__ == '__main__':
   absltest.main()