Sparsity Preserving DP-SGD in TF Privacy [3 of 5]

Adds sparse noise utilities to privately select sparse indices from and add sparse noise to gradients. See https://research.google/blog/sparsity-preserving-differentially-private-training/ for more details on the algorithm. PiperOrigin-RevId: 654902527
2024-07-22 14:46:20 -07:00 · 2024-07-22 14:46:20 -07:00 · a56f33c4c5
commit a56f33c4c5
parent 8747858b5b
2 changed files with 342 additions and 1 deletions
--- a/tensorflow_privacy/privacy/sparsity_preserving_noise/sparse_noise_utils.py
+++ b/tensorflow_privacy/privacy/sparsity_preserving_noise/sparse_noise_utils.py
@ -16,8 +16,9 @@
 For more details on the algorithm, refer to https://arxiv.org/abs/2311.08357.
 """

-from typing import Optional, Sequence
+from typing import Mapping, Optional, Sequence

+from scipy import stats
 import tensorflow as tf
 import tensorflow_probability as tfp

@ -169,3 +170,191 @@ def sample_true_positive_indices(
      noised_contribution_count_values >= threshold
  ][:, 0]
  return tf.reshape(noised_contribution_counts_indices, (-1,))
+
+
+@tf.function
+def _remap_indices(
+    indices: tf.Tensor,
+    skip_indices: tf.Tensor,
+) -> tf.Tensor:
+  """Remaps the indices while skipping the skip indices.
+
+  As an example, if skip_indices = [1, 3], then the indices will be remapped as
+  follows:
+  0 -> 0
+  1 -> 2
+  2 -> 4
+  3 -> 5
+  4 -> 6
+  5 -> 7
+  ...
+
+  This is useful for merging the true positive and false positive indices.
+
+  Args:
+    indices: The indices to remap.
+    skip_indices: The indices to skip while remapping. Assumed to be sorted.
+
+  Returns:
+    The remapped indices.
+  """
+
+  def piecewise_map(skip_indices):
+    map_counts = tf.range(tf.size(skip_indices) + 1, dtype=tf.int64)
+    map_idx = skip_indices - map_counts[:-1]
+    skip_indices = tf.concat([[-1], skip_indices], axis=0)
+    gaps = skip_indices[1:] - skip_indices[:-1] - 1
+
+    map_idx = tf.concat([map_idx, [tf.int64.max]], axis=0)
+    gaps = tf.concat([gaps, [1]], axis=0)
+
+    return map_idx[gaps > 0], map_counts[gaps > 0]
+
+  map_idx, map_count = piecewise_map(skip_indices)
+  idx = tf.searchsorted(map_idx, indices, side='right')
+  offset = tf.gather(map_count, idx)
+  return indices + offset
+
+
+def sparse_private_partition_selection(
+    contribution_counts: tf.SparseTensor,
+    noise_multiplier: float,
+    threshold: int,
+) -> tf.Tensor:
+  """Differentially private partition selection.
+
+  Uses the sparse sampling algorithm to sample false positive indices. Also
+  assumes that the contribution counts are clipped to a per example contribution
+  of 1.
+
+  Args:
+    contribution_counts: The contribution counts for each index.
+    noise_multiplier: The noise multiplier to use for the gaussian noise.
+    threshold: The threshold to use for the selection.
+
+  Returns:
+    A tensor of selected indices.
+  """
+  if threshold < 0:
+    raise ValueError(f'Threshold must be positive, got {threshold}.')
+
+  true_positive_indices = sample_true_positive_indices(
+      contribution_counts, noise_multiplier, threshold
+  )
+
+  if noise_multiplier <= 0.0:
+    return true_positive_indices
+
+  # probability of selecting an index with zero contribution count.
+  prob = stats.norm.sf(threshold / noise_multiplier).item()
+
+  num_total_indices = tf.cast(contribution_counts.dense_shape[0], tf.int32)
+  num_non_zero_indices = tf.shape(contribution_counts.values)[0]
+  max_index = tf.cast(num_total_indices - num_non_zero_indices - 1, tf.int32)
+  false_positive_indices = sample_false_positive_indices(max_index, prob)
+  remapped_false_positive_indices = _remap_indices(
+      false_positive_indices, tf.reshape(contribution_counts.indices, (-1,))
+  )
+  merged_indices = tf.sort(
+      tf.concat(
+          [remapped_false_positive_indices, true_positive_indices], axis=0
+      )
+  )
+  return merged_indices
+
+
+def add_sparse_gradient_noise(
+    grad: tf.IndexedSlices, indices: tf.Tensor, noise_stddev: float
+) -> tf.IndexedSlices:
+  """Adds sparse gradient noise.
+
+  Args:
+    grad: A sparse gradient of type `tf.IndexedSlices`.
+    indices: The selected indices to keep.
+    noise_stddev: The standard deviation of the noise to add.
+
+  Returns:
+    A sparse gradient of type `tf.IndexedSlices` with the noise added.
+  """
+  filtered_grad_values = tf.gather(grad, indices)
+  sparse_noise_values = tf.random.normal(
+      filtered_grad_values.shape, mean=0.0, stddev=noise_stddev
+  )
+  filtered_noised_grad_values = filtered_grad_values + sparse_noise_values
+  return tf.IndexedSlices(
+      indices=indices,
+      values=filtered_noised_grad_values,
+      dense_shape=grad.dense_shape,
+  )
+
+
+def get_contribution_counts(
+    trainable_vars: list[tf.Variable],
+    grads: list[tf.Tensor],
+    varname_to_contribution_counts_fns: Mapping[str, tf.SparseTensor],
+) -> list[tf.Tensor | None]:
+  """Gets the contribution counts for each variable in the Model.
+
+  Args:
+    trainable_vars: A list of the trainable variables in the Model.
+    grads: A corresponding list of gradients for each trainable variable.
+    varname_to_contribution_counts_fns: A mapping from variable name to a list
+      of functions to get the contribution counts for that variable.
+
+  Returns:
+    A list of contribution counts for each variable and None for variables that
+    do not have contribution counts function.
+
+  Raises:
+    NotImplementedError: If there are more than one contribution counts function
+      for a variable.
+  """
+  contribution_counts_list = []
+  for var, grad in zip(trainable_vars, grads):
+    if var.name not in varname_to_contribution_counts_fns:
+      contribution_counts_list.append(None)
+      continue
+    contribution_counts_fns = varname_to_contribution_counts_fns[var.name]
+    if not contribution_counts_fns or not contribution_counts_fns[0]:
+      contribution_counts_list.append(None)
+      continue
+    if len(contribution_counts_fns) > 1:
+      raise NotImplementedError(
+          'Sparse noise is not supported for shared weight variables.'
+      )
+    contribution_counts_fn = contribution_counts_fns[0]
+    contribution_counts = contribution_counts_fn(grad)
+    contribution_counts_list.append(contribution_counts)
+
+  return contribution_counts_list
+
+
+def add_sparse_noise(
+    grad: tf.IndexedSlices,
+    contribution_counts: tf.SparseTensor,
+    noise_multiplier: float,
+    noise_multiplier_sparse: float,
+    l2_norm_clip: float,
+    threshold: int,
+) -> tf.IndexedSlices:
+  """Adds sparse noise to a gradient.
+
+  Args:
+    grad: A sparse gradient of type `tf.IndexedSlices`.
+    contribution_counts: The contribution counts for each index of grad.
+    noise_multiplier: The noise multiplier to use for the gradient noise.
+    noise_multiplier_sparse: The noise multiplier to use for the partition
+      selection.
+    l2_norm_clip: The l2 norm clip at which the gradient is clipped.
+    threshold: The threshold to use for the partition selection.
+
+  Returns:
+    A sparse gradient of type `tf.IndexedSlices` with the noise added.
+  """
+  privately_selected_indices = sparse_private_partition_selection(
+      contribution_counts, noise_multiplier_sparse, threshold
+  )
+  noised_grad = add_sparse_gradient_noise(
+      grad, privately_selected_indices, noise_multiplier * l2_norm_clip
+  )
+  return noised_grad
--- a/tensorflow_privacy/privacy/sparsity_preserving_noise/sparse_noise_utils_test.py
+++ b/tensorflow_privacy/privacy/sparsity_preserving_noise/sparse_noise_utils_test.py
@ -284,6 +284,158 @@ class SparseNoiseUtilsTest(tf.test.TestCase, parameterized.TestCase):
    self.assertGreater(batch_size, 0)
    self.assertLess(batch_size, max_index + 1)

+  def test_sparse_private_partition_selection_without_noise(self):
+    contribution_counts = tf.SparseTensor(
+        indices=[[0], [3], [5]],
+        values=[2.0, 1.0, 1.0],
+        dense_shape=[8],
+    )
+    noise_multiplier = 0.0
+    threshold = 2
+    sampled_indices = (
+        sparse_noise_utils.sparse_private_partition_selection(
+            contribution_counts, noise_multiplier, threshold
+        )
+        .numpy()
+        .tolist()
+    )
+    expected_indices = [0]
+    self.assertEqual(sampled_indices, expected_indices)
+
+  def test_sparse_private_partition_selection_with_noise(self):
+    contribution_counts = tf.SparseTensor(
+        indices=[[0], [3], [5]],
+        values=[50.0, 1.0, 1.0],
+        dense_shape=[1000],
+    )
+    noise_multiplier = 1.0
+    threshold = 1
+    sampled_indices = (
+        sparse_noise_utils.sparse_private_partition_selection(
+            contribution_counts, noise_multiplier, threshold
+        )
+        .numpy()
+        .tolist()
+    )
+    expected_indices = [0]
+    self.assertContainsSubset(expected_indices, sampled_indices)
+    self.assertGreater(len(sampled_indices), 1)
+
+  def test_remap_indices(self):
+    expected_indices = [4, 9, 14]
+    indices = tf.constant([1, 5, 10], tf.int64)
+    skip_indices = tf.constant([0, 1, 2, 5], tf.int64)
+    remapped_indices = sparse_noise_utils._remap_indices(indices, skip_indices)
+    self.assertEqual(remapped_indices.numpy().tolist(), expected_indices)
+
+  def test_remap_indices_no_skip(self):
+    expected_indices = [1, 5, 10]
+    indices = tf.constant([1, 5, 10], tf.int64)
+    skip_indices = tf.constant([], tf.int64)
+    remapped_indices = sparse_noise_utils._remap_indices(indices, skip_indices)
+    self.assertEqual(remapped_indices.numpy().tolist(), expected_indices)
+
+  def test_add_sparse_gradient_noise(self):
+    grad = tf.IndexedSlices(
+        values=tf.ones((1, 2)),
+        indices=tf.constant([0]),
+        dense_shape=tf.constant([2, 2]),
+    )
+    indices = tf.constant([1], dtype=tf.int64)
+    noise_stddev = 1.0
+    noised_grad = sparse_noise_utils.add_sparse_gradient_noise(
+        grad, indices, noise_stddev
+    )
+    self.assertListEqual(
+        noised_grad.indices.numpy().tolist(), indices.numpy().tolist()
+    )
+    one_index_values = noised_grad.values[0].numpy().tolist()
+    self.assertNotEqual(one_index_values, [0.0, 0.0])
+
+  def test_get_contribution_counts(self):
+    trainable_vars = [
+        tf.Variable(tf.ones((1, 2)), name='var1'),
+        tf.Variable(tf.ones((1, 2)), name='var2'),
+        tf.Variable(tf.ones((1, 2)), name='var3'),
+    ]
+    grads = [
+        tf.IndexedSlices(
+            values=tf.ones((1, 2)),
+            indices=tf.constant([0]),
+            dense_shape=tf.constant([2, 2]),
+        ),
+        tf.ones((1, 2)),
+        tf.ones((1, 2)),
+    ]
+    varname_to_contribution_counts_fns = {
+        'var1:0': [lambda grad: 1.0],
+        'var2:0': None,
+    }
+    contribution_counts = sparse_noise_utils.get_contribution_counts(
+        trainable_vars, grads, varname_to_contribution_counts_fns
+    )
+    expected_contribution_counts = [1.0, None, None]
+    self.assertEqual(contribution_counts, expected_contribution_counts)
+
+  def test_add_sparse_noise_without_noise(self):
+    grad = tf.IndexedSlices(
+        values=tf.ones((3, 4)),
+        indices=tf.constant([0, 3, 5]),
+        dense_shape=tf.constant([8, 4]),
+    )
+    contribution_counts = tf.SparseTensor(
+        indices=[[0], [3], [5]],
+        values=[3.0, 1.0, 2.0],
+        dense_shape=[8],
+    )
+    noised_grad = sparse_noise_utils.add_sparse_noise(
+        grad,
+        contribution_counts,
+        noise_multiplier=0.0,
+        noise_multiplier_sparse=0.0,
+        l2_norm_clip=1.0,
+        threshold=1,
+    )
+    self.assertEqual(
+        noised_grad.indices.numpy().tolist(), grad.indices.numpy().tolist()
+    )
+    self.assertEqual(
+        noised_grad.values.numpy().tolist(), grad.values.numpy().tolist()
+    )
+
+  def test_add_sparse_noise_with_noise(self):
+    grad = tf.IndexedSlices(
+        values=tf.ones((3, 4)),
+        indices=tf.constant([0, 3, 5]),
+        dense_shape=tf.constant([8, 4]),
+    )
+    contribution_counts = tf.SparseTensor(
+        indices=[[0], [3], [5]],
+        values=[10.0, 10.0, 20.0],
+        dense_shape=[8],
+    )
+    noised_grad = sparse_noise_utils.add_sparse_noise(
+        grad,
+        contribution_counts,
+        noise_multiplier=1.0,
+        noise_multiplier_sparse=1.0,
+        l2_norm_clip=1.0,
+        threshold=5,
+    )
+    self.assertContainsSubset(
+        grad.indices.numpy().tolist(),
+        noised_grad.indices.numpy().tolist(),
+    )
+    noised_grad_dense = tf.scatter_nd(
+        tf.reshape(noised_grad.indices, (-1, 1)),
+        noised_grad.values,
+        shape=(8, 4),
+    ).numpy()
+    noised_grad_valid_indices = noised_grad_dense[grad.indices.numpy()]
+    self.assertTrue(
+        np.all(np.not_equal(noised_grad_valid_indices, grad.values.numpy()))
+    )
+

 if __name__ == '__main__':
  tf.test.main()