PiperOrigin-RevId: 224061027

2018-12-04 15:50:21 -08:00 · 2018-12-04 15:50:21 -08:00 · afb8189dba
commit afb8189dba
parent c0a43b2178
8 changed files with 590 additions and 37 deletions
--- a/README.md
+++ b/README.md
@ -4,10 +4,5 @@ This repository will contain implementations of TensorFlow optimizers that
 support training machine learning models with (differential) privacy, as well
 as tutorials and analysis tools for computing the privacy guarantees provided.

-The content of this repository will superseed the following existing repository:
+The content of this repository will supersede the following existing repository:
 https://github.com/tensorflow/models/tree/master/research/differential_privacy
-
-# Contact
-
-* Steve Chien (schien@google.com)
-* Nicolas Papernot (@npapernot)
--- a/privacy/optimizers/BUILD
+++ b/privacy/optimizers/BUILD
@ -0,0 +1,55 @@
+licenses(["notice"])  # Apache 2.0
+
+py_library(
+    name = "gaussian_average_query",
+    srcs = ["gaussian_average_query.py"],
+    deps = [
+        ":private_queries",
+        "//third_party/py/tensorflow",
+    ],
+)
+
+py_library(
+    name = "dp_optimizers",
+    deps = [
+        ":dp_adam",
+        ":dp_gradient_descent",
+    ],
+)
+
+py_library(
+    name = "dp_adam",
+    srcs = [
+        "dp_adam.py",
+    ],
+    deps = [
+        ":gaussian_average_query",
+        "//third_party/py/tensorflow",
+    ],
+)
+
+py_library(
+    name = "dp_gradient_descent",
+    srcs = [
+        "dp_gradient_descent.py",
+    ],
+    deps = [
+        ":gaussian_average_query",
+        "//third_party/py/tensorflow",
+    ],
+)
+
+py_test(
+    name = "dp_optimizer_test",
+    srcs = ["dp_optimizer_test.py"],
+    deps = [
+        ":dp_optimizers",
+        "//third_party/py/absl/testing:parameterized",
+        "//third_party/py/tensorflow",
+    ],
+)
+
+py_library(
+    name = "private_queries",
+    srcs = ["private_queries.py"],
+)
--- a/privacy/optimizers/dp_adam.py
+++ b/privacy/optimizers/dp_adam.py
@ -0,0 +1,122 @@
+# Copyright 2018, The TensorFlow Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""DPAdamOptimizer for TensorFlow."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf
+
+import tensorflow_privacy.privacy.optimizers.gaussian_average_query as ph
+
+
+class DPAdamOptimizer(tf.train.AdamOptimizer):
+  """Optimizer that implements the DP Adam algorithm.
+
+  """
+
+  def __init__(self,
+               learning_rate,
+               beta1=0.9,
+               beta2=0.999,
+               epsilon=1e-8,
+               use_locking=False,
+               l2_norm_clip=1e9,
+               noise_multiplier=0.0,
+               nb_microbatches=1,
+               name='DPAdam'):
+    """Construct a new DP Adam optimizer.
+
+    Args:
+      learning_rate: A Tensor or a floating point value.  The learning rate to
+        use.
+      beta1: A float value or a constant float tensor.
+        The exponential decay rate for the 1st moment estimates.
+      beta2: A float value or a constant float tensor.
+        The exponential decay rate for the 2nd moment estimates.
+      epsilon: A small constant for numerical stability. This epsilon is
+        "epsilon hat" in the Kingma and Ba paper (in the formula just before
+        Section 2.1), not the epsilon in Algorithm 1 of the paper.
+      use_locking: If True use locks for update operations.
+      l2_norm_clip: Clipping parameter for DP-SGD.
+      noise_multiplier: Noise multiplier for DP-SGD.
+      nb_microbatches: Number of microbatches in which to split the input.
+      name: Optional name prefix for the operations created when applying
+        gradients. Defaults to "DPAdam".  @compatibility(eager) When eager
+        execution is enabled, `learning_rate` can be a callable that takes no
+        arguments and returns the actual value to use. This can be useful for
+        changing these values across different invocations of optimizer
+        functions. @end_compatibility
+    """
+    super(DPAdamOptimizer, self).__init__(
+        learning_rate,
+        beta1,
+        beta2,
+        epsilon,
+        use_locking,
+        name)
+    stddev = l2_norm_clip * noise_multiplier
+    self._nb_microbatches = nb_microbatches
+    self._privacy_helper = ph.GaussianAverageQuery(l2_norm_clip, stddev,
+                                                   nb_microbatches)
+    self._ph_global_state = self._privacy_helper.initial_global_state()
+
+  def compute_gradients(self,
+                        loss,
+                        var_list,
+                        gate_gradients=tf.train.Optimizer.GATE_OP,
+                        aggregation_method=None,
+                        colocate_gradients_with_ops=False,
+                        grad_loss=None):
+
+    # Note: it would be closer to the correct i.i.d. sampling of records if
+    # we sampled each microbatch from the appropriate binomial distribution,
+    # although that still wouldn't be quite correct because it would be sampling
+    # from the dataset without replacement.
+    microbatches_losses = tf.reshape(loss, [self._nb_microbatches, -1])
+    sample_params = (
+        self._privacy_helper.derive_sample_params(self._ph_global_state))
+
+    def process_microbatch(i, sample_state):
+      """Process one microbatch (record) with privacy helper."""
+      grads, _ = zip(*super(DPAdamOptimizer, self).compute_gradients(
+          tf.gather(microbatches_losses, [i]), var_list, gate_gradients,
+          aggregation_method, colocate_gradients_with_ops, grad_loss))
+      sample_state = self._privacy_helper.accumulate_record(
+          sample_params, sample_state, grads)
+      return [tf.add(i, 1), sample_state]
+
+    i = tf.constant(0)
+
+    if var_list is None:
+      var_list = (
+          tf.trainable_variables() +
+          tf.get_collection(tf.GraphKeys.TRAINABLE_RESOURCE_VARIABLES))
+    sample_state = self._privacy_helper.initial_sample_state(
+        self._ph_global_state, var_list)
+
+    # Use of while_loop here requires that sample_state be a nested structure of
+    # tensors. In general, we would prefer to allow it to be an arbitrary
+    # opaque type.
+    _, final_state = tf.while_loop(
+        lambda i, _: tf.less(i, self._nb_microbatches), process_microbatch,
+        [i, sample_state])
+    final_grads, self._ph_global_state = (
+        self._privacy_helper.get_noised_average(final_state,
+                                                self._ph_global_state))
+
+    return zip(final_grads, var_list)
+
--- a/privacy/optimizers/dp_gradient_descent.py
+++ b/privacy/optimizers/dp_gradient_descent.py
@ -0,0 +1,106 @@
+# Copyright 2018, The TensorFlow Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""DPGradientDescentOptimizer for TensorFlow."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf
+
+import tensorflow_privacy.privacy.optimizers.gaussian_average_query as ph
+
+
+class DPGradientDescentOptimizer(tf.train.GradientDescentOptimizer):
+  """Optimizer that implements the DP gradient descent algorithm.
+
+  """
+
+  def __init__(self,
+               learning_rate,
+               use_locking=False,
+               l2_norm_clip=1e9,
+               noise_multiplier=0.0,
+               nb_microbatches=1,
+               name='DPGradientDescent'):
+    """Construct a new DP gradient descent optimizer.
+
+    Args:
+      learning_rate: A Tensor or a floating point value.  The learning rate to
+        use.
+      use_locking: If True use locks for update operations.
+      l2_norm_clip: Clipping parameter for DP-SGD.
+      noise_multiplier: Noise multiplier for DP-SGD.
+      nb_microbatches: Number of microbatches in which to split the input.
+      name: Optional name prefix for the operations created when applying
+        gradients. Defaults to "DPGradientDescent".  @compatibility(eager) When
+        eager execution is enabled, `learning_rate` can be a callable that takes
+        no arguments and returns the actual value to use. This can be useful for
+        changing these values across different invocations of optimizer
+        functions. @end_compatibility
+    """
+    super(DPGradientDescentOptimizer, self).__init__(learning_rate, use_locking,
+                                                     name)
+    stddev = l2_norm_clip * noise_multiplier
+    self._nb_microbatches = nb_microbatches
+    self._privacy_helper = ph.GaussianAverageQuery(l2_norm_clip, stddev,
+                                                   nb_microbatches)
+    self._ph_global_state = self._privacy_helper.initial_global_state()
+
+  def compute_gradients(self,
+                        loss,
+                        var_list,
+                        gate_gradients=tf.train.Optimizer.GATE_OP,
+                        aggregation_method=None,
+                        colocate_gradients_with_ops=False,
+                        grad_loss=None):
+
+    # Note: it would be closer to the correct i.i.d. sampling of records if
+    # we sampled each microbatch from the appropriate binomial distribution,
+    # although that still wouldn't be quite correct because it would be sampling
+    # from the dataset without replacement.
+    microbatches_losses = tf.reshape(loss, [self._nb_microbatches, -1])
+    sample_params = (
+        self._privacy_helper.derive_sample_params(self._ph_global_state))
+
+    def process_microbatch(i, sample_state):
+      """Process one microbatch (record) with privacy helper."""
+      grads, _ = zip(*super(DPGradientDescentOptimizer, self).compute_gradients(
+          tf.gather(microbatches_losses, [i]), var_list, gate_gradients,
+          aggregation_method, colocate_gradients_with_ops, grad_loss))
+      sample_state = self._privacy_helper.accumulate_record(
+          sample_params, sample_state, grads)
+      return [tf.add(i, 1), sample_state]
+
+    i = tf.constant(0)
+
+    if var_list is None:
+      var_list = (
+          tf.trainable_variables() +
+          tf.get_collection(tf.GraphKeys.TRAINABLE_RESOURCE_VARIABLES))
+    sample_state = self._privacy_helper.initial_sample_state(
+        self._ph_global_state, var_list)
+
+    # Use of while_loop here requires that sample_state be a nested structure of
+    # tensors. In general, we would prefer to allow it to be an arbitrary
+    # opaque type.
+    _, final_state = tf.while_loop(
+        lambda i, _: tf.less(i, self._nb_microbatches), process_microbatch,
+        [i, sample_state])
+    final_grads, self._ph_global_state = (
+        self._privacy_helper.get_noised_average(final_state,
+                                                self._ph_global_state))
+
+    return zip(final_grads, var_list)
--- a/privacy/optimizers/dp_optimizer_test.py
+++ b/privacy/optimizers/dp_optimizer_test.py
@ -0,0 +1,108 @@
+# Copyright 2018, The TensorFlow Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Tests for differentially private optimizers."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from absl.testing import parameterized
+import numpy as np
+import tensorflow as tf
+
+from tensorflow_privacy.privacy.optimizers import dp_adam
+from tensorflow_privacy.privacy.optimizers import dp_gradient_descent
+
+
+def loss(val0, val1):
+  """Loss function that is minimized at the mean of the input points."""
+  return 0.5 * tf.reduce_sum(tf.squared_difference(val0, val1), axis=1)
+
+
+class DPOptimizerTest(tf.test.TestCase, parameterized.TestCase):
+
+  # Parameters for testing: optimizer, nb_microbatches, expected answer.
+  @parameterized.named_parameters(
+      ('DPGradientDescent 1', dp_gradient_descent.DPGradientDescentOptimizer, 1,
+       [-10.0, -10.0]),
+      ('DPGradientDescent 2', dp_gradient_descent.DPGradientDescentOptimizer, 2,
+       [-5.0, -5.0]),
+      ('DPGradientDescent 4', dp_gradient_descent.DPGradientDescentOptimizer, 4,
+       [-2.5, -2.5]), ('DPAdam 1', dp_adam.DPAdamOptimizer, 1, [-10.0, -10.0]),
+      ('DPAdam 2', dp_adam.DPAdamOptimizer, 2, [-5.0, -5.0]),
+      ('DPAdam 4', dp_adam.DPAdamOptimizer, 4, [-2.5, -2.5]))
+  def testBaseline(self, cls, nb_microbatches, expected_answer):
+    with self.cached_session() as sess:
+      var0 = tf.Variable([1.0, 2.0])
+      data0 = tf.Variable([[3.0, 4.0], [5.0, 6.0], [7.0, 8.0], [-1.0, 0.0]])
+
+      opt = cls(learning_rate=2.0, nb_microbatches=nb_microbatches)
+      self.evaluate(tf.global_variables_initializer())
+      # Fetch params to validate initial values
+      self.assertAllClose([1.0, 2.0], self.evaluate(var0))
+
+      # Expected gradient is sum of differences divided by number of
+      # microbatches.
+      gradient_op = opt.compute_gradients(loss(data0, var0), [var0])
+      grads_and_vars = sess.run(gradient_op)
+      self.assertAllCloseAccordingToType(expected_answer, grads_and_vars[0][0])
+
+  @parameterized.named_parameters(
+      ('DPGradientDescent', dp_gradient_descent.DPGradientDescentOptimizer),
+      ('DPAdam', dp_adam.DPAdamOptimizer))
+  def testClippingNorm(self, cls):
+    with self.cached_session() as sess:
+      var0 = tf.Variable([0.0, 0.0])
+      data0 = tf.Variable([[3.0, 4.0], [6.0, 8.0]])
+
+      opt = cls(learning_rate=2.0, l2_norm_clip=1.0, nb_microbatches=1)
+      self.evaluate(tf.global_variables_initializer())
+      # Fetch params to validate initial values
+      self.assertAllClose([0.0, 0.0], self.evaluate(var0))
+
+      # Expected gradient is sum of differences.
+      gradient_op = opt.compute_gradients(loss(data0, var0), [var0])
+      grads_and_vars = sess.run(gradient_op)
+      self.assertAllCloseAccordingToType([-0.6, -0.8], grads_and_vars[0][0])
+
+  @parameterized.named_parameters(
+      ('DPGradientDescent', dp_gradient_descent.DPGradientDescentOptimizer),
+      ('DPAdam', dp_adam.DPAdamOptimizer))
+  def testNoiseMultiplier(self, cls):
+    with self.cached_session() as sess:
+      var0 = tf.Variable([0.0])
+      data0 = tf.Variable([[0.0]])
+
+      opt = cls(
+          learning_rate=2.0,
+          l2_norm_clip=4.0,
+          noise_multiplier=2.0,
+          nb_microbatches=1)
+      self.evaluate(tf.global_variables_initializer())
+      # Fetch params to validate initial values
+      self.assertAllClose([0.0], self.evaluate(var0))
+
+      gradient_op = opt.compute_gradients(loss(data0, var0), [var0])
+      grads = []
+      for _ in xrange(1000):
+        grads_and_vars = sess.run(gradient_op)
+        grads.append(grads_and_vars[0][0])
+
+      # Test standard deviation is close to l2_norm_clip * noise_multiplier.
+      self.assertNear(np.std(grads), 2.0 * 4.0, 0.5)
+
+
+if __name__ == '__main__':
+  tf.test.main()
--- a/privacy/optimizers/gaussian_average_query.py
+++ b/privacy/optimizers/gaussian_average_query.py
@ -0,0 +1,108 @@
+# Copyright 2018, The TensorFlow Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Implements PrivateQuery interface for Gaussian average queries.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import collections
+
+import tensorflow as tf
+
+from tensorflow_privacy.privacy.optimizers import private_queries
+
+
+class GaussianAverageQuery(private_queries.PrivateAverageQuery):
+  """Implements PrivateQuery interface for Gaussian average queries.
+
+  Accumulates clipped vectors, then adds Gaussian noise to the average.
+  """
+
+  # pylint: disable=invalid-name
+  _GlobalState = collections.namedtuple(
+      '_GlobalState', ['l2_norm_clip', 'stddev', 'denominator'])
+
+  def __init__(self, l2_norm_clip, stddev, denominator):
+    """Initializes the GaussianAverageQuery."""
+    self._l2_norm_clip = l2_norm_clip
+    self._stddev = stddev
+    self._denominator = denominator
+
+  def initial_global_state(self):
+    """Returns the initial global state for the PrivacyHelper."""
+    return self._GlobalState(
+        float(self._l2_norm_clip), float(self._stddev),
+        float(self._denominator))
+
+  def derive_sample_params(self, global_state):
+    """Given the global state, derives parameters to use for the next sample.
+
+    Args:
+      global_state: The current global state.
+
+    Returns:
+      Parameters to use to process records in the next sample.
+    """
+    return global_state.l2_norm_clip
+
+  def initial_sample_state(self, global_state, tensors):
+    """Returns an initial state to use for the next sample.
+
+    Args:
+      global_state: The current global state.
+      tensors: A structure of tensors used as a template to create the initial
+        sample state.
+
+    Returns: An initial sample state.
+    """
+    del global_state  # unused.
+    return tf.contrib.framework.nest.map_structure(tf.zeros_like, tensors)
+
+  def accumulate_record(self, params, sample_state, record):
+    """Accumulates a single record into the sample state.
+
+    Args:
+      params: The parameters for the sample.
+      sample_state: The current sample state.
+      record: The record to accumulate.
+
+    Returns:
+      The updated sample state.
+    """
+    l2_norm_clip = params
+    clipped, _ = tf.clip_by_global_norm(record, l2_norm_clip)
+    return tf.contrib.framework.nest.map_structure(tf.add, sample_state,
+                                                   clipped)
+
+  def get_noised_average(self, sample_state, global_state):
+    """Gets noised average after all records of sample have been accumulated.
+
+    Args:
+      sample_state: The sample state after all records have been accumulated.
+      global_state: The global state.
+
+    Returns:
+      A tuple (estimate, new_global_state) where "estimate" is the estimated
+      average of the records and "new_global_state" is the updated global state.
+    """
+    def noised_average(v):
+      return tf.truediv(
+          v + tf.random_normal(tf.shape(v), stddev=self._stddev),
+          global_state.denominator)
+
+    return (tf.contrib.framework.nest.map_structure(noised_average,
+                                                    sample_state), global_state)
--- a/privacy/optimizers/private_queries.py
+++ b/privacy/optimizers/private_queries.py
@ -0,0 +1,90 @@
+# Copyright 2018, The TensorFlow Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""An interface for differentially private query mechanisms.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import abc
+
+
+class PrivateQuery(object):
+  """Interface for differentially private query mechanisms."""
+
+  __metaclass__ = abc.ABCMeta
+
+  @abc.abstractmethod
+  def initial_global_state(self):
+    """Returns the initial global state for the PrivateQuery."""
+    pass
+
+  @abc.abstractmethod
+  def derive_sample_params(self, global_state):
+    """Given the global state, derives parameters to use for the next sample.
+
+    Args:
+      global_state: The current global state.
+
+    Returns:
+      Parameters to use to process records in the next sample.
+    """
+    pass
+
+  @abc.abstractmethod
+  def initial_sample_state(self, global_state, tensors):
+    """Returns an initial state to use for the next sample.
+
+    Args:
+      global_state: The current global state.
+      tensors: A structure of tensors used as a template to create the initial
+        sample state.
+
+    Returns: An initial sample state.
+    """
+    pass
+
+  @abc.abstractmethod
+  def accumulate_record(self, params, sample_state, record):
+    """Accumulates a single record into the sample state.
+
+    Args:
+      params: The parameters for the sample.
+      sample_state: The current sample state.
+      record: The record to accumulate.
+
+    Returns:
+      The updated sample state.
+    """
+    pass
+
+
+class PrivateAverageQuery(PrivateQuery):
+  """Interface for differentially private mechanisms to compute an average."""
+
+  @abc.abstractmethod
+  def get_noised_average(self, sample_state, global_state):
+    """Gets average estimate after all records of sample have been accumulated.
+
+    Args:
+      sample_state: The sample state after all records have been accumulated.
+      global_state: The global state.
+
+    Returns:
+      A tuple (estimate, new_global_state) where "estimate" is the estimated
+      average of the records and "new_global_state" is the updated global state.
+    """
+    pass
--- a/privacy/test.py
+++ b/privacy/test.py
@ -1,31 +0,0 @@
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from absl import app
-from absl import flags
-
-FLAGS = flags.FLAGS
-
-
-def main(argv):
-  if len(argv) > 1:
-    raise app.UsageError('Too many command-line arguments.')
-
-if __name__ == '__main__':
-  app.run(main)