Test DPModel in distributed training.

PiperOrigin-RevId: 528039164
2023-04-28 18:56:53 -07:00 · 2023-04-28 18:56:53 -07:00 · 8fdac5f833
commit 8fdac5f833
parent e65e14b2d6
2 changed files with 188 additions and 0 deletions
--- a/tensorflow_privacy/privacy/keras_models/BUILD
+++ b/tensorflow_privacy/privacy/keras_models/BUILD
@ -32,3 +32,12 @@ py_test(
        "//tensorflow_privacy/privacy/keras_models:dp_keras_model",
    ],
 )
+
+py_test(
+    name = "dp_keras_model_distributed_test",
+    srcs = ["dp_keras_model_distributed_test.py"],
+    deps = [
+        ":dp_keras_model",
+        "//tensorflow_privacy/privacy/fast_gradient_clipping:layer_registry",
+    ],
+)
--- a/tensorflow_privacy/privacy/keras_models/dp_keras_model_distributed_test.py
+++ b/tensorflow_privacy/privacy/keras_models/dp_keras_model_distributed_test.py
@ -0,0 +1,179 @@
+# Copyright 2023, The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Tests DPModel in distributed training."""
+import contextlib
+import multiprocessing
+import os
+import sys
+from absl.testing import parameterized
+import numpy as np
+import tensorflow as tf
+
+from tensorflow_privacy.privacy.fast_gradient_clipping import layer_registry
+from tensorflow_privacy.privacy.keras_models import dp_keras_model
+
+
+ds_combinations = tf.__internal__.distribute.combinations
+
+
+STRATEGIES = [
+    ds_combinations.one_device_strategy,
+    ds_combinations.parameter_server_strategy_1worker_2ps_cpu,
+]
+
+
+def get_data(n, clip_norm):
+  # Data is for hidden weights of w* = [3, 1] and bias of b* = 2.
+  # For mean-squared loss, we have:
+  # loss = (data * w + b - label)^2 = (data * (w - w*) + (b - b*))^2
+  # Let T = (data * (w - w*) + (b - b*)), we have:
+  #   grad_w = 2 * T * data
+  #   grad_b = 2 * T
+  # For w = [0, 0], b = 0:
+  #   For data = [3, 4],  T = -15, grad_w = [-90, -120],  grad_b = -30
+  #   For data = [1, -1], T = -4,  grad_w = [-8, 8],      grad_b = -8
+  data = np.array([[3., 4.], [1., -1.]])
+  labels = np.matmul(data, [[3], [1]]) + 2
+  data, labels = np.tile(data, (n, 1)), np.tile(labels, (n, 1))
+
+  def clip_grad(grad):
+    norm = np.linalg.norm(grad)
+    if norm <= clip_norm:
+      return grad
+    return grad / norm * clip_norm
+
+  grad1 = clip_grad(np.array([-90., -120., -30.]))
+  grad2 = clip_grad(np.array([-8., 8., -8.]))
+  grad = np.mean(np.vstack([grad1, grad2]), axis=0)
+  return data, labels, grad
+
+
+class DPKerasModelDistributedTest(parameterized.TestCase, tf.test.TestCase):
+
+  @ds_combinations.generate(
+      tf.__internal__.test.combinations.combine(
+          strategy=STRATEGIES,
+          mode="eager",
+          # Clip norm corresponding to no-clipping, clipping one gradient, and
+          # clipping both gradients.
+          clip_norm=[1e5, 200., 1.],
+          model_or_sequential=["model", "sequential"],
+          fast_clipping=[False, True],
+      )
+  )
+  def test_training_works(
+      self, strategy, clip_norm, model_or_sequential, fast_clipping
+  ):
+    if model_or_sequential == "sequential" and fast_clipping:
+      self.skipTest("Fast clipping does not work for DPSequential.")
+
+    if isinstance(strategy, tf.distribute.OneDeviceStrategy):
+      strategy_scope = contextlib.nullcontext()
+    else:
+      strategy_scope = strategy.scope()
+
+    n = 10
+    x, y, expected_grad = get_data(n, clip_norm)
+
+    def make_model():
+      dense_layer = tf.keras.layers.Dense(
+          1, kernel_initializer="zeros", bias_initializer="zeros"
+      )
+      dp_kwargs = dict(
+          l2_norm_clip=clip_norm,
+          noise_multiplier=0.0,
+          num_microbatches=None,
+          use_xla=False,
+          layer_registry=layer_registry.make_default_layer_registry()
+          if fast_clipping
+          else None,
+      )
+      if model_or_sequential == "sequential":
+        model = dp_keras_model.DPSequential(
+            layers=[dense_layer],
+            **dp_kwargs,
+        )
+      else:
+        inputs = tf.keras.layers.Input((2,))
+        outputs = dense_layer(inputs)
+        model = dp_keras_model.DPModel(
+            inputs=inputs, outputs=outputs, **dp_kwargs
+        )
+      return model
+
+    with strategy_scope:
+      model = make_model()
+      self.assertEqual(model._enable_fast_peg_computation, fast_clipping)
+      lr = 0.01
+      opt = tf.keras.optimizers.SGD(learning_rate=lr)
+      loss = tf.keras.losses.MeanSquaredError(
+          reduction=tf.keras.losses.Reduction.SUM_OVER_BATCH_SIZE
+      )
+      model.compile(loss=loss, optimizer=opt)
+      history = model.fit(
+          x=x,
+          y=y,
+          epochs=1,
+          batch_size=x.shape[0],
+          steps_per_epoch=1,
+      )
+      self.assertIn("loss", history.history)
+      self.assertEqual(opt.iterations.numpy(), 1)
+      model_weights = model.get_weights()
+
+      expected_val = -expected_grad * lr
+      self.assertAllClose(model_weights[0], expected_val[:2].reshape(-1, 1))
+      self.assertAllClose(model_weights[1], [expected_val[2]])
+
+
+def _set_spawn_exe_path():
+  """Set the path to the executable for spawned processes.
+
+  This utility searches for the binary the parent process is using, and sets
+  the executable of multiprocessing's context accordingly.
+  It is branched from tensorflow/python/distribute/multi_process_lib.py, the
+  only change being that it additionally looks under "org_tensorflow_privacy".
+  """
+  if sys.argv[0].endswith(".py"):
+
+    def guess_path(package_root):
+      # If all we have is a python module path, we'll need to make a guess for
+      # the actual executable path.
+      if "bazel-out" in sys.argv[0] and package_root in sys.argv[0]:
+        # Guess the binary path under bazel. For target
+        # //tensorflow/python/distribute:input_lib_test_multiworker_gpu, the
+        # argv[0] is in the form of
+        # /.../tensorflow/python/distribute/input_lib_test.py
+        # and the binary is
+        # /.../tensorflow/python/distribute/input_lib_test_multiworker_gpu
+        package_root_base = sys.argv[0][: sys.argv[0].rfind(package_root)]
+        binary = os.environ["TEST_TARGET"][2:].replace(":", "/", 1)
+        possible_path = os.path.join(package_root_base, package_root, binary)
+        if os.access(possible_path, os.X_OK):
+          return possible_path
+      return None
+
+    path = (
+        guess_path("org_tensorflow")
+        or guess_path("org_keras")
+        or guess_path("org_tensorflow_privacy")
+    )
+    if path is not None:
+      sys.argv[0] = path
+      multiprocessing.get_context().set_executable(sys.argv[0])
+
+
+if __name__ == "__main__":
+  _set_spawn_exe_path()
+  tf.__internal__.distribute.multi_process_runner.test_main()