Handle the case when the data comes from a multilabel classification problem but the provided samples happen to have just one positive label per sample.

PiperOrigin-RevId: 445468067
2022-04-29 11:36:21 -07:00 · 2022-04-29 11:36:21 -07:00 · 930c4d13e8
commit 930c4d13e8
parent e0ab480e3d
3 changed files with 54 additions and 0 deletions
--- a/tensorflow_privacy/privacy/privacy_tests/membership_inference_attack/data_structures.py
+++ b/tensorflow_privacy/privacy/privacy_tests/membership_inference_attack/data_structures.py
@ -235,6 +235,13 @@ class AttackInputData:
  # corresponding class is absent from the example, and 1s where the
  # corresponding class is present.
  multilabel_data: Optional[bool] = None
+  # In some corner cases, the provided data comes from a multi-label
+  # classification model, but the samples all happen to have just 1 label. In
+  # that case, the `is_multilabel_data()` test will return a `False` value. The
+  # attack models will expect 1D input, which will throw an exception. Handle
+  # this case by letting the user set a flag that forces the input data to be
+  # treated as multilabel data.
+  force_multilabel_data: bool = False

  @property
  def num_classes(self):
@ -450,6 +457,10 @@ class AttackInputData:
    Raises:
      ValueError if the dimensionality of the train and test data are not equal.
    """
+    # If 'force_multilabel_data' is set, then assume multilabel data going
+    # forward.
+    if self.force_multilabel_data:
+      self.multilabel_data = True
    # If the data has already been checked for multihot encoded labels, then
    # return the result of the evaluation.
    if self.multilabel_data is not None:
--- a/tensorflow_privacy/privacy/privacy_tests/membership_inference_attack/data_structures_test.py
+++ b/tensorflow_privacy/privacy/privacy_tests/membership_inference_attack/data_structures_test.py
@ -358,6 +358,41 @@ class AttackInputDataTest(parameterized.TestCase):
    np.testing.assert_equal(attack_input.get_loss_test().tolist(),
                            np.array([[1.0, 4.0, 6.0], [1.0, 2.0, 3.0]]))

+  def test_validate_with_force_multilabel_false(self):
+    attack_input = AttackInputData(
+        probs_train=np.array([[0.2, 0.3, 0.7], [0.8, 0.6, 0.9]]),
+        probs_test=np.array([[0.8, 0.7, 0.9]]),
+        labels_train=np.array([[0, 0, 1], [0, 1, 0]]),
+        labels_test=np.array([[1, 0, 0]]))
+    self.assertRaisesRegex(ValueError,
+                           r'should be a one dimensional numpy array.',
+                           attack_input.validate)
+
+  def test_validate_with_force_multilabel_true(self):
+    attack_input = AttackInputData(
+        probs_train=np.array([[0.2, 0.3, 0.7], [0.8, 0.6, 0.9]]),
+        probs_test=np.array([[0.8, 0.7, 0.9]]),
+        labels_train=np.array([[0, 0, 1], [0, 1, 0]]),
+        labels_test=np.array([[1, 0, 0]]),
+        force_multilabel_data=True)
+    try:
+      attack_input.validate()
+    except ValueError:
+      # For a 'ValueError' exception the test should record a failure. All
+      # other exceptions are errors.
+      self.fail('ValueError not raised by validate().')
+
+  def test_multilabel_data_true_with_force_multilabel_true(self):
+    attack_input = AttackInputData(
+        probs_train=np.array([[0.2, 0.3, 0.7], [0.8, 0.6, 0.9]]),
+        probs_test=np.array([[0.8, 0.7, 0.9]]),
+        labels_train=np.array([[0, 0, 1], [0, 1, 0]]),
+        labels_test=np.array([[1, 0, 0]]),
+        force_multilabel_data=True)
+    self.assertTrue(
+        attack_input.multilabel_data,
+        '"force_multilabel_data" is True but "multilabel_data" is False.')
+

 class RocCurveTest(absltest.TestCase):

--- a/tensorflow_privacy/privacy/privacy_tests/membership_inference_attack/membership_inference_attack.py
+++ b/tensorflow_privacy/privacy/privacy_tests/membership_inference_attack/membership_inference_attack.py
@ -217,6 +217,7 @@ def run_attacks(attack_input: AttackInputData,
  """
  attack_input.validate()
  attack_results = []
+  attack_types = list(attack_types)

  if slicing_spec is None:
    slicing_spec = SlicingSpec(entire_dataset=True)
@ -224,6 +225,10 @@ def run_attacks(attack_input: AttackInputData,
  if slicing_spec.by_class:
    num_classes = attack_input.num_classes
  input_slice_specs = get_single_slice_specs(slicing_spec, num_classes)
+  num_slice_specs = len(input_slice_specs)
+  num_attacks = len(attack_types)
+  logging.info('Will run %s attacks on each of %s slice specifications.',
+               num_attacks, num_slice_specs)
  for single_slice_spec in input_slice_specs:
    attack_input_slice = get_slice(attack_input, single_slice_spec)
    for attack_type in attack_types:
@ -231,6 +236,9 @@ def run_attacks(attack_input: AttackInputData,
      attack_result = _run_attack(attack_input_slice, attack_type,
                                  balance_attacker_training, min_num_samples)
      if attack_result is not None:
+        logging.info('%s attack had an AUC=%s and attacker advantage=%s',
+                     attack_type.name, attack_result.get_auc(),
+                     attack_result.get_attacker_advantage())
        attack_results.append(attack_result)

  privacy_report_metadata = _compute_missing_privacy_report_metadata(