From a4d108f270830ddacb24a7caf339898564ca9d78 Mon Sep 17 00:00:00 2001
From: Liwei Song <liweisongpku@gmail.com>
Date: Wed, 16 Dec 2020 15:47:15 -0500
Subject: [PATCH] update code

---
 .../data_structures.py                        | 30 +++++++------
 .../data_structures_test.py                   |  4 +-
 .../membership_inference_attack.py            | 42 +++++++++++--------
 3 files changed, 44 insertions(+), 32 deletions(-)

diff --git a/tensorflow_privacy/privacy/membership_inference_attack/data_structures.py b/tensorflow_privacy/privacy/membership_inference_attack/data_structures.py
index 06670a6..cc1557f 100644
--- a/tensorflow_privacy/privacy/membership_inference_attack/data_structures.py
+++ b/tensorflow_privacy/privacy/membership_inference_attack/data_structures.py
@@ -462,21 +462,28 @@ class SingleRiskScoreResult:
     and further compute precision and recall values.
     We skip the threshold value if it is larger than every sample's privacy risk score.
     """
+    fpr, tpr, thresholds = metrics.roc_curve(
+      np.concatenate((np.ones(len(self.train_risk_scores)),
+                      np.zeros(len(self.test_risk_scores)))),
+      np.concatenate((self.train_risk_scores, self.test_risk_scores)),
+      drop_intermediate=False)
+    
     precision_list = []
     recall_list = []
     meaningful_threshold_list = []
+    max_risk_score = max(train_risk_scores.max(), test_risk_scores.max())
     for threshold in threshold_list:
-        true_positive_normalized = np.sum(self.train_risk_scores>=threshold)/(len(self.train_risk_scores)+0.0)
-        false_positive_normalized = np.sum(self.test_risk_scores>=threshold)/(len(self.test_risk_scores)+0.0)
-        if true_positive_normalized+false_positive_normalized>0:
-          meaningful_threshold_list.append(threshold)
-          precision_list.append(true_positive_normalized/(true_positive_normalized+false_positive_normalized+0.0))
-          recall_list.append(true_positive_normalized)
+      if threshold <= max_risk_score:
+        idx = np.argwhere(thresholds>=threshold)[-1][0]
+        meaningful_threshold_list.append(threshold)
+        precision_list.append(tpr[idx]/(tpr[idx]+fpr[idx]))
+        recall_list.append(tpr[idx])
+    
     return np.array(meaningful_threshold_list), np.array(precision_list), np.array(recall_list)
   
-  def collect_results(self, threshold_list=np.array([1,0.9,0.8,0.7,0.6,0.5])):
+  def collect_results(self, threshold_list):
     """ The privacy risk score (from 0 to 1) represents each sample's probability of being in the training set.
-    Here, we choose a list of threshold values from 0.5 (uncertain of training or test) to 1 (100% certain of training)
+    Usually, we choose a list of threshold values from 0.5 (uncertain of training or test) to 1 (100% certain of training)
     to compute corresponding attack precision and recall.
     """
     meaningful_threshold_list, precision_list, recall_list = self.attack_with_varied_thresholds(threshold_list)
@@ -496,14 +503,13 @@ class RiskScoreResults:
 
   risk_score_results: Iterable[SingleRiskScoreResult]
     
-  def summary(self):
+  def summary(self, threshold_list):
     """ return the summary of privacy risk score analysis on all given data slices
     """
     summary = []
     for single_result in self.risk_score_results:
-      single_summary = single_result.collect_results()
-      for line in single_summary:
-        summary.append(line)
+      single_summary = single_result.collect_results(threshold_list)
+      summary.extend(single_summary)
     return '\n'.join(summary)
 
 
diff --git a/tensorflow_privacy/privacy/membership_inference_attack/data_structures_test.py b/tensorflow_privacy/privacy/membership_inference_attack/data_structures_test.py
index 67c959d..d61c5ca 100644
--- a/tensorflow_privacy/privacy/membership_inference_attack/data_structures_test.py
+++ b/tensorflow_privacy/privacy/membership_inference_attack/data_structures_test.py
@@ -229,8 +229,8 @@ class SingleRiskScoreResultTest(absltest.TestCase):
         train_risk_scores=np.array([0.91,1,0.92,0.82,0.75]),
         test_risk_scores=np.array([0.81,0.7,0.75,0.25,0.3]))
 
-    self.assertEqual(result.attack_with_varied_thresholds(np.array([0.8,0.7]))[1].tolist(), [0.8,0.625])
-    self.assertEqual(result.attack_with_varied_thresholds(np.array([0.8,0.7]))[2].tolist(), [0.8,1])
+    self.assertEqual(result.attack_with_varied_thresholds(threshold_list=np.array([0.8,0.7]))[1].tolist(), [0.8,0.625])
+    self.assertEqual(result.attack_with_varied_thresholds(threshold_list=np.array([0.8,0.7]))[2].tolist(), [0.8,1])
     
     
 class AttackResultsCollectionTest(absltest.TestCase):
diff --git a/tensorflow_privacy/privacy/membership_inference_attack/membership_inference_attack.py b/tensorflow_privacy/privacy/membership_inference_attack/membership_inference_attack.py
index d17f99d..7b51b81 100644
--- a/tensorflow_privacy/privacy/membership_inference_attack/membership_inference_attack.py
+++ b/tensorflow_privacy/privacy/membership_inference_attack/membership_inference_attack.py
@@ -176,10 +176,13 @@ def run_attacks(attack_input: AttackInputData,
 
 def _compute_privacy_risk_score(attack_input: AttackInputData,
                                 num_bins: int = 15) -> SingleRiskScoreResult:
-  """compute each individual point's likelihood of being a member (https://arxiv.org/abs/2003.10595)
+  """Computes each individual point's likelihood of being a member (https://arxiv.org/abs/2003.10595).
+  For an individual sample, its privacy risk score is computed as the posterior probability of being in the training set 
+  after observing its prediction output by the target machine learning model.
+  
   Args:
     attack_input: input data for compute privacy risk scores
-    num_bins: the number of bins used to compute the training/test histogram; we set the default as 15
+    num_bins: the number of bins used to compute the training/test histogram
   
   Returns:
     privacy risk score results
@@ -188,28 +191,31 @@ def _compute_privacy_risk_score(attack_input: AttackInputData,
   # If the loss or the entropy is provided, just use it; 
   # Otherwise, call the function to compute the loss (you can also choose to compute entropy) 
   if attack_input.loss_train is not None and attack_input.loss_test is not None:
-    train_values, test_values = attack_input.loss_train, attack_input.loss_test
+    train_values = attack_input.loss_train
+    test_values = attack_input.loss_test
   elif attack_input.entropy_train is not None and attack_input.entropy_test is not None:
-    train_values, test_values = attack_input.entropy_train, attack_input.entropy_test
+    train_values = attack_input.entropy_train
+    test_values = attack_input.entropy_test
   else:
-    train_values, test_values = attack_input.get_loss_train(), attack_input.get_loss_test()
+    train_values = attack_input.get_loss_train()
+    test_values = attack_input.get_loss_test()
   
   # Compute the histogram in the log scale
   small_value = 1e-10
-  train_log_values = np.log(np.maximum(train_values, small_value))
-  test_log_values = np.log(np.maximum(test_values, small_value))
+  train_values = np.maximum(train_values, small_value)
+  test_values = np.maximum(test_values, small_value)
   
-  min_log_value = np.amin(np.concatenate((train_log_values, test_log_values)))
-  max_log_value = np.amax(np.concatenate((train_log_values, test_log_values)))
-  bins_hist = np.linspace(min_log_value, max_log_value, num_bins+1)
+  min_value = min(train_values.min(), test_values.min())
+  max_value = max(train_values.max(), test_values.max())
+  bins_hist = np.logspace(np.log10(min_value), np.log10(max_value), num_bins+1)
   
-  train_hist, _ = np.histogram(train_log_values, bins=bins_hist)
-  train_hist = train_hist/(len(train_log_values)+0.0)
-  train_hist_indices = np.fmin(np.digitize(train_log_values, bins=bins_hist),num_bins)-1
+  train_hist, _ = np.histogram(train_values, bins=bins_hist)
+  train_hist = train_hist/(len(train_values)+0.0)
+  train_hist_indices = np.fmin(np.digitize(train_values, bins=bins_hist),num_bins)-1
   
-  test_hist, _ = np.histogram(test_log_values, bins=bins_hist)
-  test_hist = test_hist/(len(test_log_values)+0.0)
-  test_hist_indices = np.fmin(np.digitize(test_log_values, bins=bins_hist),num_bins)-1
+  test_hist, _ = np.histogram(test_values, bins=bins_hist)
+  test_hist = test_hist/(len(test_values)+0.0)
+  test_hist_indices = np.fmin(np.digitize(test_values, bins=bins_hist),num_bins)-1
   
   combined_hist = train_hist+test_hist
   combined_hist[combined_hist==0] = small_value
@@ -224,8 +230,8 @@ def _compute_privacy_risk_score(attack_input: AttackInputData,
                                test_risk_scores=test_risk_scores)
 
 
-def privacy_risk_score_analysis(attack_input: AttackInputData,
-                                slicing_spec: SlicingSpec = None) -> RiskScoreResults:
+def run_privacy_risk_score_analysis(attack_input: AttackInputData,
+                                    slicing_spec: SlicingSpec = None) -> RiskScoreResults:
     
   """Perform privacy risk score analysis on all given slice types