facebookresearch
diff --git a/‎privacy_guard/analysis/lia/lia_analysis_input.py‎
Lines changed: 38 additions & 0 deletions b/‎privacy_guard/analysis/lia/lia_analysis_input.py‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎privacy_guard/analysis/lia/lia_analysis_node.py‎
Lines changed: 182 additions & 0 deletions b/‎privacy_guard/analysis/lia/lia_analysis_node.py‎
Lines changed: 182 additions & 0 deletions
diff --git a/‎privacy_guard/analysis/tests/test_lia_analysis_input.py‎
Lines changed: 49 additions & 0 deletions b/‎privacy_guard/analysis/tests/test_lia_analysis_input.py‎
Lines changed: 49 additions & 0 deletions
@@ -0,0 +1,38 @@
+# (c) Meta Platforms, Inc. and affiliates. Confidential and proprietary.
+
+# pyre-strict
+
+import pandas as pd
+from numpy.typing import NDArray
+from privacy_guard.analysis.base_analysis_input import BaseAnalysisInput
+
+
+class LIAAnalysisInput(BaseAnalysisInput):
+    def __init__(
+        self,
+        predictions: NDArray[float],
+        predictions_y1_generation: NDArray[float],
+        true_bits: NDArray[int],
+        y0: NDArray[int],
+        y1: NDArray[int],
+        received_labels: NDArray[int],
+    ) -> None:
+        """
+        Input to the LIA analysis.
+        args:
+            predictions: target model's predictions on the training data
+            predictions_y1_generation: predictions on training features used for generating y1 (reconstructed labels)
+            true_bits: array of 0s and 1s indicating whether a sample is from training or reconstrcuted
+            y0: training labels
+            y1: reconstructed labels
+            received_labels: labels received by the adversary (y0 or y1)
+        """
+        self.predictions = predictions
+        self.true_bits = true_bits
+        self.y0 = y0
+        self.y1 = y1
+        self.received_labels = received_labels
+        self.predictions_y1_generation = predictions_y1_generation
+        # Create minimal DataFrame for compatibility with BaseAnalysisInput
+        df_small = pd.DataFrame({"predictions": predictions})
+        super().__init__(df_train_user=df_small, df_test_user=df_small)
@@ -0,0 +1,182 @@
+# (c) Meta Platforms, Inc. and affiliates. Confidential and proprietary.
+
+# pyre-strict
+import logging
+from dataclasses import dataclass
+from typing import List, Tuple
+
+import numpy as np
+import torch
+from privacy_guard.analysis.base_analysis_output import BaseAnalysisOutput
+from privacy_guard.analysis.lia.lia_analysis_input import LIAAnalysisInput
+from privacy_guard.analysis.mia.analysis_node import AnalysisNode
+from privacy_guard.analysis.mia.mia_results import MIAResults
+from tqdm import tqdm
+
+logger: logging.Logger = logging.getLogger(__name__)
+
+TimerStats = dict[str, float]
+
+
+@dataclass
+class LIAAnalysisOutput(BaseAnalysisOutput):
+    """
+    A dataclass to encapsulate the outputs of LIAAnalysisNode.
+    """
+
+    eps: float  # epsilon UB (highest across all error thresholds)
+    eps_lb: float  # LB associated with UB epsilon
+    # Accuracy and AUC
+    accuracy: float
+    accuracy_ci: List[float]  # confidence interval
+    auc: float
+    auc_ci: List[float]  # confidence interval
+    error_rate_at_max_eps: float  # error rate at which max eps upper bound is achieved
+    eps_max_bounds: Tuple[
+        List[float], List[float]
+    ]  # eps LB and UB at TPR and FPR thresholds (eps=max(eps_tpr, eps_fpr))
+    eps_at_tpr_bounds: Tuple[
+        List[float], List[float]
+    ]  # eps LB and UB at TPR thresholds
+    eps_at_fpr_bounds: Tuple[
+        List[float], List[float]
+    ]  # eps LB and UB at FPR thresholds
+    # Dataset size
+    data_size: int
+    label_mean: float
+    prediction_mean: float
+    prediction_y1_generation_mean: float
+
+
+class LIAAnalysisNode(AnalysisNode):
+    def __init__(
+        self,
+        analysis_input: LIAAnalysisInput,
+        delta: float,
+        num_bootstrap_resampling_times: int = 10,
+        cap_eps: bool = True,
+        show_progress: bool = False,
+        with_timer: bool = False,
+        power: float = 0.0,
+        use_fnr_and_tnr: bool = False,
+    ) -> None:
+        if power < 0:
+            raise ValueError("Power used for score function must be non-negative")
+
+        self._delta = delta
+        self._num_bootstrap_resampling_times = num_bootstrap_resampling_times
+        self._cap_eps = cap_eps
+        self._show_progress = show_progress
+        self._with_timer = with_timer
+        self._analysis_input = analysis_input
+        self._timer_stats: dict[str, float] = {}
+        self._power = power
+        self._use_fnr_and_tnr = use_fnr_and_tnr
+
+    def compute_scores(self, i: int) -> Tuple[torch.Tensor, torch.Tensor]:
+        """
+        Compute scores for a given game instantiation.
+
+        Args:
+            i (int): index of the game instantiation (i.e. the i-th game)
+
+        Returns:
+            Tuple[torch.Tensor, torch.Tensor]: scores for samples with training labels and reconstructed labels
+        """
+
+        true_bits = self._analysis_input.true_bits[i]
+
+        received_labels = self._analysis_input.received_labels[i]
+        y1_probs = self._analysis_input.predictions_y1_generation
+        predictions = self._analysis_input.predictions
+
+        prob_train = np.where(received_labels == 1, predictions, 1 - predictions)
+        prob_reconstruct = np.where(received_labels == 1, y1_probs, 1 - y1_probs)
+        prob_diff_label = np.where(received_labels == 1, 1 - y1_probs, y1_probs)
+
+        scores = (prob_train - prob_reconstruct) * prob_diff_label**self._power
+
+        scores_train = torch.tensor(scores[true_bits == 0])
+        scores_test = torch.tensor(scores[true_bits == 1])
+
+        return scores_train, scores_test
+
+    def run_analysis(self) -> BaseAnalysisOutput:
+        """Run LIA analysis"""
+
+        error_thresholds = np.linspace(0.01, 1, 100)
+        num_resampling = self._analysis_input.y1.shape[0]
+        num_samples = self._analysis_input.y1.shape[1]
+
+        # run analysis for each game instance
+        all_metrics = []
+        with self.timer("compute all metrics"):
+            for i in tqdm(range(num_resampling), disable=not self._show_progress):
+                scores_train, scores_test = self.compute_scores(i)
+                train_size, test_size = scores_train.shape[0], scores_test.shape[0]
+                bootstrap_sample_size = min(train_size, test_size)
+                for _ in range(self._num_bootstrap_resampling_times):
+                    indices_train = AnalysisNode._compute_bootstrap_sample_indexes(
+                        train_size, bootstrap_sample_size
+                    )
+                    indices_test = AnalysisNode._compute_bootstrap_sample_indexes(
+                        test_size, bootstrap_sample_size
+                    )
+                    lia_results = MIAResults(
+                        scores_train=scores_train[indices_train],
+                        scores_test=scores_test[indices_test],
+                    )
+
+                    # metrics is a tuple: (accuracy, auc_value, eps_fpr_array, eps_tpr_array, eps_max_array)
+                    metrics = lia_results.compute_metrics_at_error_threshold(
+                        delta=self._delta,
+                        error_threshold=error_thresholds,
+                        cap_eps=self._cap_eps,
+                        verbose=self._show_progress,
+                        use_fnr_tnr=self._use_fnr_and_tnr,
+                    )
+
+                    all_metrics.append(metrics)
+
+        all_accuracy_values = np.array([run[0] for run in all_metrics])
+        all_auc_values = np.array([run[1] for run in all_metrics])
+        all_eps_fpr_values = np.array([run[2] for run in all_metrics])
+        all_eps_tpr_values = np.array([run[3] for run in all_metrics])
+        all_eps_values = np.array([run[4] for run in all_metrics])
+
+        # Compute upper bounds (95th percentile) for each error_threshold
+        eps_lb_per_threshold, eps_ub_per_threshold = self._compute_ci(all_eps_values)
+        # Find the maximum eps_ub across all error thresholds
+        idx = np.argmax(eps_ub_per_threshold)
+
+        error_rate_at_max_eps = error_thresholds[idx]
+
+        eps_max_ub = eps_ub_per_threshold[idx]
+        eps_lb_at_max_ub = eps_lb_per_threshold[idx]
+
+        # Compute lb/ub for accuracy and auc
+        accuracy_lb, accuracy_ub = self._compute_ci(np.array(all_accuracy_values))
+        auc_lb, auc_ub = self._compute_ci(np.array(all_auc_values))
+
+        # Compute lb/ub for eps computed using only TPR or only FPR thresholds
+        eps_tpr_lb, eps_tpr_ub = self._compute_ci(np.array(all_eps_tpr_values))
+        eps_fpr_lb, eps_fpr_ub = self._compute_ci(np.array(all_eps_fpr_values))
+
+        return LIAAnalysisOutput(
+            eps=float(eps_max_ub),
+            eps_lb=float(eps_lb_at_max_ub),
+            accuracy=np.mean(all_accuracy_values),
+            accuracy_ci=[accuracy_lb[0], accuracy_ub[0]],
+            auc=np.mean(all_auc_values),
+            auc_ci=[auc_lb[0], auc_ub[0]],
+            error_rate_at_max_eps=error_rate_at_max_eps,
+            eps_max_bounds=(list(eps_lb_per_threshold), list(eps_ub_per_threshold)),
+            eps_at_tpr_bounds=(list(eps_tpr_lb), list(eps_tpr_ub)),
+            eps_at_fpr_bounds=(list(eps_fpr_lb), list(eps_fpr_ub)),
+            data_size=num_samples,
+            label_mean=np.mean(self._analysis_input.y0),
+            prediction_mean=np.mean(self._analysis_input.predictions),
+            prediction_y1_generation_mean=np.mean(
+                self._analysis_input.predictions_y1_generation
+            ),
+        )
@@ -0,0 +1,49 @@
+# (c) Meta Platforms, Inc. and affiliates. Confidential and proprietary.
+
+# pyre-strict
+
+import unittest
+
+import numpy as np
+import pandas as pd
+from privacy_guard.analysis.lia.lia_analysis_input import LIAAnalysisInput
+
+
+class TestLIAAnalysisInput(unittest.TestCase):
+    def setUp(self) -> None:
+        self.predictions = np.array([0.1, 0.2, 0.3, 0.4, 0.5])
+        self.predictions_y1_generation = np.array([0.15, 0.25, 0.35, 0.45, 0.55])
+        self.true_bits = np.array([0, 1, 0, 1, 0])
+        self.y0 = np.array([0, 1, 0, 1, 0])
+        self.y1 = np.array([1, 0, 1, 0, 1])
+        self.received_labels = np.array([1, 0, 1, 0, 1])
+
+        self.lia_input = LIAAnalysisInput(
+            predictions=self.predictions,
+            predictions_y1_generation=self.predictions_y1_generation,
+            true_bits=self.true_bits,
+            y0=self.y0,
+            y1=self.y1,
+            received_labels=self.received_labels,
+        )
+        super().setUp()
+
+    def test_lia_analysis_input_init(self) -> None:
+        # Test that all attributes are set correctly
+        np.testing.assert_array_equal(self.lia_input.predictions, self.predictions)
+        np.testing.assert_array_equal(
+            self.lia_input.predictions_y1_generation, self.predictions_y1_generation
+        )
+        np.testing.assert_array_equal(self.lia_input.true_bits, self.true_bits)
+        np.testing.assert_array_equal(self.lia_input.y0, self.y0)
+        np.testing.assert_array_equal(self.lia_input.y1, self.y1)
+        np.testing.assert_array_equal(
+            self.lia_input.received_labels, self.received_labels
+        )
+
+        # Test that DataFrame is created correctly
+        self.assertIsInstance(self.lia_input.df_train_user, pd.DataFrame)
+        self.assertIsInstance(self.lia_input.df_test_user, pd.DataFrame)
+        np.testing.assert_array_equal(
+            self.lia_input.df_train_user["predictions"].values, self.predictions
+        )