computationalprivacy
diff --git a/‎notebooks/additional_setups.ipynb
Lines changed: 0 additions & 48 deletions b/‎notebooks/additional_setups.ipynb
Lines changed: 0 additions & 48 deletions
diff --git a/‎notebooks/dp.ipynb
Lines changed: 0 additions & 11 deletions b/‎notebooks/dp.ipynb
Lines changed: 0 additions & 11 deletions
diff --git a/‎notebooks/main_results.ipynb
Lines changed: 0 additions & 7 deletions b/‎notebooks/main_results.ipynb
Lines changed: 0 additions & 7 deletions
@@ -279,48 +279,37 @@
     "    \"lt_iqr_desc\"\n",
     "]\n",
     "\n",
-    "# Initialize list to store results\n",
     "all_results = []\n",
     "\n",
-    "# Loop through architectures and collect metrics\n",
     "for arch in [\"rn-20\", \"wrn28-2\", \"wrn40-4\"]:\n",
     "    exp_id = f\"{arch}_CIFAR10\"\n",
     "    if exp_id not in final_model_metrics:\n",
     "        continue\n",
     "        \n",
-    "    # Get precision/recall metrics for this architecture\n",
     "    results = make_precision_recall_at_k_df_single_threshold(\n",
     "        scores_df=final_model_metrics[exp_id],\n",
     "        ground_truth_df=final_model_metrics[exp_id], \n",
     "        fpr_threshold=0.001,\n",
     "        k_frac=0.01\n",
     "    )\n",
     "    \n",
-    "    # Add architecture column\n",
     "    results['architecture'] = arch\n",
     "    \n",
-    "    # Append to list\n",
     "    all_results.append(results)\n",
     "\n",
-    "# Create column names for precision and recall\n",
     "precision_columns = [\"precision_\" + m for m in metrics]\n",
     "recall_columns = [\"recall_\" + m for m in metrics]\n",
     "\n",
-    "# Create dataframe with both precision and recall columns\n",
     "df = pd.DataFrame.from_records(all_results)[precision_columns + recall_columns + ['architecture']]\n",
     "\n",
-    "# Pivot table to make architectures as columns\n",
     "df_pivot = df.melt(id_vars=['architecture'], var_name='metric', value_name='value')\n",
     "\n",
-    "# Create MultiIndex before pivoting\n",
     "df_pivot['type'] = df_pivot['metric'].str.split('_').str[0]\n",
     "df_pivot['metric'] = df_pivot['metric'].str.split('_').str[1:].str.join('_')\n",
     "df_pivot.set_index(['type', 'metric'], inplace=True)\n",
     "\n",
-    "# Now pivot with the MultiIndex\n",
     "results_df = df_pivot.pivot(columns='architecture', values='value')\n",
     "\n",
-    "# Sort index to group precision and recall metrics together\n",
     "idx = pd.MultiIndex.from_product([['precision', 'recall'], metrics], names=['type', 'metric'])\n",
     "results_df = results_df.reindex(idx)\n",
     "\n",
@@ -484,48 +473,37 @@
     "    \"lt_iqr_desc\"\n",
     "]\n",
     "\n",
-    "# Initialize list to store results\n",
     "all_results = []\n",
     "\n",
-    "# Loop through datasets and collect metrics\n",
     "for dataset in [\"CIFAR10\", \"CIFAR100\", \"CINIC10\"]:\n",
     "    exp_id = f\"wrn28-2_{dataset}\"  # Use WRN-28-2 for all datasets\n",
     "    if exp_id not in final_model_metrics:\n",
     "        continue\n",
     "        \n",
-    "    # Get precision/recall metrics for this dataset\n",
     "    results = make_precision_recall_at_k_df_single_threshold(\n",
     "        scores_df=final_model_metrics[exp_id],\n",
     "        ground_truth_df=final_model_metrics[exp_id], \n",
     "        fpr_threshold=0.001,\n",
     "        k_frac=0.01\n",
     "    )\n",
     "    \n",
-    "    # Add dataset column\n",
     "    results['dataset'] = dataset\n",
     "    \n",
-    "    # Append to list\n",
     "    all_results.append(results)\n",
     "\n",
-    "# Create column names for precision and recall\n",
     "precision_columns = [\"precision_\" + m for m in metrics]\n",
     "recall_columns = [\"recall_\" + m for m in metrics]\n",
     "\n",
-    "# Create dataframe with both precision and recall columns\n",
     "df = pd.DataFrame.from_records(all_results)[precision_columns + recall_columns + ['dataset']]\n",
     "\n",
-    "# Pivot table to make datasets as columns\n",
     "df_pivot = df.melt(id_vars=['dataset'], var_name='metric', value_name='value')\n",
     "\n",
-    "# Create MultiIndex before pivoting\n",
     "df_pivot['type'] = df_pivot['metric'].str.split('_').str[0]\n",
     "df_pivot['metric'] = df_pivot['metric'].str.split('_').str[1:].str.join('_')\n",
     "df_pivot.set_index(['type', 'metric'], inplace=True)\n",
     "\n",
-    "# Now pivot with the MultiIndex\n",
     "results_df = df_pivot.pivot(columns='dataset', values='value')\n",
     "\n",
-    "# Sort index to group precision and recall metrics together\n",
     "idx = pd.MultiIndex.from_product([['precision', 'recall'], metrics], names=['type', 'metric'])\n",
     "results_df = results_df.reindex(idx)\n",
     "\n",
@@ -628,18 +606,14 @@
     }
    ],
    "source": [
-    "# Initialize results storage\n",
     "results = []\n",
     "\n",
-    "# Loop through all experiments\n",
     "for exp_id in final_model_metrics.keys():\n",
     "    scores = final_model_metrics[exp_id][\"lira_score\"]\n",
     "    labels = final_model_metrics[exp_id][\"target_trained_on\"]\n",
     "\n",
-    "    # Calculate LiRA AUC\n",
     "    lira_auc = roc_auc_score(labels, scores)\n",
     "\n",
-    "    # Calculate TPR at FPR=0.001 \n",
     "    fpr, tpr, thresholds = roc_curve(labels, scores)\n",
     "    idx = np.argmin(np.abs(fpr - 0.001))\n",
     "    tpr_at_fpr = tpr[idx]\n",
@@ -650,7 +624,6 @@
     "        'tpr_at_fpr': tpr_at_fpr\n",
     "    })\n",
     "\n",
-    "# Create dataframe\n",
     "df = pd.DataFrame(results).set_index('exp_id')\n",
     "print(\"\\nLiRA Metrics across all experiments:\")\n",
     "df\n"
@@ -813,48 +786,37 @@
     "    \"lt_iqr_desc\"\n",
     "]\n",
     "\n",
-    "# Initialize list to store results\n",
     "all_results = []\n",
     "\n",
-    "# Loop through datasets and collect metrics\n",
     "for dataset in [\"CIFAR10\", \"CIFAR100\", \"CINIC10\"]:\n",
     "    exp_id = f\"wrn28-2_{dataset}\"  # Use WRN-28-2 for all datasets\n",
     "    if exp_id not in final_model_metrics:\n",
     "        continue\n",
     "        \n",
-    "    # Get precision/recall metrics for this dataset\n",
     "    results = make_precision_recall_at_k_df_single_threshold(\n",
     "        scores_df=final_model_metrics[exp_id],\n",
     "        ground_truth_df=final_model_metrics[exp_id], \n",
     "        fpr_threshold=0.001,\n",
     "        k_frac=0.01\n",
     "    )\n",
     "    \n",
-    "    # Add dataset column\n",
     "    results['dataset'] = dataset\n",
     "    \n",
-    "    # Append to list\n",
     "    all_results.append(results)\n",
     "\n",
-    "# Create column names for precision and recall\n",
     "precision_columns = [\"precision_\" + m for m in metrics]\n",
     "recall_columns = [\"recall_\" + m for m in metrics]\n",
     "\n",
-    "# Create dataframe with both precision and recall columns\n",
     "df = pd.DataFrame.from_records(all_results)[precision_columns + recall_columns + ['dataset']]\n",
     "\n",
-    "# Pivot table to make datasets as columns\n",
     "df_pivot = df.melt(id_vars=['dataset'], var_name='metric', value_name='value')\n",
     "\n",
-    "# Create MultiIndex before pivoting\n",
     "df_pivot['type'] = df_pivot['metric'].str.split('_').str[0]\n",
     "df_pivot['metric'] = df_pivot['metric'].str.split('_').str[1:].str.join('_')\n",
     "df_pivot.set_index(['type', 'metric'], inplace=True)\n",
     "\n",
-    "# Now pivot with the MultiIndex\n",
     "results_df = df_pivot.pivot(columns='dataset', values='value')\n",
     "\n",
-    "# Sort index to group precision and recall metrics together\n",
     "idx = pd.MultiIndex.from_product([['precision', 'recall'], metrics], names=['type', 'metric'])\n",
     "results_df = results_df.reindex(idx)\n",
     "\n",
@@ -1065,7 +1027,6 @@
     "for exp_id in final_model_metrics:\n",
     "    df = final_model_metrics[exp_id]\n",
     "\n",
-    "    # Create empty results dictionary with metrics as rows\n",
     "    k_fracs = [0.01, 0.03, 0.05, 0.10, 0.20, 0.50]\n",
     "\n",
     "    # Populate results\n",
@@ -1080,10 +1041,8 @@
     "        results[exp_id][f'k={k_frac*100}% Precision'] = stats['precision_lt_iqr_desc']\n",
     "        results[exp_id][f'k={k_frac*100}% Recall'] = stats['recall_lt_iqr_desc']\n",
     "\n",
-    "    # Convert to DataFrame with metrics as index\n",
     "results_df = pd.DataFrame.from_dict(results, orient='index')\n",
     "\n",
-    "# Sort columns to group by k%\n",
     "column_order = []\n",
     "for k_frac in k_fracs:\n",
     "    column_order.extend([f'k={k_frac*100}% Precision', f'k={k_frac*100}% Recall'])\n",
@@ -1246,13 +1205,11 @@
    "source": [
     "from collections import defaultdict\n",
     "\n",
-    "# Create empty lists/dicts to store results\n",
     "exp_ids = []\n",
     "total_pos = []\n",
     "pos_at_thresh = []\n",
     "max_recalls = defaultdict(list)\n",
     "\n",
-    "# Calculate metrics for each experiment\n",
     "for exp_id in final_model_metrics.keys():\n",
     "    results = final_model_metrics[exp_id]\n",
     "    \n",
@@ -1263,18 +1220,15 @@
     "    total_pos.append(total_positives)\n",
     "    pos_at_thresh.append(num_positives_at_threshold)\n",
     "    \n",
-    "    # Calculate max recalls for different k%\n",
     "    for k in (1, 3, 5, 10, 20, 50):\n",
     "        predicted_samples = k * total_positives // 100\n",
     "        max_recall = min(1, predicted_samples / num_positives_at_threshold)\n",
     "        max_recalls[k].append(max_recall)\n",
     "\n",
-    "# Create and display results DataFrame\n",
     "results_dict = {\n",
     "    'Total Positives': total_pos,\n",
     "    'Positives at Threshold': pos_at_thresh,\n",
     "}\n",
-    "# Add max recalls to results dictionary\n",
     "for k in max_recalls:\n",
     "    results_dict[f'Max Recall {k}%'] = max_recalls[k]\n",
     "\n",
@@ -1407,7 +1361,6 @@
     "    \"spearman_lt_iqr\",\n",
     "]\n",
     "\n",
-    "# Create DataFrame with metrics for each experiment\n",
     "metrics_by_exp = {}\n",
     "\n",
     "for exp_id in final_model_metrics:\n",
@@ -1422,7 +1375,6 @@
     "    \n",
     "    metrics_by_exp[exp_id] = metrics_dict\n",
     "\n",
-    "# Create DataFrame with experiments as columns and metrics as rows\n",
     "results_df = pd.DataFrame(metrics_by_exp).loc[metrics]\n",
     "\n",
     "display(results_df)\n",
 
@@ -133,15 +133,12 @@
     "\n",
     "        df = all_dfs[(clipnorm, noise)]\n",
     "\n",
-    "        # Extract the ground truth (target_trained_on) and scores (lira_score)\n",
     "        y_true = df[\"target_trained_on\"]\n",
     "        y_scores = df[\"lira_score\"]\n",
     "\n",
-    "        # Compute ROC curve and ROC area\n",
     "        fpr, tpr, thresholds = roc_curve(y_true, y_scores)\n",
     "        roc_auc = auc(fpr, tpr)\n",
     "\n",
-    "        # Plot ROC curve\n",
     "        plt.plot(fpr, tpr, lw=2,\n",
     "                color=colors[clipnorm],\n",
     "                linestyle=linestyles[noise],\n",
@@ -734,7 +731,6 @@
    "source": [
     "trace_df = all_dfs[(\"10\", \"0\")]\n",
     "\n",
-    "# Get results for different k values\n",
     "k_values = [0.01, 0.03, 0.05]\n",
     "results = {}\n",
     "for k in k_values:\n",
@@ -746,7 +742,6 @@
     "    )\n",
     "    results[k] = result\n",
     "\n",
-    "# Create DataFrame with metrics as rows and k values as columns\n",
     "metrics_df = pd.DataFrame.from_dict(results, orient='columns')\n",
     "metrics_df.columns = [f'k={k}' for k in k_values]\n",
     "\n",
@@ -1326,11 +1321,9 @@
     }
    ],
    "source": [
-    "# Fix noise=0 and k=0.05\n",
     "noise = \"0\"\n",
     "k = 0.05\n",
     "\n",
-    "# Get results for different clipnorm values\n",
     "results = {}\n",
     "for clipnorm in [\"1\", \"3\", \"10\"]:\n",
     "    if (clipnorm, noise) in all_dfs:\n",
@@ -1343,7 +1336,6 @@
     "        )\n",
     "        results[clipnorm] = result\n",
     "\n",
-    "# Create DataFrame with metrics as rows and clipnorm values as columns\n",
     "metrics_df = pd.DataFrame.from_dict(results, orient='columns')\n",
     "metrics_df.columns = [f'clipnorm={c}' for c in results.keys()]\n",
     "\n",
@@ -1923,12 +1915,10 @@
     }
    ],
    "source": [
-    "# Fix noise=0 and k=0.05\n",
     "noise = \"0\"\n",
     "k = 0.05\n",
     "fpr_values = [0.1, 0.01, 0.001]\n",
     "\n",
-    "# Get results for different fpr thresholds\n",
     "results = {}\n",
     "for fpr in fpr_values:\n",
     "    if (clipnorm, noise) in all_dfs:\n",
@@ -1941,7 +1931,6 @@
     "        )\n",
     "        results[fpr] = result\n",
     "\n",
-    "# Create DataFrame with metrics as rows and fpr values as columns\n",
     "metrics_df = pd.DataFrame.from_dict(results, orient='columns')\n",
     "metrics_df.columns = [f'fpr={fpr}' for fpr in fpr_values]\n",
     "\n",
 
@@ -301,7 +301,6 @@
     "        'Recall on union': recall\n",
     "    })\n",
     "\n",
-    "# Display as a table\n",
     "results_df = pd.DataFrame(results)\n",
     "display(results_df)"
    ]
@@ -482,11 +481,9 @@
     "    \"shap_desc\",\n",
     "    \"lt_iqr_desc\",\n",
     "]\n",
-    "# Create empty results dictionary with metrics as rows\n",
     "results = {metric: {} for metric in metrics}\n",
     "k_fracs = [0.01, 0.03, 0.05, 0.10, 0.20, 0.50]\n",
     "\n",
-    "# Populate results\n",
     "for k_frac in k_fracs:\n",
     "    stats = make_precision_recall_at_k_df_single_threshold(\n",
     "        scores_df=df,\n",
@@ -496,14 +493,11 @@
     "    )\n",
     "    \n",
     "    for metric in metrics:\n",
-    "        # Add precision and recall columns for each k%\n",
     "        results[metric][f'k={k_frac*100}% Precision'] = stats[f'precision_{metric}']\n",
     "        results[metric][f'k={k_frac*100}% Recall'] = stats[f'recall_{metric}']\n",
     "\n",
-    "# Convert to DataFrame with metrics as index\n",
     "results_df = pd.DataFrame.from_dict(results, orient='index')\n",
     "\n",
-    "# Sort columns to group by k%\n",
     "column_order = []\n",
     "for k_frac in k_fracs:\n",
     "    column_order.extend([f'k={k_frac*100}% Precision', f'k={k_frac*100}% Recall'])\n",
@@ -1079,7 +1073,6 @@
     ")\n",
     "\n",
     "plt.grid(True, linestyle='--', alpha=0.7)\n",
-    "# plt.title('Correlation between LT-IQR and LiRA Rankings', pad=20, fontsize=14)\n",
     "plt.xlabel(\"LT-IQR Rank\", fontsize=20, labelpad=10)\n",
     "plt.ylabel(\"LiRA Rank\", fontsize=20, labelpad=10)\n",
     "\n",