mi face/qebb testing

Azure · Apr 8, 2022 · ff4f3c7 · ff4f3c7
1 parent de0cb8b
commit ff4f3c7
Show file tree

Hide file tree

Showing 2 changed files with 186 additions and 54 deletions.
diff --git a/counterfit/frameworks/art/art.py b/counterfit/frameworks/art/art.py
@@ -12,11 +12,11 @@
 from counterfit.core.output import CFPrint
 from counterfit.core.frameworks import CFFramework
 from counterfit.core.targets import CFTarget
-from counterfit.core.reporting import get_target_data_type_obj
 
 from .utils import attack_factory
 from art.utils import compute_success_array, random_targets
-
+from scipy.stats import entropy
+from art.utils import clip_and_round
 
 class ArtFramework(CFFramework):
     def __init__(self):
@@ -67,20 +67,77 @@ def build(cls, target: CFTarget, attack: str) -> object:
         Initialize parameters.
         Set samples.
         """
-        # Return the correct estimator for the target selected.
-        # Keep an empty classifier around for extraction attacks.
-        classifier = cls.classifier(target)
 
+        # Pass to helper factory function for attack creation.
         loaded_attack = attack_factory(attack)
+
+        # Return the correct ART estimator for the target selected.
+        # Keep an empty classifier around for extraction attacks.
+        classifier = cls.set_classifier(target)
 
-        # Build the classifier
+        # Build the blackbox classifier
         if "BlackBox" in classifier.__name__:
             target_classifier = classifier(
                 target.predict_wrapper,
                 target.input_shape,
                 len(target.output_classes)
             )
 
+        # Build the classifier if log_probs is present
+        elif "QueryEfficientGradient" in classifier.__name__:
+            class QEBBWrapper:
+                def __init__(self) -> None:
+                    class ModelWrapper:
+                        predict = target.predict_wrapper
+
+                    self.model = ModelWrapper()
+                    self.clip_values = loaded_attack.estimator.clip_values
+                    self.nb_classes = loaded_attack.estimator.nb_classes
+                    self.predict = target.predict_wrapper
+
+            def class_gradient(x, label, target=target, num_basis=1, sigma=1.5, clip_values=(0., 255.), round_samples=0.0):
+                epsilon_map = sigma * np.random.normal(size=([num_basis] + list(target.input_shape)))
+                grads = []
+
+                y = target.predict_wrapper(x[0])
+
+                for i in range(len(x)):
+                    minus = clip_and_round(
+                        np.repeat(x[i], num_basis, axis=0) - epsilon_map,
+                        clip_values,
+                        round_samples,
+                    )
+                    plus = clip_and_round(
+                        np.repeat(x[i], num_basis, axis=0) + epsilon_map,
+                        clip_values,
+                        round_samples,
+                    )
+
+                    new_y_minus = np.array([entropy(y[i], p) for p in target.predict_wrapper(minus)])
+                    new_y_plus = np.array([entropy(y[i], p) for p in target.predict_wrapper(plus)])
+                    query_efficient_grad = 2 * np.mean(
+                        np.multiply(
+                            epsilon_map.reshape(num_basis, -1),
+                            (new_y_plus - new_y_minus).reshape(num_basis, -1) / (2 * sigma),
+                        ).reshape([-1] + list(target.input_shape)),
+                        axis=0,
+                    )
+                    grads.append(query_efficient_grad)
+#                 grads_array = self._apply_preprocessing_gradient(x, np.array(grads))
+
+                return np.array(grads)                     
+
+            temp_classifier = QEBBWrapper()
+            setattr(temp_classifier, "class_gradient", class_gradient)
+
+            target_classifier = classifier(
+                classifier=temp_classifier,
+                num_basis = 3,
+                sigma = 1.5
+            )
+
+            setattr(target_classifier, "class_gradient", class_gradient)
+
         # Everything else takes a model file.
         else:
             target_classifier = classifier(
@@ -102,36 +159,23 @@ def run(cls, cfattack: CFAttack):
 
         # Run the attack. Each attack type has it's own execution function signature.
         if "infer" in attack_attributes:
-            results = cfattack.attack.infer(
-                np.array(cfattack.samples, dtype=np.float32), y=np.array(cfattack.target.output_classes, dtype=np.float32))
+            x_init_average  = np.zeros((10, 1, 784)) + np.mean(cfattack.target.X, axis=0)
+            results = cfattack.attack.infer(x_init_average, np.array(cfattack.target.output_classes).astype(np.int64))
+            #results = cfattack.attack.infer(cfattack.samples, np.array(cfattack.target.output_classes).astype(np.int64))
 
         elif "reconstruct" in attack_attributes:
             results = cfattack.attack.reconstruct(
                 np.array(cfattack.samples, dtype=np.float32))
 
         elif "generate" in attack_attributes:
-            if "CarliniWagnerASR" == cfattack.name:
-                y = cfattack.target.output_classes
-            elif "FeatureAdversariesNumpy" in attack_attributes:
-                y = cfattack.samples
-            elif "FeatureAdversariesPyTorch" in attack_attributes:
-                y = cfattack.samples
-            elif "FeatureAdversariesTensorFlowV2" in attack_attributes:
-                y = cfattack.samples
-            else:
-                y = None
+
 
             if "ZooAttack" == cfattack.name:
                 # patch ZooAttack
                 cfattack.attack.estimator.channels_first = True
 
-            print("----------------------------------------------------------------------")
-            print(random_targets(np.array(cfattack.initial_labels), len(cfattack.target.output_classes)))
-            print("----------------------------------------------------------------------")
-
             results = cfattack.attack.generate(
-                x=np.array(cfattack.samples, dtype=np.float32),
-                y=random_targets(np.array(cfattack.initial_labels), len(cfattack.target.output_classes)))
+                x=np.array(cfattack.samples, dtype=np.float32))
 
         elif "poison" in attack_attributes:
             results = cfattack.attack.poison(
@@ -164,42 +208,57 @@ def pre_attack_processing(cls, cfattack: CFAttack):
     def post_attack_processing(cfattack: CFAttack):
         attack_attributes = cfattack.attack.__dir__()
 
-        if "generate" in attack_attributes:
-            current_datatype = cfattack.target.data_type
-            current_dt_report_gen = get_target_data_type_obj(current_datatype)
-            cfattack.summary = current_dt_report_gen.get_run_summary(cfattack)
-            # current_dt_report_gen.print_run_summary(summary)
+        pass
+
+        # if "generate" in attack_attributes:
+        #     current_datatype = cfattack.target.data_type
+        #     current_dt_report_gen = get_target_data_type_obj(current_datatype)
+        #     cfattack.summary = current_dt_report_gen.get_run_summary(cfattack)
+        #     # current_dt_report_gen.print_run_summary(summary)
 
-        elif "extract" in attack_attributes:
-            # Override default reporting for the attack type
-            extract_table = Table(header_style="bold magenta")
-            # Add columns to extraction table
-            extract_table.add_column("Success")
-            extract_table.add_column("Copy Cat Accuracy")
-            extract_table.add_column("Elapsed time")
-            extract_table.add_column("Total Queries")
-
-            # Add data to extraction table
-            success = cfattack.success[0]  # Starting value
-            thieved_accuracy = cfattack.results
-            elapsed_time = cfattack.elapsed_time
-            num_queries = cfattack.logger.num_queries
-            extract_table.add_row(str(success), str(
-                thieved_accuracy), str(elapsed_time), str(num_queries))
-
-            CFPrint.output(extract_table)
+        # elif "extract" in attack_attributes:
+        #     # Override default reporting for the attack type
+        #     extract_table = Table(header_style="bold magenta")
+        #     # Add columns to extraction table
+        #     extract_table.add_column("Success")
+        #     extract_table.add_column("Copy Cat Accuracy")
+        #     extract_table.add_column("Elapsed time")
+        #     extract_table.add_column("Total Queries")
+
+        #     # Add data to extraction table
+        #     success = cfattack.success[0]  # Starting value
+        #     thieved_accuracy = cfattack.results
+        #     elapsed_time = cfattack.elapsed_time
+        #     num_queries = cfattack.logger.num_queries
+        #     extract_table.add_row(str(success), str(
+        #         thieved_accuracy), str(elapsed_time), str(num_queries))
+
+        #     CFPrint.output(extract_table)
 
     @classmethod
-    def classifier(cls, target: CFTarget):
-        # this code attempts to match the .target_classifier attribute of a target with an ART
+    def set_classifier(cls, target: CFTarget):
+
+        # Match the target.classifier attribute with an ART classifier type
         classifiers = cls.get_classifiers()
 
-        if not hasattr(target, "target_classifier"):
-            return classifiers.get("BlackBoxClassifierNeuralNetwork")
+        # If no classifer attribute has been set, assume a blackbox.
+        if not hasattr(target, "classifier"):
+
+            # If the target model returns log_probs, return the relevant estimator
+            if hasattr(target, "log_probs"):
+                if target.log_probs == True:
+                    return classifiers.get("QueryEfficientGradientEstimationClassifier")
+
+            # Else return a plain BB estimator 
+            else:
+                return classifiers.get("BlackBoxClassifierNeuralNetwork")
+
+
+        # Else resolve the correct classifier
         else:
             for classifier in classifiers.keys():
-                if target.target_classifier.lower() in classifier.lower():
-                    return classifiers.get(classifier)
+                if target.classifier.lower() in classifier.lower():
+                    return classifiers.get(classifier, None)
 
     def check_success(self, cfattack: CFAttack) -> bool:
         attack_attributes = set(cfattack.attack.__dir__())

diff --git a/examples/scripting/cf.py b/examples/scripting/cf.py
@@ -8,6 +8,10 @@
 from targets import DigitKeras
 from targets import Digits
 
+import numpy as np
+
+import matplotlib.pyplot as plt
+
 attacks = ["mi_face"]
 target = Digits()
 target.load()
@@ -16,4 +20,73 @@
     cfattack = Counterfit.build_attack(target, attack)
     Counterfit.run_attack(cfattack)
 
-print(cfattack.results)
+
+plt.figure(figsize=(15,15))
+for i in range(10):
+    plt.subplot(5, 5, i + 1)
+    plt.imshow( (np.reshape(cfattack.results[0+i,], (28, 28))), cmap=plt.cm.gray_r)
+
+plt.show()
+print()
+
+# import tensorflow as tf
+# tf.compat.v1.disable_eager_execution()
+# import warnings
+# warnings.filterwarnings('ignore')
+# import keras.backend as k
+# from keras.models import Sequential
+# from keras.layers import Dense, Flatten, Conv2D, MaxPooling2D, Dropout
+# import numpy as np
+# from numpy.random import seed
+# seed(123)
+
+# from art.estimators.classification import KerasClassifier
+# from art.attacks.inference.model_inversion.mi_face import MIFace
+# from art.utils import load_dataset
+
+
+
+# # Read MNIST dataset
+# (x_train, y_train), (x_test, y_test), min_, max_ = load_dataset(str('mnist'))
+
+# # create standard CNN in Keras and wrap with ART KerasClassifier:
+# def cnn_mnist(input_shape, min_val, max_val):
+
+#     model = Sequential()
+#     model.add(Conv2D(32, kernel_size=(3, 3), activation='relu', input_shape=input_shape))
+#     model.add(MaxPooling2D(pool_size=(2, 2)))
+#     model.add(Conv2D(64, (3, 3), activation='relu'))
+#     model.add(MaxPooling2D(pool_size=(2, 2)))
+#     model.add(Dropout(0.25))
+#     model.add(Flatten())
+#     model.add(Dense(128, activation='relu'))
+#     model.add(Dense(10, activation='softmax'))
+
+#     model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
+
+#     classifier = KerasClassifier(clip_values=(min_val, max_val), 
+#                                 model=model, use_logits=False)
+#     return classifier
+
+# num_epochs = 1
+
+# # Construct and train a convolutional neural network
+# classifier = cnn_mnist(x_train.shape[1:], min_, max_)
+# classifier.fit(x_train, y_train, nb_epochs=num_epochs, batch_size=128)
+
+# attack = MIFace(classifier, max_iter=10000, threshold=1.) 
+
+# y = np.arange(10)
+
+# x_init_white = np.zeros((10, 28, 28, 1))
+# x_init_grey = np.zeros((10, 28, 28, 1)) + 0.5
+# x_init_black = np.ones((10, 28, 28, 1))
+# x_init_random = np.random.uniform(0, 1, (10, 28, 28, 1))
+# x_init_average = np.zeros((10, 28, 28, 1)) + np.mean(x_test, axis=0)
+
+# class_gradient = classifier.class_gradient(x_init_grey, y)
+# class_gradient = np.reshape(class_gradient, (10, 28*28))
+# class_gradient_max = np.max(class_gradient, axis=1)
+
+# # Now we run the attack:
+# x_infer_from_average = attack.infer(x_init_average, y)