fixing activation maximisation

b8d18de9 · Nikolai.Hartmann · 14a7743a · b8d18de9 · b8d18de9
Commit b8d18de9 authored 6 years ago by Nikolai.Hartmann
--- a/scripts/plot_NN_2D.py
+++ b/scripts/plot_NN_2D.py
@@ -220,7 +220,17 @@ elif args.mode.startswith("hist"):
        # ranges in which to sample the random events
        x_test_scaled = c.transform(c.x_test)
        ranges = get_ranges(x_test_scaled, [0.01, 0.99], total_weights, mask_value=mask_value)
-        losses, events = get_max_activation_events(c.model, ranges, ntries=args.ntries_actmax, step=args.step_size, layer=layer, neuron=neuron, threshold=args.threshold)
+        kwargs = {}
+        if hasattr(c, "get_input_list"):
+            kwargs["input_transform"] = c.get_input_list
+            kwargs["input_inverse_transform"] = c.get_input_flat
+        losses, events = get_max_activation_events(c.model, ranges,
+                                                   ntries=args.ntries_actmax,
+                                                   step=args.step_size,
+                                                   layer=layer,
+                                                   neuron=neuron,
+                                                   threshold=args.threshold,
+                                                   **kwargs)
        events = c.inverse_transform(events)
        valsx = events[:,varx_index]
        if not plot_vs_activation:

--- a/utils.py
+++ b/utils.py
@@ -39,26 +39,44 @@ def create_random_event(ranges):
    return random_event
-def max_activation_wrt_input(gradient_function, random_event, threshold=None, maxthreshold=None, maxit=100, step=1, const_indices=[]):
+def max_activation_wrt_input(gradient_function, random_event, threshold=None, maxthreshold=None, maxit=100, step=1, const_indices=[],
-    for i in range(maxit):
+                             input_transform=None, input_inverse_transform=None):
-        loss_value, grads_value = gradient_function([random_event])
+    if input_transform is not None:
-        for const_index in const_indices:
+        random_event = input_transform(random_event)
-            grads_value[0][const_index] = 0
+    if not isinstance(random_event, list):
-        if threshold is not None:
+        random_event = [random_event]
-            if loss_value > threshold and (maxthreshold is None or loss_value < maxthreshold):
-                # found an event within the thresholds
+    def iterate(random_event):
-                return loss_value, random_event
+        for i in range(maxit):
-            elif (maxthreshold is not None and loss_value > maxthreshold):
+            grads_out = gradient_function(random_event)
-                random_event -= grads_value*step
+            loss_value = grads_out[0][0]
-            else:
+            grads_values = grads_out[1:]
-                random_event += grads_value*step
+            # follow gradient for all inputs
+            for i, (grads_value, input_event) in enumerate(zip(grads_values, random_event)):
+                for const_index in const_indices:
+                    grads_value[0][const_index] = 0
+                if threshold is not None:
+                    if loss_value > threshold and (maxthreshold is None or loss_value < maxthreshold):
+                        # found an event within the thresholds
+                        return loss_value, random_event
+                    elif (maxthreshold is not None and loss_value > maxthreshold):
+                        random_event[i] -= grads_value*step
+                    else:
+                        random_event[i] += grads_value*step
+                else:
+                    random_event[i] += grads_value*step
        else:
-            random_event += grads_value*step
+            if threshold is not None:
-    else:
+                # no event found for the given threshold
-        if threshold is not None:
+                return None, None
-            # no event found
+        # otherwise return last status
-            return None
+        return loss_value, random_event
-    # if no threshold requested, always return last status
+    loss_value, random_event = iterate(random_event)
+    if input_inverse_transform is not None and random_event is not None:
+        random_event = input_inverse_transform(random_event)
+    elif random_event is None:
+        return None
    return loss_value, random_event
@@ -66,12 +84,16 @@ def get_grad_function(model, layer, neuron):
    loss = model.layers[layer].output[:,neuron]
-    grads = K.gradients(loss, model.input)[0]
+    grads = K.gradients(loss, model.input)
    # trick from https://blog.keras.io/how-convolutional-neural-networks-see-the-world.html
-    grads /= (K.sqrt(K.mean(K.square(grads))) + 1e-5)
+    norm_grads = [grad/(K.sqrt(K.mean(K.square(grad))) + 1e-5) for grad in grads]
+    inp = model.input
+    if not isinstance(inp, list):
+        inp = [inp]
-    return K.function([model.input], [loss, grads])
+    return K.function(inp, [loss]+norm_grads)
 @cache(useJSON=True,
@@ -79,6 +101,7 @@ def get_grad_function(model, layer, neuron):
           lambda model: [hash(i.tostring()) for i in model.get_weights()],
           lambda ranges: [hash(i.tostring()) for i in ranges],
       ],
+       ignoreKwargs=["input_transform", "input_inverse_transform"],
 )
 def get_max_activation_events(model, ranges, ntries, layer, neuron, seed=42, **kwargs):
@@ -90,9 +113,12 @@ def get_max_activation_events(model, ranges, ntries, layer, neuron, seed=42, **k
    for i in range(ntries):
        if not (i%100):
            logger.info(i)
-        res = max_activation_wrt_input(gradient_function, create_random_event(ranges), **kwargs)
+        res = max_activation_wrt_input(gradient_function,
+                                       create_random_event(ranges),
+                                       **kwargs)
        if res is not None:
            loss, event = res
+            loss = np.array([loss])
        else:
            continue
        if events is None: