Deep-Graph-Persistence/src/dgp-shift-detection/witness_functions.py at main · ExplainableML/Deep-Graph-Persistence · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
import torch
import numpy as np

from mlp import MLP
from typing import List
from torch import Tensor
from utils import build_dnp_matrix
from collections.abc import Iterable
from utils import get_mlp_activations
from utils import build_mlp_activation_graph
from utils import get_mst_weights_from_bipartite_graph
from utils import get_approximate_mst_weights_from_bipartite_graph


def logit_witness_function(model: MLP, x: Tensor) -> np.ndarray:
    return model(x).detach().cpu().numpy()


def softmax_witness_function(model: MLP, x: Tensor) -> np.ndarray:
    return torch.softmax(model(x), dim=1).detach().cpu().numpy()


def magdiff_witness_function(model: MLP, x: Tensor) -> np.ndarray:
    activation_graph = build_mlp_activation_graph(model, x)
    activation_graph = activation_graph[-1]
    activation_graph = activation_graph.reshape(activation_graph.shape[0], -1)
    activation_graph = activation_graph.detach().cpu().numpy()
    return activation_graph


def dnp_witness_function(
    model: MLP,
    x: Tensor,
    variance_correction: bool,
    normalize: bool = False,
    approximate: bool = False,
) -> np.ndarray:
    # Build activation graph
    activation_graph = build_mlp_activation_graph(model, x)
    num_layers = len(activation_graph)

    # Normalize activation graph
    def normalize_layer(layer: Tensor) -> Tensor:
        if variance_correction:
            layer = layer - layer.mean()
            layer = layer / (layer.std() + 1e-8)

        layer = torch.abs(layer)
        return layer

    # Split into samples
    activation_graph = [
        [activations[sample_index] for activations in activation_graph]
        for sample_index in range(x.shape[0])
    ]

    # Normalize each layer
    activation_graph = [
        [normalize_layer(layer) for layer in sample_layers]
        for sample_layers in activation_graph
    ]

    # Map to [0, 1]
    if normalize:
        maximum_activations = [
            np.max([layer.max() for layer in sample_layers])
            for sample_layers in activation_graph
        ]
        activation_graph = [
            [layer / maximum_activation for layer in sample_layers]
            for sample_layers, maximum_activation in zip(
                activation_graph, maximum_activations
            )
        ]

    # Recombine samples
    activation_graph = [
        torch.stack(
            [
                sample_activations[layer_index]
                for sample_activations in activation_graph
            ],
        ).transpose(1, 2)
        for layer_index in range(num_layers)
    ]

    # Build DNP matrix
    activation_graph = [layer.detach().cpu().numpy() for layer in activation_graph]
    dnp_matrix = build_dnp_matrix(activation_graph)

    # Get MST weights from each sample individually
    mst_weights = []
    for sample_dnp_matrix in dnp_matrix:
        sample_dnp_matrix = sample_dnp_matrix.detach().cpu().numpy()
        if approximate:
            sample_mst_weights = get_approximate_mst_weights_from_bipartite_graph(
                sample_dnp_matrix
            )
        else:
            sample_mst_weights = get_mst_weights_from_bipartite_graph(sample_dnp_matrix)
        mst_weights.append(sample_mst_weights)

    mst_weights = np.stack(mst_weights)
    return mst_weights


def input_activation_witness_function(model: MLP, x: Tensor) -> List[np.ndarray]:
    activations = get_mlp_activations(model, x)
    activations = activations[1:]
    activations = [activation.detach().cpu().numpy() for activation in activations]
    return activations


def topological_uncertainty_witness_function(
    model: MLP, x: Tensor, variance_correction: bool = False
) -> List[np.ndarray]:
    def _layer_persistence_diagrams(layer: List[np.ndarray]) -> List[np.ndarray]:
        # Get PD for each sample individually
        layer_persistence_diagrams = []

        for sample_layer in layer:
            if variance_correction:
                sample_layer = sample_layer - sample_layer.mean()
                sample_layer = sample_layer / (sample_layer.std() + 1e-8)
            # Extract Maximum Spanning Tree
            mst_weights = get_mst_weights_from_bipartite_graph(sample_layer)

            # Save PD
            layer_persistence_diagrams.append(mst_weights)

        layer_persistence_diagrams = np.stack(layer_persistence_diagrams)
        return layer_persistence_diagrams

    # Build Activation Graph
    activation_graph = build_mlp_activation_graph(model, x)

    # Get PD for each layer
    persistence_diagrams = []

    for layer in activation_graph:
        # Convert to numpy
        layer = layer.detach().cpu().numpy()

        # Get PD for each sample individually
        layer_persistence_diagrams = _layer_persistence_diagrams(layer)

        # Save Layer PDs
        persistence_diagrams.append(layer_persistence_diagrams)

    return persistence_diagrams


def distance_from_center(x_reference: np.ndarray, x: np.ndarray) -> np.ndarray:
    if isinstance(x, np.ndarray):
        return np.linalg.norm(x_reference.mean(axis=0) - x, axis=1)
    elif isinstance(x, Iterable):
        elementwise_distances = [
            distance_from_center(x_reference_i, x_i)
            for x_reference_i, x_i in zip(x_reference, x)
        ]
        elementwise_distances = np.stack(elementwise_distances)
        return np.mean(elementwise_distances, axis=0)
    else:
        raise TypeError(f"Expected x to be np.ndarray or Iterable, got {type(x)}")


def distance_from_center_by_groups(
    x_reference: np.ndarray, y_reference: np.ndarray, x: np.ndarray
) -> np.ndarray:
    if isinstance(x, np.ndarray):
        distances = []
        for group in np.sort(np.unique(y_reference)):
            group_x_reference = x_reference[y_reference == group]
            group_distances = distance_from_center(group_x_reference, x)
            distances.append(group_distances)
        return np.stack(distances, axis=1)

    elif isinstance(x, Iterable):
        elementwise_distances = [
            distance_from_center_by_groups(x_reference_i, y_reference, x_i)
            for x_reference_i, x_i in zip(x_reference, x)
        ]
        elementwise_distances = np.stack(elementwise_distances)
        return np.mean(elementwise_distances, axis=0)
    else:
        raise TypeError(f"Expected x to be np.ndarray or Iterable, got {type(x)}")