-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathItCModel.py
172 lines (123 loc) · 6.38 KB
/
ItCModel.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
import numpy as np
from sklearn.linear_model import LogisticRegression
from sklearn.semi_supervised import LabelSpreading
import tensorflow as tf
from sklearn.dummy import DummyClassifier
from sklearn.metrics import accuracy_score
from sklearn.model_selection import train_test_split
from utils import compute_activation_per_layer, flatten_activations
class ItCModel():
def __init__(self, model, **params):
# Create copy of passed-in parameters
self.params = params
# Retrieve the layers to use for hidden representations
self.layer_ids = params.get("layer_ids", [i for i in range(len(model.layers))])
# Retrieve the corresponding layer names
self.layer_names = params.get("layer_names", ["Layer " + str(i) for i in range(len(model.layers))])
# Set number of parameters
self.n_concepts = params['n_concepts']
# Retrieve the concept names
self.concept_names = params.get("concept_names", ["Concept " + str(i) for i in range(self.n_concepts)])
# Batch size to use during computation
self.batch_size = params.get("batch_size", 128)
# Set classifier to use for concept value prediction
self.clf_method = params.get("method", "LR")
# Model for extracting activations from
self.model = model
def get_clf(self):
if self.clf_method == 'LR':
semi_supervised = False
clf = LogisticRegression(max_iter=200)
elif self.clf_method == 'LP':
semi_supervised = True
clf = LabelSpreading()
else:
raise ValueError("Non-implemented method")
return clf, semi_supervised
def _get_layer_concept_predictor_model(self, h_data_l, c_data_l, h_data_u):
'''
Train cme concept label predictor for a particular layer and concept
:param h_data_l: Activation data for a given layer
:param c_data_l: Corresponding concept labels for that data
:param h_data_u: Activation data without corresponding labels
:return: Classifier predicting concept values from the activations
'''
# Create safe copies of data
x_data_l = np.copy(h_data_l)
y_data_l = np.copy(c_data_l)
x_data_u = np.copy(h_data_u)
y_data_u = np.ones((x_data_u.shape[0])) * -1 # Here, label is 'undefined'
# Specify whether to use the unlabelled data at all
semi_supervised = False
# If there is only 1 value, then return simple classifier
unique_vals = np.unique(y_data_l)
if len(unique_vals) == 1:
clf = DummyClassifier(strategy="constant", constant=c_data_l[0])
else:
# Otherwise, train classifier model
clf, semi_supervised = self.get_clf()
# Split the labelled data for train/test
x_train, x_test, y_train, y_test = train_test_split(x_data_l, y_data_l, test_size=0.15)
# Combine with unlabelled data, if using a semi-supervised method
if semi_supervised:
x_train = np.concatenate([x_train, x_data_u])
y_train = np.concatenate([y_train, y_data_u])
# Train classifier
clf.fit(x_train, y_train)
# Retrieve predictive accuracy of classifier
pred_acc = accuracy_score(y_test, clf.predict(x_test))
return clf, pred_acc
def train(self, x_data_l, c_data_l, x_data_u):
'''
Compute a dictionary with structure: layer --> concept --> model
i.e., the dictionary returns which clf to use to predict a given concept, from a given layer
'''
self.model_ensemble = {}
self.model_accuracies = {}
# Compute activations for specified layers
h_data_ls = compute_activation_per_layer(x_data_l, self.layer_ids, self.model, aggregation_function=flatten_activations)
h_data_us = compute_activation_per_layer(x_data_u, self.layer_ids, self.model, aggregation_function=flatten_activations)
for i, layer_id in enumerate(self.layer_ids):
# Retrieve activations for next layer
activations_l = h_data_ls[i]
activations_u = h_data_us[i]
output_layer = self.model.layers[layer_id]
self.model_ensemble[output_layer] = []
self.model_accuracies[output_layer] = []
# Generate predictive models for every concept
for c in range(self.n_concepts):
clf, pred_acc = self._get_layer_concept_predictor_model(activations_l, c_data_l[:, c], activations_u)
self.model_ensemble[output_layer].append(clf)
self.model_accuracies[output_layer].append(pred_acc)
print("Processed layer ", str(i + 1), " of ", str(len(self.layer_ids)))
# Initialise concept predictors with models in the first layer
# Consists of an array of size |concepts|, in which
# The element arr[i] is the Layer Id of the layer to use when predicting that concept
self.concept_predictor_layer_ids = [self.layer_ids[0] for _ in range(self.n_concepts)]
# For every concept, identify the layer with the best clf predictive accuracy
for c in range(self.n_concepts):
max_acc = 0
for i, layer_id in enumerate(self.layer_ids):
layer = self.model.layers[layer_id]
acc = self.model_accuracies[layer][c]
if acc > max_acc:
max_acc = acc
self.concept_predictor_layer_ids[c] = layer_id
def predict_concepts(self, x_data):
'''
Given the same model and new x_data, predict their concept values
'''
n_samples = x_data.shape[0]
concept_vals = np.zeros((n_samples, self.n_concepts), dtype=float)
for c in range(self.n_concepts):
# Retrieve clf corresponding to concept c
layer_id = self.concept_predictor_layer_ids[c]
output_layer = self.model.layers[layer_id]
clf = self.model_ensemble[output_layer][c]
# Compute activations for that layer
output_layer = self.model.layers[layer_id]
reduced_model = tf.keras.Model(inputs=self.model.inputs, outputs=[output_layer.output])
hidden_features = reduced_model.predict(x_data, batch_size=self.batch_size)
clf_data = flatten_activations(hidden_features)
concept_vals[:, c] = clf.predict(clf_data)
return concept_vals