forked from mila-iqia/babyai
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvisualize_concepts_noCW.py
231 lines (171 loc) · 7.69 KB
/
visualize_concepts_noCW.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
import matplotlib.pyplot as plt
import numpy as np
import os
import pickle
import torch
import tqdm
import babyai.utils as utils
import gym
# from babyai.model import ACModel
from babyai.iterative_normalization import iterative_normalization_py
### Constants
# CONCEPTS = [
# '1_search_for_key', '2_take_key_to_door', '3_search_for_target'
# ]
CONCEPTS = ['0_search_for_red_key', '1_search_for_green_key', '2_search_for_blue_key',
'3_take_red_key_to_door', '4_take_green_key_to_door', '5_take_blue_key_to_door']
### Helper Functions
def load(path):
with open(path, 'rb') as file:
data = pickle.load(file)
return data
def starting_indexes(num_frames, recurrence=20):
if num_frames % recurrence == 0:
return np.arange(0, num_frames, recurrence)
else:
return np.arange(0, num_frames, recurrence)[:-1]
### Activations
def get_activations(acmodel, batch_dict, observation_space, action_space, model_name,
recurrence=20, num_concepts=6, device='cuda:6'):
outputs = []
def hook(module, input, output):
outputs.append(output.cpu().numpy())
acmodel.image_conv[5].register_forward_hook(hook)
flat_batch = batch_dict['flat_batch']
mask = torch.tensor(batch_dict['mask'], device=device)
episode_ids = batch_dict['episode_ids']
inds = batch_dict['inds']
flat_batch_concept_inds = batch_dict['flat_batch_concept_inds']
concept_mask = torch.tensor(batch_dict['concept_mask'], device=device)
concept_episode_ids = batch_dict['concept_episode_ids']
concept_inds = batch_dict['concept_inds']
obss_preprocessor = utils.ObssPreprocessor(model_name, observation_space, None)
num_frames = len(flat_batch)
obss, action_true, done = flat_batch[:, 0], flat_batch[:, 1], flat_batch[:, 2]
len_batch = 256
# Memory to be stored
memories = torch.zeros([len(flat_batch), acmodel.memory_size], device=device)
memory = torch.zeros([len_batch, acmodel.memory_size], device=device)
preprocessed_first_obs = obss_preprocessor(obss[inds], device=device)
instr_embedding = acmodel._get_instr_embedding(preprocessed_first_obs.instr)
# Loop terminates when every observation in the flat_batch has been handled
while True:
# taking observations and done located at inds
obs = obss[inds]
done_step = done[inds]
preprocessed_obs = obss_preprocessor(obs, device=device)
with torch.no_grad():
# taking the memory till len(inds), as demos beyond that have already finished
new_memory = acmodel(
preprocessed_obs,
memory[:len(inds), :], instr_embedding[:len(inds)])['memory']
memories[inds, :] = memory[:len(inds), :]
memory[:len(inds), :] = new_memory
# Updating inds, by removing those indices corresponding to which the demonstrations have finished
inds = inds[:len(inds) - sum(done_step)]
if len(inds) == 0:
break
# Incrementing the remaining indices
inds = [index + 1 for index in inds]
############ CUT MEMORIES AND OBSS TO CONCEPT TIMESTEPS ONLY ####################
flat_concept_batch = []
for pair in flat_batch_concept_inds:
concept_data = flat_batch[pair[0]:pair[1]]
flat_concept_batch.extend(concept_data)
concept_memories = torch.zeros([len(flat_concept_batch), acmodel.memory_size], device=device)
mem_start = 0
for pair in flat_batch_concept_inds:
mem = memories[pair[0]:pair[1]]
concept_memories[mem_start:mem_start + len(mem)] = mem
mem_start += len(mem)
# Here, actual backprop upto recurrence happens
flat_concept_batch = np.array(flat_concept_batch)
# total_frames = len(indexes) * recurrence
obss, action_true, done = flat_concept_batch[:, 0], flat_concept_batch[:, 1], flat_concept_batch[:, 2]
preprocessed_first_obs = obss_preprocessor(obss[concept_inds], device=device)
instr_embedding = acmodel._get_instr_embedding(preprocessed_first_obs.instr)
c_indexes = starting_indexes(len(flat_concept_batch))
concept_memory = concept_memories[c_indexes]
with torch.no_grad():
for _ in tqdm.trange(recurrence):
obs = obss[c_indexes]
preprocessed_obs = obss_preprocessor(obs, device=device)
mask_step = concept_mask[c_indexes]
model_results = acmodel(
preprocessed_obs, concept_memory * mask_step,
instr_embedding[concept_episode_ids[c_indexes]])
concept_memory = model_results['memory']
c_indexes += 1
activations = np.vstack(outputs).max((2, 3))[:, :num_concepts]
return activations
##########################################
model_name = 'UnlockRGB_best'
device = 'cuda:6'
#############################################
model_path = '/data/graceduansu/models/'+ model_name + '/model.pt'
concept_directory='/data/graceduansu/UnlockRGB_concepts'
concept_dirs = sorted([os.path.join(concept_directory, filename) for filename in os.listdir(concept_directory)])
# Models
acmodel = torch.load(model_path).to(device)
# Env
env_name = 'BabyAI-UnlockRGB-v0'
env = gym.make(env_name)
observation_space = env.observation_space
action_space = env.action_space
x = np.zeros((1,6))
y = []
for concept_index, concept_dir in enumerate(tqdm.tqdm(concept_dirs, leave=False)):
concept_paths = [os.path.join(concept_dir, f) for f in os.listdir(concept_dir)]
activations = []
print('Concept {}'.format(concept_index))
for _ in tqdm.trange(10):
concept_path = np.random.choice(concept_paths)
batch_dict = None
with open(concept_path, 'rb') as file:
batch_dict = pickle.load(file)
a = get_activations(acmodel, batch_dict, observation_space, action_space, model_name, device=device)
activations.append(a)
x = np.vstack((x,a))
y += [concept_index for i in range(len(a))]
z = np.vstack(activations).mean(axis=0)
print(z)
print('Size of concept {}: {}'.format(concept_index, len(a)))
x_pos = [i for i, _ in enumerate(CONCEPTS)]
plt.bar(x_pos, z)
plt.xticks(x_pos, CONCEPTS)
plt.title('Model {}:\n Mean activations for Concept {} Data Input'.format(model_name, concept_index))
plt.savefig('/data/graceduansu/models/{}/mean_activations_concept_{}.png'.format(model_name, concept_index))
plt.show()
plt.clf()
y = np.array(y)
x = x[1:]
print('Total dataset size: {}'.format(len(y)))
from sklearn.tree import DecisionTreeClassifier # Import Decision Tree Classifier
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split # Import train_test_split function
from sklearn import metrics #Import scikit-learn metrics module for accuracy calculation
from sklearn.preprocessing import StandardScaler
# p = np.random.permutation(len(x))
# N = int(len(p) / 5)
# X_train, y_train = x[p[:N]], y[p[:N]]
# X_test, y_test = x[p[N:]], y[p[N:]]
X_train, X_test, y_train, y_test = train_test_split(x, y, test_size=0.2)
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)
# Create Decision Tree classifer object
clf = LogisticRegression()
# Train Decision Tree Classifer
clf = clf.fit(X_train,y_train)
#Predict the response for test dataset
y_pred = clf.predict(X_test)
print('Training set size: {}'.format(len(y_train)))
print('Test set size: {}'.format(len(y_test)))
# Model Accuracy, how often is the classifier correct?
print("LR Accuracy:", metrics.accuracy_score(y_test, y_pred))
dt = DecisionTreeClassifier()
dt = dt.fit(X_train, y_train)
#Predict the response for test dataset
y_pred = dt.predict(X_test)
# Model Accuracy, how often is the classifier correct?
print("DT Accuracy:", metrics.accuracy_score(y_test, y_pred))