in cluster_vis/preprocess.py [0:0]
def get_data(filename, meta_filename=None):
with open(filename, 'rb') as handle:
clusters = pickle.load(handle)
epochs = [int(epoch) for epoch in clusters.keys()]
epochs.sort()
last_epoch = clusters[f'{epochs[-1]}']
for i in range(len(last_epoch)):
random.shuffle(last_epoch[i])
if meta_filename is not None:
with open("meta-classes.json", 'rb') as handle:
meta = json.load(handle)
keys = list(meta.keys())
for k in keys:
new_key = ('' + k).replace(' ', '_')
meta[new_key] = meta.pop(k)
else:
meta = {}
for c in last_epoch:
for v in c:
meta[v[3]] = "people"
print(set(meta.values()))
data = {"clusters": last_epoch, "metaclasses": meta}
return data