in hypernymysuite/unsup.py [0:0]
def __init__(self, space_filename, topk):
super(SLQS, self).__init__(space_filename)
self.topk = topk
logging.info("Computing column entropies")
tr = self.matrix.transpose().tocsr()
entropies = []
# Minibatches for computation efficiency
bs = 1024
for idx_start in range(0, tr.shape[0], bs):
idx_end = min(idx_start + bs, tr.shape[0])
v = tr[idx_start:idx_end].todense().A
entropies += list(entropy(v.T))
self.colent = np.array(entropies)
assert len(self.colent) == tr.shape[0]
logging.info("Done computing entropies")
# cleanup
del tr
logging.info("Done computing row entropies")