def _generate_all_features(self):
"""
generates all features for all mentions
and frees from memory: self.embeddings and self.features
pregenerate all feature vectors to increase get_batch speed
"""
print('DataLoader: generating all features')
# self.mention_features = {m: self._make_mention_features(m) for ms in self.document_mentions for m in ms}
assert self.embeddings is not None
assert self.features is not None
for ms in tqdm(self.document_mentions):
for m in ms:
self.mention_features[m] = self._make_mention_features(m)
self.features_size = len(self.mention_features[m])
self.embeddings = None
print('DataLoader: generating all features finished')
评论列表
文章目录