def _compute_features(self, raw_documents):
values = array.array(str("f"))
print "Preloading regexes"
dummy_processor = event_classifier.StringProcessor('')
for name, rule in named_rules_list:
dummy_processor.count_tokens(rule)
print "Computing Features"
result = Parallel(
n_jobs=7 if process_all else 1, verbose=10
)(delayed(process_doc)(fb_event) for event_id, fb_event in raw_documents)
for row_values in result:
values.extend(row_values)
X = np.array(values)
X.shape = (len(raw_documents), len(self.features))
return X
评论列表
文章目录