def get_pipeline(sample_col, parallel_jobs=None):
feat_ext_objs = [feat_ext_class(sample_col)
for feat_ext_class in get_objs(FEAT_EXTS_DIR, 'Worker')]
feat_ext_tuples = [(feat_ext_obj.feature_name, feat_ext_obj)
for feat_ext_obj in feat_ext_objs]
pipeline = Pipeline([
('features', FeatureUnion(feat_ext_tuples, n_jobs=parallel_jobs)),
('describe_data', describe_data.Transformer()),
('classifier', MultinomialNB()),
])
return pipeline
评论列表
文章目录