def transform(self):
## tfidf
tfidf = self._init_word_ngram_tfidf(ngram=self.ngram)
X_obs = tfidf.fit_transform(self.obs_corpus)
X_target = tfidf.fit_transform(self.target_corpus)
X_tfidf = scipy.sparse.hstack([X_obs, X_target]).tocsr()
## svd
svd = TruncatedSVD(n_components=self.svd_dim,
n_iter=self.svd_n_iter, random_state=config.RANDOM_SEED)
X_svd = svd.fit_transform(X_tfidf)
return X_svd
# -------------------------------- TSNE ------------------------------------------
# 2nd in CrowdFlower (preprocessing_mikhail.py)
feature_vector_space.py 文件源码
python
阅读 24
收藏 0
点赞 0
评论 0
评论列表
文章目录