def train_test():
"""Identify accuracy via training set"""
X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=2)
vect = CountVectorizer()
X_train_dtm = vect.fit_transform(X_train) # creates vocab set and dtm for each raw document!
X_test_dtm = vect.transform(X_test)
nb = MultinomialNB()
nb.fit(X_train_dtm, y_train)
y_pred_class = nb.predict(X_test_dtm) # make class predictions for X_test_dtm
# w = list(X_test)
return metrics.accuracy_score(y_test, y_pred_class)
# print(train_test())
评论列表
文章目录