def extract_feature(sentence): features = defaultdict(lambda: 0) stemmer = stem.PorterStemmer() for word in sentence.split(): if not include_stopword(word): features[stemmer.stem(word)] += 1 return features