Initial commit

parent c71d63e4
......@@ -79,11 +79,6 @@ class TopicCluster:
X = count_vectorizer.fit_transform(texts)
# print(count_vectorizer.get_feature_names())
tfidf_vectorizer = TfidfVectorizer(
stop_words='english', tokenizer=stemming_tokenizer, use_idf=False, norm='l1')
X = tfidf_vectorizer.fit_transform(texts)
pd.DataFrame(X.toarray(), columns=tfidf_vectorizer.get_feature_names())
tfidf_vectorizer = TfidfVectorizer(
stop_words='english', tokenizer=stemming_tokenizer, use_idf=False, norm='l1')
X = tfidf_vectorizer.fit_transform(texts)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment