Initial commit

parent c71d63e4
...@@ -79,11 +79,6 @@ class TopicCluster: ...@@ -79,11 +79,6 @@ class TopicCluster:
X = count_vectorizer.fit_transform(texts) X = count_vectorizer.fit_transform(texts)
# print(count_vectorizer.get_feature_names()) # print(count_vectorizer.get_feature_names())
tfidf_vectorizer = TfidfVectorizer(
stop_words='english', tokenizer=stemming_tokenizer, use_idf=False, norm='l1')
X = tfidf_vectorizer.fit_transform(texts)
pd.DataFrame(X.toarray(), columns=tfidf_vectorizer.get_feature_names())
tfidf_vectorizer = TfidfVectorizer( tfidf_vectorizer = TfidfVectorizer(
stop_words='english', tokenizer=stemming_tokenizer, use_idf=False, norm='l1') stop_words='english', tokenizer=stemming_tokenizer, use_idf=False, norm='l1')
X = tfidf_vectorizer.fit_transform(texts) X = tfidf_vectorizer.fit_transform(texts)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment