Update 4.Text_Preprocessing.py

2eacca06 · Ramachandran Rajeevaletshanth · 381b4c9d · 2eacca06
Commit 2eacca06 authored Jul 09, 2021 by Ramachandran Rajeevaletshanth
Hide whitespace changes
Inline Side-by-side

Showing with 6 additions and 4 deletions

IT17163682/4.Text_Preprocessing.py IT17163682/4.Text_Preprocessing.py +6 -4

No files found.
--- a/IT17163682/4.Text_Preprocessing.py
+++ b/IT17163682/4.Text_Preprocessing.py
@@ -9,8 +9,10 @@ from collections import Counter
 import re
 import unidecode

-res = open("ResumeStr.txt").read()
-tweet = open('Tweet.txt').read()
+#nltk.download('stopwords')
+
+res = open("Experience.txt",'r', encoding='utf-8').read()
+tweet = open('Tweet.txt','r', encoding='utf-8').read()

 #Lower case conversion
 def lower_case_convertion(text):
@@ -87,7 +89,7 @@ def lemmatization(text):
 # initialize lemmatizer object
 lemma = WordNetLemmatizer()
 res = lemmatization(res)
-tweet = lemmatization(tweet)
+

 # Implementation of removing punctuations using string library
 def remove_punctuation(text):
@@ -227,7 +229,7 @@ tweet = '\n'.join(k)
 #print(res)
 #print(tweet)

-with open("ClearText.txt", "w") as text_file:
+with open("Experience.txt", "w") as text_file:
    print(res, file=text_file)

 with open("Tweet.txt", "w") as text_file: