amankharwal/resume screening.py Secret

## resume screening.py
import nltk
from nltk.corpus import stopwords
import string
from wordcloud import WordCloud

oneSetOfStopWords = set(stopwords.words('english')+['``',"''"])
totalWords =[]
Sentences = resumeDataSet['Resume'].values
cleanedSentences = ""
for i in range(0,160):
    cleanedText = cleanResume(Sentences[i])
    cleanedSentences += cleanedText
    requiredWords = nltk.word_tokenize(cleanedText)
    for word in requiredWords:
        if word not in oneSetOfStopWords and word not in string.punctuation:
            totalWords.append(word)

wordfreqdist = nltk.FreqDist(totalWords)
mostcommon = wordfreqdist.most_common(50)
print(mostcommon)

wc = WordCloud().generate(cleanedSentences)
plt.figure(figsize=(15,15))
plt.imshow(wc, interpolation='bilinear')
plt.axis("off")
plt.show()
	import nltk
	from nltk.corpus import stopwords
	import string
	from wordcloud import WordCloud

	oneSetOfStopWords = set(stopwords.words('english')+['``',"''"])
	totalWords =[]
	Sentences = resumeDataSet['Resume'].values
	cleanedSentences = ""
	for i in range(0,160):
	cleanedText = cleanResume(Sentences[i])
	cleanedSentences += cleanedText
	requiredWords = nltk.word_tokenize(cleanedText)
	for word in requiredWords:
	if word not in oneSetOfStopWords and word not in string.punctuation:
	totalWords.append(word)

	wordfreqdist = nltk.FreqDist(totalWords)
	mostcommon = wordfreqdist.most_common(50)
	print(mostcommon)

	wc = WordCloud().generate(cleanedSentences)
	plt.figure(figsize=(15,15))
	plt.imshow(wc, interpolation='bilinear')
	plt.axis("off")
	plt.show()