andy51002000/BagOfWord.py

## BagOfWord.py
import pandas as pd
from sklearn.feature_extraction.text import CountVectorizer


corpus = ['The cat sat on the mat', 'The dog sat on the mat', 'The goat sat on the mat']

vectorizer = CountVectorizer(lowercase=True, analyzer='word', binary=False)
representation = vectorizer.fit_transform(corpus)
representation_df = pd.DataFrame(data = representation.toarray(), columns=sorted(vectorizer.vocabulary_.keys()))
	import pandas as pd
	from sklearn.feature_extraction.text import CountVectorizer


	corpus = ['The cat sat on the mat', 'The dog sat on the mat', 'The goat sat on the mat']

	vectorizer = CountVectorizer(lowercase=True, analyzer='word', binary=False)
	representation = vectorizer.fit_transform(corpus)
	representation_df = pd.DataFrame(data = representation.toarray(), columns=sorted(vectorizer.vocabulary_.keys()))