somyamohanty/text_collocation.py

## text_collocation.py
import nltk
docs = ['hi this is a test', 'testing done for now', 'today is a test']
docs_l = []
for sentence in docs:
  tokens = nltk.word_tokenize(sentence)
  docs_l.append(tokens)

finder = BigramCollocationFinder.from_documents(docs_l)
bigram_measures = nltk.collocations.BigramAssocMeasures()
print(finder.score_ngrams(bigram_measures.raw_freq))

finder.ngram_fd.viewitems()
	import nltk
	docs = ['hi this is a test', 'testing done for now', 'today is a test']
	docs_l = []
	for sentence in docs:
	tokens = nltk.word_tokenize(sentence)
	docs_l.append(tokens)

	finder = BigramCollocationFinder.from_documents(docs_l)
	bigram_measures = nltk.collocations.BigramAssocMeasures()
	print(finder.score_ngrams(bigram_measures.raw_freq))

	finder.ngram_fd.viewitems()