Skip to content

Instantly share code, notes, and snippets.

View andrewtremblay's full-sized avatar
🕵️‍♂️
Working on secret stuff.

Andrew Tremblay andrewtremblay

🕵️‍♂️
Working on secret stuff.
View GitHub Profile
@andrewtremblay
andrewtremblay / 1000_words.txt
Created January 3, 2016 08:59
Custom Corpus
the
of
to
and
a
in
is
it
you
that
import nltk
all_words = nltk.corpus.words.words()
print len(all_words), "total words loaded"
jumbled_letters = "andrewtremblay"
letter_distribution = nltk.FreqDist(jumbled_letters)
matching_wordlist = [w.lower() for w in all_words if nltk.FreqDist(w) <= letter_distribution]
import nltk
all_words = nltk.corpus.words.words()
print len(all_words), "total words loaded"
import nltk
all_words = nltk.corpus.words.words()
jumbled_letters = "andrewtremblay"
anagram_results = []
len_full_phrase = len(jumbled_letters)
letter_distribution = nltk.FreqDist(jumbled_letters)
trimmed_lowercase_wordlist = [w.lower() for w in all_words if len(w) <= len_full_phrase]