Skip to content

Instantly share code, notes, and snippets.

View lcschv's full-sized avatar

Lucas Chaves Lima lcschv

View GitHub Profile
from nltk.probability import FreqDist
import math
import pickle
from top2vec import Top2Vec
import numpy as np
from gensim.utils import simple_preprocess
from gensim.parsing.preprocessing import strip_tags
def default_tokenizer(doc):