Skip to content

Instantly share code, notes, and snippets.

View josephcc's full-sized avatar
💭

Joseph Chang josephcc

💭
View GitHub Profile
import nltk
from nltk.tokenize.treebank import TreebankWordTokenizer
class TreebankSpanTokenizer(TreebankWordTokenizer):
def __init__(self):
self._word_tokenizer = TreebankWordTokenizer()
def span_tokenize(self, text):