VincentTatan/tokenization.py

## tokenization.py
from tensorflow.keras.preprocessing.text import Tokenizer

sentences = [
  'I eat chicken',
  'I do not eat fish',
  'Did you eat fish?'
]

tokenizer = Tokenizer(num_words = 100, oov_token="<OOV>")
tokenizer.fit_on_texts(sentences)
word_index = tokenizer.word_index

print(word_index)
	from tensorflow.keras.preprocessing.text import Tokenizer

	sentences = [
	'I eat chicken',
	'I do not eat fish',
	'Did you eat fish?'
	]

	tokenizer = Tokenizer(num_words = 100, oov_token="<OOV>")
	tokenizer.fit_on_texts(sentences)
	word_index = tokenizer.word_index

	print(word_index)