anujdutt9/RNN_LanguageModel2.py

## RNN_LanguageModel2.py
# Step1: Training Data and Preprocessing
#       a) Tokenize the Input text (sentence to words)
#       b) Form the Vocabulary and remove Infrequent words
#       c) Add "Start" and "End" Tokens to the sentences

# Vocabulary Size: 8000 words
vocab_size = 8000

# Token to replace the infrequent words
unknown_token = 'Unknown_Token'

# Sentence start and end tokens
sentence_start_token = 'Sentence_Start'
sentence_end_token = 'Sentence_End'
	# Step1: Training Data and Preprocessing
	# a) Tokenize the Input text (sentence to words)
	# b) Form the Vocabulary and remove Infrequent words
	# c) Add "Start" and "End" Tokens to the sentences

	# Vocabulary Size: 8000 words
	vocab_size = 8000

	# Token to replace the infrequent words
	unknown_token = 'Unknown_Token'

	# Sentence start and end tokens
	sentence_start_token = 'Sentence_Start'
	sentence_end_token = 'Sentence_End'