mohdsanadzakirizvi/lm_val.py

## lm_val.py
from sklearn.model_selection import train_test_split

# vocabulary size
vocab = len(mapping)
sequences = np.array(sequences)
# create X and y
X, y = sequences[:,:-1], sequences[:,-1]
# one hot encode y
y = to_categorical(y, num_classes=vocab)
# create train and validation sets
X_tr, X_val, y_tr, y_val = train_test_split(X, y, test_size=0.1, random_state=42)

print('Train shape:', X_tr.shape, 'Val shape:', X_val.shape)
	from sklearn.model_selection import train_test_split

	# vocabulary size
	vocab = len(mapping)
	sequences = np.array(sequences)
	# create X and y
	X, y = sequences[:,:-1], sequences[:,-1]
	# one hot encode y
	y = to_categorical(y, num_classes=vocab)
	# create train and validation sets
	X_tr, X_val, y_tr, y_val = train_test_split(X, y, test_size=0.1, random_state=42)

	print('Train shape:', X_tr.shape, 'Val shape:', X_val.shape)