Prateek Joshi prateekjoshi565

## train_model.py
filename = 'model.h1.24_jan_19'

# set checkpoint
checkpoint = ModelCheckpoint(filename, monitor='val_loss',
                             verbose=1, save_best_only=True,
                             mode='min')


# train model
history = model.fit(trainX, trainY.reshape(trainY.shape[0], trainY.shape[1], 1),

## predict.py
model = load_model('model.h1.24_jan_19')

preds = model.predict_classes(testX.reshape((testX.shape[0], testX.shape[1])))

## integer_word_mapping.py
def get_word(n, tokenizer):
      for word, index in tokenizer.word_index.items():
          if index == n:
              return word
      return None

## prepare_predictions.py
preds_text = []
for i in preds:
       temp = []
       for j in range(len(i)):
            t = get_word(i[j], eng_tokenizer)
            if j > 0:
                if (t==get_word(i[j-1],eng_tokenizer))or(t== None):
                     temp.append('')
                else:
                     temp.append(t)

## import_libraries_elmo.py
import pandas as pd
import numpy as np
import spacy
from tqdm import tqdm
import re
import time
import pickle
pd.set_option('display.max_colwidth', 200)

## remove_url_elmo.py
# remove URL's from train and test
train['clean_tweet'] = train['tweet'].apply(lambda x: re.sub(r'http\S+', '', x))

test['clean_tweet'] = test['tweet'].apply(lambda x: re.sub(r'http\S+', '', x))

## elmo_example.py
# just a random sentence
x = ["Roasted ants are a popular snack in Columbia"]

# Extract ELMo features
embeddings = elmo(x, signature="default", as_dict=True)["elmo"]

embeddings.shape

## elmo_vectors_func.py
def elmo_vectors(x):
  embeddings = elmo(x.tolist(), signature="default", as_dict=True)["elmo"]

  with tf.Session() as sess:
    sess.run(tf.global_variables_initializer())
    sess.run(tf.tables_initializer())
    # return average of ELMo features
    return sess.run(tf.reduce_mean(embeddings,1))

## save_pickle_elmo.py
# save elmo_train_new
pickle_out = open("elmo_train_03032019.pickle","wb")
pickle.dump(elmo_train_new, pickle_out)
pickle_out.close()

# save elmo_test_new
pickle_out = open("elmo_test_03032019.pickle","wb")
pickle.dump(elmo_test_new, pickle_out)
pickle_out.close()

## load_pickle_elmo.py
# load elmo_train_new
pickle_in = open("elmo_train_03032019.pickle", "rb")
elmo_train_new = pickle.load(pickle_in)

# load elmo_train_new
pickle_in = open("elmo_test_03032019.pickle", "rb")
elmo_test_new = pickle.load(pickle_in)
	filename = 'model.h1.24_jan_19'

	# set checkpoint
	checkpoint = ModelCheckpoint(filename, monitor='val_loss',
	verbose=1, save_best_only=True,
	mode='min')


	# train model
	history = model.fit(trainX, trainY.reshape(trainY.shape[0], trainY.shape[1], 1),
	model = load_model('model.h1.24_jan_19')

	preds = model.predict_classes(testX.reshape((testX.shape[0], testX.shape[1])))
	def get_word(n, tokenizer):
	for word, index in tokenizer.word_index.items():
	if index == n:
	return word
	return None
	preds_text = []
	for i in preds:
	temp = []
	for j in range(len(i)):
	t = get_word(i[j], eng_tokenizer)
	if j > 0:
	if (t==get_word(i[j-1],eng_tokenizer))or(t== None):
	temp.append('')
	else:
	temp.append(t)
	import pandas as pd
	import numpy as np
	import spacy
	from tqdm import tqdm
	import re
	import time
	import pickle
	pd.set_option('display.max_colwidth', 200)
	# remove URL's from train and test
	train['clean_tweet'] = train['tweet'].apply(lambda x: re.sub(r'http\S+', '', x))

	test['clean_tweet'] = test['tweet'].apply(lambda x: re.sub(r'http\S+', '', x))
	# just a random sentence
	x = ["Roasted ants are a popular snack in Columbia"]

	# Extract ELMo features
	embeddings = elmo(x, signature="default", as_dict=True)["elmo"]

	embeddings.shape
	def elmo_vectors(x):
	embeddings = elmo(x.tolist(), signature="default", as_dict=True)["elmo"]

	with tf.Session() as sess:
	sess.run(tf.global_variables_initializer())
	sess.run(tf.tables_initializer())
	# return average of ELMo features
	return sess.run(tf.reduce_mean(embeddings,1))
	# save elmo_train_new
	pickle_out = open("elmo_train_03032019.pickle","wb")
	pickle.dump(elmo_train_new, pickle_out)
	pickle_out.close()

	# save elmo_test_new
	pickle_out = open("elmo_test_03032019.pickle","wb")
	pickle.dump(elmo_test_new, pickle_out)
	pickle_out.close()
	# load elmo_train_new
	pickle_in = open("elmo_train_03032019.pickle", "rb")
	elmo_train_new = pickle.load(pickle_in)

	# load elmo_train_new
	pickle_in = open("elmo_test_03032019.pickle", "rb")
	elmo_test_new = pickle.load(pickle_in)