Sparkle Russell-Puleri sparalic

## Linear_Regression_Homework_hw_1_Sparkle Russell-Puleri.ipynb

      
              1 file
            
          
              0 forks
            
          
                0 comments
              
            
              0 stars
            
          
                sparalic
                / Linear_Regression_Homework_hw_1_Sparkle Russell-Puleri.ipynb
            
            
              Created
              June 24, 2017 19:32
            
              
                New York City Data Academy: Machine Learning Data Science in Python Course Homework 1 
              
          
      Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## grus_prepred.py
def one_hot_encode(encoded, vocab_size):
    result = torch.zeros((len(encoded), vocab_size))
    for i, idx in enumerate(encoded):
        result[i, idx] = 1.0
    return result


# One hot encode our encoded charactes
batch_size = 2
seq_length = 3

## Weights.py
torch.manual_seed(1) # reproducibility

####  Define the network parameters:
hiddenSize = 2 # network size, this can be any number (depending on your task)
numClass = 4 # this is the same as our vocab_size

#### Weight matrices for our inputs
Wz = Variable(torch.randn(vocab_size, hiddenSize), requires_grad=True))
Wr = Variable(torch.randn(vocab_size, hiddenSize), requires_grad=True))
Wh = Variable(torch.randn(vocab_size, hiddenSize), requires_grad=True))

## hidden state.py
# h gets updated and then we calculate for the next
h_t_1 = []
h = h_t_demo
for i,sequence in enumerate(X[0]):   # iterate over each sequence in the batch to calculate the hidden state h
    z = torch.sigmoid(torch.matmul(sequence, Wz) + torch.matmul(h, Uz) + bz)
    r = torch.sigmoid(torch.matmul(sequence, Wr) + torch.matmul(h, Ur) + br)
    h_tilde = torch.tanh(torch.matmul(sequence, Wh) + torch.matmul(r * h, Uh) + bh)
    h = z * h + (1 - z) * h_tilde
    h_t_1.append(h)
    print(f'h{i}:{h}')

## gru.py
def gru(x, h):
    outputs = []
    for i,sequence in enumerate(x): # iterates over the sequences in each batch
        z = torch.sigmoid(torch.matmul(sequence, Wz) + torch.matmul(h, Uz) + bz)
        r = torch.sigmoid(torch.matmul(sequence, Wr) + torch.matmul(h, Ur) + br)
        h_tilde = torch.tanh(torch.matmul(sequence, Wh) + torch.matmul(r * h, Uh) + bh)
        h = z * h + (1 - z) * h_tilde

        # Linear layer
        y_linear = torch.matmul(h, Wy) + by

## training.py
def sample(primer, length_chars_predict):

    word = primer

    primer_dictionary = [character_dictionary[char] for char in word]
    test_input = one_hot_encode(primer_dictionary, vocab_size)


    h = torch.zeros(1, hiddenSize)

## encoding.py
character_list = list(set(text))   # get all of the unique letters in our text variable
vocabulary_size = len(character_list)   # count the number of unique elements
character_dictionary = {char:e for e, char in enumerate(character_list)}  # create a dictionary mapping each unique char to a number
encoded_chars = [character_dictionary[char] for char in text] #integer representation of our vocabulary

## GRUs Part2.py
#Input text

# This will be our input ---> x
text = 'MathMathMathMathMath'

# Training loop
max_epochs = 5  # passes through the data
for e in range(max_epochs):
    h = torch.zeros(batch_size, hiddenSize)
    for i in range(num_batches):

## training.py
ht_2 = [] # stores the calculated h for each input x
outputs = []
h = torch.zeros(batch_size, hiddenSize) # intitalizes the hidden state
for i in range(num_batches):  # this loops over the batches
    x = X[i]
    for i,sequence in enumerate(x): # iterates over the sequences in each batch
        z = torch.sigmoid(torch.matmul(sequence, Wz) + torch.matmul(h, Uz) + bz)
        r = torch.sigmoid(torch.matmul(sequence, Wr) + torch.matmul(h, Ur) + br)
        h_tilde = torch.tanh(torch.matmul(sequence, Wh) + torch.matmul(r * h, Uh) + bh)
        h = z * h + (1 - z) * h_tilde

## matrices.py
hidden_batch_1 = ht_2[:3]
outputs_batch_1 = outputs[:3]
print(f' Predictions for the first batch: \n\n{outputs_batch_1}, \
      \n \n Hidden states for the first bactch: \n{hidden_batch_1}')

'''
Predictions for the first batch:

tensor([[[0.4342, 0.1669, 0.1735, 0.2254],
         [0.2207, 0.2352, 0.3322, 0.2119]],
	def one_hot_encode(encoded, vocab_size):
	result = torch.zeros((len(encoded), vocab_size))
	for i, idx in enumerate(encoded):
	result[i, idx] = 1.0
	return result


	# One hot encode our encoded charactes
	batch_size = 2
	seq_length = 3
	torch.manual_seed(1) # reproducibility

	#### Define the network parameters:
	hiddenSize = 2 # network size, this can be any number (depending on your task)
	numClass = 4 # this is the same as our vocab_size

	#### Weight matrices for our inputs
	Wz = Variable(torch.randn(vocab_size, hiddenSize), requires_grad=True))
	Wr = Variable(torch.randn(vocab_size, hiddenSize), requires_grad=True))
	Wh = Variable(torch.randn(vocab_size, hiddenSize), requires_grad=True))
	# h gets updated and then we calculate for the next
	h_t_1 = []
	h = h_t_demo
	for i,sequence in enumerate(X[0]): # iterate over each sequence in the batch to calculate the hidden state h
	z = torch.sigmoid(torch.matmul(sequence, Wz) + torch.matmul(h, Uz) + bz)
	r = torch.sigmoid(torch.matmul(sequence, Wr) + torch.matmul(h, Ur) + br)
	h_tilde = torch.tanh(torch.matmul(sequence, Wh) + torch.matmul(r * h, Uh) + bh)
	h = z * h + (1 - z) * h_tilde
	h_t_1.append(h)
	print(f'h{i}:{h}')
	def gru(x, h):
	outputs = []
	for i,sequence in enumerate(x): # iterates over the sequences in each batch
	z = torch.sigmoid(torch.matmul(sequence, Wz) + torch.matmul(h, Uz) + bz)
	r = torch.sigmoid(torch.matmul(sequence, Wr) + torch.matmul(h, Ur) + br)
	h_tilde = torch.tanh(torch.matmul(sequence, Wh) + torch.matmul(r * h, Uh) + bh)
	h = z * h + (1 - z) * h_tilde

	# Linear layer
	y_linear = torch.matmul(h, Wy) + by
	def sample(primer, length_chars_predict):

	word = primer

	primer_dictionary = [character_dictionary[char] for char in word]
	test_input = one_hot_encode(primer_dictionary, vocab_size)


	h = torch.zeros(1, hiddenSize)
	character_list = list(set(text)) # get all of the unique letters in our text variable
	vocabulary_size = len(character_list) # count the number of unique elements
	character_dictionary = {char:e for e, char in enumerate(character_list)} # create a dictionary mapping each unique char to a number
	encoded_chars = [character_dictionary[char] for char in text] #integer representation of our vocabulary
	#Input text

	# This will be our input ---> x
	text = 'MathMathMathMathMath'

	# Training loop
	max_epochs = 5 # passes through the data
	for e in range(max_epochs):
	h = torch.zeros(batch_size, hiddenSize)
	for i in range(num_batches):
	ht_2 = [] # stores the calculated h for each input x
	outputs = []
	h = torch.zeros(batch_size, hiddenSize) # intitalizes the hidden state
	for i in range(num_batches): # this loops over the batches
	x = X[i]
	for i,sequence in enumerate(x): # iterates over the sequences in each batch
	z = torch.sigmoid(torch.matmul(sequence, Wz) + torch.matmul(h, Uz) + bz)
	r = torch.sigmoid(torch.matmul(sequence, Wr) + torch.matmul(h, Ur) + br)
	h_tilde = torch.tanh(torch.matmul(sequence, Wh) + torch.matmul(r * h, Uh) + bh)
	h = z * h + (1 - z) * h_tilde
	hidden_batch_1 = ht_2[:3]
	outputs_batch_1 = outputs[:3]
	print(f' Predictions for the first batch: \n\n{outputs_batch_1}, \
	\n \n Hidden states for the first bactch: \n{hidden_batch_1}')

	'''
	Predictions for the first batch:

	tensor([[[0.4342, 0.1669, 0.1735, 0.2254],
	[0.2207, 0.2352, 0.3322, 0.2119]],