Ran Pelta ranpelta

## import_packages.py
# import packages
import pandas as pd
import numpy as np
import keras
import matplotlib.pyplot as plt
from sklearn.preprocessing import MinMaxScaler
from pandas.plotting import register_matplotlib_converters
register_matplotlib_converters()
from keras.preprocessing.sequence import TimeseriesGenerator
from keras.models import Sequential

## keras RNN for towards data science.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ranpelta
                / keras RNN for towards data science.ipynb
            
            
              Created
              July 17, 2020 12:21
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## step1 - import packages.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ranpelta
                / step1 - import packages.ipynb
            
            
              Created
              July 17, 2020 13:07
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## step2 - get and plot data.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                ranpelta
                / step2 - get and plot data.ipynb
            
            
              Created
              July 17, 2020 13:33
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## step1 - import packages.py
# import packages
import pandas as pd
import numpy as np
import keras
import matplotlib.pyplot as plt
from sklearn.preprocessing import MinMaxScaler
from pandas.plotting import register_matplotlib_converters
register_matplotlib_converters()
from keras.preprocessing.sequence import TimeseriesGenerator
from keras.models import Sequential

## step2 - read the data.py
df = pd.read_pickle(r'C:\..........\data.pkl') # read data
y_col='y' # define y variable, i.e., what we want to predict
print(df.shape) # print the number of rows anc columns
df.head()

## Optional step - plot the data.py
plt.figure(figsize=(50,4))
plt.plot(range(len(df)),df[y_col]);

## split the data to train and test.py
test_size = int(len(df) * 0.1) # the test data will be 10% (0.1) of the entire data
train = df.iloc[:-test_size,:].copy()
# the copy() here is important, it will prevent us from getting: SettingWithCopyWarning: A value is trying to be set on a copy of a slice from a DataFrame. Try using .loc[row_index,col_indexer] = value instead
test = df.iloc[-test_size:,:].copy()
print(train.shape, test.shape)

>>> ((28916, 4), (3212, 4))

## plot train and test.py
plt.figure(figsize=(50,4))
plt.plot(train.index,train[y_col],label='Train');
plt.plot(test.index,test[y_col],label='test')
plt.legend();

## separate X and y.py
#separate X and y only for the train data (for now)
X_train = train.drop(y_col,axis=1).copy()
y_train = train[[y_col]].copy() # the double brakets here are to keep the y in a dataframe format, otherwise it will be pandas Series
print(X_train.shape, y_train.shape)

>>> (28916, 3) (28916, 1)
	# import packages
	import pandas as pd
	import numpy as np
	import keras
	import matplotlib.pyplot as plt
	from sklearn.preprocessing import MinMaxScaler
	from pandas.plotting import register_matplotlib_converters
	register_matplotlib_converters()
	from keras.preprocessing.sequence import TimeseriesGenerator
	from keras.models import Sequential
	df = pd.read_pickle(r'C:\..........\data.pkl') # read data
	y_col='y' # define y variable, i.e., what we want to predict
	print(df.shape) # print the number of rows anc columns
	df.head()
	plt.figure(figsize=(50,4))
	plt.plot(range(len(df)),df[y_col]);
	test_size = int(len(df) * 0.1) # the test data will be 10% (0.1) of the entire data
	train = df.iloc[:-test_size,:].copy()
	# the copy() here is important, it will prevent us from getting: SettingWithCopyWarning: A value is trying to be set on a copy of a slice from a DataFrame. Try using .loc[row_index,col_indexer] = value instead
	test = df.iloc[-test_size:,:].copy()
	print(train.shape, test.shape)

	>>> ((28916, 4), (3212, 4))
	plt.figure(figsize=(50,4))
	plt.plot(train.index,train[y_col],label='Train');
	plt.plot(test.index,test[y_col],label='test')
	plt.legend();
	#separate X and y only for the train data (for now)
	X_train = train.drop(y_col,axis=1).copy()
	y_train = train[[y_col]].copy() # the double brakets here are to keep the y in a dataframe format, otherwise it will be pandas Series
	print(X_train.shape, y_train.shape)

	>>> (28916, 3) (28916, 1)