Allie .S Ubisse AllieUbisse

## ec2run.sh
#!/bin/bash
########################################################################################
#                                   START, STOP or STATUS                              #
#                               ----------------------------                           #
#       This scrip is intended to help you start, stop or get the IP address of        #
#       Current running EC2.                                                           #
#       This will require you to 1st configure your AWC-CLI, namualy to ensure safety  #
#                                                                                      #
#       Please read the code to ensure that It does not cause any security issues      #
#                                                                                      #

## docker_installer.sh
#!/bin/bash


##################################################################################
#     ----------------------------------------------------------------
#     THIS SCRIPT WILL HELP YOUR AUTOMATE THE DOCKER INSTALATION STEPS
#     ----------------------------------------------------------------
# Test was ran on aws ec2 instance.
#
# AUTHOR:

## stack-processing.py
#Import All Functions
from pyspark.sql import SQLContext
from pyspark.sql import functions as F
from pyspark.sql import SparkSession
from pyspark.sql.functions import unix_timestamp, to_date, date_format, month, year, dayofyear, dayofweek, col
from pyspark.sql.types import TimestampType
from pyspark.sql import functions as F
from pyspark.sql import SparkSession
from pyspark.sql.functions import unix_timestamp, to_date, date_format, month, year, dayofyear, dayofweek, col
from pyspark.sql.types import TimestampType

## 3-ln_model.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                carlleston
                / 3-ln_model.ipynb
            
            
              Last active
              August 23, 2020 12:09
            
              
                pre-processing and linear model in pyspark
              
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## 7.2 Splice MLflow Support.ipynb

      
              1 file
            
          
              1 fork
            
          
              1 comment
            
          
              1 star
            
          
                Ben-Epstein
                / 7.2 Splice MLflow Support.ipynb
            
            
              Created
              July 24, 2020 00:37
            
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## mlflow_gridsearch.py

def log_run(gridsearch: sklearn.GridSearchCV, experiment_name: str, model_name: str, run_index: int, conda_env, tags={}):
    """Logging of cross validation results to mlflow tracking server

    Args:
        experiment_name (str): experiment name
        model_name (str): Name of the model
        run_index (int): Index of the run (in Gridsearch)
        conda_env (str): A dictionary that describes the conda environment (MLFlow Format)
        tags (dict): Dictionary of extra data and tags (usually features)

## mlflow-model-evaluation.py
from sklearn.neighbors import KNeighborsRegressor
from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score, explained_variance_score

import mlflow
import mlflow.sklearn

import numpy as np

# Launch the experiment on mlflow
experiment_name = "electricityconsumption-forecast"

## 01-model-training.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                ldrewniak
                / 01-model-training.ipynb
            
            
              Created
              November 5, 2019 14:01
            
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## test_MLflow_2.ipynb

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                azarnyx
                / test_MLflow_2.ipynb
            
            
              Created
              June 30, 2019 12:07
            
          
        Loading

      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## sstreaming-spark-final.py
'''
spark/bin/spark-submit \
    --master local --driver-memory 4g \
    --num-executors 2 --executor-memory 4g \
    --packages org.apache.spark:spark-sql-kafka-0-10_2.11:2.4.0 \
    sstreaming-spark-final.py
'''
from pyspark.sql import SparkSession
from pyspark.sql.types import *
from pyspark.sql.functions import expr
	#!/bin/bash
	########################################################################################
	# START, STOP or STATUS #
	# ---------------------------- #
	# This scrip is intended to help you start, stop or get the IP address of #
	# Current running EC2. #
	# This will require you to 1st configure your AWC-CLI, namualy to ensure safety #
	# #
	# Please read the code to ensure that It does not cause any security issues #
	# #
	#!/bin/bash


	##################################################################################
	# ----------------------------------------------------------------
	# THIS SCRIPT WILL HELP YOUR AUTOMATE THE DOCKER INSTALATION STEPS
	# ----------------------------------------------------------------
	# Test was ran on aws ec2 instance.
	#
	# AUTHOR:
	#Import All Functions
	from pyspark.sql import SQLContext
	from pyspark.sql import functions as F
	from pyspark.sql import SparkSession
	from pyspark.sql.functions import unix_timestamp, to_date, date_format, month, year, dayofyear, dayofweek, col
	from pyspark.sql.types import TimestampType
	from pyspark.sql import functions as F
	from pyspark.sql import SparkSession
	from pyspark.sql.functions import unix_timestamp, to_date, date_format, month, year, dayofyear, dayofweek, col
	from pyspark.sql.types import TimestampType

	def log_run(gridsearch: sklearn.GridSearchCV, experiment_name: str, model_name: str, run_index: int, conda_env, tags={}):
	"""Logging of cross validation results to mlflow tracking server

	Args:
	experiment_name (str): experiment name
	model_name (str): Name of the model
	run_index (int): Index of the run (in Gridsearch)
	conda_env (str): A dictionary that describes the conda environment (MLFlow Format)
	tags (dict): Dictionary of extra data and tags (usually features)
	from sklearn.neighbors import KNeighborsRegressor
	from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score, explained_variance_score

	import mlflow
	import mlflow.sklearn

	import numpy as np

	# Launch the experiment on mlflow
	experiment_name = "electricityconsumption-forecast"
	'''
	spark/bin/spark-submit \
	--master local --driver-memory 4g \
	--num-executors 2 --executor-memory 4g \
	--packages org.apache.spark:spark-sql-kafka-0-10_2.11:2.4.0 \
	sstreaming-spark-final.py
	'''
	from pyspark.sql import SparkSession
	from pyspark.sql.types import *
	from pyspark.sql.functions import expr