sachinsdate

## poisson_regression.py
import pandas as pd
from patsy import dmatrices
import numpy as np
import statsmodels.api as sm
import matplotlib.pyplot as plt


#Create a pandas DataFrame for the counts data set.
df = pd.read_csv('nyc_bb_bicyclist_counts.csv', header=0, infer_datetime_format=True, parse_dates=[0], index_col=[0])

## poisson_counts_generator.py
import random
import math

_lambda = 5
_num_total_arrivals = 150
_num_arrivals = 0
_arrival_time = 0
_num_arrivals_in_unit_time = []
_time_tick = 1

## negative_binomial_regression.py
import pandas as pd
from patsy import dmatrices
import numpy as np
import statsmodels.api as sm
import statsmodels.formula.api as smf
import matplotlib.pyplot as plt

#create a pandas DataFrame for the counts data set
df = pd.read_csv('nyc_bb_bicyclist_counts.csv', header=0, infer_datetime_format=True, parse_dates=[0], index_col=[0])

## f_test.py
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

#Create a pandas DataFrame for the djia data set.
df = pd.read_csv('djia.csv', header=0, infer_datetime_format=True, parse_dates=[0], index_col=[0])

################################
######## THE MEAN MODEL ########
################################

## djia.csv

          
            Date
            Closing Price

            
              7/24/2019
              27269.9707

            
              7/25/2019
              27140.98047

            
              7/26/2019
              27192.44922

            
              7/29/2019
              27221.34961

            
              7/30/2019
              27198.01953

            
              7/31/2019
              26864.26953

            
              8/1/2019
              26583.41992

            
              8/2/2019
              26485.00977

            
              8/5/2019
              25717.74023

## poisson_sim2.py
import random
import math
import statistics
import matplotlib.pyplot as plt


_lambda = 5
_num_events = 100
_event_num = []
_inter_event_times = []

## aic.py
import pandas as pd
from patsy import dmatrices
from collections import OrderedDict
import itertools
import statsmodels.formula.api as smf
import sys
import matplotlib.pyplot as plt

#Read the data set into a pandas DataFrame
df = pd.read_csv('boston_daily_temps_1978_2019.csv', header=0, infer_datetime_format=True, parse_dates=[0], index_col=[0])

## boston_daily_temps_1978_2019.csv

          
            DATE
            TAVG

            
              1/1/1978
              26.5

            
              1/2/1978
              24

            
              1/3/1978
              25.5

            
              1/4/1978
              23

            
              1/5/1978
              35.5

            
              1/6/1978
              39.5

            
              1/7/1978
              30.5

            
              1/8/1978
              39

            
              1/9/1978
              38.5

## wages_and_salaries_1984_2019_us_bls_CXU900000LB1203M.csv

          
            Year
            Wages

            
              1984
              25088

            
              1985
              26611

            
              1986
              27005

            
              1987
              29103

            
              1988
              30168

            
              1989
              31922

            
              1990
              33183

            
              1991
              35576

            
              1992
              35679

## olsr_for_counts_based_data.py
import pandas as pd
from matplotlib import pyplot as plt

#load the data into a pandas data frame and plot the BB_COUNT variable
df = pd.read_csv('nyc_bb_bicyclist_counts.csv', header=0, infer_datetime_format=True, parse_dates=[0], index_col=[0])
fig = plt.figure()
fig.suptitle('Bicyclist counts on the Brooklyn bridge')
plt.xlabel('Date')
plt.ylabel('Count')
actual, = plt.plot(df.index, df['BB_COUNT'], 'go-', label='Count of bicyclists')
	import pandas as pd
	from patsy import dmatrices
	import numpy as np
	import statsmodels.api as sm
	import matplotlib.pyplot as plt


	#Create a pandas DataFrame for the counts data set.
	df = pd.read_csv('nyc_bb_bicyclist_counts.csv', header=0, infer_datetime_format=True, parse_dates=[0], index_col=[0])
	import random
	import math

	_lambda = 5
	_num_total_arrivals = 150
	_num_arrivals = 0
	_arrival_time = 0
	_num_arrivals_in_unit_time = []
	_time_tick = 1
	Date	Closing Price
	7/24/2019	27269.9707
	7/25/2019	27140.98047
	7/26/2019	27192.44922
	7/29/2019	27221.34961
	7/30/2019	27198.01953
	7/31/2019	26864.26953
	8/1/2019	26583.41992
	8/2/2019	26485.00977
	8/5/2019	25717.74023
	import random
	import math
	import statistics
	import matplotlib.pyplot as plt


	_lambda = 5
	_num_events = 100
	_event_num = []
	_inter_event_times = []
	import pandas as pd
	from patsy import dmatrices
	from collections import OrderedDict
	import itertools
	import statsmodels.formula.api as smf
	import sys
	import matplotlib.pyplot as plt

	#Read the data set into a pandas DataFrame
	df = pd.read_csv('boston_daily_temps_1978_2019.csv', header=0, infer_datetime_format=True, parse_dates=[0], index_col=[0])
	DATE	TAVG
	1/1/1978	26.5
	1/2/1978	24
	1/3/1978	25.5
	1/4/1978	23
	1/5/1978	35.5
	1/6/1978	39.5
	1/7/1978	30.5
	1/8/1978	39
	1/9/1978	38.5
	Year	Wages
	1984	25088
	1985	26611
	1986	27005
	1987	29103
	1988	30168
	1989	31922
	1990	33183
	1991	35576
	1992	35679
	import pandas as pd
	from matplotlib import pyplot as plt

	#load the data into a pandas data frame and plot the BB_COUNT variable
	df = pd.read_csv('nyc_bb_bicyclist_counts.csv', header=0, infer_datetime_format=True, parse_dates=[0], index_col=[0])
	fig = plt.figure()
	fig.suptitle('Bicyclist counts on the Brooklyn bridge')
	plt.xlabel('Date')
	plt.ylabel('Count')
	actual, = plt.plot(df.index, df['BB_COUNT'], 'go-', label='Count of bicyclists')