Jingfei Cai-Pincus Ailuropoda1864

## auto_git_pull_to_gmail.py
import subprocess
import os
import time
import smtplib
from email.message import EmailMessage


# put your GA directory here, e.g. '/home/fay/code/GA/DSI'
CWD = ''

## append_to_csv.py
import csv


def append_to_csv(csvfile, entry):
    """
    append a row to a csv file
    :param csvfile: the path to a .csv file
    :param entry: a list representing a row in the .csv file
    :return: None
    """

## corr_heatmap.py
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from functools import partial


def corr_heatmap(dataframe, cmap=sns.diverging_palette(220, 10, as_cmap=True),
                 **kwargs):
    """

## scatter_plot_with_linear_fit.py
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import scipy.stats as stats


def scatter_plot_with_linear_fit(x, y, slope=None, y_intercept=None):
    """
    :param x: an array
    :param y: an array

## auto_git_pull.py
import subprocess
import os
import time


# put your GA directory here, e.g. '/home/fay/code/GA/DSI'
CWD = ''

# put the path to a .gitignore template here
# e.g. '/home/fay/code/GA/DSI/projects/West-Nile-Virus-Prediction/.gitignore'

## eda.py
import numpy as np
import pandas as pd
from pandas.core.dtypes.common import (
    is_numeric_dtype, is_datetime64_dtype, is_bool_dtype
)
from pandas.core.indexes.datetimes import DatetimeIndex


def eda(dataframe, head=True, info=True, describe=True, duplicated=True,
        dup_kwd={}):

## category_counts.py
import pandas as pd
from pandas.core.dtypes.common import (
    is_numeric_dtype, is_datetime64_dtype, is_bool_dtype
)


def category_counts(dataframe, max_nunique=20, numeric=False, datetime=False):
    """
    prints value counts for each (categorical) column
    :param dataframe: a pandas DataFrame

## find_duplicated.py
import pandas as pd

def find_duplicated(dataframe, show=True, sort=False):
    """
    prints out information on duplicate rows
    :param dataframe: a pandas DataFrame
    :param show: boolean; if True, the duplicated rows (if any) are shown
    :param sort: boolean; if True, the duplicated rows are sorted by each column
                 of the dataframe
    """

## show_null.py
import pandas as pd

def show_null(dataframe):
    """
    prints the number and percentage of null values in each column
    :param dataframe: a pandas DataFrame
    :return: None
    """
    if dataframe.isnull().sum().sum() == 0:
        print('No null in the dataframe.')

## describe_by_type.py
import numpy as np
import pandas as pd
from pandas.core.dtypes.common import (
    is_numeric_dtype, is_datetime64_dtype, is_bool_dtype
)
from pandas.core.indexes.datetimes import DatetimeIndex


def describe_by_type(dataframe):
    """
	import subprocess
	import os
	import time
	import smtplib
	from email.message import EmailMessage


	# put your GA directory here, e.g. '/home/fay/code/GA/DSI'
	CWD = ''
	import csv


	def append_to_csv(csvfile, entry):
	"""
	append a row to a csv file
	:param csvfile: the path to a .csv file
	:param entry: a list representing a row in the .csv file
	:return: None
	"""
	import numpy as np
	import pandas as pd
	import matplotlib.pyplot as plt
	import seaborn as sns
	from functools import partial


	def corr_heatmap(dataframe, cmap=sns.diverging_palette(220, 10, as_cmap=True),
	**kwargs):
	"""
	import numpy as np
	import pandas as pd
	from pandas.core.dtypes.common import (
	is_numeric_dtype, is_datetime64_dtype, is_bool_dtype
	)
	from pandas.core.indexes.datetimes import DatetimeIndex


	def eda(dataframe, head=True, info=True, describe=True, duplicated=True,
	dup_kwd={}):
	import pandas as pd

	def find_duplicated(dataframe, show=True, sort=False):
	"""
	prints out information on duplicate rows
	:param dataframe: a pandas DataFrame
	:param show: boolean; if True, the duplicated rows (if any) are shown
	:param sort: boolean; if True, the duplicated rows are sorted by each column
	of the dataframe
	"""
	import pandas as pd

	def show_null(dataframe):
	"""
	prints the number and percentage of null values in each column
	:param dataframe: a pandas DataFrame
	:return: None
	"""
	if dataframe.isnull().sum().sum() == 0:
	print('No null in the dataframe.')