Miriam Seoane Santos miriamspsantos

## adult_profiling_report.py
# Make the necessary imports
import pandas as pd
from ydata_profiling import ProfileReport

# Load the data
df = pd.read_csv('data/adult.csv', na_values='?')

# Generate the report
profile = ProfileReport(df,title="Adult Census Profile")

## adult_categories.py
cat_cols = ['workclass', 'education', 'education.num',
            'marital.status', 'occupation', 'relationship', 'race',
            'sex', 'native.country', 'income']

for col in cat_cols:
    categories = df.groupby(col).size()
    print(categories)

#workclass
#Federal-gov           960

## adult_dataset_overview.py
import pandas as pd

# Load the data
df = pd.read_csv('data/adult.csv', na_values='?')

# Dataset Overview
df.head() # preview a sample

df.shape  # number of observations and features
# (32561, 15)
	# Make the necessary imports
	import pandas as pd
	from ydata_profiling import ProfileReport

	# Load the data
	df = pd.read_csv('data/adult.csv', na_values='?')

	# Generate the report
	profile = ProfileReport(df,title="Adult Census Profile")
	cat_cols = ['workclass', 'education', 'education.num',
	'marital.status', 'occupation', 'relationship', 'race',
	'sex', 'native.country', 'income']

	for col in cat_cols:
	categories = df.groupby(col).size()
	print(categories)

	#workclass
	#Federal-gov 960