srishtis/load_iris.py

## load_iris.py
from sklearn import datasets
import pandas as pd

# load iris dataset
iris = datasets.load_iris()
# Since this is a bunch, create a dataframe
iris_df=pd.DataFrame(iris.data)
iris_df['class']=iris.target

iris_df.columns=['sepal_len', 'sepal_wid', 'petal_len', 'petal_wid', 'class']
iris_df.dropna(how="all", inplace=True) # remove any empty lines

#selecting only first 4 columns as they are the independent(X) variable
# any kind of feature selection or correlation analysis should be first done on these
iris_X=iris_df.iloc[:,[0,1,2,3]]
	from sklearn import datasets
	import pandas as pd

	# load iris dataset
	iris = datasets.load_iris()
	# Since this is a bunch, create a dataframe
	iris_df=pd.DataFrame(iris.data)
	iris_df['class']=iris.target

	iris_df.columns=['sepal_len', 'sepal_wid', 'petal_len', 'petal_wid', 'class']
	iris_df.dropna(how="all", inplace=True) # remove any empty lines

	#selecting only first 4 columns as they are the independent(X) variable
	# any kind of feature selection or correlation analysis should be first done on these
	iris_X=iris_df.iloc[:,[0,1,2,3]]