srishtis · October 5, 2018 09:44
diff --git a/load_iris.py b/load_iris.py
 from sklearn import datasets
 import pandas as pd

 # load iris dataset
 iris = datasets.load_iris()
 # Since this is a bunch, create a dataframe
 iris_df=pd.DataFrame(iris.data)
 iris_df['class']=iris.target

 iris_df.columns=['sepal_len', 'sepal_wid', 'petal_len', 'petal_wid', 'class']
 iris_df.dropna(how="all", inplace=True) # remove any empty lines

 #selecting only first 4 columns as they are the independent(X) variable
 # any kind of feature selection or correlation analysis should be first done on these
 iris_X=iris_df.iloc[:,[0,1,2,3]]
	from sklearn import datasets
	import pandas as pd

	# load iris dataset
	iris = datasets.load_iris()
	# Since this is a bunch, create a dataframe
	iris_df=pd.DataFrame(iris.data)
	iris_df['class']=iris.target

	iris_df.columns=['sepal_len', 'sepal_wid', 'petal_len', 'petal_wid', 'class']
	iris_df.dropna(how="all", inplace=True) # remove any empty lines

	#selecting only first 4 columns as they are the independent(X) variable
	# any kind of feature selection or correlation analysis should be first done on these
	iris_X=iris_df.iloc[:,[0,1,2,3]]