josepablog · May 30, 2018 11:04
diff --git a/DictVectorizer_Pandas.py b/DictVectorizer_Pandas.py
 from sklearn.feature_extraction import DictVectorizer
 import pandas as pd

 df = pd.DataFrame({"user_name": ["a", "b", "c"]})
 fe_lm = DictVectorizer()
 design_lm = fe_lm.fit_transform(df.to_dict(orient="records"))

 # Note that this solution is *MUCH* faster (60 times) than transposing and converting into a dictionary:
 # http://fastml.com/converting-categorical-data-into-numbers-with-pandas-and-scikit-learn/ is much slower
	from sklearn.feature_extraction import DictVectorizer
	import pandas as pd

	df = pd.DataFrame({"user_name": ["a", "b", "c"]})
	fe_lm = DictVectorizer()
	design_lm = fe_lm.fit_transform(df.to_dict(orient="records"))

	# Note that this solution is MUCH faster (60 times) than transposing and converting into a dictionary:
	# http://fastml.com/converting-categorical-data-into-numbers-with-pandas-and-scikit-learn/ is much slower
No results found