ashok0587

View GitHub Profile

Recently created

Least recently created

Recently updated

Least recently updated

saihttam / one_hot.py

Created October 24, 2015 16:05

	import pandas as pd
	from sklearn.feature_extraction import DictVectorizer

	def one_hot_dataframe(data, cols, replace=False):
	""" Takes a dataframe and a list of columns that need to be encoded.
	Returns a 3-tuple comprising the data, the vectorized data,
	and the fitted vectorizor."""
	vec = DictVectorizer(sparse=False)
	vecData = pd.DataFrame(vec.fit_transform(data[cols].T.to_dict().values()))
	vecData.columns = vec.get_feature_names()

kljensen / onehot_pandas_scikit.py

Last active May 18, 2020 23:17 — forked from anonymous/onehot_pandas_scikit.py

	# -- coding: utf-8 --
	""" Small script that shows hot to do one hot encoding
	of categorical columns in a pandas DataFrame.

	See:
	http://scikit-learn.org/dev/modules/generated/sklearn.preprocessing.OneHotEncoder.html#sklearn.preprocessing.OneHotEncoder
	http://scikit-learn.org/dev/modules/generated/sklearn.feature_extraction.DictVectorizer.html
	"""
	import pandas
	import random