dalequark · January 29, 2019 17:45
diff --git a/bucket_polite_data.py b/bucket_polite_data.py
 # We'll consider everything with a Normalized Score below the 25th percentile to be rude.
 # Above the 75th percentile is considered polite.
 # Scores in the middle are considered neutral

 # Get the 25th and 75th percentiles of Normalized Scoes
 rude_thresh = data.describe().loc["25%"]['Normalized Score']
 polite_thresh = data.describe().loc["75%"]['Normalized Score']

 label_list = ["rude", "neutral", "polite"]
 def score_to_label(score):
    if score <= rude_thresh:
        return label_list[0]
    if score < polite_thresh:
        return label_list[1]
    return label_list[2]

 # Give the 'data' DataFrame a new column that contains string labels 
 data['label'] = data['Normalized Score'].map(score_to_label)
	# We'll consider everything with a Normalized Score below the 25th percentile to be rude.
	# Above the 75th percentile is considered polite.
	# Scores in the middle are considered neutral

	# Get the 25th and 75th percentiles of Normalized Scoes
	rude_thresh = data.describe().loc["25%"]['Normalized Score']
	polite_thresh = data.describe().loc["75%"]['Normalized Score']

	label_list = ["rude", "neutral", "polite"]
	def score_to_label(score):
	if score <= rude_thresh:
	return label_list[0]
	if score < polite_thresh:
	return label_list[1]
	return label_list[2]

	# Give the 'data' DataFrame a new column that contains string labels
	data['label'] = data['Normalized Score'].map(score_to_label)