Vanessa Liang vanessaaleung

Professional StackOverflow Researcher

vanessaaleung / structure.py

Created September 28, 2019 06:26

vanessaaleung / scrape.py

Created September 28, 2019 06:25

	response = requests.get("http://www.healthysf.org/bdi/outcomes/zipmap.htm")
	soup = BeautifulSoup(response.text, "lxml")
	table = soup.find_all("table")
	df = pd.read_html(str(table))
	df = pd.DataFrame(df[4])

vanessaaleung / library.py

Created September 28, 2019 06:22

	import requests # library to handle requests
	from bs4 import BeautifulSoup
	import pandas as pd

vanessaaleung / removesingle.py

Created September 21, 2019 08:10

names = [name for name in names if len(name) > 1]

vanessaaleung / customizewc.py

Created September 21, 2019 07:27

	import random

	def grey_color_func(word, font_size, position, orientation, random_state=None,
	**kwargs):
	return "hsl(0, 0%%, %d%%)" % random.randint(60, 100)


	plt.figure(figsize=(15,8))
	plt.imshow(wordcloud.recolor(color_func=grey_color_func, random_state=3), interpolation='bilinear')
	plt.axis("off")

vanessaaleung / plot.py

Created September 21, 2019 07:22

	unique_string=(" ").join(names)
	wordcloud = WordCloud(width = 1000, height = 500).generate(unique_string)
	plt.figure(figsize=(15,8))
	plt.imshow(wordcloud, interpolation='bilinear')
	plt.axis("off")
	plt.show()

vanessaaleung / wordcloud.py

Created September 21, 2019 07:21

	pip install wordcloud
	import numpy as np
	from os import path
	from PIL import Image
	from wordcloud import WordCloud, STOPWORDS, ImageColorGenerator

	import matplotlib.pyplot as plt
	% matplotlib inline

vanessaaleung / freq.py

Last active September 21, 2019 07:39

	from nltk.probability import FreqDist
	fdist = FreqDist(names).most_common(20)

vanessaaleung / removestopwords.py

Last active September 21, 2019 08:09

names = [name for name in names if name not in a]

vanessaaleung / stopwords.py

Last active September 21, 2019 07:37

	from nltk import word_tokenize
	import nltk
	nltk.download('stopwords')
	from nltk.corpus import stopwords
	a = set(stopwords.words('english'))