t0mst0ne · August 28, 2018 08:20
diff --git a/gistfile1.txt b/gistfile1.txt
 import requests
 from bs4 import BeautifulSoup

 url = 'https://en.wikipedia.org/w/index.php' + \
      '?title=List_of_Game_of_Thrones_episodes&oldid=802553687'

 r = requests.get(url)
 html_contents = r.text
 html_soup = BeautifulSoup(html_contents, 'html.parser')

 # We'll use a list to store our episode list
 episodes = []

 ep_tables = html_soup.find_all('table', class_="wikiepisodetable")

 for table in ep_tables:
    headers = []
    rows = table.find_all('tr')
    # Start by fetching the header cells from the first row to determine
    # the field names
    for header in table.find('tr').find_all('th'):
        headers.append(header.text)
    # Then go through all the rows except the first one
    for row in table.find_all('tr')[1:]:
        values = []
        # And get the column cells, the first one being inside a th-tag
        for col in row.find_all(['th','td']):
            values.append(col.text)
        if values:
            episode_dict = {headers[i]: values[i] for i in range(len(values))}
            episodes.append(episode_dict)

 # Show the results
 for episode in episodes:
    print(episode)
	import requests
	from bs4 import BeautifulSoup

	url = 'https://en.wikipedia.org/w/index.php' + \
	'?title=List_of_Game_of_Thrones_episodes&oldid=802553687'

	r = requests.get(url)
	html_contents = r.text
	html_soup = BeautifulSoup(html_contents, 'html.parser')

	# We'll use a list to store our episode list
	episodes = []

	ep_tables = html_soup.find_all('table', class_="wikiepisodetable")

	for table in ep_tables:
	headers = []
	rows = table.find_all('tr')
	# Start by fetching the header cells from the first row to determine
	# the field names
	for header in table.find('tr').find_all('th'):
	headers.append(header.text)
	# Then go through all the rows except the first one
	for row in table.find_all('tr')[1:]:
	values = []
	# And get the column cells, the first one being inside a th-tag
	for col in row.find_all(['th','td']):
	values.append(col.text)
	if values:
	episode_dict = {headers[i]: values[i] for i in range(len(values))}
	episodes.append(episode_dict)

	# Show the results
	for episode in episodes:
	print(episode)