suhithr · October 30, 2016 19:04
diff --git a/9gag-scraper.py b/9gag-scraper.py
 # Code used for the Delta Workshop on Python and Linux 2016 at NIT, Trichy

 import urllib
 from time import sleep

 import requests # http://docs.python-requests.org/en/master/
 from bs4 import BeautifulSoup # https://www.crummy.com/software/BeautifulSoup/bs4/doc/

 # Try printing out the variables at various stages to view the objects
 # Better yet execute this in your Python interpreter to see all the action happening
 # and print each variable

 url = "http://9gag.com"
 r = requests.get(url)

 soup = BeautifulSoup(r.text, 'html.parser')

 img_tags = soup.select('img.badge-item-img')
 # This is a CSS selector: The format is tag.class#id
 # soup.find_all('img')
 # We are not using the find_all() method because it gets all the images
 # All the images are not what we want, since some of them are badges, icons, and we only want images that are part of the feed

 # We will only download the first ten images
 n = 10

 for img in img_tags:
    if img['src'] is not None and n > 0:
    	sleep(1) # Adding a delay so we don't flood 9gag's servers
        urllib.urlretrieve(img['src'], img['alt'])
        print "Downloaded {}".format(img['alt'])
        n -= 1
	# Code used for the Delta Workshop on Python and Linux 2016 at NIT, Trichy

	import urllib
	from time import sleep

	import requests # http://docs.python-requests.org/en/master/
	from bs4 import BeautifulSoup # https://www.crummy.com/software/BeautifulSoup/bs4/doc/

	# Try printing out the variables at various stages to view the objects
	# Better yet execute this in your Python interpreter to see all the action happening
	# and print each variable

	url = "http://9gag.com"
	r = requests.get(url)

	soup = BeautifulSoup(r.text, 'html.parser')

	img_tags = soup.select('img.badge-item-img')
	# This is a CSS selector: The format is tag.class#id
	# soup.find_all('img')
	# We are not using the find_all() method because it gets all the images
	# All the images are not what we want, since some of them are badges, icons, and we only want images that are part of the feed

	# We will only download the first ten images
	n = 10

	for img in img_tags:
	if img['src'] is not None and n > 0:
	sleep(1) # Adding a delay so we don't flood 9gag's servers
	urllib.urlretrieve(img['src'], img['alt'])
	print "Downloaded {}".format(img['alt'])
	n -= 1