cbscribe · October 25, 2018 01:08 · magikalcookie · Oct 25, 2018
diff --git a/bs4_example.py b/bs4_example.py
 import requests, bs4
 import time

 # for n in range(0, 5937):
 #     url = 'https://www.fiercebiotech.com/biotech?page=0%2C' + str(n)
 #     data = requests.get(url)

 # use this to prevent ddos
 #     time.sleep(10)

 # example loading google.com 
 url = "http://google.com/"
 # "data" contains the raw html from the website
 data = requests.get(url)
 data.raise_for_status()
 #print(data.text)
 # "soupdata" contains the processed html
 soupdata = bs4.BeautifulSoup(data.text,features="html.parser")
 # this pulls all <a> tags into a list
 links = soupdata.select('a')
 # loops through all links
 for link in links:
    # loop through each link and print its url and text
    print(link.get('href'), "\t",  link.string)
    print("-"*20)
	import requests, bs4
	import time

	# for n in range(0, 5937):
	# url = 'https://www.fiercebiotech.com/biotech?page=0%2C' + str(n)
	# data = requests.get(url)

	# use this to prevent ddos
	# time.sleep(10)

	# example loading google.com
	url = "http://google.com/"
	# "data" contains the raw html from the website
	data = requests.get(url)
	data.raise_for_status()
	#print(data.text)
	# "soupdata" contains the processed html
	soupdata = bs4.BeautifulSoup(data.text,features="html.parser")
	# this pulls all <a> tags into a list
	links = soupdata.select('a')
	# loops through all links
	for link in links:
	# loop through each link and print its url and text
	print(link.get('href'), "\t", link.string)
	print("-"*20)