JeyKJey · September 2, 2019 09:36 · fALKENdk · Apr 13, 2018 · hmarkopcuoglu · Jul 13, 2018
diff --git a/beautiful_soup.py b/beautiful_soup.py
 from bs4 import BeautifulSoup
 import requests
 page_link ='https://www.website_to_crawl.com'
 # fetch the content from url
 page_response = requests.get(page_link, timeout=5)
 # parse html
 page_content = BeautifulSoup(page_response.content, "html.parser")

 # extract all html elements where price is stored
 prices = page_content.find_all(class_='main_price')
 # prices has a form:
 #[<div class="main_price">Price: $66.68</div>,
 # <div class="main_price">Price: $56.68</div>]

 # you can also access the main_price class by specifying the tag of the class
 prices = page_content.find_all('div', attrs={'class':'main_price'})
	from bs4 import BeautifulSoup
	import requests
	page_link ='https://www.website_to_crawl.com'
	# fetch the content from url
	page_response = requests.get(page_link, timeout=5)
	# parse html
	page_content = BeautifulSoup(page_response.content, "html.parser")

	# extract all html elements where price is stored
	prices = page_content.find_all(class_='main_price')
	# prices has a form:
	#[<div class="main_price">Price: $66.68</div>,
	# <div class="main_price">Price: $56.68</div>]

	# you can also access the main_price class by specifying the tag of the class
	prices = page_content.find_all('div', attrs={'class':'main_price'})