Skip to content

Instantly share code, notes, and snippets.

View ishritam's full-sized avatar
🎯
Focusing

Shritam Kumar Mund ishritam

🎯
Focusing
View GitHub Profile
(venv) (base) C:\Users\Shritam\Desktop\Scrapy\venv\iscrapy>scrapy crawl Thespider -o book_data.csv
books = response.css('ol.row')
for book in books:
for b in book.css('article.product_pod'):
data['Title'] = b.css('a::attr(title)').getall()
data['Price'] = b.css('div.product_price p.price_color::text').getall()[0].split()[0]
data['Stock'] = b.css('div.product_price p.instock.availability::text').getall()[1].strip()
data['Star'] = b.css('p::attr(class)').getall()[0].split()[-1]
data['Star'] = [j for i,j in dic.items() if i in data['Star']][0]
inp = int(input("Enter the no. of pages you want to scrap: "))
class ThescrapySpider(scrapy.Spider):
name = 'Thescrapy'
start_urls = ['http://books.toscrape.com/catalogue/page-{}.html'.format(n) for n in range(1,inp)]
(venv) (base) C:\Users\Shritam\Desktop\Scrapy\venv\iscrapy>scrapy genspider TheSpider books.toscrape.com
# -*- coding: utf-8 -*-
import scrapy
class ThespiderSpider(scrapy.Spider):
name = 'TheSpider'
allowed_domains = ['books.toscrape.com']
start_urls = ['http://books.toscrape.com/']
def parse(self, response):
(venv) (base) C:\Users\Shritam\Desktop\Scrapy\venv\iscrapy>scrapy genspider iscrapy books.toscrape.com
(venv) (base) C:\Users\Shritam\Desktop\Scrapy\venv>scrapy startproject iscrapy
(venv) (base) C:\Users\Shritam\Desktop\Scrapy\venv>pip install scrapy
(base) C:\Users\Shritam\Desktop\Scrapy\venv>Scripts\activate.bat