Skip to content

Instantly share code, notes, and snippets.

View jorgezanguettin's full-sized avatar

Jorge Luis Zanguettin jorgezanguettin

View GitHub Profile
@jorgezanguettin
jorgezanguettin / instagram_followers.py
Created May 20, 2021 21:23 — forked from tomkdickinson/instagram_followers.py
Followers Extraction Instagram
import json
import requests
import logging as log
log.basicConfig(level=log.DEBUG)
class FollowerExtractor():
"""
Extracts followers for a given profile
"""
import requests
import os
from bs4 import BeautifulSoup
def requisitar_site(siteUrl):
conteudoSite = requests.get(siteUrl).content
analisar_requisicao(conteudoSite)
def analisar_requisicao(conteudoRequisicao):
objBs4 = BeautifulSoup(conteudoRequisicao, "html.parser")
@jorgezanguettin
jorgezanguettin / analisar_requisicao_partial_4.py
Last active April 14, 2021 21:32
analisar_requisicao_partial_4
def analisar_requisicao(conteudoRequisicao):
objBs4 = BeautifulSoup(conteudoRequisicao, "html.parser")
marcas = objBs4.find_all('div', {'class': 'product-box-brand'})
nomes = objBs4.select('div.catalog-content p.product-box-title')
links = objBs4.find_all('a', {
'class': 'product-box-link is-lazyloaded image product-image-rotate'
})
precos = objBs4.find_all('span', {'class': 'product-box-price-from'})
def armazenar_dados(dadosObtidos):
arquivo = open('roupas.csv', 'a+', encoding='utf-8')
arquivo.write(dadosObtidos)
arquivo.close()
@jorgezanguettin
jorgezanguettin / analisar_requisicao_partial_3.py
Created April 14, 2021 20:57
analisar_requisicao_partial_3
def analisar_requisicao(conteudoRequisicao):
objBs4 = BeautifulSoup(conteudoRequisicao, "html.parser")
marcas = objBs4.find_all('div', {'class': 'product-box-brand'})
nomes = objBs4.select('div.catalog-content p.product-box-title')
links = objBs4.find_all('a', {
'class': 'product-box-link is-lazyloaded image product-image-rotate'
})
precos = objBs4.find_all('span', {'class': 'product-box-price-from'})
def tratamento_dados(dadoObtido, tipoString):
if tipoString == 'Preco':
return str(dadoObtido).replace('R$','').strip()
else:
return str(dadoObtido).replace(';',',').strip()
@jorgezanguettin
jorgezanguettin / analisar_requisicao_partial_2.py
Last active April 14, 2021 20:12
analisar_requisicao_partial_2.py
def analisar_requisicao(conteudoRequisicao):
objBs4 = BeautifulSoup(conteudoRequisicao, "html.parser")
marcas = objBs4.find_all('div', {'class': 'product-box-brand'})
nomes = objBs4.select('div.catalog-content p.product-box-title')
links = objBs4.find_all('a', {
'class': 'product-box-link is-lazyloaded image product-image-rotate'
})
precos = objBs4.find_all('span', {'class': 'product-box-price-from'})
@jorgezanguettin
jorgezanguettin / analisar_requisicao_partial_1.py
Last active April 14, 2021 19:44
analisar_requisicao_partial_1
analisar_requisicao(conteudoRequisicao):
objetoBs4 = BeautifulSoup(conteudoRequisicao, 'html.parser')
marcas = objBs4.find_all('div', {'class': 'product-box-brand'})
nomes = objBs4.select('div.catalog-content p.product-box-title')
links = objBs4.find_all('a', {
'class': 'product-box-link is-lazyloaded image product-image-rotate'
})
precos = objBs4.find_all('span', {'class': 'product-box-price-from'})
@jorgezanguettin
jorgezanguettin / analisar_requisicao.py
Last active April 14, 2021 19:41
analisar_requisicao
analisar_requisicao(conteudoRequisicao):
objetoBs4 = BeautifulSoup(conteudoRequisicao, 'html.parser')
marcas = objBs4.find_all('div', {'class': 'product-box-brand'})
@jorgezanguettin
jorgezanguettin / requisitar_site.py
Last active April 14, 2021 03:10
requisitar_site
def requisitar_site(siteUrl):
conteudoSite = requests.get(siteUrl).content
analisar_requisicao(conteudoSite)