ninetwentyfour/gist:202735664a5639e2f2fe3336e9161047

joshstaab · 2021-03-19T01:18:24Z

hr_data = []

web = 'https://hrdive.com/topic/hr-technology-analytics/?page=%s'
for page in range(1, 25):
url = web % page
data = html.fromstring(requests.get(url).text)

for i in data.xpath("//li[@Class='row feed__item']"):
title = i.xpath("div/h3/a/text()")
label_text = ""
label = i.xpath("div/span[@Class='label--sponsored']")
if label is not None:
label=True

hr_data.append([title, label])

len(hr_data)

ninetwentyfour · 2021-03-19T01:19:04Z

hr_data = []
for page in whatever
    for i in data.xpath('feed__item):
        title = i.xpath.("the same shit that should be here")
        label = i.xpath.("same label shit as before")
        label_text = ""
        sponsoredHtmlElements = i.xpath("div/span[@class='label--sponsored']")
        if sponsoredHtmlElements is not None:
            label_text = sponsoredHtmlElements

        loundHtmlElements = i.xpath("div/span[@class='label--loud']")
        if loundHtmlElements is not None:
            label_text = loundHtmlElements

        hr_data.append([title, label_text])

len(hr_data)

ninetwentyfour · 2021-03-19T01:32:24Z

hr_data = []
for page in whatever
    for i in data.xpath('feed__item):
        title = i.xpath.("the same shit that should be here")
        label = i.xpath.("same label shit as before")
        label_text = ""
        sponsoredHtmlElements = i.xpath("div/span[@class='label--sponsored']")
        print(sponsoredHtmlElements)

	sponsoredItems = []
	for i in data.xpath('ffed_item)
	sponsored = i.xpath("div/span[@class='label--sponsored']")
	if sponsored is not None:
	sponsoredItems = sponsoredItems.append(i)

	print(sponsoredItems)

ninetwentyfour/gist:202735664a5639e2f2fe3336e9161047

joshstaab commented Mar 19, 2021

ninetwentyfour commented Mar 19, 2021

ninetwentyfour commented Mar 19, 2021