chiraagshah-qa · October 5, 2022 15:13
diff --git a/bulk_webpage_screenshots.py b/bulk_webpage_screenshots.py
 import os

 from selenium import webdriver
 from selenium.common.exceptions import WebDriverException
 from selenium.webdriver.chrome.options import Options
 from PIL import Image
 from tqdm import tqdm
 import time

 lines = []
 timestr = time.strftime("%Y%m%d-%H%M%S")
 sites_list = 'Location of Text File'
 screenshots_dir_path = 'Location where screenshots should be saved'
 screenshots_dir = f'{screenshots_dir_path}_{timestr}'
 os.makedirs(screenshots_dir)
 i = 1


 def s(x): return driver.execute_script('return document.body.parentNode.scroll' + x)


 with open(sites_list, "r") as f:
    lines = f.readlines()
    lines = [line.rstrip() for line in lines]

 options = Options()
 options.headless = True
 options.add_argument('--log-level=3')
 options.binary_location = "Location of chrome.exe"
 driver = webdriver.Chrome(options=options)
 user_agent = driver.execute_script("return navigator.userAgent;")
 print(user_agent)

 for link in tqdm(lines, ncols=65):
    try:
        driver.get(link)
        time.sleep(5)
        driver.set_window_size(2560, 1440)  # May need manual adjustment
        driver.get_screenshot_as_file(f'{screenshots_dir}/{i}.png')
        
        #  Optional file conversion to save space.
        img = Image.open(f'{screenshots_dir}/{i}.png')
        rgb_img = img.convert('RGB')
        rgb_img.save(f'{screenshots_dir}/{i}.jpg')
        os.remove(f'{screenshots_dir}/{i}.png')
        i = i + 1
    except WebDriverException:
        print("Error getting screenshot of " + link + ".")
        continue
 driver.quit()
	import os

	from selenium import webdriver
	from selenium.common.exceptions import WebDriverException
	from selenium.webdriver.chrome.options import Options
	from PIL import Image
	from tqdm import tqdm
	import time

	lines = []
	timestr = time.strftime("%Y%m%d-%H%M%S")
	sites_list = 'Location of Text File'
	screenshots_dir_path = 'Location where screenshots should be saved'
	screenshots_dir = f'{screenshots_dir_path}_{timestr}'
	os.makedirs(screenshots_dir)
	i = 1


	def s(x): return driver.execute_script('return document.body.parentNode.scroll' + x)


	with open(sites_list, "r") as f:
	lines = f.readlines()
	lines = [line.rstrip() for line in lines]

	options = Options()
	options.headless = True
	options.add_argument('--log-level=3')
	options.binary_location = "Location of chrome.exe"
	driver = webdriver.Chrome(options=options)
	user_agent = driver.execute_script("return navigator.userAgent;")
	print(user_agent)

	for link in tqdm(lines, ncols=65):
	try:
	driver.get(link)
	time.sleep(5)
	driver.set_window_size(2560, 1440) # May need manual adjustment
	driver.get_screenshot_as_file(f'{screenshots_dir}/{i}.png')

	# Optional file conversion to save space.
	img = Image.open(f'{screenshots_dir}/{i}.png')
	rgb_img = img.convert('RGB')
	rgb_img.save(f'{screenshots_dir}/{i}.jpg')
	os.remove(f'{screenshots_dir}/{i}.png')
	i = i + 1
	except WebDriverException:
	print("Error getting screenshot of " + link + ".")
	continue
	driver.quit()