yeiichi · January 22, 2025 08:18
diff --git a/pdf_scraper.py b/pdf_scraper.py
 #!/usr/bin/env python3
 from io import BytesIO

 import requests
 from pdfminer.high_level import extract_text


 def extract_str_fm_pdf_url(url_pdf):
    """Extract strings directly from a PDF file URL.
    Args:
        url_pdf (str): URL of the target PDF file
    Returns:
        Content string
    """
    byte_data = requests.get(url_pdf).content
    bytio_obj = BytesIO(byte_data)
    try:
        return extract_text(bytio_obj)
    except Exception as err_msg:
        return err_msg


 if __name__ == '__main__':
    print(extract_str_fm_pdf_url(input('Target PDF URL? >> ')))
	#!/usr/bin/env python3
	from io import BytesIO

	import requests
	from pdfminer.high_level import extract_text


	def extract_str_fm_pdf_url(url_pdf):
	"""Extract strings directly from a PDF file URL.
	Args:
	url_pdf (str): URL of the target PDF file
	Returns:
	Content string
	"""
	byte_data = requests.get(url_pdf).content
	bytio_obj = BytesIO(byte_data)
	try:
	return extract_text(bytio_obj)
	except Exception as err_msg:
	return err_msg


	if __name__ == '__main__':
	print(extract_str_fm_pdf_url(input('Target PDF URL? >> ')))