dannguyen · July 29, 2025 14:26 · rahpalrah · Jul 2, 2018 · ngadhvi · Feb 13, 2019
diff --git a/README.md b/README.md
diff --git a/cloudvisreq.py b/cloudvisreq.py
 from base64 import b64encode
 from os import makedirs
 from os.path import join, basename
 from sys import argv
 import json
 import requests

 ENDPOINT_URL = 'https://vision.googleapis.com/v1/images:annotate'
 RESULTS_DIR = 'jsons'
 makedirs(RESULTS_DIR, exist_ok=True)

 def make_image_data_list(image_filenames):
    """
    image_filenames is a list of filename strings
    Returns a list of dicts formatted as the Vision API
        needs them to be
    """
    img_requests = []
    for imgname in image_filenames:
        with open(imgname, 'rb') as f:
            ctxt = b64encode(f.read()).decode()
            img_requests.append({
                    'image': {'content': ctxt},
                    'features': [{
                        'type': 'TEXT_DETECTION',
                        'maxResults': 1
                    }]
            })
    return img_requests

 def make_image_data(image_filenames):
    """Returns the image data lists as bytes"""
    imgdict = make_image_data_list(image_filenames)
    return json.dumps({"requests": imgdict }).encode()


 def request_ocr(api_key, image_filenames):
    response = requests.post(ENDPOINT_URL,
                             data=make_image_data(image_filenames),
                             params={'key': api_key},
                             headers={'Content-Type': 'application/json'})
    return response


 if __name__ == '__main__':
    api_key, *image_filenames = argv[1:]
    if not api_key or not image_filenames:
        print("""
            Please supply an api key, then one or more image filenames

            $ python cloudvisreq.py api_key image1.jpg image2.png""")
    else:
        response = request_ocr(api_key, image_filenames)
        if response.status_code != 200 or response.json().get('error'):
            print(response.text)
        else:
            for idx, resp in enumerate(response.json()['responses']):
                # save to JSON file
                imgname = image_filenames[idx]
                jpath = join(RESULTS_DIR, basename(imgname) + '.json')
                with open(jpath, 'w') as f:
                    datatxt = json.dumps(resp, indent=2)
                    print("Wrote", len(datatxt), "bytes to", jpath)
                    f.write(datatxt)

                # print the plaintext to screen for convenience
                print("---------------------------------------------")
                t = resp['textAnnotations'][0]
                print("    Bounding Polygon:")
                print(t['boundingPoly'])
                print("    Text:")
                print(t['description'])
	from base64 import b64encode
	from os import makedirs
	from os.path import join, basename
	from sys import argv
	import json
	import requests

	ENDPOINT_URL = 'https://vision.googleapis.com/v1/images:annotate'
	RESULTS_DIR = 'jsons'
	makedirs(RESULTS_DIR, exist_ok=True)

	def make_image_data_list(image_filenames):
	"""
	image_filenames is a list of filename strings
	Returns a list of dicts formatted as the Vision API
	needs them to be
	"""
	img_requests = []
	for imgname in image_filenames:
	with open(imgname, 'rb') as f:
	ctxt = b64encode(f.read()).decode()
	img_requests.append({
	'image': {'content': ctxt},
	'features': [{
	'type': 'TEXT_DETECTION',
	'maxResults': 1
	}]
	})
	return img_requests

	def make_image_data(image_filenames):
	"""Returns the image data lists as bytes"""
	imgdict = make_image_data_list(image_filenames)
	return json.dumps({"requests": imgdict }).encode()


	def request_ocr(api_key, image_filenames):
	response = requests.post(ENDPOINT_URL,
	data=make_image_data(image_filenames),
	params={'key': api_key},
	headers={'Content-Type': 'application/json'})
	return response


	if __name__ == '__main__':
	api_key, *image_filenames = argv[1:]
	if not api_key or not image_filenames:
	print("""
	Please supply an api key, then one or more image filenames

	$ python cloudvisreq.py api_key image1.jpg image2.png""")
	else:
	response = request_ocr(api_key, image_filenames)
	if response.status_code != 200 or response.json().get('error'):
	print(response.text)
	else:
	for idx, resp in enumerate(response.json()['responses']):
	# save to JSON file
	imgname = image_filenames[idx]
	jpath = join(RESULTS_DIR, basename(imgname) + '.json')
	with open(jpath, 'w') as f:
	datatxt = json.dumps(resp, indent=2)
	print("Wrote", len(datatxt), "bytes to", jpath)
	f.write(datatxt)

	# print the plaintext to screen for convenience
	print("---------------------------------------------")
	t = resp['textAnnotations'][0]
	print(" Bounding Polygon:")
	print(t['boundingPoly'])
	print(" Text:")
	print(t['description'])
No results found