sanjarcode · April 1, 2023 14:53 · sanjarcode · Mar 29, 2023 · sanjarcode · Apr 1, 2023
diff --git a/requirements.txt b/requirements.txt
 Pillow==9.3.0
 pyocr==0.8.3
diff --git a/WhatsApp-status-images-to-text.py b/WhatsApp-status-images-to-text.py
 # instructions: place images in same directory as this file. Run the file.

 from PIL import Image
 import pyocr
 import pyocr.builders
 import os

 # Print the list of png files
 def get_images_list():
    # Get the list of all files in the current directory
    all_files = os.listdir()

    # Filter the list to include only png files
    png_files = [file for file in all_files if file.endswith('.png')]

    return sorted(png_files)

 def crop_image(img, top = 0, right = 0, bottom = 0, left = 0):
    img = Image.open(img)
    width, height = img.size
    img = img.crop((left, top, width - right, height - bottom))
    return img

 def get_text_from_image(img, name = "\b"):
    # Use pyocr to extract text from the cropped image
    tools = pyocr.get_available_tools()
    tool = tools[0]

    # Set the OCR language
    lang = 'eng'

    # Use pyocr builders to configure the OCR
    builder = pyocr.builders.TextBuilder(tesseract_layout=6)

    # Extract text from the image
    result = tool.image_to_string(
        img,
        lang=lang,
        builder=builder
    )

    # Print the extracted text
    return result

 # Create a file to store the extracted text
 output_file = open('output.html', 'a')

 for image in get_images_list():
    cropped_image = crop_image(image, 250, 0, 350, 0) # whatsApp status top and bottom UI cropped
    scanned_text = get_text_from_image(cropped_image, image)

    # Print the extracted text
    to_print = f"<blockquote>{scanned_text.strip()}</blockquote>"
    print(to_print)

    # Append the extracted text to the output file
    output_file.write(f"{to_print.strip()}\n")

 output_file.close()

 # Print the contents of the output file
 with open('output.html', 'r') as file:
    print(f"\n\nOutput file contents:\n{file.read()}")
	# instructions: place images in same directory as this file. Run the file.

	from PIL import Image
	import pyocr
	import pyocr.builders
	import os

	# Print the list of png files
	def get_images_list():
	# Get the list of all files in the current directory
	all_files = os.listdir()

	# Filter the list to include only png files
	png_files = [file for file in all_files if file.endswith('.png')]

	return sorted(png_files)

	def crop_image(img, top = 0, right = 0, bottom = 0, left = 0):
	img = Image.open(img)
	width, height = img.size
	img = img.crop((left, top, width - right, height - bottom))
	return img

	def get_text_from_image(img, name = "\b"):
	# Use pyocr to extract text from the cropped image
	tools = pyocr.get_available_tools()
	tool = tools[0]

	# Set the OCR language
	lang = 'eng'

	# Use pyocr builders to configure the OCR
	builder = pyocr.builders.TextBuilder(tesseract_layout=6)

	# Extract text from the image
	result = tool.image_to_string(
	img,
	lang=lang,
	builder=builder
	)

	# Print the extracted text
	return result

	# Create a file to store the extracted text
	output_file = open('output.html', 'a')

	for image in get_images_list():
	cropped_image = crop_image(image, 250, 0, 350, 0) # whatsApp status top and bottom UI cropped
	scanned_text = get_text_from_image(cropped_image, image)

	# Print the extracted text
	to_print = f"<blockquote>{scanned_text.strip()}</blockquote>"
	print(to_print)

	# Append the extracted text to the output file
	output_file.write(f"{to_print.strip()}\n")

	output_file.close()

	# Print the contents of the output file
	with open('output.html', 'r') as file:
	print(f"\n\nOutput file contents:\n{file.read()}")
No results found