zafe · November 21, 2018 07:58
diff --git a/ocr2voice.py b/ocr2voice.py
 #by PradiptaSaha999

 import tesseract
 import cv2
 import cv2.cv as cv
 import numpy as np
 import pyttsx
 engine = pyttsx.init()
 engine.setProperty('rate', 100)

 scale = 1
 delta = 0
 ddepth = cv2.CV_16S

 gray=cv2.imread("Untitled.png")
 cv2.namedWindow("Main")
 cv2.imshow("Main", gray)
 ### trim the edges
 cut_offset=23
 gray=gray[cut_offset:-cut_offset,cut_offset:-cut_offset]

 ### convert to gray color
 gray = cv2.cvtColor(gray,cv2.COLOR_BGR2GRAY)

 ### edge enhancing by Sobeling
 # Gradient-X
 grad_x = cv2.Sobel(gray,ddepth,1,0,ksize = 3, scale = scale, delta = delta,borderType = cv2.BORDER_DEFAULT)
 #grad_x = cv2.Scharr(gray,ddepth,1,0)

 # Gradient-Y
 grad_y = cv2.Sobel(gray,ddepth,0,1,ksize = 3, scale = scale, delta = delta, borderType = cv2.BORDER_DEFAULT)
 #grad_y = cv2.Scharr(gray,ddepth,0,1)

 abs_grad_x = cv2.convertScaleAbs(grad_x)   # converting back to uint8
 abs_grad_y = cv2.convertScaleAbs(grad_y)
 gray = cv2.addWeighted(abs_grad_x,0.4,abs_grad_y,0.4,0)

 ### Bluring
 image1 = cv2.medianBlur(gray,5) 
 image1[image1 < 50]= 255
 image1 = cv2.GaussianBlur(image1,(31,13),0)     
 color_offset=220
 image1[image1 >= color_offset]= 255  
 image1[image1 < color_offset ] = 0      #black

 #### Insert White Border
 offset=30
 height,width = image1.shape
 image1=cv2.copyMakeBorder(image1,offset,offset,offset,offset,cv2.BORDER_CONSTANT,value=(255,255,255)) 
 cv2.namedWindow("Test")
 cv2.imshow("Test", image1)
 cv2.imwrite("an91cut_decoded.jpg",image1)

 ### tesseract OCR
 api = tesseract.TessBaseAPI()
 api.Init(".","eng",tesseract.OEM_DEFAULT)
 api.SetPageSegMode(tesseract.PSM_AUTO)
 #as suggested by zdenko podobny <[email protected]>, 
 #using PSM_SINGLE_BLOCK will be more reliable for ocr-ing a line of word. 
 #api.SetPageSegMode(tesseract.PSM_SINGLE_BLOCK)
 height1,width1 = image1.shape
 channel1=1
 image = cv.CreateImageHeader((width1,height1), cv.IPL_DEPTH_8U, channel1)
 cv.SetData(image, image1.tostring(),image1.dtype.itemsize * channel1 * (width1))
 tesseract.SetCvImage(image,api)
 text=api.GetUTF8Text()
 conf=api.MeanTextConf()
 image=None
 print "..............."
 print "Ocred Text: %s"%text
 engine.say(text)
 engine.runAndWait()
 print "Cofidence Level: %d %%"%conf
 cv2.waitKey(0)
 cv2.destroyWindow("Test")
 cv2.destroyWindow("Main")
 api.End()
	#by PradiptaSaha999

	import tesseract
	import cv2
	import cv2.cv as cv
	import numpy as np
	import pyttsx
	engine = pyttsx.init()
	engine.setProperty('rate', 100)

	scale = 1
	delta = 0
	ddepth = cv2.CV_16S

	gray=cv2.imread("Untitled.png")
	cv2.namedWindow("Main")
	cv2.imshow("Main", gray)
	### trim the edges
	cut_offset=23
	gray=gray[cut_offset:-cut_offset,cut_offset:-cut_offset]

	### convert to gray color
	gray = cv2.cvtColor(gray,cv2.COLOR_BGR2GRAY)

	### edge enhancing by Sobeling
	# Gradient-X
	grad_x = cv2.Sobel(gray,ddepth,1,0,ksize = 3, scale = scale, delta = delta,borderType = cv2.BORDER_DEFAULT)
	#grad_x = cv2.Scharr(gray,ddepth,1,0)

	# Gradient-Y
	grad_y = cv2.Sobel(gray,ddepth,0,1,ksize = 3, scale = scale, delta = delta, borderType = cv2.BORDER_DEFAULT)
	#grad_y = cv2.Scharr(gray,ddepth,0,1)

	abs_grad_x = cv2.convertScaleAbs(grad_x) # converting back to uint8
	abs_grad_y = cv2.convertScaleAbs(grad_y)
	gray = cv2.addWeighted(abs_grad_x,0.4,abs_grad_y,0.4,0)

	### Bluring
	image1 = cv2.medianBlur(gray,5)
	image1[image1 < 50]= 255
	image1 = cv2.GaussianBlur(image1,(31,13),0)
	color_offset=220
	image1[image1 >= color_offset]= 255
	image1[image1 < color_offset ] = 0 #black

	#### Insert White Border
	offset=30
	height,width = image1.shape
	image1=cv2.copyMakeBorder(image1,offset,offset,offset,offset,cv2.BORDER_CONSTANT,value=(255,255,255))
	cv2.namedWindow("Test")
	cv2.imshow("Test", image1)
	cv2.imwrite("an91cut_decoded.jpg",image1)

	### tesseract OCR
	api = tesseract.TessBaseAPI()
	api.Init(".","eng",tesseract.OEM_DEFAULT)
	api.SetPageSegMode(tesseract.PSM_AUTO)
	#as suggested by zdenko podobny <[email protected]>,
	#using PSM_SINGLE_BLOCK will be more reliable for ocr-ing a line of word.
	#api.SetPageSegMode(tesseract.PSM_SINGLE_BLOCK)
	height1,width1 = image1.shape
	channel1=1
	image = cv.CreateImageHeader((width1,height1), cv.IPL_DEPTH_8U, channel1)
	cv.SetData(image, image1.tostring(),image1.dtype.itemsize * channel1 * (width1))
	tesseract.SetCvImage(image,api)
	text=api.GetUTF8Text()
	conf=api.MeanTextConf()
	image=None
	print "..............."
	print "Ocred Text: %s"%text
	engine.say(text)
	engine.runAndWait()
	print "Cofidence Level: %d %%"%conf
	cv2.waitKey(0)
	cv2.destroyWindow("Test")
	cv2.destroyWindow("Main")
	api.End()