TimSC · June 19, 2013 00:12
diff --git a/fast_hog.pyx b/fast_hog.pyx
 # cython: profile=True
 # cython: cdivision=True
 # cython: boundscheck=False
 # cython: wraparound=False

 import cmath, math
 cimport numpy as np
 import numpy as np
 '''
 Based on _hog.py from https://github.com/scikit-image/scikit-image

 Copyright (C) 2011, the scikit-image team
 (C) 2013 Tim Sheerman-Chase
 All rights reserved.

 Redistribution and use in source and binary forms, with or without
 modification, are permitted provided that the following conditions are
 met:

 1. Redistributions of source code must retain the above copyright
 	notice, this list of conditions and the following disclaimer.
 2. Redistributions in binary form must reproduce the above copyright
 	notice, this list of conditions and the following disclaimer in
 	the documentation and/or other materials provided with the
 	distribution.
 3. Neither the name of skimage nor the names of its contributors may be
 	used to endorse or promote products derived from this software without
 	specific prior written permission.

 THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
 IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
 INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
 STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
 IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 POSSIBILITY OF SUCH DAMAGE.
 '''

 import numpy as np
 from scipy import sqrt, pi, arctan2, cos, sin

 cdef float CellHog(np.ndarray[np.float64_t, ndim=2] magnitude, 
 	np.ndarray[np.float64_t, ndim=2] orientation,
 	float ori1, float ori2,
 	int cx, int cy, int xi, int yi, int sx, int sy):
 	cdef int cx1, cy1

 	cdef float total = 0.
 	for cy1 in range(-cy/2, cy/2):
 		for cx1 in range(-cx/2, cx/2):
 			if yi + cy1 < 0: continue
 			if yi + cy1 >= sy: continue
 			if xi + cx1 < 0: continue
 			if xi + cx1 >= sx: continue
 			if orientation[yi + cy1, xi + cx1] >= ori1: continue
 			if orientation[yi + cy1, xi + cx1] < ori2: continue

 			total += magnitude[yi + cy1, xi + cx1]

 	return total

 cdef HogThirdStage(np.ndarray[np.float64_t, ndim=2] gx, \
 	np.ndarray[np.float64_t, ndim=2] gy, 
 	int cx, int cy, #Pixels per cell
 	int bx, int by, 
 	int sx, int sy, #Image size
 	int n_cellsx, int n_cellsy, 
 	int visualise, int orientations, 
 	np.ndarray[np.float64_t, ndim=3] orientation_histogram):

 	"""
 	The third stage aims to produce an encoding that is sensitive to
 	local image content while remaining resistant to small changes in
 	pose or appearance. The adopted method pools gradient orientation
 	information locally in the same way as the SIFT [Lowe 2004]
 	feature. The image window is divided into small spatial regions,
 	called "cells". For each cell we accumulate a local 1-D histogram
 	of gradient or edge orientations over all the pixels in the
 	cell. This combined cell-level 1-D histogram forms the basic
 	"orientation histogram" representation. Each orientation histogram
 	divides the gradient angle range into a fixed number of
 	predetermined bins. The gradient magnitudes of the pixels in the
 	cell are used to vote into the orientation histogram.
 	"""

 	cdef np.ndarray[np.float64_t, ndim=2] magnitude = sqrt(gx**2 + gy**2)
 	cdef np.ndarray[np.float64_t, ndim=2] orientation = arctan2(gy, gx) * (180 / pi) % 180
 	cdef int i, x, y, o, yi, xi, cy1, cy2, cx1, cx2
 	cdef float ori1, ori2

 	# compute orientations integral images

 	for i in range(orientations):
 		# isolate orientations in this range

 		ori1 = 180. / orientations * (i + 1)
 		ori2 = 180. / orientations * i

 		y = cy / 2
 		cy2 = cy * n_cellsy
 		x = cx / 2
 		cx2 = cx * n_cellsx
 		yi = 0
 		xi = 0

 		while y < cy2:
 			xi = 0
 			x = cx / 2

 			while x < cx2:
 				orientation_histogram[yi, xi, i] = CellHog(magnitude, orientation, ori1, ori2, cx, cy, x, y, sx, sy)
 				xi += 1
 				x += cx

 			yi += 1
 			y += cy


 cdef VisualiseHistograms(int cx, int cy, 
 	int n_cellsx, int n_cellsy, 
 	int orientations, 
 	np.ndarray[np.float64_t, ndim=3] orientation_histogram, 
 	np.ndarray[np.float64_t, ndim=2] hog_image):

 	# now for each cell, compute the histogram
 	from skimage import draw

 	radius = min(cx, cy) // 2 - 1
 	for x in range(n_cellsx):
 		for y in range(n_cellsy):
 			for o in range(orientations):
 				centre = tuple([y * cy + cy // 2, x * cx + cx // 2])
 				dx = radius * cos(float(o) / orientations * np.pi)
 				dy = radius * sin(float(o) / orientations * np.pi)
 				rr, cc = draw.line(int(centre[0] - dx),
 								   int(centre[1] - dy),
 								   int(centre[0] + dx),
 								   int(centre[1] + dy))
 				hog_image[rr, cc] += orientation_histogram[y, x, o]



 def hog(np.ndarray[np.float64_t, ndim=2] image, 
 		int orientations=9, 
 		pixels_per_cell=(8, 8),
 		cells_per_block=(3, 3), 
 		int visualise=0, int normalise=0):
 	"""Extract Histogram of Oriented Gradients (HOG) for a given image.

 	Compute a Histogram of Oriented Gradients (HOG) by

 		1. (optional) global image normalisation
 		2. computing the gradient image in x and y
 		3. computing gradient histograms
 		4. normalising across blocks
 		5. flattening into a feature vector

 	Parameters
 	----------
 	image : (M, N) ndarray
 		Input image (greyscale).
 	orientations : int
 		Number of orientation bins.
 	pixels_per_cell : 2 tuple (int, int)
 		Size (in pixels) of a cell.
 	cells_per_block  : 2 tuple (int,int)
 		Number of cells in each block.
 	visualise : bool, optional
 		Also return an image of the HOG.
 	normalise : bool, optional
 		Apply power law compression to normalise the image before
 		processing.

 	Returns
 	-------
 	newarr : ndarray
 		HOG for the image as a 1D (flattened) array.
 	hog_image : ndarray (if visualise=True)
 		A visualisation of the HOG image.

 	References
 	----------
 	* http://en.wikipedia.org/wiki/Histogram_of_oriented_gradients

 	* Dalal, N and Triggs, B, Histograms of Oriented Gradients for
 	  Human Detection, IEEE Computer Society Conference on Computer
 	  Vision and Pattern Recognition 2005 San Diego, CA, USA

 	"""

 	"""
 	The first stage applies an optional global image normalisation
 	equalisation that is designed to reduce the influence of illumination
 	effects. In practice we use gamma (power law) compression, either
 	computing the square root or the log of each colour channel.
 	Image texture strength is typically proportional to the local surface
 	illumination so this compression helps to reduce the effects of local
 	shadowing and illumination variations.
 	"""

 	if normalise:
 		image = sqrt(image)

 	"""
 	The second stage computes first order image gradients. These capture
 	contour, silhouette and some texture information, while providing
 	further resistance to illumination variations. The locally dominant
 	colour channel is used, which provides colour invariance to a large
 	extent. Variant methods may also include second order image derivatives,
 	which act as primitive bar detectors - a useful feature for capturing,
 	e.g. bar like structures in bicycles and limbs in humans.
 	"""

 	cdef int sy = image.shape[0]
 	cdef int sx = image.shape[1]
 	cdef np.ndarray[np.float64_t, ndim=2] gx = np.zeros((sy,sx))
 	cdef np.ndarray[np.float64_t, ndim=2] gy = np.zeros((sy,sx))
 	gx[:, :-1] = np.diff(image, n=1, axis=1)
 	gy[:-1, :] = np.diff(image, n=1, axis=0)

 	cdef int cx = pixels_per_cell[0]
 	cdef int cy = pixels_per_cell[1]
 	cdef int bx = cells_per_block[0]
 	cdef int by = cells_per_block[1]
 	
 	cdef int n_cellsx = int(np.floor(sx // cx))  # number of cells in x
 	cdef int n_cellsy = int(np.floor(sy // cy))  # number of cells in y

 	cdef np.ndarray[np.float64_t, ndim=3] orientation_histogram = np.zeros((n_cellsy, n_cellsx, orientations))
 	HogThirdStage(gx, gy, cx, cy, bx, by, sx, sy, n_cellsx, n_cellsy, 
 		visualise, orientations, orientation_histogram)

 	cdef np.ndarray[np.float64_t, ndim=2] hog_image
 	if visualise:
 		hog_image = np.zeros((sy, sx), dtype=float)
 		VisualiseHistograms(cx, cy, n_cellsx, n_cellsy, 
 			orientations, orientation_histogram, hog_image)

 	"""
 	The fourth stage computes normalisation, which takes local groups of
 	cells and contrast normalises their overall responses before passing
 	to next stage. Normalisation introduces better invariance to illumination,
 	shadowing, and edge contrast. It is performed by accumulating a measure
 	of local histogram "energy" over local groups of cells that we call
 	"blocks". The result is used to normalise each cell in the block.
 	Typically each individual cell is shared between several blocks, but
 	its normalisations are block dependent and thus different. The cell
 	thus appears several times in the final output vector with different
 	normalisations. This may seem redundant but it improves the performance.
 	We refer to the normalised block descriptors as Histogram of Oriented
 	Gradient (HOG) descriptors.
 	"""

 	cdef int n_blocksx = (n_cellsx - bx) + 1
 	cdef int n_blocksy = (n_cellsy - by) + 1
 	normalised_blocks = np.zeros((n_blocksy, n_blocksx,
 								  by, bx, orientations))

 	for x in range(n_blocksx):
 		for y in range(n_blocksy):
 			block = orientation_histogram[y:y + by, x:x + bx, :]
 			eps = 1e-5
 			normalised_blocks[y, x, :] = block / sqrt(block.sum()**2 + eps)

 	"""
 	The final step collects the HOG descriptors from all blocks of a dense
 	overlapping grid of blocks covering the detection window into a combined
 	feature vector for use in the window classifier.
 	"""

 	if visualise:
 		return normalised_blocks.ravel(), hog_image
 	else:
 		return normalised_blocks.ravel()
	# cython: profile=True
	# cython: cdivision=True
	# cython: boundscheck=False
	# cython: wraparound=False

	import cmath, math
	cimport numpy as np
	import numpy as np
	'''
	Based on _hog.py from https://github.com/scikit-image/scikit-image

	Copyright (C) 2011, the scikit-image team
	(C) 2013 Tim Sheerman-Chase
	All rights reserved.

	Redistribution and use in source and binary forms, with or without
	modification, are permitted provided that the following conditions are
	met:

	1. Redistributions of source code must retain the above copyright
	notice, this list of conditions and the following disclaimer.
	2. Redistributions in binary form must reproduce the above copyright
	notice, this list of conditions and the following disclaimer in
	the documentation and/or other materials provided with the
	distribution.
	3. Neither the name of skimage nor the names of its contributors may be
	used to endorse or promote products derived from this software without
	specific prior written permission.

	THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
	IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
	WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
	DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
	INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
	(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
	SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
	HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
	STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
	IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
	POSSIBILITY OF SUCH DAMAGE.
	'''

	import numpy as np
	from scipy import sqrt, pi, arctan2, cos, sin

	cdef float CellHog(np.ndarray[np.float64_t, ndim=2] magnitude,
	np.ndarray[np.float64_t, ndim=2] orientation,
	float ori1, float ori2,
	int cx, int cy, int xi, int yi, int sx, int sy):
	cdef int cx1, cy1

	cdef float total = 0.
	for cy1 in range(-cy/2, cy/2):
	for cx1 in range(-cx/2, cx/2):
	if yi + cy1 < 0: continue
	if yi + cy1 >= sy: continue
	if xi + cx1 < 0: continue
	if xi + cx1 >= sx: continue
	if orientation[yi + cy1, xi + cx1] >= ori1: continue
	if orientation[yi + cy1, xi + cx1] < ori2: continue

	total += magnitude[yi + cy1, xi + cx1]

	return total

	cdef HogThirdStage(np.ndarray[np.float64_t, ndim=2] gx, \
	np.ndarray[np.float64_t, ndim=2] gy,
	int cx, int cy, #Pixels per cell
	int bx, int by,
	int sx, int sy, #Image size
	int n_cellsx, int n_cellsy,
	int visualise, int orientations,
	np.ndarray[np.float64_t, ndim=3] orientation_histogram):

	"""
	The third stage aims to produce an encoding that is sensitive to
	local image content while remaining resistant to small changes in
	pose or appearance. The adopted method pools gradient orientation
	information locally in the same way as the SIFT [Lowe 2004]
	feature. The image window is divided into small spatial regions,
	called "cells". For each cell we accumulate a local 1-D histogram
	of gradient or edge orientations over all the pixels in the
	cell. This combined cell-level 1-D histogram forms the basic
	"orientation histogram" representation. Each orientation histogram
	divides the gradient angle range into a fixed number of
	predetermined bins. The gradient magnitudes of the pixels in the
	cell are used to vote into the orientation histogram.
	"""

	cdef np.ndarray[np.float64_t, ndim=2] magnitude = sqrt(gx2 + gy2)
	cdef np.ndarray[np.float64_t, ndim=2] orientation = arctan2(gy, gx) * (180 / pi) % 180
	cdef int i, x, y, o, yi, xi, cy1, cy2, cx1, cx2
	cdef float ori1, ori2

	# compute orientations integral images

	for i in range(orientations):
	# isolate orientations in this range

	ori1 = 180. / orientations * (i + 1)
	ori2 = 180. / orientations * i

	y = cy / 2
	cy2 = cy * n_cellsy
	x = cx / 2
	cx2 = cx * n_cellsx
	yi = 0
	xi = 0

	while y < cy2:
	xi = 0
	x = cx / 2

	while x < cx2:
	orientation_histogram[yi, xi, i] = CellHog(magnitude, orientation, ori1, ori2, cx, cy, x, y, sx, sy)
	xi += 1
	x += cx

	yi += 1
	y += cy


	cdef VisualiseHistograms(int cx, int cy,
	int n_cellsx, int n_cellsy,
	int orientations,
	np.ndarray[np.float64_t, ndim=3] orientation_histogram,
	np.ndarray[np.float64_t, ndim=2] hog_image):

	# now for each cell, compute the histogram
	from skimage import draw

	radius = min(cx, cy) // 2 - 1
	for x in range(n_cellsx):
	for y in range(n_cellsy):
	for o in range(orientations):
	centre = tuple([y * cy + cy // 2, x * cx + cx // 2])
	dx = radius * cos(float(o) / orientations * np.pi)
	dy = radius * sin(float(o) / orientations * np.pi)
	rr, cc = draw.line(int(centre[0] - dx),
	int(centre[1] - dy),
	int(centre[0] + dx),
	int(centre[1] + dy))
	hog_image[rr, cc] += orientation_histogram[y, x, o]



	def hog(np.ndarray[np.float64_t, ndim=2] image,
	int orientations=9,
	pixels_per_cell=(8, 8),
	cells_per_block=(3, 3),
	int visualise=0, int normalise=0):
	"""Extract Histogram of Oriented Gradients (HOG) for a given image.

	Compute a Histogram of Oriented Gradients (HOG) by

	1. (optional) global image normalisation
	2. computing the gradient image in x and y
	3. computing gradient histograms
	4. normalising across blocks
	5. flattening into a feature vector

	Parameters
	----------
	image : (M, N) ndarray
	Input image (greyscale).
	orientations : int
	Number of orientation bins.
	pixels_per_cell : 2 tuple (int, int)
	Size (in pixels) of a cell.
	cells_per_block : 2 tuple (int,int)
	Number of cells in each block.
	visualise : bool, optional
	Also return an image of the HOG.
	normalise : bool, optional
	Apply power law compression to normalise the image before
	processing.

	Returns
	-------
	newarr : ndarray
	HOG for the image as a 1D (flattened) array.
	hog_image : ndarray (if visualise=True)
	A visualisation of the HOG image.

	References
	----------
	* http://en.wikipedia.org/wiki/Histogram_of_oriented_gradients

	* Dalal, N and Triggs, B, Histograms of Oriented Gradients for
	Human Detection, IEEE Computer Society Conference on Computer
	Vision and Pattern Recognition 2005 San Diego, CA, USA

	"""

	"""
	The first stage applies an optional global image normalisation
	equalisation that is designed to reduce the influence of illumination
	effects. In practice we use gamma (power law) compression, either
	computing the square root or the log of each colour channel.
	Image texture strength is typically proportional to the local surface
	illumination so this compression helps to reduce the effects of local
	shadowing and illumination variations.
	"""

	if normalise:
	image = sqrt(image)

	"""
	The second stage computes first order image gradients. These capture
	contour, silhouette and some texture information, while providing
	further resistance to illumination variations. The locally dominant
	colour channel is used, which provides colour invariance to a large
	extent. Variant methods may also include second order image derivatives,
	which act as primitive bar detectors - a useful feature for capturing,
	e.g. bar like structures in bicycles and limbs in humans.
	"""

	cdef int sy = image.shape[0]
	cdef int sx = image.shape[1]
	cdef np.ndarray[np.float64_t, ndim=2] gx = np.zeros((sy,sx))
	cdef np.ndarray[np.float64_t, ndim=2] gy = np.zeros((sy,sx))
	gx[:, :-1] = np.diff(image, n=1, axis=1)
	gy[:-1, :] = np.diff(image, n=1, axis=0)

	cdef int cx = pixels_per_cell[0]
	cdef int cy = pixels_per_cell[1]
	cdef int bx = cells_per_block[0]
	cdef int by = cells_per_block[1]

	cdef int n_cellsx = int(np.floor(sx // cx)) # number of cells in x
	cdef int n_cellsy = int(np.floor(sy // cy)) # number of cells in y

	cdef np.ndarray[np.float64_t, ndim=3] orientation_histogram = np.zeros((n_cellsy, n_cellsx, orientations))
	HogThirdStage(gx, gy, cx, cy, bx, by, sx, sy, n_cellsx, n_cellsy,
	visualise, orientations, orientation_histogram)

	cdef np.ndarray[np.float64_t, ndim=2] hog_image
	if visualise:
	hog_image = np.zeros((sy, sx), dtype=float)
	VisualiseHistograms(cx, cy, n_cellsx, n_cellsy,
	orientations, orientation_histogram, hog_image)

	"""
	The fourth stage computes normalisation, which takes local groups of
	cells and contrast normalises their overall responses before passing
	to next stage. Normalisation introduces better invariance to illumination,
	shadowing, and edge contrast. It is performed by accumulating a measure
	of local histogram "energy" over local groups of cells that we call
	"blocks". The result is used to normalise each cell in the block.
	Typically each individual cell is shared between several blocks, but
	its normalisations are block dependent and thus different. The cell
	thus appears several times in the final output vector with different
	normalisations. This may seem redundant but it improves the performance.
	We refer to the normalised block descriptors as Histogram of Oriented
	Gradient (HOG) descriptors.
	"""

	cdef int n_blocksx = (n_cellsx - bx) + 1
	cdef int n_blocksy = (n_cellsy - by) + 1
	normalised_blocks = np.zeros((n_blocksy, n_blocksx,
	by, bx, orientations))

	for x in range(n_blocksx):
	for y in range(n_blocksy):
	block = orientation_histogram[y:y + by, x:x + bx, :]
	eps = 1e-5
	normalised_blocks[y, x, :] = block / sqrt(block.sum()**2 + eps)

	"""
	The final step collects the HOG descriptors from all blocks of a dense
	overlapping grid of blocks covering the detection window into a combined
	feature vector for use in the window classifier.
	"""

	if visualise:
	return normalised_blocks.ravel(), hog_image
	else:
	return normalised_blocks.ravel()