osya · May 26, 2015 19:58
diff --git a/neural.py b/neural.py
 # Source: https://getpocket.com/a/read/932998243

 import copy
 import numpy as np
 import random as rd
 import theano.tensor as th


 class network:
    # layers -list [5 10 10 5] - 5 input, 2 hidden
    # layers (10 neurons each), 5 output

    def create(self, layers):
        theta = [0]
        # for each layer from the first (skip zero layer!)
        for i in range(1, len(layers)):
            # create nxM+1 matrix (+bias!) with random floats in range [-1; 1]
            theta.append(
                np.mat(np.random.uniform(-1, 1, (layers[i], layers[i - 1] + 1))))
        nn = {'theta': theta, 'structure': layers}
        return nn

    def runAll(self, nn, X):
        z = [0]
        m = len(X)
        a = [copy.deepcopy(X)]  # a[0] is equal to the first input values
        logFunc = self.logisticFunctionVectorize()
        # for each layer except the input
        for i in range(1, len(nn['structure'])):
            # add bias column to the previous matrix of activation functions
            a[i - 1] = np.c_[np.ones(m), a[i - 1]]
            # for all neurons in current layer multiply corresponds neurons
            z.append(a[i - 1] * nn['theta'][i].T)
            # in previous layers by the appropriate weights and sum the
            # productions
            a.append(logFunc(z[i]))  # apply activation function for each value
        nn['z'] = z
        nn['a'] = a
        return a[len(nn['structure']) - 1]

    def run(self, nn, input):
        z = [0]
        a = []
        a.append(copy.deepcopy(input))
        a[0] = np.matrix(a[0]).T  # nx1 vector
        logFunc = self.logisticFunctionVectorize()
        for i in range(1, len(nn['structure'])):
            a[i - 1] = np.vstack(([1], a[i - 1]))
            z.append(nn['theta'][i] * a[i - 1])
            a.append(logFunc(z[i]))
        nn['z'] = z
        nn['a'] = a
        return a[len(nn['structure']) - 1]

    def logisticFunction(self, x):
        a = 1 / (1 + np.exp(-x))
        if a == 1:
            a = 0.99999  # make smallest step to the direction of zero
        elif a == 0:
            a = 0.00001  # It is possible to use np.nextafter(0, 1) and
        # make smallest step to the direction of one, but sometimes this step
        # is too small and other algorithms fail :)
        return a

    def logisticFunctionVectorize(self):
        return np.vectorize(self.logisticFunction)

    def costTotal(self, theta, nn, X, y, lamb):
        m = len(X)
        # following string is for fmin_cg computaton
        if type(theta) == np.ndarray:
            nn['theta'] = self.roll(theta, nn['structure'])
        y = np.matrix(copy.deepcopy(y))
        # feed forward to obtain output of neural network
        hAll = self.runAll(nn, X)
        cost = self.cost(hAll, y)
        # apply regularization
        return cost / m + (lamb / (2 * m)) * self.regul(nn['theta'])

    def cost(self, h, y):
        logH = np.log(h)
        log1H = np.log(1 - h)
        # transpose y for matrix multiplication
        cost = -1 * y.T * logH - (1 - y.T) * log1H
        # sum matrix of costs for each output neuron and input vector
        return cost.sum(axis=0).sum(axis=1)

    def regul(self, theta):
        reg = 0
        thetaLocal = copy.deepcopy(theta)
        for i in range(1, len(thetaLocal)):
            # delete bias connection
            thetaLocal[i] = np.delete(thetaLocal[i], 0, 1)
            # square the values because they can be negative
            thetaLocal[i] = np.power(thetaLocal[i], 2)
            # sum at first rows, than columns
            reg += thetaLocal[i].sum(axis=0).sum(axis=1)
        return reg

    def backpropagation(self, theta, nn, X, y, lamb):
        layersNumb = len(nn['structure'])
        thetaDelta = [0] * (layersNumb)
        m = len(X)
        # calculate matrix of outpit values for all input vectors X
        hLoc = copy.deepcopy(self.runAll(nn, X))
        yLoc = np.matrix(y)
        thetaLoc = copy.deepcopy(nn['theta'])
        derFunct = np.vectorize(
            lambda x: (1 / (1 + np.exp(-x))) * (1 - (1 / (1 + np.exp(-x)))))

        zLoc = copy.deepcopy(nn['z'])
        aLoc = copy.deepcopy(nn['a'])
        for n in range(0, len(X)):
            delta = [0] * (layersNumb + 1)  # fill list with zeros
            # calculate delta of error of output layer
            delta[len(delta) - 1] = (hLoc[n].T - yLoc[n].T)
            for i in range(layersNumb - 1, 0, -1):
                # we can not calculate delta[0] because we don't have theta[0]
                # (and even we don't need it)
                if i > 1:
                    z = zLoc[i - 1][n]
                    # add one for correct matrix multiplication
                    z = np.c_[[[1]], z]
                    delta[i] = np.multiply(
                        thetaLoc[i].T * delta[i + 1], derFunct(z).T)
                    delta[i] = delta[i][1:]
                thetaDelta[i] = thetaDelta[i] + delta[i + 1] * aLoc[i - 1][n]

        for i in range(1, len(thetaDelta)):
            thetaDelta[i] = thetaDelta[i] / m
            thetaDelta[i][:, 1:] = thetaDelta[i][:, 1:] + \
                                   thetaLoc[i][:, 1:] * (lamb / m)  # regularization

        if type(theta) == np.ndarray:
            # to work also with fmin_cg
            return np.asarray(self.unroll(thetaDelta)).reshape(-1)
        return thetaDelta

    # create 1d array form lists like theta
    def unroll(self, arr):
        for i in range(0, len(arr)):
            arr[i] = np.matrix(arr[i])
            if i == 0:
                res = (arr[i]).ravel().T
            else:
                res = np.vstack((res, (arr[i]).ravel().T))
        res.shape = (1, len(res))
        return res
    # roll back 1d array to list with matrices according to given structure

    def roll(self, arr, structure):
        rolled = [arr[0]]
        shift = 1
        for i in range(1, len(structure)):
            temparr = copy.deepcopy(
                arr[shift:shift + structure[i] * (structure[i - 1] + 1)])
            temparr.shape = (structure[i], structure[i - 1] + 1)
            rolled.append(np.matrix(temparr))
            shift += structure[i] * (structure[i - 1] + 1)
        return rolled
	# Source: https://getpocket.com/a/read/932998243

	import copy
	import numpy as np
	import random as rd
	import theano.tensor as th


	class network:
	# layers -list [5 10 10 5] - 5 input, 2 hidden
	# layers (10 neurons each), 5 output

	def create(self, layers):
	theta = [0]
	# for each layer from the first (skip zero layer!)
	for i in range(1, len(layers)):
	# create nxM+1 matrix (+bias!) with random floats in range [-1; 1]
	theta.append(
	np.mat(np.random.uniform(-1, 1, (layers[i], layers[i - 1] + 1))))
	nn = {'theta': theta, 'structure': layers}
	return nn

	def runAll(self, nn, X):
	z = [0]
	m = len(X)
	a = [copy.deepcopy(X)] # a[0] is equal to the first input values
	logFunc = self.logisticFunctionVectorize()
	# for each layer except the input
	for i in range(1, len(nn['structure'])):
	# add bias column to the previous matrix of activation functions
	a[i - 1] = np.c_[np.ones(m), a[i - 1]]
	# for all neurons in current layer multiply corresponds neurons
	z.append(a[i - 1] * nn['theta'][i].T)
	# in previous layers by the appropriate weights and sum the
	# productions
	a.append(logFunc(z[i])) # apply activation function for each value
	nn['z'] = z
	nn['a'] = a
	return a[len(nn['structure']) - 1]

	def run(self, nn, input):
	z = [0]
	a = []
	a.append(copy.deepcopy(input))
	a[0] = np.matrix(a[0]).T # nx1 vector
	logFunc = self.logisticFunctionVectorize()
	for i in range(1, len(nn['structure'])):
	a[i - 1] = np.vstack(([1], a[i - 1]))
	z.append(nn['theta'][i] * a[i - 1])
	a.append(logFunc(z[i]))
	nn['z'] = z
	nn['a'] = a
	return a[len(nn['structure']) - 1]

	def logisticFunction(self, x):
	a = 1 / (1 + np.exp(-x))
	if a == 1:
	a = 0.99999 # make smallest step to the direction of zero
	elif a == 0:
	a = 0.00001 # It is possible to use np.nextafter(0, 1) and
	# make smallest step to the direction of one, but sometimes this step
	# is too small and other algorithms fail :)
	return a

	def logisticFunctionVectorize(self):
	return np.vectorize(self.logisticFunction)

	def costTotal(self, theta, nn, X, y, lamb):
	m = len(X)
	# following string is for fmin_cg computaton
	if type(theta) == np.ndarray:
	nn['theta'] = self.roll(theta, nn['structure'])
	y = np.matrix(copy.deepcopy(y))
	# feed forward to obtain output of neural network
	hAll = self.runAll(nn, X)
	cost = self.cost(hAll, y)
	# apply regularization
	return cost / m + (lamb / (2 * m)) * self.regul(nn['theta'])

	def cost(self, h, y):
	logH = np.log(h)
	log1H = np.log(1 - h)
	# transpose y for matrix multiplication
	cost = -1 * y.T * logH - (1 - y.T) * log1H
	# sum matrix of costs for each output neuron and input vector
	return cost.sum(axis=0).sum(axis=1)

	def regul(self, theta):
	reg = 0
	thetaLocal = copy.deepcopy(theta)
	for i in range(1, len(thetaLocal)):
	# delete bias connection
	thetaLocal[i] = np.delete(thetaLocal[i], 0, 1)
	# square the values because they can be negative
	thetaLocal[i] = np.power(thetaLocal[i], 2)
	# sum at first rows, than columns
	reg += thetaLocal[i].sum(axis=0).sum(axis=1)
	return reg

	def backpropagation(self, theta, nn, X, y, lamb):
	layersNumb = len(nn['structure'])
	thetaDelta = [0] * (layersNumb)
	m = len(X)
	# calculate matrix of outpit values for all input vectors X
	hLoc = copy.deepcopy(self.runAll(nn, X))
	yLoc = np.matrix(y)
	thetaLoc = copy.deepcopy(nn['theta'])
	derFunct = np.vectorize(
	lambda x: (1 / (1 + np.exp(-x))) * (1 - (1 / (1 + np.exp(-x)))))

	zLoc = copy.deepcopy(nn['z'])
	aLoc = copy.deepcopy(nn['a'])
	for n in range(0, len(X)):
	delta = [0] * (layersNumb + 1) # fill list with zeros
	# calculate delta of error of output layer
	delta[len(delta) - 1] = (hLoc[n].T - yLoc[n].T)
	for i in range(layersNumb - 1, 0, -1):
	# we can not calculate delta[0] because we don't have theta[0]
	# (and even we don't need it)
	if i > 1:
	z = zLoc[i - 1][n]
	# add one for correct matrix multiplication
	z = np.c_[[[1]], z]
	delta[i] = np.multiply(
	thetaLoc[i].T * delta[i + 1], derFunct(z).T)
	delta[i] = delta[i][1:]
	thetaDelta[i] = thetaDelta[i] + delta[i + 1] * aLoc[i - 1][n]

	for i in range(1, len(thetaDelta)):
	thetaDelta[i] = thetaDelta[i] / m
	thetaDelta[i][:, 1:] = thetaDelta[i][:, 1:] + \
	thetaLoc[i][:, 1:] * (lamb / m) # regularization

	if type(theta) == np.ndarray:
	# to work also with fmin_cg
	return np.asarray(self.unroll(thetaDelta)).reshape(-1)
	return thetaDelta

	# create 1d array form lists like theta
	def unroll(self, arr):
	for i in range(0, len(arr)):
	arr[i] = np.matrix(arr[i])
	if i == 0:
	res = (arr[i]).ravel().T
	else:
	res = np.vstack((res, (arr[i]).ravel().T))
	res.shape = (1, len(res))
	return res
	# roll back 1d array to list with matrices according to given structure

	def roll(self, arr, structure):
	rolled = [arr[0]]
	shift = 1
	for i in range(1, len(structure)):
	temparr = copy.deepcopy(
	arr[shift:shift + structure[i] * (structure[i - 1] + 1)])
	temparr.shape = (structure[i], structure[i - 1] + 1)
	rolled.append(np.matrix(temparr))
	shift += structure[i] * (structure[i - 1] + 1)
	return rolled