tolleiv · September 28, 2012 08:51
diff --git a/gistfile1.txt b/gistfile1.txt
 # origin: http://sifter.org/~simon/journal/20061211.html
 # further resource to get the context: http://www.stat.osu.edu/~dmsl/Koren_2009.pdf

 samples = [[1,1,5.0], [1,2,3.0], [1,3,2.5],
           [2,1,2.0], [2,2,2.5], [2,3,5.0], [2,4,2.0],
 	   [3,1,2.5], [3,4,4.0], [3,5,4.5], [3,7,5.0],
 	   [4,1,5.0], [4,3,3.0], [4,4,4.5], [4,6,4.0],
 	   [5,1,4.0], [5,1,3.0], [5,1,2.0], [5,4,4.0], [5,5,3.5], [5,6,4.0]]

 # avoid overfitting	   
 lambda=0.02
 # primary learning rate - in addition learning has to converge to gamma^2
 gamma=0.005
 # amount of features - 2 works fine / 5 seems to be the maximum
 features = 3
 # initialize features - value is not really important
 init = Array.new(features, 0.1)
 u = Array.new(5).fill { init.clone }
 uB = Array.new(5, 0)
 i = Array.new(7).fill { init.clone }
 iB = Array.new(7, 0)

 def dot_product l1, l2
    sum = 0
    for i in 0...l1.size
        sum += l1[i] * l2[i]
    end
    sum
 end

 def predict uX,iX,u,i,uB,iB
     iB[iX] + uB[uX] + dot_product(i[iX],u[uX])
 end

 # training
 features.times do |feat|
    old = 0; uN = 0; iN = 0; x = 0
    begin
 	old = uN.abs+iN.abs
        samples.each do |s|
            uX = s[0]-1; iX = s[1]-1
            err = s[2] - (iB[iX] + uB[uX] + dot_product(i[iX],u[uX]))
 	    uN = u[uX][feat] + gamma * (err*i[iX][feat]-lambda*u[uX][feat])
 	    iN = i[iX][feat] + gamma * (err*u[uX][feat]-lambda*i[iX][feat])
 	    uBn = uB[uX] + gamma * (err-lambda*uB[uX])
 	    iBn = iB[iX] + gamma * (err-lambda*iB[iX])
 	    u[uX][feat] = uN
 	    i[iX][feat] = iN
 	    uB[uX] = uBn
 	    iB[iX] = iBn
 	end
 	x+=1
    end while (old+gamma**2 < uN.abs+iN.abs)
    puts "learning feature #{feat} took #{x} iterations"
 end

 # let's see what we got:
 puts "User:"
 u.each { |uR| uR.each {|v| print " %.2f" % v }; puts "" }
 puts uB.inspect
 puts "Items:"
 i.each { |iR| iR.each {|v| print " %.2f" % v }; puts "" }
 puts iB.inspect
 # And here's a prediction
 puts "User 1 - Item 4: %.2f (should be close to 4)" % predict(0,3,u,i,uB,iB)
	# origin: http://sifter.org/~simon/journal/20061211.html
	# further resource to get the context: http://www.stat.osu.edu/~dmsl/Koren_2009.pdf

	samples = [[1,1,5.0], [1,2,3.0], [1,3,2.5],
	[2,1,2.0], [2,2,2.5], [2,3,5.0], [2,4,2.0],
	[3,1,2.5], [3,4,4.0], [3,5,4.5], [3,7,5.0],
	[4,1,5.0], [4,3,3.0], [4,4,4.5], [4,6,4.0],
	[5,1,4.0], [5,1,3.0], [5,1,2.0], [5,4,4.0], [5,5,3.5], [5,6,4.0]]

	# avoid overfitting
	lambda=0.02
	# primary learning rate - in addition learning has to converge to gamma^2
	gamma=0.005
	# amount of features - 2 works fine / 5 seems to be the maximum
	features = 3
	# initialize features - value is not really important
	init = Array.new(features, 0.1)
	u = Array.new(5).fill { init.clone }
	uB = Array.new(5, 0)
	i = Array.new(7).fill { init.clone }
	iB = Array.new(7, 0)

	def dot_product l1, l2
	sum = 0
	for i in 0...l1.size
	sum += l1[i] * l2[i]
	end
	sum
	end

	def predict uX,iX,u,i,uB,iB
	iB[iX] + uB[uX] + dot_product(i[iX],u[uX])
	end

	# training
	features.times do \|feat\|
	old = 0; uN = 0; iN = 0; x = 0
	begin
	old = uN.abs+iN.abs
	samples.each do \|s\|
	uX = s[0]-1; iX = s[1]-1
	err = s[2] - (iB[iX] + uB[uX] + dot_product(i[iX],u[uX]))
	uN = u[uX][feat] + gamma * (erri[iX][feat]-lambdau[uX][feat])
	iN = i[iX][feat] + gamma * (erru[uX][feat]-lambdai[iX][feat])
	uBn = uB[uX] + gamma * (err-lambda*uB[uX])
	iBn = iB[iX] + gamma * (err-lambda*iB[iX])
	u[uX][feat] = uN
	i[iX][feat] = iN
	uB[uX] = uBn
	iB[iX] = iBn
	end
	x+=1
	end while (old+gamma**2 < uN.abs+iN.abs)
	puts "learning feature #{feat} took #{x} iterations"
	end

	# let's see what we got:
	puts "User:"
	u.each { \|uR\| uR.each {\|v\| print " %.2f" % v }; puts "" }
	puts uB.inspect
	puts "Items:"
	i.each { \|iR\| iR.each {\|v\| print " %.2f" % v }; puts "" }
	puts iB.inspect
	# And here's a prediction
	puts "User 1 - Item 4: %.2f (should be close to 4)" % predict(0,3,u,i,uB,iB)