EnsekiTT · January 23, 2017 15:22
diff --git a/simple_sample.lua b/simple_sample.lua
 require 'torch'

 torch.manualSeed(114514)

 -- choose a dimension
 N = 5

 -- create a random NxN matrix
 A = torch.rand(N, N)

 -- make it symmetric positive
 A = A*A:t()

 -- make it definite
 A:add(0.001, torch.eye(N))

 -- add a linear term
 b = torch.rand(N)

 -- create the quadratic form
 function J(x)
   return 0.5*x:dot(A*x)-b:dot(x)
 end

 print(J(torch.rand(N)))

 -- 2. Find the exact minimum
 xs = torch.inverse(A)*b
 print(string.format('J(x^*) = %g', J(xs)))


 -- 3. Search the minimum by gradient descent
 function dJ(x)
  return A*x-b
 end

 x = torch.rand(N)

 lr = 0.01
 for i=1,20000 do
  x = x - dJ(x)*lr
  -- we print the value of the objective function at each iteration
  print(string.format('at iter %d J(x) = %f', i, J(x)))
 end

 -- 4. Using the optim package
 local A = torch.rand(N, N)

 do
   local A = torch.rand(N, N)
   print(A)
 end
 print(A)

 do
   local neval = 0
   function JdJ(x)
      local Jx = J(x)
      neval = neval + 1
      print(string.format('after %d evaluations J(x) = %f', neval, Jx))
      return Jx, dJ(x)
   end
 end

 require 'optim'

 state = {
   verbose = true,
   maxIter = 100
 }

 x = torch.rand(N)
 optim.cg(JdJ, x, state)

 -- 5. Plot

 -- CG
 evaluations = {}
 time = {}
 timer = torch.Timer()
 neval = 0
 function JdJ(x)
   local Jx = J(x)
   neval = neval + 1
   print(string.format('after %d evaluations, J(x) = %f', neval, Jx))
   table.insert(evaluations, Jx)
   table.insert(time, timer:time().real)
   return Jx, dJ(x)
 end

 state = {
   verbose = true,
   maxIter = 100
 }

 x0 = torch.rand(N)
 cgx = x0:clone() -- make a copy of x0
 timer:reset()
 optim.cg(JdJ, cgx, state)

 -- we convert the evaluations and time tables to tensors for plotting:
 cgtime = torch.Tensor(time)
 cgevaluations = torch.Tensor(evaluations)


 -- sgd
 evaluations = {}
 time = {}
 neval = 0
 state = {
  lr = 0.1
 }

 -- we start from the same starting point than for CG
 x = x0:clone()

 -- reset the timer!
 timer:reset()

 -- note that SGD optimizer requires us to do the loop
 for i=1,1000 do
  optim.sgd(JdJ, x, state)
  table.insert(evaluations, Jx)
 end

 sgdtime = torch.Tensor(time)
 sgdevaluations = torch.Tensor(evaluations)

 require 'gnuplot'

 gnuplot.figure(1)
 gnuplot.title('CG loss minimisation over time')
 gnuplot.plot(cgtime, cgevaluations)

 gnuplot.figure(2)
 gnuplot.title('SGD loss minimisation over time')
 gnuplot.plot(sgdtime, sgdevaluations)

 gnuplot.pngfigure('myplot.png')
 gnuplot.plot(
   {'CG',  cgtime,  cgevaluations,  '-'},
   {'SGD', sgdtime, sgdevaluations, '-'})
 gnuplot.xlabel('time (s)')
 gnuplot.ylabel('J(x)')
 gnuplot.plotflush()
	require 'torch'

	torch.manualSeed(114514)

	-- choose a dimension
	N = 5

	-- create a random NxN matrix
	A = torch.rand(N, N)

	-- make it symmetric positive
	A = A*A:t()

	-- make it definite
	A:add(0.001, torch.eye(N))

	-- add a linear term
	b = torch.rand(N)

	-- create the quadratic form
	function J(x)
	return 0.5x:dot(Ax)-b:dot(x)
	end

	print(J(torch.rand(N)))

	-- 2. Find the exact minimum
	xs = torch.inverse(A)*b
	print(string.format('J(x^*) = %g', J(xs)))


	-- 3. Search the minimum by gradient descent
	function dJ(x)
	return A*x-b
	end

	x = torch.rand(N)

	lr = 0.01
	for i=1,20000 do
	x = x - dJ(x)*lr
	-- we print the value of the objective function at each iteration
	print(string.format('at iter %d J(x) = %f', i, J(x)))
	end

	-- 4. Using the optim package
	local A = torch.rand(N, N)

	do
	local A = torch.rand(N, N)
	print(A)
	end
	print(A)

	do
	local neval = 0
	function JdJ(x)
	local Jx = J(x)
	neval = neval + 1
	print(string.format('after %d evaluations J(x) = %f', neval, Jx))
	return Jx, dJ(x)
	end
	end

	require 'optim'

	state = {
	verbose = true,
	maxIter = 100
	}

	x = torch.rand(N)
	optim.cg(JdJ, x, state)

	-- 5. Plot

	-- CG
	evaluations = {}
	time = {}
	timer = torch.Timer()
	neval = 0
	function JdJ(x)
	local Jx = J(x)
	neval = neval + 1
	print(string.format('after %d evaluations, J(x) = %f', neval, Jx))
	table.insert(evaluations, Jx)
	table.insert(time, timer:time().real)
	return Jx, dJ(x)
	end

	state = {
	verbose = true,
	maxIter = 100
	}

	x0 = torch.rand(N)
	cgx = x0:clone() -- make a copy of x0
	timer:reset()
	optim.cg(JdJ, cgx, state)

	-- we convert the evaluations and time tables to tensors for plotting:
	cgtime = torch.Tensor(time)
	cgevaluations = torch.Tensor(evaluations)


	-- sgd
	evaluations = {}
	time = {}
	neval = 0
	state = {
	lr = 0.1
	}

	-- we start from the same starting point than for CG
	x = x0:clone()

	-- reset the timer!
	timer:reset()

	-- note that SGD optimizer requires us to do the loop
	for i=1,1000 do
	optim.sgd(JdJ, x, state)
	table.insert(evaluations, Jx)
	end

	sgdtime = torch.Tensor(time)
	sgdevaluations = torch.Tensor(evaluations)

	require 'gnuplot'

	gnuplot.figure(1)
	gnuplot.title('CG loss minimisation over time')
	gnuplot.plot(cgtime, cgevaluations)

	gnuplot.figure(2)
	gnuplot.title('SGD loss minimisation over time')
	gnuplot.plot(sgdtime, sgdevaluations)

	gnuplot.pngfigure('myplot.png')
	gnuplot.plot(
	{'CG', cgtime, cgevaluations, '-'},
	{'SGD', sgdtime, sgdevaluations, '-'})
	gnuplot.xlabel('time (s)')
	gnuplot.ylabel('J(x)')
	gnuplot.plotflush()