Updated info / help.

author: Clement Farabet <clement.farabet@gmail.com> 2012-09-28 21:52:18 +0400
committer: Clement Farabet <clement.farabet@gmail.com> 2012-09-28 21:52:18 +0400
commit: c12e430a890092c83ed950683704b68831a64e6e (patch)
tree: 3b289ce0aedbec8a5ba657f8fc682c1a6b23aca5
parent: f16142686048d6e2b17a4ccac192753135d3072f (diff)
4 files changed, 70 insertions, 33 deletions
diff --git a/README.md b/README.md
index cfaaa46..3b56831 100644
--- a/README.md
+++ b/README.md
@@ -1,16 +1,30 @@
-# optim: an optimization package for Torch7
+Optim: an optimization package for Torch7
+=========================================
 
-## Requirements
+Requirements
+------------
 
 * Torch7 (www.torch.ch)
 
-## Installation
+Installation
+------------
 
 * Install Torch7 (refer to its own documentation).
-* clone this project into dev directory of Torch7.
-* Rebuild torch, it will include new projects too.
+* Use `torch-pkg` to install optim:
 
-## Info
+```
+torch-pkg install optim
+```
+
+or from these sources:
+
+```
+cd optim;
+torch-pkg deploy
+```
+
+Info
+----
 
 This package contains several optimization routines for Torch7.
 
@@ -26,3 +40,22 @@ with:
 * x*    : the new parameter vector that minimizes f, x* = argmin_x f(x)
 * {f}   : a table of all f values, in the order they've been evaluated
           (for some simple algorithms, like SGD, #f == 1)
+
+Important Note: the state table is used to hold the state of the algorihtm.
+It's usually initialized once, by the user, and then passed to the optim function
+as a black box. Example:
+
+```lua
+state = {
+   learningRate = 1e-3,
+   momentum = 0.5
+}
+
+for i,sample in ipairs(training_samples) do
+    local func = function(x)
+       -- define eval function
+       return f,df_dx
+    end
+    optim.sgd(f,x,state)
+end
+```
diff --git a/asgd.lua b/asgd.lua
index 05ab953..cf1cd32 100644
--- a/asgd.lua
+++ b/asgd.lua
@@ -26,6 +26,8 @@
 -- f(x)  : the function, evaluated before the update
 -- ax    : the averaged x vector
 --
+-- (Clement Farabet, 2012)
+--
 function optim.asgd(opfunc, x, state)
    -- (0) get/update state
    local state = state or {}
diff --git a/cg.lua b/cg.lua
index d8a9f27..28ae9a5 100644
--- a/cg.lua
+++ b/cg.lua
@@ -11,11 +11,11 @@
 -- ARGS:
 -- opfunc : a function that takes a single input, the point of evaluation.
 -- x      : the initial point
--- params : a table of parameters and temporary allocations.
---   params.maxEval     : max number of function evaluations
---   params.maxIter     : max number of iterations
---   params.df[0,1,2,3] : if you pass torch.Tensor they will be used for temp storage
---   params.[s,x0]      : if you pass torch.Tensor they will be used for temp storage
+-- state : a table of parameters and temporary allocations.
+--   state.maxEval     : max number of function evaluations
+--   state.maxIter     : max number of iterations
+--   state.df[0,1,2,3] : if you pass torch.Tensor they will be used for temp storage
+--   state.[s,x0]      : if you pass torch.Tensor they will be used for temp storage
 --
 -- RETURN:
 -- x* : the new x vector, at the optimal point
@@ -25,19 +25,19 @@
 --
 -- (Koray Kavukcuoglu, 2012)
 --
-function optim.cg(opfunc, x, params)
+function optim.cg(opfunc, x, state)
    -- parameters
-   local params = params or {}
-   local rho  = params.rho or 0.01
-   local sig  = params.sig or 0.5
-   local int  = params.int or 0.1
-   local ext  = params.ext or 3.0
-   local maxIter  = params.maxIter or 20
-   local ratio = params.ratio or 100
-   local maxEval = params.maxEval or maxIter*1.25
+   local state = state or {}
+   local rho  = state.rho or 0.01
+   local sig  = state.sig or 0.5
+   local int  = state.int or 0.1
+   local ext  = state.ext or 3.0
+   local maxIter  = state.maxIter or 20
+   local ratio = state.ratio or 100
+   local maxEval = state.maxEval or maxIter*1.25
    local red = 1
 
-   local verbose = params.verbose or 0
+   local verbose = state.verbose or 0
 
    local i = 0
    local ls_failed = 0
@@ -48,9 +48,9 @@ function optim.cg(opfunc, x, params)
    local d1,d2,d3 = 0,0,0
    local f1,f2,f3 = 0,0,0
 
-   local df1 = params.df1 or torch.Tensor()
-   local df2 = params.df2 or torch.Tensor()
-   local df3 = params.df3 or torch.Tensor()
+   local df1 = state.df1 or torch.Tensor()
+   local df2 = state.df2 or torch.Tensor()
+   local df3 = state.df3 or torch.Tensor()
    local tdf
 
    df1:resizeAs(x)
@@ -58,13 +58,13 @@ function optim.cg(opfunc, x, params)
    df3:resizeAs(x)
 
    -- search direction
-   local s = params.s or torch.Tensor()
+   local s = state.s or torch.Tensor()
    s:resizeAs(x)
 
    -- we need a temp storage for X
-   local x0 = params.x0 or torch.Tensor()
+   local x0 = state.x0 or torch.Tensor()
    local f0 = 0
-   local df0 = params.df0 or torch.Tensor()
+   local df0 = state.df0 or torch.Tensor()
    x0:resizeAs(x)
    df0:resizeAs(x)
 
@@ -192,11 +192,11 @@ function optim.cg(opfunc, x, params)
          ls_failed = 1
       end
    end
-   params.df0 = df0
-   params.df1 = df1
-   params.df2 = df2
-   params.df3 = df3
-   params.x0 = x0
-   params.s = s
+   state.df0 = df0
+   state.df1 = df1
+   state.df2 = df2
+   state.df3 = df3
+   state.x0 = x0
+   state.s = s
    return x,fx,i
 end
diff --git a/sgd.lua b/sgd.lua
index 684ac9a..42dd43b 100644
--- a/sgd.lua
+++ b/sgd.lua
@@ -17,6 +17,8 @@
 -- x     : the new x vector
 -- f(x)  : the function, evaluated before the update
 --
+-- (Clement Farabet, 2012)
+--
 function optim.sgd(opfunc, x, state)
    -- (0) get/update state
    local state = state or {}
author	Clement Farabet <clement.farabet@gmail.com>	2012-09-28 21:52:18 +0400
committer	Clement Farabet <clement.farabet@gmail.com>	2012-09-28 21:52:18 +0400
commit	c12e430a890092c83ed950683704b68831a64e6e (patch)
tree	3b289ce0aedbec8a5ba657f8fc682c1a6b23aca5
parent	f16142686048d6e2b17a4ccac192753135d3072f (diff)