Now deals when a module whose input is a table has multiple successors.

[dagnn.git] / test-dagnn.lua
diff --git a/test-dagnn.lua b/test-dagnn.lua

index 1df04e2..f7de819 100755 (executable)
--- a/test-dagnn.lua
+++ b/test-dagnn.lua
@@ -23,9 +23,8 @@ require 'torch'
  require 'nn'
  require 'dagnn'
  
  require 'nn'
  require 'dagnn'
  
--- torch.setnumthreads(params.nbThreads)
  torch.setdefaulttensortype('torch.DoubleTensor')
  torch.setdefaulttensortype('torch.DoubleTensor')
-torch.manualSeed(2)
+torch.manualSeed(1)
  
  function checkGrad(model, criterion, input, target)
     local params, gradParams = model:getParameters()
  
  function checkGrad(model, criterion, input, target)
     local params, gradParams = model:getParameters()
@@ -39,6 +38,8 @@ function checkGrad(model, criterion, input, target)
     model:backward(input, gradOutput)
     local analyticalGradParam = gradParams:clone()
  
     model:backward(input, gradOutput)
     local analyticalGradParam = gradParams:clone()
  
+   local err = 0
+
     for i = 1, params:size(1) do
        local x = params[i]
  
     for i = 1, params:size(1) do
        local x = params[i]
  
@@ -54,23 +55,13 @@ function checkGrad(model, criterion, input, target)
  
        local ana = analyticalGradParam[i]
        local num = (loss1 - loss0) / (2 * epsilon)
  
        local ana = analyticalGradParam[i]
        local num = (loss1 - loss0) / (2 * epsilon)
-      local err
  
  
-      if num == ana then
-         err = 0
-      else
-         err = torch.abs(num - ana) / torch.abs(num)
+      if num ~= ana then
+         err = math.max(err, torch.abs(num - ana) / torch.abs(num))
        end
        end
-
-      print(
-         'CHECK '
-            .. err
-            .. ' checkGrad ' .. i
-            .. ' analytical ' .. ana
-            .. ' numerical ' .. num
-      )
     end
  
     end
  
+   return err
  end
  
  function printTensorTable(t)
  end
  
  function printTensorTable(t)
@@ -84,39 +75,41 @@ function printTensorTable(t)
     end
  end
  
     end
  end
  
---                     +--> c ----> e --+
---                    /            /     \
---                   /            /       \
---  input --> a --> b ---> d ----+         g --> output
---                          \             /
---                           \           /
---                            +--> f ---+
+--               +-- Linear(10, 10) --> ReLU --> d -->
+--              /                               /
+--             /                               /
+--  --> a --> b -----------> c ---------------+
+--                            \
+--                             \
+--                              +--------------- e -->
+
+dag = nn.DAG()
  
  a = nn.Linear(50, 10)
  b = nn.ReLU()
  c = nn.Linear(10, 15)
  
  a = nn.Linear(50, 10)
  b = nn.ReLU()
  c = nn.Linear(10, 15)
-d = nn.Linear(10, 15)
-e = nn.CMulTable()
-f = nn.Linear(15, 15)
-g = nn.CAddTable()
+d = nn.CMulTable()
+e = nn.Mul(-1)
  
  
-model = nn.DAG()
+dag:connect(a, b, c)
+dag:connect(b, nn.Linear(10, 15), nn.ReLU(), d)
+dag:connect(c, d)
+dag:connect(c, e)
  
  
-model:addEdge(a, b)
-model:addEdge(b, c)
-model:addEdge(b, d)
-model:addEdge(c, e)
-model:addEdge(d, e)
-model:addEdge(d, f)
-model:addEdge(e, g)
-model:addEdge(f, g)
+dag:setInput(a)
+dag:setOutput({ d, e })
  
  
-model:setInput(a)
-model:setOutput(g)
+-- We check it works when we put it into a nn.Sequential
+model = nn.Sequential()
+   :add(nn.Linear(50, 50))
+   :add(dag)
+   :add(nn.CAddTable())
  
  local input = torch.Tensor(30, 50):uniform()
  local output = model:updateOutput(input):clone()
  
  local input = torch.Tensor(30, 50):uniform()
  local output = model:updateOutput(input):clone()
-
  output:uniform()
  
  output:uniform()
  
-checkGrad(model, nn.MSECriterion(), input, output)
+print('Gradient estimate error ' .. checkGrad(model, nn.MSECriterion(), input, output))
+
+print('Writing /tmp/graph.dot')
+dag:saveDot('/tmp/graph.dot')