Fix zero gradient for subtensor assignment.

The variable that is being assigned has its gradient correctly calculated (g[k]) but later on when the gradient of the variable being assigned to is calculated g[k] is set to 0. This gives the correct gradient for the variable being assigned to, but because it shares the same storage it actually overrides the earlier gradient incorrectly to zero. This fixes that.
twitter-archive · May 27, 2016 · 0d31b91 · 0d31b91
1 parent ff0057f
commit 0d31b91
Show file tree

Hide file tree

Showing 2 changed files with 11 additions and 1 deletion.
diff --git a/src/gradfuns.lua b/src/gradfuns.lua
@@ -152,7 +152,12 @@ functions.set = {
       return nil
    end,
    function(g, ans, x, k, v)
-      return g[k]
+      local gk = getValue(g[k])
+      if type(gk) == 'number' then
+        return gk
+      else
+        return torch.clone(gk)
+      end
    end,
 }
 

diff --git a/test/test.lua b/test/test.lua
@@ -1687,6 +1687,11 @@ local tests = {
          return torch.sum(xc)
       end
       tester:assert(gradcheck(f4,{x=torch.randn(10,10),y=torch.randn(3)}), "Incorrect gradient")
+      local f5 = function(params)
+         params.x[2] = params.y*2.0
+         return torch.sum(params.x)
+      end
+      tester:assert(gradcheck(f5,{x=torch.randn(10,10),y=torch.randn(10)}), "Incorrect gradient")
    end,
 
    ScalarSigmoid = function()