remove retain_graph in Tensor.backward [pr] (#8835)

not used. gradient accumulation works directly
2026-01-08 22:48:25 -05:00 · 2025-01-31 13:41:26 -05:00
parent 0a59db936a
commit 1f730ae8f8
3 changed files with 10 additions and 12 deletions
--- a/test/test_tensor.py
+++ b/test/test_tensor.py
@@ -63,17 +63,16 @@ class TestTinygrad(unittest.TestCase):
      np.testing.assert_allclose(x, y, atol=1e-5)

  # A simple test is to check that we can accumulate gradients (run backward twice or more times)
-  # This will only work if retain_graph works.
-  def test_retain_graph(self):
+  def test_accumulate_gradients(self):
    x = Tensor(x_init, requires_grad=True)
    W = Tensor(W_init, requires_grad=True)
    m = Tensor(m_init)
    out = x.dot(W).relu()
    out = out.log_softmax()
    out = out.mul(m).add(m).sum()
-    out.backward(retain_graph=True)
+    out.backward()
    xgrad,wgrad = x.grad, W.grad
-    out.backward(retain_graph=True)
+    out.backward()
    xgrad2,wgrad2 = x.grad, W.grad
    out.backward() # no need to retain again since we will not re-run backward
    xgrad3,wgrad3 = x.grad, W.grad