lower schedule (#2559)

* lower schedule

* remove RAND, and don't put load in the JIT yet

* better fix for that test
This commit is contained in:
George Hotz
2023-12-01 19:17:46 -08:00
committed by GitHub
parent 077567f62d
commit 6733425095
9 changed files with 105 additions and 93 deletions

View File

@@ -88,8 +88,9 @@ class TestInferenceMinKernels(unittest.TestCase):
args_tiny = {"dim": 512, "hidden_dim": 1024, "n_heads": 8, "n_layers": 4, "norm_eps": 1e-05, "vocab_size": 1000}
model = Transformer(**args_tiny)
for p in get_parameters(model): p.assign(np.zeros(p.shape, dtype=p.dtype.np))
inp = Tensor([[1,2,3,4]])
with CLCache(100):
model(Tensor([[1,2,3,4]]), 0).realize()
model(inp, 0).realize()
@unittest.skipUnless(Device.DEFAULT == "GPU", "Not Implemented")
class TestOptBinOp(unittest.TestCase):