Disable logging in early compile2 and lower kernel counts (#2090)

* Revert "Revert "openpilot kernel fix from 209 to 207 (#2006)" (#2065)" This reverts commit 924ecc4d6a. * gate behind OPT >= 4 * disable_logging in schedule * simple * from master * more images * revert that * 206 kernels
2026-01-08 22:48:25 -05:00 · 2023-10-16 20:15:24 -07:00
parent 442a27db8a
commit 5a4a62ecae
5 changed files with 19 additions and 10 deletions
--- a/test/external/external_test_opt.py
+++ b/test/external/external_test_opt.py
@@ -64,7 +64,7 @@ class TestInferenceMinKernels(unittest.TestCase):
    for p in get_parameters(model): p.assign(np.zeros(p.shape, dtype=p.dtype.np))
    img = Tensor.randn(1, 3, 224, 224)
    # TODO: this seems very high
-    with CLCache(116):
+    with CLCache(115):
      model.forward(img).realize()

  def test_resnet(self):
@@ -78,7 +78,7 @@ class TestInferenceMinKernels(unittest.TestCase):
    model = ViT(embed_dim=192, num_heads=3)
    for p in get_parameters(model): p.assign(np.zeros(p.shape, dtype=p.dtype.np))
    img = Tensor.randn(1, 3, 224, 224)
-    with CLCache(223): # NOTE: this is way too high
+    with CLCache(222): # NOTE: this is way too high
      out = model.forward(img)
      assert len(CacheCollector.cache) == 0, "ViT prerealized?"
      out.realize()
@@ -88,7 +88,7 @@ class TestInferenceMinKernels(unittest.TestCase):
    args_tiny = {"dim": 512, "multiple_of": 256, "n_heads": 8, "n_layers": 4, "norm_eps": 1e-05, "vocab_size": 1000}
    model = Transformer(**args_tiny)
    for p in get_parameters(model): p.assign(np.zeros(p.shape, dtype=p.dtype.np))
-    with CLCache(94):
+    with CLCache(85):
      model(Tensor([[1,2,3,4]]), 0).realize()

@unittest.skipUnless(Device.DEFAULT == "GPU", "Not Implemented")