coder.py can write and run code (#2439)

* wip mistral * coder * touchups * cleanups * mistral cleanups * clean up cache create * download the weights, fix tests * fix llama loading * global fixup * clean up all * move llama model * cleanups * Revert "cleanups" This reverts commit a71c5d59eb. * fine, leave it
2026-01-08 22:48:25 -05:00 · 2023-11-25 12:27:54 -08:00
parent df41a57e09
commit 7170a9a057
10 changed files with 334 additions and 167 deletions
--- a/test/external/external_test_opt.py
+++ b/test/external/external_test_opt.py
@@ -86,7 +86,7 @@ class TestInferenceMinKernels(unittest.TestCase):
  def test_llama(self):
    from examples.llama import Transformer
    from tinygrad.shape.symbolic import Variable
-    args_tiny = {"dim": 512, "multiple_of": 256, "n_heads": 8, "n_layers": 4, "norm_eps": 1e-05, "vocab_size": 1000}
+    args_tiny = {"dim": 512, "hidden_dim": 1024, "n_heads": 8, "n_layers": 4, "norm_eps": 1e-05, "vocab_size": 1000}
    model = Transformer(**args_tiny)
    for p in get_parameters(model): p.assign(np.zeros(p.shape, dtype=p.dtype.np))
    with CLCache(100):