From 12b04efd691e247a82aba2bc61e11aa61bc0198f Mon Sep 17 00:00:00 2001
From: chenyu <chenyu@fastmail.com>
Date: Sat, 12 Jul 2025 10:16:56 -0400
Subject: [PATCH] remove a TODO prod(k.full_shape[k.first_upcast:]) (#11191)

IMAGE=2 test/test_ops.py works now
---
 tinygrad/opt/heuristic.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/tinygrad/opt/heuristic.py b/tinygrad/opt/heuristic.py
index 73a8611531..2b6a90df8f 100644
--- a/tinygrad/opt/heuristic.py
+++ b/tinygrad/opt/heuristic.py
@@ -53,9 +53,6 @@ def hand_coded_optimizations(k:Kernel) -> list[Opt]:
 
   # **** below this line need to be optional and benchmarked ****
 
-  # TODO: doing extra upcasts with images doesn't work for some reason (maybe has to do with to_image_idx)
-  # to trigger the above bug, remove prod(k.full_shape[k.first_upcast:]) from the below
-  # expression and run test/test_ops.py with IMAGE=2
   # if there are small dims with lots of valid masks, upcast them (they might be from Tensor.stack)
   # this can be made much smarter
   to_upcast: list[int] = []
@@ -64,7 +61,7 @@ def hand_coded_optimizations(k:Kernel) -> list[Opt]:
     # we might want to be able to split axes that are masked, or refuse to merge them in simplify_merge_adjacent
     # for now skip upcasting here if there is a symbolic axis
     if isinstance(k.full_shape[axis], int) and k.full_shape[axis] <= 7 and any(st.axis_is_masked(axis) for st in k.sts) and \
-      prod(k.full_shape[k.first_upcast:]) * prod(k.full_shape[j] for j in to_upcast) * k.full_shape[axis] <= 7 * 7:
+      prod(k.full_shape[j] for j in to_upcast) * k.full_shape[axis] <= 7 * 7:
       if DEBUG >= 4: print(f"upcasting masked axis : {axis}")
       to_upcast.append(axis)
   for axis in to_upcast[::-1]: k.apply_opt(Opt(OptOps.UPCAST, axis, 0))