diff --git a/tinygrad/runtime/ops_cuda.py b/tinygrad/runtime/ops_cuda.py index 7f8fc265ba..2c3d9e8781 100644 --- a/tinygrad/runtime/ops_cuda.py +++ b/tinygrad/runtime/ops_cuda.py @@ -24,7 +24,7 @@ class CUDAProgram: global_size = global_size + [1] * (3 - len(global_size)) assert all(x%y == 0 for x,y in zip(global_size, local_size)), f"local:{local_size} must divide global:{global_size}" global_size = [x//y for x,y in zip(global_size, local_size)] - self.prg(*args, block=tuple(local_size), grid=tuple(global_size)) + self.prg(*[x._cl for x in args], block=tuple(local_size), grid=tuple(global_size)) class CUDACodegen(GPUCodegen): lang = GPULanguage(