diff --git a/tinygrad/engine/realize.py b/tinygrad/engine/realize.py index 0fbbe7cd40..a621b6cdb8 100644 --- a/tinygrad/engine/realize.py +++ b/tinygrad/engine/realize.py @@ -41,7 +41,7 @@ class CompiledRunner(Runner): if DEBUG >= 4: print(p.src) self.p:ProgramSpec = p self.lib:bytes = precompiled if precompiled is not None else Device[p.device].compiler.compile_cached(p.src) - if DEBUG >= 6: Device[p.device].compiler.disassemble(self.lib) + if DEBUG >= 7: Device[p.device].compiler.disassemble(self.lib) self._prg = Device[p.device].runtime(p.function_name, self.lib) super().__init__(p.name, p.device, p.estimates) diff --git a/tinygrad/runtime/ops_cuda.py b/tinygrad/runtime/ops_cuda.py index 0f4988412e..c39ab667e3 100644 --- a/tinygrad/runtime/ops_cuda.py +++ b/tinygrad/runtime/ops_cuda.py @@ -34,7 +34,7 @@ class CUDAProgram: def __init__(self, dev:CUDADevice, name:str, lib:bytes, smem:int=0): self.dev, self.name, self.lib, self.smem = dev, name, lib, smem if DEBUG >= 5: print("\n".join([f"{i+1:>3} {line}" for i, line in enumerate(pretty_ptx(lib.decode('utf-8')).split("\n"))])) - if DEBUG >= 6: cuda_disassemble(lib, dev.arch) + if DEBUG >= 7: cuda_disassemble(lib, dev.arch) check(cuda.cuCtxSetCurrent(self.dev.context)) self.module = cuda.CUmodule()