[FRONTEND] Expose the register usage and spill information thru CompiledKernel (#1296)

This commit is contained in:
shunting314
2023-03-07 17:30:31 -08:00
committed by GitHub
parent 773c29cfaa
commit f5c9f9b4b5

View File

@@ -1725,6 +1725,8 @@ class CompiledKernel:
if self.shared > max_shared:
raise OutOfResources(self.shared, max_shared, "shared memory")
mod, func, n_regs, n_spills = cuda_utils.load_binary(self.metadata["name"], self.asm["cubin"], self.shared, device)
self.n_spills = n_spills
self.n_regs = n_regs
self.cu_module = mod
self.cu_function = func