mirror of
https://github.com/tinygrad/tinygrad.git
synced 2026-04-29 03:00:14 -04:00
* start new rdna4 * work * plus works * more pass * rdna4 * assembly/amd: fix RDNA4 emulator for float16 and VOP3 clamp * stale * rev * rr * rdna4 emu tests * cleanup * cleanup * simp * works * better factorizaion * hacks * fix mockgpu * guard both * cleaner * gate * bug fix and a few tests * all test_tiny
45 lines
2.2 KiB
Python
45 lines
2.2 KiB
Python
import ctypes, ctypes.util
|
|
from tinygrad.helpers import getenv
|
|
|
|
def _try_dlopen_gpuocelot():
|
|
GPUOCELOT_PATHS = [ctypes.util.find_library("gpuocelot")] if ctypes.util.find_library("gpuocelot") is not None else []
|
|
GPUOCELOT_PATHS += ["libgpuocelot.so", "/usr/local/lib/libgpuocelot.so",
|
|
"libgpuocelot.dylib", "/usr/local/lib/libgpuocelot.dylib", "/opt/homebrew/lib/libgpuocelot.dylib"]
|
|
for path in GPUOCELOT_PATHS:
|
|
try:
|
|
gpuocelot_lib = ctypes.CDLL(path)
|
|
gpuocelot_lib.ptx_run.argtypes = [ctypes.c_char_p, ctypes.c_int, ctypes.POINTER(ctypes.c_void_p), ctypes.c_int, ctypes.c_int,
|
|
ctypes.c_int, ctypes.c_int, ctypes.c_int, ctypes.c_int, ctypes.c_int]
|
|
except OSError: pass
|
|
else: return gpuocelot_lib
|
|
print("Could not find libgpuocelot.so")
|
|
return None
|
|
|
|
class PythonRemu:
|
|
"""Python RDNA3/RDNA4 emulator wrapper that matches the libremu.so interface."""
|
|
valid_mem_ranges: set[tuple[int, int]] = set()
|
|
rsrc2: int = 0x19c # Default: USER_SGPR_COUNT=14, enable X and Y workgroup IDs
|
|
scratch_size: int = 0 # private_segment_fixed_size from kernel descriptor
|
|
arch: str = "rdna3" # Architecture: rdna3 or rdna4
|
|
|
|
def run_asm(self, lib: int, lib_sz: int, gx: int, gy: int, gz: int, lx: int, ly: int, lz: int, args_ptr: int) -> int:
|
|
from extra.assembly.amd.emu import run_asm
|
|
return run_asm(lib, lib_sz, gx, gy, gz, lx, ly, lz, args_ptr, self.rsrc2, self.scratch_size, self.arch)
|
|
|
|
def _try_dlopen_remu():
|
|
# Use Python emulator only if PYTHON_REMU=1
|
|
if int(getenv("PYTHON_REMU", "1")):
|
|
return PythonRemu()
|
|
REMU_PATHS = ["extra/remu/target/release/libremu.so", "libremu.so", "/usr/local/lib/libremu.so",
|
|
"extra/remu/target/release/libremu.dylib", "libremu.dylib", "/usr/local/lib/libremu.dylib", "/opt/homebrew/lib/libremu.dylib"]
|
|
for path in REMU_PATHS:
|
|
try:
|
|
remu = ctypes.CDLL(path)
|
|
remu.run_asm.restype = ctypes.c_int32
|
|
remu.run_asm.argtypes = [ctypes.c_void_p, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32,
|
|
ctypes.c_uint32, ctypes.c_uint32, ctypes.c_uint32, ctypes.c_void_p]
|
|
except OSError: pass
|
|
else: return remu
|
|
print("Could not find libremu.so")
|
|
return None
|