Skip to content

Commit 9b9c1e1

Browse files
authored
Late MTLCompiler load (tinygrad#8963)
Moved loading MTLCompiler (and trying to load normal llvm before it) to MetalCompiler, like in CPUProgram with helper
1 parent a3c78d4 commit 9b9c1e1

File tree

1 file changed

+11
-11
lines changed

1 file changed

+11
-11
lines changed

tinygrad/runtime/ops_metal.py

+11-11
Original file line numberDiff line numberDiff line change
@@ -4,13 +4,6 @@
44
from tinygrad.device import Compiled, Compiler, CompileError, LRUAllocator, cpu_profile, ProfileDeviceEvent, ProfileRangeEvent
55
from tinygrad.renderer.cstyle import MetalRenderer
66

7-
# Opening METAL after LLVM doesn't fail because ctypes.CDLL opens with RTLD_LOCAL but MTLCompiler opens it's own llvm with RTLD_GLOBAL
8-
# This means that MTLCompiler's llvm will create it's own instances of global state because RTLD_LOCAL doesn't export symbols, but if RTLD_GLOBAL
9-
# library is loaded first then RTLD_LOCAL library will just use it's symbols. On linux there is RTLD_DEEPBIND to prevent that, but on macos there
10-
# doesn't seem to be anything we can do.
11-
with contextlib.suppress(FileNotFoundError):
12-
import tinygrad.runtime.autogen.llvm # noqa: F401
13-
147
class objc_id(ctypes.c_void_p): # This prevents ctypes from converting response to plain int, and dict.fromkeys() can use it to dedup
158
def __hash__(self): return hash(self.value)
169
def __eq__(self, other): return self.value == other.value
@@ -34,14 +27,12 @@ class MTLPipelineOption:
3427

3528
libobjc = ctypes.CDLL("/usr/lib/libobjc.dylib")
3629
libmetal = ctypes.CDLL("/System/Library/Frameworks/Metal.framework/Metal")
37-
compiler = ctypes.CDLL("/System/Library/PrivateFrameworks/MTLCompiler.framework/MTLCompiler")
3830
# Must be loaded for default Metal Device: https://developer.apple.com/documentation/metal/1433401-mtlcreatesystemdefaultdevice?language=objc
3931
ctypes.CDLL("/System/Library/Frameworks/CoreGraphics.framework/CoreGraphics")
4032
libdispatch = ctypes.CDLL("/usr/lib/libSystem.dylib") # libdispatch is part of libSystem on mac
4133
libobjc.objc_getClass.restype = objc_id
4234
libobjc.sel_registerName.restype = objc_id
4335
libmetal.MTLCreateSystemDefaultDevice.restype = objc_instance
44-
compiler.MTLCodeGenServiceCreate.restype = ctypes.c_void_p
4536
libdispatch.dispatch_data_create.restype = objc_instance
4637

4738
@functools.lru_cache(None)
@@ -102,8 +93,17 @@ def metal_src_to_library(device:MetalDevice, src:str) -> objc_instance:
10293
return library
10394

10495
class MetalCompiler(Compiler):
96+
# Opening METAL after LLVM doesn't fail because ctypes.CDLL opens with RTLD_LOCAL but MTLCompiler opens it's own llvm with RTLD_GLOBAL
97+
# This means that MTLCompiler's llvm will create it's own instances of global state because RTLD_LOCAL doesn't export symbols, but if RTLD_GLOBAL
98+
# library is loaded first then RTLD_LOCAL library will just use it's symbols. On linux there is RTLD_DEEPBIND to prevent that, but on macos there
99+
# doesn't seem to be anything we can do.
100+
with contextlib.suppress(FileNotFoundError):
101+
import tinygrad.runtime.autogen.llvm # noqa: F401
102+
support = ctypes.CDLL("/System/Library/PrivateFrameworks/MTLCompiler.framework/MTLCompiler")
103+
support.MTLCodeGenServiceCreate.restype = ctypes.c_void_p
104+
105105
def __init__(self):
106-
self.cgs = ctypes.c_void_p(compiler.MTLCodeGenServiceCreate(b"tinygrad"))
106+
self.cgs = ctypes.c_void_p(MetalCompiler.support.MTLCodeGenServiceCreate(b"tinygrad"))
107107
super().__init__("compile_metal_direct")
108108
def __reduce__(self): return (MetalCompiler,()) # force pickle to create new instance for each multiprocessing fork
109109
def compile(self, src:str) -> bytes:
@@ -127,7 +127,7 @@ def callback(blockptr, error, dataPtr, dataLen, errorMessage):
127127
# See https://clang.llvm.org/docs/Block-ABI-Apple.html#high-level for struct layout.
128128
# Fields other than invoke are unused in this case so we can just use ctypes.byref with negative offset to invoke field, add blockptr as a first
129129
# argument and pretend it's a normal callback
130-
compiler.MTLCodeGenServiceBuildRequest(self.cgs, None, REQUEST_TYPE_COMPILE, request, len(request), ctypes.byref(callback, -0x10))
130+
MetalCompiler.support.MTLCodeGenServiceBuildRequest(self.cgs, None, REQUEST_TYPE_COMPILE, request, len(request), ctypes.byref(callback, -0x10))
131131
if isinstance(ret, Exception): raise ret
132132
assert ret[:4] == b"MTLB" and ret[-4:] == b"ENDT", f"Invalid Metal library. {ret!r}"
133133
return ret

0 commit comments

Comments
 (0)