Skip to content

Commit

Permalink
JITModule: rework/fix __udivdi3 handling
Browse files Browse the repository at this point in the history
The original workaround is very partial,
and was not really working in my experience,
even after making it non-GCC specific.

Instead:
1. Ensure that the library that actually provides that symbol
   (as per the compiler used!) is actually linked into.
   This was not enough still.
2. Replace `HalideJITMemoryManager` hack with a more direct approach
   of actually telling the JIT the address of the symbol.
3. While there, move the symbol's forward definition to outside
   of namespaces. It's a global symbol, it makes sense to place it there.

This makes python binding tests pass on i386,
and i'm really happy about that.

Refs. llvm/llvm-project#61289
Inspired by root-project/root#13286

Forwarded: #8389

Gbp-Pq: Name 0010-JITModule-rework-fix-__udivdi3-handling.patch
  • Loading branch information
LebedevRI committed Aug 11, 2024
1 parent 3cdeb53 commit 9e1b50b
Show file tree
Hide file tree
Showing 2 changed files with 37 additions and 23 deletions.
13 changes: 13 additions & 0 deletions src/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -550,6 +550,19 @@ if (WITH_SERIALIZATION_JIT_ROUNDTRIP_TESTING)
target_compile_definitions(Halide PRIVATE WITH_SERIALIZATION_JIT_ROUNDTRIP_TESTING)
endif ()

if (NOT DEFINED Halide_COMPILER_BUILTIN_LIBRARY)
execute_process(
COMMAND ${CMAKE_CXX_COMPILER} "--print-libgcc-file-name"
OUTPUT_VARIABLE Halide_COMPILER_BUILTIN_LIBRARY
OUTPUT_STRIP_TRAILING_WHITESPACE
)
endif ()

set(Halide_COMPILER_BUILTIN_LIBRARY "${Halide_COMPILER_BUILTIN_LIBRARY}"
CACHE FILEPATH "Library containing __udivdi3 symbol, either “libgcc.a” or “libclang_rt.builtins.*.a”.")

target_link_libraries(Halide PRIVATE "${Halide_COMPILER_BUILTIN_LIBRARY}")

# Note that we (deliberately) redeclare these versions here, even though the macros
# with identical versions are expected to be defined in source; this allows us to
# ensure that the versions defined between all build systems are identical.
Expand Down
47 changes: 24 additions & 23 deletions src/JITModule.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -23,15 +23,13 @@
#include "Pipeline.h"
#include "WasmExecutor.h"

extern "C" unsigned long __udivdi3(unsigned long a, unsigned long b);

namespace Halide {
namespace Internal {

using std::string;

#if defined(__GNUC__) && defined(__i386__)
extern "C" unsigned long __udivdi3(unsigned long a, unsigned long b);
#endif

#ifdef _WIN32
void *get_symbol_address(const char *s) {
return (void *)GetProcAddress(GetModuleHandle(nullptr), s);
Expand Down Expand Up @@ -135,6 +133,26 @@ void load_webgpu() {
<< "(Try setting the env var HL_WEBGPU_NATIVE_LIB to an explicit path to fix this.)\n";
}

llvm::orc::SymbolMap GetListOfAdditionalSymbols(const llvm::orc::LLJIT &Jit) {
// Inject a number of symbols that may be in libgcc.a where they are
// not found automatically. See also the upstream issue:
// https://github.com/llvm/llvm-project/issues/61289.

static const std::pair<const char *, const void *> NamePtrList[] = {
// NOTE: at least libgcc does not provide this symbol on 64-bit x86_64, only on 32-bit i386.
{"__udivdi3", (((CHAR_BIT * sizeof(void *)) == 32) ? ((void *)&__udivdi3) : nullptr)},
};

llvm::orc::SymbolMap AdditionalSymbols;
for (const auto &NamePtr : NamePtrList) {
auto Addr = static_cast<llvm::orc::ExecutorAddr>(
reinterpret_cast<uintptr_t>(NamePtr.second));
AdditionalSymbols[Jit.mangleAndIntern(NamePtr.first)] =
llvm::orc::ExecutorSymbolDef(Addr, llvm::JITSymbolFlags::Exported);
}
return AdditionalSymbols;
}

} // namespace

using namespace llvm;
Expand Down Expand Up @@ -216,25 +234,6 @@ class HalideJITMemoryManager : public SectionMemoryManager {
}
}
uint64_t result = SectionMemoryManager::getSymbolAddress(name);
#if defined(__GNUC__) && defined(__i386__)
// This is a workaround for an odd corner case (cross-compiling + testing
// Python bindings x86-32 on an x86-64 system): __udivdi3 is a helper function
// that GCC uses to do u64/u64 division on 32-bit systems; it's usually included
// by the linker on these systems as needed. When we JIT, LLVM will include references
// to this call; MCJIT fixes up these references by doing (roughly) dlopen(NULL)
// to look up the symbol. For normal JIT tests, this works fine, as dlopen(NULL)
// finds the test executable, which has the right lookups to locate it inside libHalide.so.
// If, however, we are running a JIT-via-Python test, dlopen(NULL) returns the
// CPython executable... which apparently *doesn't* include this as an exported
// function, so the lookup fails and crashiness ensues. So our workaround here is
// a bit icky, but expedient: check for this name if we can't find it elsewhere,
// and if so, return the one we know should be present. (Obviously, if other runtime
// helper functions of this sort crop up in the future, this should be expanded
// into a "builtins map".)
if (result == 0 && name == "__udivdi3") {
result = (uint64_t)&__udivdi3;
}
#endif
internal_assert(result != 0)
<< "HalideJITMemoryManager: unable to find address for " << name << "\n";
return result;
Expand Down Expand Up @@ -350,6 +349,8 @@ void JITModule::compile_module(std::unique_ptr<llvm::Module> m, const string &fu
internal_assert(gen) << llvm::toString(gen.takeError()) << "\n";
JIT->getMainJITDylib().addGenerator(std::move(gen.get()));

cantFail(JIT->getMainJITDylib().define(absoluteSymbols(GetListOfAdditionalSymbols(*JIT))));

llvm::orc::ThreadSafeModule tsm(std::move(m), std::move(jit_module->context));
auto err = JIT->addIRModule(std::move(tsm));
internal_assert(!err) << llvm::toString(std::move(err)) << "\n";
Expand Down

0 comments on commit 9e1b50b

Please sign in to comment.