xenocara/lib/mesa/src/amd/llvm/ac_llvm_helper.cpp

/*
 * Copyright 2014 Advanced Micro Devices, Inc.
 *
 * SPDX-License-Identifier: MIT
 */

#include <llvm-c/Core.h>
#include <llvm/Analysis/TargetLibraryInfo.h>
#include <llvm/IR/IRBuilder.h>
#include <llvm/IR/LegacyPassManager.h>
#include <llvm/IR/Verifier.h>
#include <llvm/Target/TargetMachine.h>
#include <llvm/MC/MCSubtargetInfo.h>
#include <llvm/Support/CommandLine.h>
#include <llvm/Transforms/IPO.h>
#include <llvm/Transforms/Scalar.h>
#include <llvm/Transforms/Utils.h>
#include <llvm/CodeGen/Passes.h>
#include <llvm/Transforms/IPO/AlwaysInliner.h>
#include <llvm/Transforms/InstCombine/InstCombine.h>
#include <llvm/Transforms/IPO/SCCP.h>
#include "llvm/CodeGen/SelectionDAGNodes.h"

#include <cstring>

/* DO NOT REORDER THE HEADERS
 * The LLVM headers need to all be included before any Mesa header,
 * as they use the `restrict` keyword in ways that are incompatible
 * with our #define in include/c99_compat.h
 */

#include "ac_binary.h"
#include "ac_llvm_util.h"
#include "ac_llvm_build.h"
#include "util/macros.h"

using namespace llvm;

class RunAtExitForStaticDestructors : public SDNode
{
public:
   /* getSDVTList (protected) calls getValueTypeList (private), which contains static variables. */
   RunAtExitForStaticDestructors(): SDNode(0, 0, DebugLoc(), getSDVTList(MVT::Other))
   {
   }
};

void ac_llvm_run_atexit_for_destructors(void)
{
   /* LLVM >= 16 registers static variable destructors on the first compile, which gcc
    * implements by calling atexit there. Before that, u_queue registers its atexit
    * handler to kill all threads. Since exit() runs atexit handlers in the reverse order,
    * the LLVM destructors are called first while shader compiler threads may still be
    * running, which crashes in LLVM in SelectionDAG.cpp.
    *
    * The solution is to run the code that declares the LLVM static variables first,
    * so that atexit for LLVM is registered first and u_queue is registered after that,
    * which ensures that all u_queue threads are terminated before LLVM destructors are
    * called.
    *
    * This just executes the code that declares static variables.
    */
   RunAtExitForStaticDestructors();
}

bool ac_is_llvm_processor_supported(LLVMTargetMachineRef tm, const char *processor)
{
   TargetMachine *TM = reinterpret_cast<TargetMachine *>(tm);
   return TM->getMCSubtargetInfo()->isCPUStringValid(processor);
}

void ac_reset_llvm_all_options_occurrences()
{
   cl::ResetAllOptionOccurrences();
}

void ac_add_attr_dereferenceable(LLVMValueRef val, uint64_t bytes)
{
   Argument *A = unwrap<Argument>(val);
   A->addAttr(Attribute::getWithDereferenceableBytes(A->getContext(), bytes));
}

void ac_add_attr_alignment(LLVMValueRef val, uint64_t bytes)
{
   Argument *A = unwrap<Argument>(val);
   A->addAttr(Attribute::getWithAlignment(A->getContext(), Align(bytes)));
}

bool ac_is_sgpr_param(LLVMValueRef arg)
{
   Argument *A = unwrap<Argument>(arg);
   AttributeList AS = A->getParent()->getAttributes();
   unsigned ArgNo = A->getArgNo();
   return AS.hasParamAttr(ArgNo, Attribute::InReg);
}

LLVMModuleRef ac_create_module(LLVMTargetMachineRef tm, LLVMContextRef ctx)
{
   TargetMachine *TM = reinterpret_cast<TargetMachine *>(tm);
   LLVMModuleRef module = LLVMModuleCreateWithNameInContext("mesa-shader", ctx);

   unwrap(module)->setTargetTriple(TM->getTargetTriple().getTriple());
   unwrap(module)->setDataLayout(TM->createDataLayout());
   return module;
}

LLVMBuilderRef ac_create_builder(LLVMContextRef ctx, enum ac_float_mode float_mode)
{
   LLVMBuilderRef builder = LLVMCreateBuilderInContext(ctx);

   FastMathFlags flags;

   switch (float_mode) {
   case AC_FLOAT_MODE_DEFAULT:
   case AC_FLOAT_MODE_DENORM_FLUSH_TO_ZERO:
      break;

   case AC_FLOAT_MODE_DEFAULT_OPENGL:
      /* Allow optimizations to treat the sign of a zero argument or
       * result as insignificant.
       */
      flags.setNoSignedZeros(); /* nsz */

      /* Allow optimizations to use the reciprocal of an argument
       * rather than perform division.
       */
      flags.setAllowReciprocal(); /* arcp */

      unwrap(builder)->setFastMathFlags(flags);
      break;
   }

   return builder;
}

void ac_enable_signed_zeros(struct ac_llvm_context *ctx)
{
   if (ctx->float_mode == AC_FLOAT_MODE_DEFAULT_OPENGL) {
      auto *b = unwrap(ctx->builder);
      FastMathFlags flags = b->getFastMathFlags();

      /* This disables the optimization of (x + 0), which is used
       * to convert negative zero to positive zero.
       */
      flags.setNoSignedZeros(false);
      b->setFastMathFlags(flags);
   }
}

void ac_disable_signed_zeros(struct ac_llvm_context *ctx)
{
   if (ctx->float_mode == AC_FLOAT_MODE_DEFAULT_OPENGL) {
      auto *b = unwrap(ctx->builder);
      FastMathFlags flags = b->getFastMathFlags();

      flags.setNoSignedZeros();
      b->setFastMathFlags(flags);
   }
}

LLVMTargetLibraryInfoRef ac_create_target_library_info(const char *triple)
{
   return reinterpret_cast<LLVMTargetLibraryInfoRef>(
      new TargetLibraryInfoImpl(Triple(triple)));
}

void ac_dispose_target_library_info(LLVMTargetLibraryInfoRef library_info)
{
   delete reinterpret_cast<TargetLibraryInfoImpl *>(library_info);
}

/* Implementation of raw_pwrite_stream that works on malloc()ed memory for
 * better compatibility with C code. */
struct raw_memory_ostream : public raw_pwrite_stream {
   char *buffer;
   size_t written;
   size_t bufsize;

   raw_memory_ostream()
   {
      buffer = NULL;
      written = 0;
      bufsize = 0;
      SetUnbuffered();
   }

   ~raw_memory_ostream()
   {
      free(buffer);
   }

   void clear()
   {
      written = 0;
   }

   void take(char *&out_buffer, size_t &out_size)
   {
      out_buffer = buffer;
      out_size = written;
      buffer = NULL;
      written = 0;
      bufsize = 0;
   }

   void flush() = delete;

   void write_impl(const char *ptr, size_t size) override
   {
      if (unlikely(written + size < written))
         abort();
      if (written + size > bufsize) {
         bufsize = MAX3(1024, written + size, bufsize / 3 * 4);
         buffer = (char *)realloc(buffer, bufsize);
         if (!buffer) {
            fprintf(stderr, "amd: out of memory allocating ELF buffer\n");
            abort();
         }
      }
      memcpy(buffer + written, ptr, size);
      written += size;
   }

   void pwrite_impl(const char *ptr, size_t size, uint64_t offset) override
   {
      assert(offset == (size_t)offset && offset + size >= offset && offset + size <= written);
      memcpy(buffer + offset, ptr, size);
   }

   uint64_t current_pos() const override
   {
      return written;
   }
};

/* The LLVM compiler is represented as a pass manager containing passes for
 * optimizations, instruction selection, and code generation.
 */
struct ac_compiler_passes {
   raw_memory_ostream ostream;        /* ELF shader binary stream */
   legacy::PassManager passmgr; /* list of passes */
};

struct ac_compiler_passes *ac_create_llvm_passes(LLVMTargetMachineRef tm)
{
   struct ac_compiler_passes *p = new ac_compiler_passes();
   if (!p)
      return NULL;

   TargetMachine *TM = reinterpret_cast<TargetMachine *>(tm);

   if (TM->addPassesToEmitFile(p->passmgr, p->ostream, nullptr,
#if LLVM_VERSION_MAJOR >= 18
                               CodeGenFileType::ObjectFile)) {
#else
                               CGFT_ObjectFile)) {
#endif
      fprintf(stderr, "amd: TargetMachine can't emit a file of this type!\n");
      delete p;
      return NULL;
   }
   return p;
}

void ac_destroy_llvm_passes(struct ac_compiler_passes *p)
{
   delete p;
}

/* This returns false on failure. */
bool ac_compile_module_to_elf(struct ac_compiler_passes *p, LLVMModuleRef module,
                              char **pelf_buffer, size_t *pelf_size)
{
   p->passmgr.run(*unwrap(module));
   p->ostream.take(*pelf_buffer, *pelf_size);
   return true;
}

LLVMPassManagerRef ac_create_passmgr(LLVMTargetLibraryInfoRef target_library_info,
                                     bool check_ir)
{
   LLVMPassManagerRef passmgr = LLVMCreatePassManager();
   if (!passmgr)
      return NULL;

   if (target_library_info)
      LLVMAddTargetLibraryInfo(target_library_info, passmgr);

   if (check_ir)
      unwrap(passmgr)->add(createVerifierPass());

   unwrap(passmgr)->add(createAlwaysInlinerLegacyPass());

   /* Normally, the pass manager runs all passes on one function before
    * moving onto another. Adding a barrier no-op pass forces the pass
    * manager to run the inliner on all functions first, which makes sure
    * that the following passes are only run on the remaining non-inline
    * function, so it removes useless work done on dead inline functions.
    */
   unwrap(passmgr)->add(createBarrierNoopPass());

   #if LLVM_VERSION_MAJOR >= 16
   unwrap(passmgr)->add(createSROAPass(true));
   #else
   unwrap(passmgr)->add(createSROAPass());
   #endif
   /* TODO: restore IPSCCP */
   unwrap(passmgr)->add(createLICMPass());
   unwrap(passmgr)->add(createCFGSimplificationPass());
   /* This is recommended by the instruction combining pass. */
   unwrap(passmgr)->add(createEarlyCSEPass(true));
   unwrap(passmgr)->add(createInstructionCombiningPass());
   return passmgr;
}

LLVMValueRef ac_build_atomic_rmw(struct ac_llvm_context *ctx, LLVMAtomicRMWBinOp op,
                                 LLVMValueRef ptr, LLVMValueRef val, const char *sync_scope)
{
   AtomicRMWInst::BinOp binop;
   switch (op) {
   case LLVMAtomicRMWBinOpXchg:
      binop = AtomicRMWInst::Xchg;
      break;
   case LLVMAtomicRMWBinOpAdd:
      binop = AtomicRMWInst::Add;
      break;
   case LLVMAtomicRMWBinOpSub:
      binop = AtomicRMWInst::Sub;
      break;
   case LLVMAtomicRMWBinOpAnd:
      binop = AtomicRMWInst::And;
      break;
   case LLVMAtomicRMWBinOpNand:
      binop = AtomicRMWInst::Nand;
      break;
   case LLVMAtomicRMWBinOpOr:
      binop = AtomicRMWInst::Or;
      break;
   case LLVMAtomicRMWBinOpXor:
      binop = AtomicRMWInst::Xor;
      break;
   case LLVMAtomicRMWBinOpMax:
      binop = AtomicRMWInst::Max;
      break;
   case LLVMAtomicRMWBinOpMin:
      binop = AtomicRMWInst::Min;
      break;
   case LLVMAtomicRMWBinOpUMax:
      binop = AtomicRMWInst::UMax;
      break;
   case LLVMAtomicRMWBinOpUMin:
      binop = AtomicRMWInst::UMin;
      break;
   case LLVMAtomicRMWBinOpFAdd:
      binop = AtomicRMWInst::FAdd;
      break;
   default:
      unreachable("invalid LLVMAtomicRMWBinOp");
      break;
   }
   unsigned SSID = unwrap(ctx->context)->getOrInsertSyncScopeID(sync_scope);
   return wrap(unwrap(ctx->builder)
                        ->CreateAtomicRMW(binop, unwrap(ptr), unwrap(val),
                                          MaybeAlign(0),
                                          AtomicOrdering::SequentiallyConsistent, SSID));
}

LLVMValueRef ac_build_atomic_cmp_xchg(struct ac_llvm_context *ctx, LLVMValueRef ptr,
                                      LLVMValueRef cmp, LLVMValueRef val, const char *sync_scope)
{
   unsigned SSID = unwrap(ctx->context)->getOrInsertSyncScopeID(sync_scope);
   return wrap(unwrap(ctx->builder)
                        ->CreateAtomicCmpXchg(unwrap(ptr), unwrap(cmp),
                                              unwrap(val),
                                              MaybeAlign(0),
                                              AtomicOrdering::SequentiallyConsistent,
                                              AtomicOrdering::SequentiallyConsistent, SSID));
}
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`/*`
			`* Copyright 2014 Advanced Micro Devices, Inc.`
			`*`
sync with OpenBSD -current 2024-04-29 00:35:41 +00:00			`* SPDX-License-Identifier: MIT`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`*/`

			`#include <llvm-c/Core.h>`
			`#include <llvm/Analysis/TargetLibraryInfo.h>`
			`#include <llvm/IR/IRBuilder.h>`
			`#include <llvm/IR/LegacyPassManager.h>`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`#include <llvm/IR/Verifier.h>`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`#include <llvm/Target/TargetMachine.h>`
			`#include <llvm/MC/MCSubtargetInfo.h>`
			`#include <llvm/Support/CommandLine.h>`
			`#include <llvm/Transforms/IPO.h>`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`#include <llvm/Transforms/Scalar.h>`
			`#include <llvm/Transforms/Utils.h>`
			`#include <llvm/CodeGen/Passes.h>`
			`#include <llvm/Transforms/IPO/AlwaysInliner.h>`
			`#include <llvm/Transforms/InstCombine/InstCombine.h>`
			`#include <llvm/Transforms/IPO/SCCP.h>`
			`#include "llvm/CodeGen/SelectionDAGNodes.h"`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00
			`#include <cstring>`

			`/* DO NOT REORDER THE HEADERS`
			`* The LLVM headers need to all be included before any Mesa header,`
			* as they use the `restrict` keyword in ways that are incompatible
			`* with our #define in include/c99_compat.h`
			`*/`

			`#include "ac_binary.h"`
			`#include "ac_llvm_util.h"`
			`#include "ac_llvm_build.h"`
			`#include "util/macros.h"`

sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`using namespace llvm;`

			`class RunAtExitForStaticDestructors : public SDNode`
			`{`
			`public:`
			`/* getSDVTList (protected) calls getValueTypeList (private), which contains static variables. */`
			`RunAtExitForStaticDestructors(): SDNode(0, 0, DebugLoc(), getSDVTList(MVT::Other))`
			`{`
			`}`
			`};`

			`void ac_llvm_run_atexit_for_destructors(void)`
			`{`
			`/* LLVM >= 16 registers static variable destructors on the first compile, which gcc`
			`* implements by calling atexit there. Before that, u_queue registers its atexit`
			`* handler to kill all threads. Since exit() runs atexit handlers in the reverse order,`
			`* the LLVM destructors are called first while shader compiler threads may still be`
			`* running, which crashes in LLVM in SelectionDAG.cpp.`
			`*`
			`* The solution is to run the code that declares the LLVM static variables first,`
			`* so that atexit for LLVM is registered first and u_queue is registered after that,`
			`* which ensures that all u_queue threads are terminated before LLVM destructors are`
			`* called.`
			`*`
			`* This just executes the code that declares static variables.`
			`*/`
			`RunAtExitForStaticDestructors();`
			`}`

sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`bool ac_is_llvm_processor_supported(LLVMTargetMachineRef tm, const char *processor)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`TargetMachine TM = reinterpret_cast<TargetMachine >(tm);`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`return TM->getMCSubtargetInfo()->isCPUStringValid(processor);`
			`}`

sync with OpenBSD -current 2024-04-29 00:35:41 +00:00			`void ac_reset_llvm_all_options_occurrences()`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`cl::ResetAllOptionOccurrences();`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`

			`void ac_add_attr_dereferenceable(LLVMValueRef val, uint64_t bytes)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`Argument *A = unwrap<Argument>(val);`
			`A->addAttr(Attribute::getWithDereferenceableBytes(A->getContext(), bytes));`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`

			`void ac_add_attr_alignment(LLVMValueRef val, uint64_t bytes)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`Argument *A = unwrap<Argument>(val);`
			`A->addAttr(Attribute::getWithAlignment(A->getContext(), Align(bytes)));`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`

			`bool ac_is_sgpr_param(LLVMValueRef arg)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`Argument *A = unwrap<Argument>(arg);`
			`AttributeList AS = A->getParent()->getAttributes();`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`unsigned ArgNo = A->getArgNo();`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`return AS.hasParamAttr(ArgNo, Attribute::InReg);`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`

			`LLVMModuleRef ac_create_module(LLVMTargetMachineRef tm, LLVMContextRef ctx)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`TargetMachine TM = reinterpret_cast<TargetMachine >(tm);`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`LLVMModuleRef module = LLVMModuleCreateWithNameInContext("mesa-shader", ctx);`

sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`unwrap(module)->setTargetTriple(TM->getTargetTriple().getTriple());`
			`unwrap(module)->setDataLayout(TM->createDataLayout());`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`return module;`
			`}`

			`LLVMBuilderRef ac_create_builder(LLVMContextRef ctx, enum ac_float_mode float_mode)`
			`{`
			`LLVMBuilderRef builder = LLVMCreateBuilderInContext(ctx);`

sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`FastMathFlags flags;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00
			`switch (float_mode) {`
			`case AC_FLOAT_MODE_DEFAULT:`
			`case AC_FLOAT_MODE_DENORM_FLUSH_TO_ZERO:`
			`break;`

			`case AC_FLOAT_MODE_DEFAULT_OPENGL:`
			`/* Allow optimizations to treat the sign of a zero argument or`
			`* result as insignificant.`
			`*/`
			`flags.setNoSignedZeros(); /* nsz */`

			`/* Allow optimizations to use the reciprocal of an argument`
			`* rather than perform division.`
			`*/`
			`flags.setAllowReciprocal(); /* arcp */`

sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`unwrap(builder)->setFastMathFlags(flags);`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`}`

			`return builder;`
			`}`

			`void ac_enable_signed_zeros(struct ac_llvm_context *ctx)`
			`{`
			`if (ctx->float_mode == AC_FLOAT_MODE_DEFAULT_OPENGL) {`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`auto *b = unwrap(ctx->builder);`
			`FastMathFlags flags = b->getFastMathFlags();`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00
			`/* This disables the optimization of (x + 0), which is used`
			`* to convert negative zero to positive zero.`
			`*/`
			`flags.setNoSignedZeros(false);`
			`b->setFastMathFlags(flags);`
			`}`
			`}`

			`void ac_disable_signed_zeros(struct ac_llvm_context *ctx)`
			`{`
			`if (ctx->float_mode == AC_FLOAT_MODE_DEFAULT_OPENGL) {`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`auto *b = unwrap(ctx->builder);`
			`FastMathFlags flags = b->getFastMathFlags();`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00
			`flags.setNoSignedZeros();`
			`b->setFastMathFlags(flags);`
			`}`
			`}`

			`LLVMTargetLibraryInfoRef ac_create_target_library_info(const char *triple)`
			`{`
			`return reinterpret_cast<LLVMTargetLibraryInfoRef>(`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`new TargetLibraryInfoImpl(Triple(triple)));`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`

			`void ac_dispose_target_library_info(LLVMTargetLibraryInfoRef library_info)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`delete reinterpret_cast<TargetLibraryInfoImpl *>(library_info);`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`

			`/* Implementation of raw_pwrite_stream that works on malloc()ed memory for`
			`* better compatibility with C code. */`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`struct raw_memory_ostream : public raw_pwrite_stream {`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`char *buffer;`
			`size_t written;`
			`size_t bufsize;`

			`raw_memory_ostream()`
			`{`
			`buffer = NULL;`
			`written = 0;`
			`bufsize = 0;`
			`SetUnbuffered();`
			`}`

			`~raw_memory_ostream()`
			`{`
			`free(buffer);`
			`}`

			`void clear()`
			`{`
			`written = 0;`
			`}`

			`void take(char *&out_buffer, size_t &out_size)`
			`{`
			`out_buffer = buffer;`
			`out_size = written;`
			`buffer = NULL;`
			`written = 0;`
			`bufsize = 0;`
			`}`

			`void flush() = delete;`

			`void write_impl(const char *ptr, size_t size) override`
			`{`
			`if (unlikely(written + size < written))`
			`abort();`
			`if (written + size > bufsize) {`
			`bufsize = MAX3(1024, written + size, bufsize / 3 * 4);`
			`buffer = (char *)realloc(buffer, bufsize);`
			`if (!buffer) {`
			`fprintf(stderr, "amd: out of memory allocating ELF buffer\n");`
			`abort();`
			`}`
			`}`
			`memcpy(buffer + written, ptr, size);`
			`written += size;`
			`}`

			`void pwrite_impl(const char *ptr, size_t size, uint64_t offset) override`
			`{`
			`assert(offset == (size_t)offset && offset + size >= offset && offset + size <= written);`
			`memcpy(buffer + offset, ptr, size);`
			`}`

			`uint64_t current_pos() const override`
			`{`
			`return written;`
			`}`
			`};`

			`/* The LLVM compiler is represented as a pass manager containing passes for`
			`* optimizations, instruction selection, and code generation.`
			`*/`
			`struct ac_compiler_passes {`
			`raw_memory_ostream ostream; /* ELF shader binary stream */`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`legacy::PassManager passmgr; /* list of passes */`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`};`

			`struct ac_compiler_passes *ac_create_llvm_passes(LLVMTargetMachineRef tm)`
			`{`
			`struct ac_compiler_passes *p = new ac_compiler_passes();`
			`if (!p)`
			`return NULL;`

sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`TargetMachine TM = reinterpret_cast<TargetMachine >(tm);`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00
			`if (TM->addPassesToEmitFile(p->passmgr, p->ostream, nullptr,`
sync with OpenBSD -current 2024-04-29 00:35:41 +00:00			`#if LLVM_VERSION_MAJOR >= 18`
			`CodeGenFileType::ObjectFile)) {`
			`#else`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`CGFT_ObjectFile)) {`
sync with OpenBSD -current 2024-04-29 00:35:41 +00:00			`#endif`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`fprintf(stderr, "amd: TargetMachine can't emit a file of this type!\n");`
			`delete p;`
			`return NULL;`
			`}`
			`return p;`
			`}`

			`void ac_destroy_llvm_passes(struct ac_compiler_passes *p)`
			`{`
			`delete p;`
			`}`

			`/* This returns false on failure. */`
			`bool ac_compile_module_to_elf(struct ac_compiler_passes *p, LLVMModuleRef module,`
			`char *pelf_buffer, size_t pelf_size)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`p->passmgr.run(*unwrap(module));`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`p->ostream.take(pelf_buffer, pelf_size);`
			`return true;`
			`}`

sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`LLVMPassManagerRef ac_create_passmgr(LLVMTargetLibraryInfoRef target_library_info,`
			`bool check_ir)`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`LLVMPassManagerRef passmgr = LLVMCreatePassManager();`
			`if (!passmgr)`
			`return NULL;`

			`if (target_library_info)`
			`LLVMAddTargetLibraryInfo(target_library_info, passmgr);`

			`if (check_ir)`
			`unwrap(passmgr)->add(createVerifierPass());`

			`unwrap(passmgr)->add(createAlwaysInlinerLegacyPass());`

			`/* Normally, the pass manager runs all passes on one function before`
			`* moving onto another. Adding a barrier no-op pass forces the pass`
			`* manager to run the inliner on all functions first, which makes sure`
			`* that the following passes are only run on the remaining non-inline`
			`* function, so it removes useless work done on dead inline functions.`
			`*/`
			`unwrap(passmgr)->add(createBarrierNoopPass());`

			`#if LLVM_VERSION_MAJOR >= 16`
			`unwrap(passmgr)->add(createSROAPass(true));`
			`#else`
			`unwrap(passmgr)->add(createSROAPass());`
			`#endif`
			`/* TODO: restore IPSCCP */`
			`unwrap(passmgr)->add(createLICMPass());`
			`unwrap(passmgr)->add(createCFGSimplificationPass());`
			`/* This is recommended by the instruction combining pass. */`
			`unwrap(passmgr)->add(createEarlyCSEPass(true));`
			`unwrap(passmgr)->add(createInstructionCombiningPass());`
			`return passmgr;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`

			`LLVMValueRef ac_build_atomic_rmw(struct ac_llvm_context *ctx, LLVMAtomicRMWBinOp op,`
			`LLVMValueRef ptr, LLVMValueRef val, const char *sync_scope)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`AtomicRMWInst::BinOp binop;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`switch (op) {`
			`case LLVMAtomicRMWBinOpXchg:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::Xchg;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpAdd:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::Add;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpSub:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::Sub;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpAnd:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::And;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpNand:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::Nand;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpOr:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::Or;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpXor:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::Xor;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpMax:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::Max;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpMin:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::Min;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpUMax:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::UMax;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpUMin:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::UMin;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`case LLVMAtomicRMWBinOpFAdd:`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`binop = AtomicRMWInst::FAdd;`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`break;`
			`default:`
			`unreachable("invalid LLVMAtomicRMWBinOp");`
			`break;`
			`}`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`unsigned SSID = unwrap(ctx->context)->getOrInsertSyncScopeID(sync_scope);`
			`return wrap(unwrap(ctx->builder)`
			`->CreateAtomicRMW(binop, unwrap(ptr), unwrap(val),`
			`MaybeAlign(0),`
			`AtomicOrdering::SequentiallyConsistent, SSID));`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`

			`LLVMValueRef ac_build_atomic_cmp_xchg(struct ac_llvm_context *ctx, LLVMValueRef ptr,`
			`LLVMValueRef cmp, LLVMValueRef val, const char *sync_scope)`
			`{`
sync code with last improvements from OpenBSD 2023-11-11 18:37:37 +00:00			`unsigned SSID = unwrap(ctx->context)->getOrInsertSyncScopeID(sync_scope);`
			`return wrap(unwrap(ctx->builder)`
			`->CreateAtomicCmpXchg(unwrap(ptr), unwrap(cmp),`
			`unwrap(val),`
			`MaybeAlign(0),`
			`AtomicOrdering::SequentiallyConsistent,`
			`AtomicOrdering::SequentiallyConsistent, SSID));`
sync code with last improvements from OpenBSD 2023-08-28 05:57:34 +00:00			`}`