[llvm] IR2Builder tool for converting LLVM IR files into C++ IRBuilder API (PR #117129)
Jason Eckhardt via llvm-commits
llvm-commits at lists.llvm.org
Thu Nov 21 12:10:46 PST 2024
================
@@ -0,0 +1,1702 @@
+//===-- ir2builder.cpp - Transpiler from IR to builder API ------*- C++ -*-===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+//
+// This file defines a pass, which converts LLVM IR into llvm::IRBuilder
+// API in textual form.
+//
+// This tool can be used to simplify IR construction using IRBuilder by
+// writing the IR by hand and then converting it using this pass.
+//
+//===----------------------------------------------------------------------===//
+
+#include "llvm/ADT/APFloat.h"
+#include "llvm/ADT/APInt.h"
+#include "llvm/ADT/PostOrderIterator.h"
+#include "llvm/ADT/StringExtras.h"
+#include "llvm/ADT/StringMap.h"
+#include "llvm/AsmParser/Parser.h"
+#include "llvm/IR/CallingConv.h"
+#include "llvm/IR/Constants.h"
+#include "llvm/IR/InlineAsm.h"
+#include "llvm/IR/Instructions.h"
+#include "llvm/IR/LLVMContext.h"
+#include "llvm/IR/Module.h"
+#include "llvm/IR/ModuleSummaryIndex.h"
+#include "llvm/Support/AtomicOrdering.h"
+#include "llvm/Support/CommandLine.h"
+#include "llvm/Support/FileSystem.h"
+#include "llvm/Support/InitLLVM.h"
+#include "llvm/Support/SourceMgr.h"
+#include "llvm/Support/ToolOutputFile.h"
+#include "llvm/Support/raw_ostream.h"
+#include <algorithm>
+#include <cctype>
+#include <cmath>
+#include <cstdint>
+#include <sstream>
+
+using namespace llvm;
+
+cl::OptionCategory Ir2BCat("ir2builder Options");
+
+/** LLVM IR to convert */
+static cl::opt<std::string>
+ InputFilename(cl::Positional, cl::desc("<input .ll file>"), cl::init("-"));
+
+/**
+ * Output file for the generated C++ code.
+ * If not set then stdout will be used.
+ */
+static cl::opt<std::string> OutputFilename("o",
+ cl::desc("Override output filename"),
+ cl::value_desc("filename"),
+ cl::cat(Ir2BCat));
+
+/** Set this when you don't use `using namespace llvm` (don't forget :: at the
+ * end) */
+static cl::opt<std::string> ScopePrefix(
+ "scope-prefix",
+ cl::desc(
+ "All generated calls to LLVM API will be prefixed with this scope. The "
+ "scope has to end with '::' (e.g.: '-scope-prefix=llvm::')"),
+ cl::cat(Ir2BCat), cl::init(""));
+
+/** Set this to your variable name for IRBuilder instance */
+static cl::opt<std::string> BuilderName(
+ "builder-name",
+ cl::desc("IRBuilder variable name that will be used in generated code"),
+ cl::cat(Ir2BCat), cl::init("Builder"));
+
+/** Set this to your LLVMContext variable name */
+static cl::opt<std::string> ContextName(
+ "context-name",
+ cl::desc("Context variable name that will be used in generated code"),
+ cl::cat(Ir2BCat), cl::init("Ctx"));
+
+/** Set this to your llvm::Module * name */
+static cl::opt<std::string> ModuleName(
+ "module-name",
+ cl::desc("Module variable name that will be used in generated code"),
+ cl::cat(Ir2BCat), cl::init("Mod"));
+
+/** Set this if you want custom data layout */
+static cl::opt<std::string> ClDataLayout("data-layout",
+ cl::desc("data layout string to use"),
+ cl::value_desc("layout-string"),
+ cl::init(""), cl::cat(Ir2BCat));
+
+/**
+ * This will generate fully compilable C++ program with main, which will
+ * use generated calls to create the original LLVM IR.
+ * Main purpose of this is to use it for testing and verification that
+ * generated program is correct and compilable.
+ * For example you can generate the code, run this program and then use
+ * llvm-diff to see if it matches the original:
+ * ```
+ * ./ir2builder code.ll --runnable > main.cpp &&
+ * g++ main.cpp `./llvm-conf --cxxflags --ldflags --system-libs --libs core`
+ * -I /llvm/include/ -o main &&
+ * ./main > generated.ll &&
+ * ./llvm-diff code.ll generated.ll
+ * ```
+ */
+static cl::opt<bool> GenerateRunnable(
+ "runnable", cl::desc("Generates whole cpp compilable program with main"),
+ cl::init(false), cl::cat(Ir2BCat));
+
+/**
+ * Disables verification of loaded llvm IR.
+ * Keep in mind that this will most likely result in C++ error as it probably
+ * won't be possible to create Builder calls for this.
+ */
+static cl::opt<bool>
+ DisableVerify("disable-verify", cl::Hidden,
+ cl::desc("Do not run verifier on input LLVM (dangerous!)"),
+ cl::cat(Ir2BCat));
+
+/**
+ * Sets the order of traversal for the LLVM IR.
+ * When enabled the traversal will be in reverse post order, which can handle
+ * when values are defined after (text-wise) their use.
+ * On the other hand using just linear traversal will also include parts that
+ * are outside of the graph (dead blocks).
+ */
+static cl::opt<bool>
+ UseRPO("use-rpo",
+ cl::desc("Traverses IR in reverse post order. This can help with "
+ "\"was not declared\" errors"),
+ cl::init(true), cl::cat(Ir2BCat));
+
+/**
+ * @brief Transpiler from LLVM IR into IRBuilder API calls
+ * The main purpose for this class is to hold variable counter and variable
+ * names for needed resources, such as LLVMContext.
+ */
+class IR2Builder {
+private:
+ unsigned long varI = 0;
+ std::string llvmPrefix;
+ std::string builder;
+ std::string ctx;
+ std::string modName;
+
+ std::vector<std::string> phiIncomings;
+
+ inline bool hasName(const Value *op) {
+ return !isa<Constant>(op) && !isa<InlineAsm>(op);
+ }
+
+ void outputAttr(Attribute att, raw_ostream &OS);
+
+ std::string getNextVar();
+ std::string getLinkage(GlobalValue &gv);
+ std::string getThreadLocalMode(GlobalValue::ThreadLocalMode tlm);
+ std::string getCmpPredicate(CmpInst::Predicate p);
+ std::string getAtomicRMWOp(AtomicRMWInst::BinOp op);
+ std::string getAtomicOrdering(AtomicOrdering ao);
+ std::string getSyncScopeID(SyncScope::ID sys);
+ std::string getCallingConv(CallingConv::ID cc);
+ std::string getConstantRange(ConstantRange &cr);
+
+ std::string getVal(const Value *op);
+ std::string getConst(const Constant *op);
+ std::string getType(const Type *t);
+ std::string getInlineAsm(const InlineAsm *op);
+ std::string getMetadata(const Metadata *op);
+
+public:
+ IR2Builder()
+ : llvmPrefix(ScopePrefix), builder(BuilderName), ctx(ContextName),
+ modName(ModuleName) {}
+
+ /**
+ * Calls convert for all the functions in passed in module
+ * @param M Module to call convert over
+ * @param OS Stream to which output the builder calls
+ */
+ void convert(Module &M, raw_ostream &OS);
+
+ /**
+ * Converts a function into IRBuilder API calls
+ * @param F Function to convert
+ * @param OS Stream to which output the builder calls
+ */
+ void convert(Function &F, raw_ostream &OS);
+
+ /**
+ * Converts an instruction into IRBuilder API calls
+ * @param I Instruction to convert
+ * @param OS Stream to which output the builder calls
+ * @note Unsupported instructions or their operands should result
+ * in a TODO comment.
+ */
+ void convert(const Instruction *I, raw_ostream &OS);
+};
+
+std::string IR2Builder::getNextVar() {
+ return "v0" + std::to_string(varI++);
+}
+
+static std::string to_str(bool b) { return b ? "true" : "false"; }
+
+static std::string escape(std::string str) {
+ std::stringstream ss;
+ for (unsigned char C : str) {
+ if (C == '\\')
+ ss << '\\' << C;
+ else if (isPrint(C) && C != '"')
+ ss << C;
+ else
+ ss << '\\' << hexdigit(C >> 4) << hexdigit(C & 0x0F);
+ }
+ return ss.str();
+}
+
+static std::string sanitize(std::string s) {
+ std::stringstream ss;
+ for (size_t i = 0; i < s.size(); ++i) {
+ if (!std::isalnum(s[i])) {
+ ss << "_" << static_cast<unsigned>(s[i]) << "_";
+ } else {
+ ss << s[i];
+ }
+ }
+ return ss.str();
+}
+
+std::string IR2Builder::getLinkage(llvm::GlobalValue &gv) {
+ std::string link = llvmPrefix + "GlobalValue::";
+
+ if (gv.hasExternalLinkage()) {
+ return link + "ExternalLinkage";
+ }
+ if (gv.hasAvailableExternallyLinkage()) {
+ return link + "AvailableExternallyLinkage";
+ }
+ if (gv.hasLinkOnceAnyLinkage()) {
+ return link + "LinkOnceAnyLinkage";
+ }
+ if (gv.hasLinkOnceODRLinkage()) {
+ return link + "LinkOnceODRLinkage";
+ }
+ if (gv.hasWeakAnyLinkage()) {
+ return link + "WeakAnyLinkage";
+ }
+ if (gv.hasWeakODRLinkage()) {
+ return link + "WeakODRLinkage";
+ }
+ if (gv.hasAppendingLinkage()) {
+ return link + "AppendingLinkage";
+ }
+ if (gv.hasInternalLinkage()) {
+ return link + "InternalLinkage";
+ }
+ if (gv.hasPrivateLinkage()) {
+ return link + "PrivateLinkage";
+ }
+ if (gv.hasExternalWeakLinkage()) {
+ return link + "ExternalWeakLinkage";
+ }
+ if (gv.hasCommonLinkage()) {
+ return link + "CommonLinkage";
+ }
+
+ return "/* Unknown linkage */";
+}
+
+std::string IR2Builder::getAtomicRMWOp(AtomicRMWInst::BinOp op) {
+ switch (op) {
+ case AtomicRMWInst::BinOp::Xchg:
+ return llvmPrefix + "AtomicRMWInst::BinOp::Xchg";
+ case AtomicRMWInst::BinOp::Add:
+ return llvmPrefix + "AtomicRMWInst::BinOp::Add";
+ case AtomicRMWInst::BinOp::Sub:
+ return llvmPrefix + "AtomicRMWInst::BinOp::Sub";
+ case AtomicRMWInst::BinOp::And:
+ return llvmPrefix + "AtomicRMWInst::BinOp::And";
+ case AtomicRMWInst::BinOp::Nand:
+ return llvmPrefix + "AtomicRMWInst::BinOp::Nand";
+ case AtomicRMWInst::BinOp::Or:
+ return llvmPrefix + "AtomicRMWInst::BinOp::Or";
+ case AtomicRMWInst::BinOp::Xor:
+ return llvmPrefix + "AtomicRMWInst::BinOp::Xor";
+ case AtomicRMWInst::BinOp::Max:
+ return llvmPrefix + "AtomicRMWInst::BinOp::Max";
+ case AtomicRMWInst::BinOp::Min:
+ return llvmPrefix + "AtomicRMWInst::BinOp::Min";
+ case AtomicRMWInst::BinOp::UMax:
+ return llvmPrefix + "AtomicRMWInst::BinOp::UMax";
+ case AtomicRMWInst::BinOp::UMin:
+ return llvmPrefix + "AtomicRMWInst::BinOp::UMin";
+ case AtomicRMWInst::BinOp::FAdd:
+ return llvmPrefix + "AtomicRMWInst::BinOp::FAdd";
+ case AtomicRMWInst::BinOp::FSub:
+ return llvmPrefix + "AtomicRMWInst::BinOp::FSub";
+ case AtomicRMWInst::BinOp::FMax:
+ return llvmPrefix + "AtomicRMWInst::BinOp::FMax";
+ case AtomicRMWInst::BinOp::FMin:
+ return llvmPrefix + "AtomicRMWInst::BinOp::FMin";
+ case AtomicRMWInst::BinOp::UIncWrap:
+ return llvmPrefix + "AtomicRMWInst::BinOp::UIncWrap";
+ case AtomicRMWInst::BinOp::UDecWrap:
+ return llvmPrefix + "AtomicRMWInst::BinOp::UDecWrap";
+ default:
+ return "/* TODO: Unknown AtomicRMW operator (using value) */ " +
+ std::to_string(op);
+ }
+}
+
+std::string IR2Builder::getAtomicOrdering(AtomicOrdering ao) {
+ switch (ao) {
+ case AtomicOrdering::NotAtomic:
+ return llvmPrefix + "AtomicOrdering::NotAtomic";
+ case AtomicOrdering::Unordered:
+ return llvmPrefix + "AtomicOrdering::Unordered";
+ case AtomicOrdering::Monotonic:
+ return llvmPrefix + "AtomicOrdering::Monotonic";
+ case AtomicOrdering::Acquire:
+ return llvmPrefix + "AtomicOrdering::Acquire";
+ case AtomicOrdering::Release:
+ return llvmPrefix + "AtomicOrdering::Release";
+ case AtomicOrdering::AcquireRelease:
+ return llvmPrefix + "AtomicOrdering::AcquireRelease";
+ case AtomicOrdering::SequentiallyConsistent:
+ return llvmPrefix + "AtomicOrdering::SequentiallyConsistent";
+ default:
+ return "/* TODO: Unknown atomic ordering */";
+ }
+}
+
+std::string IR2Builder::getCmpPredicate(CmpInst::Predicate p) {
+ switch (p) {
+ case CmpInst::Predicate::FCMP_FALSE:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_FALSE";
+ case CmpInst::Predicate::FCMP_OEQ:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_OEQ";
+ case CmpInst::Predicate::FCMP_OGT:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_OGT";
+ case CmpInst::Predicate::FCMP_OGE:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_OGE";
+ case CmpInst::Predicate::FCMP_OLT:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_OLT";
+ case CmpInst::Predicate::FCMP_OLE:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_OLE";
+ case CmpInst::Predicate::FCMP_ONE:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_ONE";
+ case CmpInst::Predicate::FCMP_ORD:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_ORD";
+ case CmpInst::Predicate::FCMP_UNO:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_UNO";
+ case CmpInst::Predicate::FCMP_UEQ:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_UEQ";
+ case CmpInst::Predicate::FCMP_UGT:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_UGT";
+ case CmpInst::Predicate::FCMP_UGE:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_UGE";
+ case CmpInst::Predicate::FCMP_ULT:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_ULT";
+ case CmpInst::Predicate::FCMP_ULE:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_ULE";
+ case CmpInst::Predicate::FCMP_UNE:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_UNE";
+ case CmpInst::Predicate::FCMP_TRUE:
+ return llvmPrefix + "CmpInst::Predicate::FCMP_TRUE";
+ case CmpInst::Predicate::ICMP_EQ:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_EQ";
+ case CmpInst::Predicate::ICMP_NE:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_NE";
+ case CmpInst::Predicate::ICMP_UGT:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_UGT";
+ case CmpInst::Predicate::ICMP_UGE:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_UGE";
+ case CmpInst::Predicate::ICMP_ULT:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_ULT";
+ case CmpInst::Predicate::ICMP_ULE:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_ULE";
+ case CmpInst::Predicate::ICMP_SGT:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_SGT";
+ case CmpInst::Predicate::ICMP_SGE:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_SGE";
+ case CmpInst::Predicate::ICMP_SLT:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_SLT";
+ case CmpInst::Predicate::ICMP_SLE:
+ return llvmPrefix + "CmpInst::Predicate::ICMP_SLE";
+ default:
+ return "/* TODO: Unknown CMP predicate (using value) */ " +
+ std::to_string(p);
+ }
+}
+
+std::string IR2Builder::getSyncScopeID(SyncScope::ID sys) {
+ if (sys == SyncScope::System)
+ return llvmPrefix + "SyncScope::System";
+ else if (sys == SyncScope::SingleThread)
+ return llvmPrefix + "SyncScope::SingleThread";
+ else
+ return "/* TODO: Unknown SyncScope ID (using value) */ " +
+ std::to_string(sys);
+}
+
+std::string IR2Builder::getThreadLocalMode(GlobalValue::ThreadLocalMode tlm) {
+ switch (tlm) {
+ case GlobalValue::ThreadLocalMode::NotThreadLocal:
+ return llvmPrefix + "GlobalValue::ThreadLocalMode::NotThreadLocal";
+ case GlobalValue::ThreadLocalMode::GeneralDynamicTLSModel:
+ return llvmPrefix + "GlobalValue::ThreadLocalMode::GeneralDynamicTLSModel";
+ case GlobalValue::ThreadLocalMode::LocalDynamicTLSModel:
+ return llvmPrefix + "GlobalValue::ThreadLocalMode::LocalDynamicTLSModel";
+ case GlobalValue::ThreadLocalMode::InitialExecTLSModel:
+ return llvmPrefix + "GlobalValue::ThreadLocalMode::InitialExecTLSModel";
+ case GlobalValue::ThreadLocalMode::LocalExecTLSModel:
+ return llvmPrefix + "GlobalValue::ThreadLocalMode::LocalExecTLSModel";
+ default:
+ return "/* TODO: Unknown ThreadLocalMode (using value) */ " +
+ std::to_string(tlm);
+ }
+}
+
+std::string IR2Builder::getCallingConv(CallingConv::ID cc) {
+ switch (cc) {
+ case CallingConv::C:
+ return llvmPrefix + "CallingConv::C";
+ case CallingConv::Fast:
+ return llvmPrefix + "CallingConv::Fast";
+ case CallingConv::Cold:
+ return llvmPrefix + "CallingConv::Cold";
+ case CallingConv::GHC:
+ return llvmPrefix + "CallingConv::GHC";
+ case CallingConv::HiPE:
+ return llvmPrefix + "CallingConv::HiPE";
+ case CallingConv::AnyReg:
+ return llvmPrefix + "CallingConv::AnyReg";
+ case CallingConv::PreserveMost:
+ return llvmPrefix + "CallingConv::PreserveMost";
+ case CallingConv::PreserveAll:
+ return llvmPrefix + "CallingConv::PreserveAll";
+ case CallingConv::Swift:
+ return llvmPrefix + "CallingConv::Swift";
+ case CallingConv::CXX_FAST_TLS:
+ return llvmPrefix + "CallingConv::CXX_FAST_TLS";
+ case CallingConv::Tail:
+ return llvmPrefix + "CallingConv::Tail";
+ case CallingConv::CFGuard_Check:
+ return llvmPrefix + "CallingConv::CFGuard_Check";
+ case CallingConv::SwiftTail:
+ return llvmPrefix + "CallingConv::SwiftTail";
+ case CallingConv::PreserveNone:
+ return llvmPrefix + "CallingConv::PreserveNone";
+ case CallingConv::FirstTargetCC:
+ return llvmPrefix + "CallingConv::FirstTargetCC";
+ // CallingConv::X86_StdCall is the same as FirstTargetCC
+ case CallingConv::X86_FastCall:
+ return llvmPrefix + "CallingConv::X86_FastCall";
+ case CallingConv::ARM_APCS:
+ return llvmPrefix + "CallingConv::ARM_APCS";
+ case CallingConv::ARM_AAPCS:
+ return llvmPrefix + "CallingConv::ARM_AAPCS";
+ case CallingConv::ARM_AAPCS_VFP:
+ return llvmPrefix + "CallingConv::ARM_AAPCS_VFP";
+ case CallingConv::MSP430_INTR:
+ return llvmPrefix + "CallingConv::MSP430_INTR";
+ case CallingConv::X86_ThisCall:
+ return llvmPrefix + "CallingConv::X86_ThisCall";
+ case CallingConv::PTX_Kernel:
+ return llvmPrefix + "CallingConv::PTX_Kernel";
+ case CallingConv::PTX_Device:
+ return llvmPrefix + "CallingConv::PTX_Device";
+ case CallingConv::SPIR_FUNC:
+ return llvmPrefix + "CallingConv::SPIR_FUNC";
+ case CallingConv::SPIR_KERNEL:
+ return llvmPrefix + "CallingConv::SPIR_KERNEL";
+ case CallingConv::Intel_OCL_BI:
+ return llvmPrefix + "CallingConv::Intel_OCL_BI";
+ case CallingConv::X86_64_SysV:
+ return llvmPrefix + "CallingConv::X86_64_SysV";
+ case CallingConv::Win64:
+ return llvmPrefix + "CallingConv::Win64";
+ case CallingConv::X86_VectorCall:
+ return llvmPrefix + "CallingConv::X86_VectorCall";
+ case CallingConv::DUMMY_HHVM:
+ return llvmPrefix + "CallingConv::DUMMY_HHVM";
+ case CallingConv::DUMMY_HHVM_C:
+ return llvmPrefix + "CallingConv::DUMMY_HHVM_C";
+ case CallingConv::X86_INTR:
+ return llvmPrefix + "CallingConv::X86_INTR";
+ case CallingConv::AVR_INTR:
+ return llvmPrefix + "CallingConv::AVR_INTR";
+ case CallingConv::AVR_SIGNAL:
+ return llvmPrefix + "CallingConv::AVR_SIGNAL";
+ case CallingConv::AVR_BUILTIN:
+ return llvmPrefix + "CallingConv::AVR_BUILTIN";
+ case CallingConv::AMDGPU_VS:
+ return llvmPrefix + "CallingConv::AMDGPU_VS";
+ case CallingConv::AMDGPU_GS:
+ return llvmPrefix + "CallingConv::AMDGPU_GS";
+ case CallingConv::AMDGPU_PS:
+ return llvmPrefix + "CallingConv::AMDGPU_PS";
+ case CallingConv::AMDGPU_CS:
+ return llvmPrefix + "CallingConv::AMDGPU_CS";
+ case CallingConv::AMDGPU_KERNEL:
+ return llvmPrefix + "CallingConv::AMDGPU_KERNEL";
+ case CallingConv::X86_RegCall:
+ return llvmPrefix + "CallingConv::X86_RegCall";
+ case CallingConv::AMDGPU_HS:
+ return llvmPrefix + "CallingConv::AMDGPU_HS";
+ case CallingConv::MSP430_BUILTIN:
+ return llvmPrefix + "CallingConv::MSP430_BUILTIN";
+ case CallingConv::AMDGPU_LS:
+ return llvmPrefix + "CallingConv::AMDGPU_LS";
+ case CallingConv::AMDGPU_ES:
+ return llvmPrefix + "CallingConv::AMDGPU_ES";
+ case CallingConv::AArch64_VectorCall:
+ return llvmPrefix + "CallingConv::AArch64_VectorCall";
+ case CallingConv::AArch64_SVE_VectorCall:
+ return llvmPrefix + "CallingConv::AArch64_SVE_VectorCall";
+ case CallingConv::WASM_EmscriptenInvoke:
+ return llvmPrefix + "CallingConv::WASM_EmscriptenInvoke";
+ case CallingConv::AMDGPU_Gfx:
+ return llvmPrefix + "CallingConv::AMDGPU_Gfx";
+ case CallingConv::M68k_INTR:
+ return llvmPrefix + "CallingConv::M68k_INTR";
+ case CallingConv::AArch64_SME_ABI_Support_Routines_PreserveMost_From_X0:
+ return llvmPrefix +
+ "CallingConv::AArch64_SME_ABI_Support_Routines_PreserveMost_From_X0";
+ case CallingConv::AArch64_SME_ABI_Support_Routines_PreserveMost_From_X2:
+ return llvmPrefix +
+ "CallingConv::AArch64_SME_ABI_Support_Routines_PreserveMost_From_X2";
+ case CallingConv::AMDGPU_CS_Chain:
+ return llvmPrefix + "CallingConv::AMDGPU_CS_Chain";
+ case CallingConv::AMDGPU_CS_ChainPreserve:
+ return llvmPrefix + "CallingConv::AMDGPU_CS_ChainPreserve";
+ case CallingConv::M68k_RTD:
+ return llvmPrefix + "CallingConv::M68k_RTD";
+ case CallingConv::GRAAL:
+ return llvmPrefix + "CallingConv::GRAAL";
+ case CallingConv::ARM64EC_Thunk_X64:
+ return llvmPrefix + "CallingConv::ARM64EC_Thunk_X64";
+ case CallingConv::ARM64EC_Thunk_Native:
+ return llvmPrefix + "CallingConv::ARM64EC_Thunk_Native";
+ default:
+ return "/* Custom CC */" + std::to_string(cc);
+ }
+}
+
+std::string IR2Builder::getType(const Type *t) {
+ std::string tcall;
+ if (auto tt = dyn_cast<IntegerType>(t)) {
+ switch (tt->getBitWidth()) {
+ case 8:
+ tcall = "getInt8Ty()";
+ break;
+ case 16:
+ tcall = "getInt16Ty()";
+ break;
+ case 32:
+ tcall = "getInt32Ty()";
+ break;
+ case 64:
+ tcall = "getInt64Ty()";
+ break;
+ default:
+ tcall = "getIntNTy(" + std::to_string(tt->getBitWidth()) + ")";
+ break;
+ }
+ } else if (t->isVoidTy())
+ tcall = "getVoidTy()";
+ else if (t->isFloatTy())
+ tcall = "getFloatTy()";
+ else if (t->isDoubleTy())
+ tcall = "getDoubleTy()";
+ else if (auto st = dyn_cast<StructType>(t)) {
+ std::string elements = llvmPrefix + "ArrayRef<Type *>(";
+ if (st->getNumElements() > 1)
+ elements += "{";
+ bool first = true;
+ for (auto e : st->elements()) {
+ if (!first)
+ elements += ", ";
+ elements += getType(e);
+ first = false;
+ }
+ if (st->getNumElements() > 1)
+ elements += "}";
+ elements += ")";
+ return llvmPrefix + "StructType::create(" + ctx + ", " + elements + ")";
+ } else if (auto at = dyn_cast<ArrayType>(t)) {
+ return llvmPrefix + "ArrayType::get(" + getType(at->getElementType()) +
+ ", " + std::to_string(at->getArrayNumElements()) + ")";
+ } else if (t->isBFloatTy())
+ tcall = "getBFloatTy()";
+ else if (auto vt = dyn_cast<VectorType>(t)) {
+ std::string elemCount =
+ llvmPrefix + "ElementCount::get(" +
+ std::to_string(vt->getElementCount().getKnownMinValue()) + ", " +
+ to_str(vt->getElementCount().isScalable()) + ")";
+ return llvmPrefix + "VectorType::get(" + getType(vt->getElementType()) +
+ ", " + elemCount + ")";
+ } else if (auto ft = dyn_cast<FunctionType>(t)) {
+ tcall = llvmPrefix + "FunctionType::get(" + getType(ft->getReturnType()) +
+ ", {";
+
+ bool isFirst = true;
+ for (auto a : ft->params()) {
+ if (!isFirst)
+ tcall += ", ";
+ tcall += getType(a);
+ isFirst = false;
+ }
+ tcall += "}, " + to_str(ft->isVarArg()) + ")";
+ return tcall;
+ } else if (t->isPointerTy())
+ tcall = "getPtrTy()";
+ else if (t->isHalfTy()) {
+ return llvmPrefix + "Type::getHalfTy(" + ctx + ")";
+ } else if (t->isBFloatTy()) {
+ return llvmPrefix + "Type::getBFloatTy(" + ctx + ")";
+ } else if (t->isX86_FP80Ty()) {
+ return llvmPrefix + "Type::getX86_FP80Ty(" + ctx + ")";
+ } else if (t->isFP128Ty()) {
+ return llvmPrefix + "Type::getFP128Ty(" + ctx + ")";
+ } else if (t->isPPC_FP128Ty()) {
+ return llvmPrefix + "Type::getPPC_FP128Ty(" + ctx + ")";
+ } else if (t->isX86_AMXTy()) {
+ return llvmPrefix + "Type::getX86_AMXTy(" + ctx + ")";
+ } else if (t->isLabelTy()) {
+ return llvmPrefix + "Type::getLabelTy(" + ctx + ")";
+ } else if (t->isMetadataTy()) {
+ return llvmPrefix + "Type::getMetadataTy(" + ctx + ")";
+ } else if (t->isTokenTy()) {
+ return llvmPrefix + "Type::getTokenTy(" + ctx + ")";
+ } else {
+ return "/* TODO: Unknown type */";
+ }
+
+ return builder + "." + tcall;
+}
+
+std::string IR2Builder::getConst(const Constant *c) {
+ if (auto ci = dyn_cast<ConstantInt>(c)) {
+ // TODO: Sign has to be determined
+ auto cval = ci->getValue();
+ return llvmPrefix + "ConstantInt::get(" + getType(c->getType()) + ", " +
+ std::to_string(cval.getSExtValue()) + ")";
+ } else if (auto cf = dyn_cast<ConstantFP>(c)) {
+ auto cval = cf->getValue();
+ double dval = cval.convertToDouble();
+ std::string val = std::to_string(dval);
+ if (std::isnan(dval) || std::isinf(dval))
+ val = "\"" + val + "\"";
+ // TODO: Handle double to string conversion to include all digits
+ return llvmPrefix + "ConstantFP::get(" + getType(c->getType()) + ", " +
+ val + ")";
+ } else if (auto at = dyn_cast<ConstantAggregate>(c)) {
+ std::string values;
+ bool first = true;
+ for (unsigned i = 0; i < at->getNumOperands(); ++i) {
+ if (!first)
+ values += ", ";
+ values += getVal(at->getOperand(i));
+ first = false;
+ }
+
+ std::string className;
+ if (isa<ConstantArray>(c)) {
+ className = "ConstantArray";
+ values = llvmPrefix + "ArrayRef<" + llvmPrefix + "Constant *>(" +
+ (at->getNumOperands() > 1 ? std::string("{") : std::string("")) +
+ values +
+ (at->getNumOperands() > 1 ? std::string("}") : std::string("")) +
+ ")";
+ } else if (isa<ConstantStruct>(c))
+ className = "ConstantStruct";
+ else if (isa<ConstantVector>(c)) {
+ values = "{" + values + "}";
+ // ConstantVector does not take type as 1st arg
+ return llvmPrefix + "ConstantVector::get(" + values + ")";
+ } else
+ return "/* TODO: Unknown aggregate constant */";
+
+ return llvmPrefix + className + "::get(" + getType(c->getType()) + ", " +
+ values + ")";
+ } else if (auto cds = dyn_cast<ConstantDataSequential>(c)) {
+ std::string values;
+ std::string className;
+ std::string elemTy = "/* TODO */";
+ if (isa<ConstantDataArray>(c))
+ className = "ConstantDataArray";
+ else if (isa<ConstantDataVector>(c))
+ className = "ConstantDataVector";
+ else
+ return "/* TODO: Unknown data sequential constant */";
+ if (cds->isString()) {
+ values = "";
+ bool first = true;
+ for (auto a : cds->getAsString().str()) {
+ if (first) {
+ values += std::to_string(static_cast<uint8_t>(a));
+ first = false;
+ } else {
+ values += ", " + std::to_string(static_cast<uint8_t>(a));
+ }
+ }
+ return llvmPrefix + className + "::get(" + ctx + ", " + llvmPrefix +
+ "ArrayRef<uint8_t>({" + values + "}))";
+ } else if (cds->isCString()) {
+ values = "";
+ bool first = true;
+ for (auto a : cds->getAsCString().str()) {
+ if (first) {
+ values += std::to_string(static_cast<uint8_t>(a));
+ first = false;
+ } else {
+ values += ", " + std::to_string(static_cast<uint8_t>(a));
+ }
+ }
+ return llvmPrefix + className + "::get(" + ctx + ", " + llvmPrefix +
+ "ArrayRef<uint8_t>({" + values + "}))";
+ } else {
+ Type *elemT = cds->getElementType();
+ if (elemT->isIntegerTy()) {
+ // There can be only 8, 16, 32 or 64 ints in ConstantDataVector
+ elemTy = "uint" + std::to_string(elemT->getIntegerBitWidth()) + "_t";
+ } else if (elemT->isDoubleTy()) {
+ elemTy = "double";
+ } else if (elemT->isFloatTy()) {
+ elemTy = "float";
+ }
+ values = llvmPrefix + "ArrayRef<" + elemTy + ">(";
+ if (cds->getNumElements() > 1)
+ values += "{";
+ bool first = true;
+ for (unsigned i = 0; i < cds->getNumElements(); ++i) {
+ if (!first)
+ values += ", ";
+ if (elemT->isIntegerTy()) {
+ values += std::to_string(cds->getElementAsInteger(i));
+ } else if (elemT->isDoubleTy()) {
+ values += std::to_string(cds->getElementAsDouble(i));
+ } else if (elemT->isFloatTy()) {
+ values += std::to_string(cds->getElementAsFloat(i));
+ } else
+ return "/* Unknown type in data sequential constant */";
+ first = false;
+ }
+ if (cds->getNumElements() > 1)
+ values += "}";
+ values += ")";
+ }
+
+ return llvmPrefix + className + "::get(" + ctx + ", " + values + ")";
+ } else if (isa<ConstantAggregateZero>(c)) {
+ return llvmPrefix + "ConstantAggregateZero::get(" + getType(c->getType()) +
+ ")";
+ } else if (isa<PoisonValue>(c)) {
+ return llvmPrefix + "PoisonValue::get(" + getType(c->getType()) + ")";
+ } else if (isa<UndefValue>(c)) {
+ return llvmPrefix + "UndefValue::get(" + getType(c->getType()) + ")";
+ } else if (auto ba = dyn_cast<BlockAddress>(c)) {
+ return llvmPrefix + "BlockAddress::get(" + getVal(ba->getFunction()) +
+ ", " + getVal(ba->getBasicBlock()) + ")";
+ } else if (isa<ConstantPointerNull>(c)) {
+ return llvmPrefix + "ConstantPointerNull::get(" + getType(c->getType()) +
+ ")";
+ } else if (auto ctn = dyn_cast<ConstantTargetNone>(c)) {
+ auto tetType = ctn->getType();
+
+ std::string typeStr = "{";
+ bool first = true;
+ for (unsigned i = 0; i < tetType->getNumTypeParameters(); ++i) {
+ if (!first)
+ typeStr += ", ";
+ typeStr += getType(tetType->getTypeParameter(i));
+ first = false;
+ }
+ typeStr += "}";
+
+ std::string intsStr = "{";
+ first = true;
+ for (unsigned i = 0; i < tetType->getNumIntParameters(); ++i) {
+ if (!first)
+ intsStr += ", ";
+ intsStr += std::to_string(tetType->getIntParameter(i));
+ first = false;
+ }
+ intsStr += "}";
+
+ std::string tetName = "\"" + escape(tetType->getName().str()) + "\"";
+ std::string tet = llvmPrefix + "TargetExtType::get(" + ctx + ", " +
+ tetName + ", " + typeStr + ", " + intsStr + ")";
+
+ return llvmPrefix + "ConstantTargetNone::get(" + tet + ")";
+ } else if (isa<ConstantTokenNone>(c)) {
+ return llvmPrefix + "ConstantTokenNone::get(" + ctx + ")";
+ } else if (auto ce = dyn_cast<ConstantExpr>(c)) {
+ (void)ce;
+ return "/* TODO: ConstantExpr creation */";
+ // TODO: Dunno how to create this... Fails either on out of range or
+ // even on incorrect opcode
+ // return llvmPrefix + "ConstantExpr::get(" +
+ // std::to_string(ce->getOpcode()) + ", " +
+ // getVal(ce->getOperand(0)) + ", " + getVal(ce->getOperand(1)) + ")";
+ } else if (auto ce = dyn_cast<ConstantPtrAuth>(c)) {
+ (void)ce;
+ return "/* TODO: ConstantPtrAuth value creation */";
+ } else if (auto ce = dyn_cast<DSOLocalEquivalent>(c)) {
+ (void)ce;
+ return "/* TODO: DSOLocalEquivalent value creation */";
+ } else if (auto ce = dyn_cast<NoCFIValue>(c)) {
+ (void)ce;
+ return "/* TODO: NoCFIValue value creation */";
+ } else if (auto ce = dyn_cast<GlobalValue>(c)) {
+ // This should not really happen as getVal should be always called
+ return getVal(ce);
+ }
+
+ return "/* TODO: Constant creation */";
+}
+
+std::string IR2Builder::getInlineAsm(const InlineAsm *op) {
+ auto getAsmDialect = [llvmPrefix = llvmPrefix](InlineAsm::AsmDialect d) {
+ switch (d) {
+ case InlineAsm::AsmDialect::AD_ATT:
+ return llvmPrefix + "InlineAsm::AsmDialect::AD_ATT";
+ case InlineAsm::AsmDialect::AD_Intel:
+ return llvmPrefix + "InlineAsm::AsmDialect::AD_Intel";
+ default:
+ return "/* TODO: Unknown AsmDialect (using value) */" + std::to_string(d);
+ }
+ };
+
+ return llvmPrefix + "InlineAsm::get(" + getType(op->getFunctionType()) +
+ ", " + "\"" + escape(op->getAsmString()) + "\", " + "\"" +
+ escape(op->getConstraintString()) + "\", " +
+ to_str(op->hasSideEffects()) + ", " + to_str(op->isAlignStack()) +
+ ", " + getAsmDialect(op->getDialect()) + ", " +
+ to_str(op->canThrow()) + ")";
+}
+
+std::string IR2Builder::getMetadata(const Metadata *op) {
+ if (auto mdn = dyn_cast<MDNode>(op)) {
+ std::string args = "{";
+ bool first = true;
+ for (unsigned i = 0; i < mdn->getNumOperands(); ++i) {
+ if (!first)
+ args += ", ";
+ args += getMetadata(mdn->getOperand(i));
+ first = false;
+ }
+ args += "}";
+ return llvmPrefix + "MDNode::get(" + ctx + ", " + args + ")";
+ } else if (auto vam = dyn_cast<ValueAsMetadata>(op)) {
+ return llvmPrefix + "ValueAsMetadata::get(" + getVal(vam->getValue()) + ")";
+ } else if (auto mds = dyn_cast<MDString>(op)) {
+ return llvmPrefix + "MDString::get(" + ctx + ", \"" +
+ escape(mds->getString().str()) + "\")";
+ } else {
+ return "/* TODO: Metadata creation */";
+ }
+}
+
+// This is a DEBUG function in Value, so lets copy it here for NDEBUG as well
+static std::string getNameOrAsOperand(const Value *v) {
+ if (!v->getName().empty())
+ return std::string(v->getName());
+
+ std::string BBName;
+ raw_string_ostream OS(BBName);
+ v->printAsOperand(OS, false);
+ return OS.str();
+}
+
+std::string IR2Builder::getVal(const Value *op) {
+ if (!op)
+ return "nullptr";
+ if (isa<Constant>(op) && !isa<GlobalValue>(op)) {
+ return getConst(dyn_cast<Constant>(op));
+ } else if (auto ina = dyn_cast<InlineAsm>(op)) {
+ return getInlineAsm(ina);
+ } else if (auto mtd = dyn_cast<MetadataAsValue>(op)) {
+ return llvmPrefix + "MetadataAsValue::get(" + ctx + ", " +
+ getMetadata(mtd->getMetadata()) + ")";
+ }
+ std::string opName = getNameOrAsOperand(op);
+ if (opName[0] == '%')
+ opName.erase(opName.begin());
+ std::string pref = "v_";
+ if (isa<GlobalValue>(op))
+ pref = "g_";
+ return pref + sanitize(opName);
+}
+
+std::string getBinArithOp(std::string name, std::string op1, std::string op2,
+ const Instruction *I) {
+ return "Create" + name + "(" + op1 + ", " + op2 + ", \"\", " +
+ to_str(I->hasNoUnsignedWrap()) + ", " + to_str(I->hasNoSignedWrap()) +
+ ")";
+}
+
+std::string getFPBinArithOp(std::string name, std::string op1, std::string op2,
+ const Instruction *I) {
+ return "Create" + name + "(" + op1 + ", " + op2 + ")";
+ // TODO: Handle FPMathTag
+}
+
+std::string IR2Builder::getConstantRange(ConstantRange &cr) {
+ std::stringstream ss;
+ unsigned NumWords = divideCeil(cr.getBitWidth(), 64);
+ auto numWordsStr = std::to_string(NumWords);
+ auto numBitsStr = std::to_string(cr.getBitWidth());
+ auto lower = std::to_string(cr.getLower().getLimitedValue());
+ auto upper = std::to_string(cr.getUpper().getLimitedValue());
+ ss << llvmPrefix << "ConstantRange(APInt(" << numBitsStr << ", " << lower
+ << ", true), "
+ << "APInt(" << numBitsStr << ", " << upper << ", true))";
+ return ss.str();
+}
+
+void IR2Builder::outputAttr(Attribute att, raw_ostream &OS) {
+ // TODO: Handle special cases detected using "has" methods
+ // see Attribute::getAsString(bool InAttrGrp)
+ if (att.isStringAttribute()) {
+ OS << llvmPrefix << "Attribute::get(" << ctx << ", \""
+ << att.getKindAsString() << "\"";
+ auto val = att.getValueAsString();
+ if (val.empty()) {
+ OS << ")";
+ } else {
+ OS << ", \"";
+ printEscapedString(val, OS);
+ OS << "\")";
+ }
+ } else if (att.isIntAttribute()) {
+ OS << llvmPrefix << "Attribute::get(" << ctx << ", (" << llvmPrefix
+ << "Attribute::AttrKind)" << std::to_string(att.getKindAsEnum())
+ << ", static_cast<uint64_t>(" << att.getValueAsInt() << "))";
+ } else if (att.isEnumAttribute()) {
+ OS << llvmPrefix << "Attribute::get(" << ctx << ", \""
+ << att.getNameFromAttrKind(att.getKindAsEnum()) << "\")";
+ } else if (att.isTypeAttribute()) {
+ OS << llvmPrefix << "Attribute::get(" << ctx << ", (" << llvmPrefix
+ << "Attribute::AttrKind)" << std::to_string(att.getKindAsEnum()) << ", "
+ << getType(att.getValueAsType()) << ")";
+ } else if (att.isConstantRangeAttribute()) {
+ auto cr = att.getValueAsConstantRange();
+ OS << llvmPrefix << "Attribute::get(" << ctx << ", (" << llvmPrefix
+ << "Attribute::AttrKind)" << std::to_string(att.getKindAsEnum()) << ", "
+ << getConstantRange(cr) << ")";
+ } else if (att.isConstantRangeListAttribute()) {
+ std::string args = "{";
+ bool first = true;
+ for (auto cr : att.getValueAsConstantRangeList()) {
+ if (!first)
+ args += ", ";
+ args += getConstantRange(cr);
+ first = false;
+ }
+ args += "}";
+ OS << llvmPrefix << "Attribute::get(" << ctx << ", (" << llvmPrefix
+ << "Attribute::AttrKind)" << std::to_string(att.getKindAsEnum()) << ", "
+ << llvmPrefix << args << ")";
+ } else {
+ OS << "/* TODO: Attribute creation */";
+ }
+}
+
+void IR2Builder::convert(Module &M, raw_ostream &OS) {
+ // Prologue
+ if (GenerateRunnable) {
+ // Top comment
+ OS << "// This file was autogenerated using ir2builder tool\n";
+
+ // Includes
+ // Currently we include all possibly needed files as this is done
+ // before the conversion of functions
+ OS << R"(
+#include "llvm/ADT/APFloat.h"
+#include "llvm/ADT/APInt.h"
+#include "llvm/IR/BasicBlock.h"
+#include "llvm/IR/CallingConv.h"
+#include "llvm/IR/ConstantRange.h"
+#include "llvm/IR/Constants.h"
+#include "llvm/IR/DerivedTypes.h"
+#include "llvm/IR/Function.h"
+#include "llvm/IR/IRBuilder.h"
+#include "llvm/IR/InlineAsm.h"
+#include "llvm/IR/Instructions.h"
+#include "llvm/IR/LLVMContext.h"
+#include "llvm/IR/Module.h"
+#include "llvm/IR/Type.h"
+#include "llvm/Support/AtomicOrdering.h"
+#include "llvm/Support/InitLLVM.h"
+#include "llvm/Support/SourceMgr.h"
+#include <cstdint>
+
+using namespace llvm;
+
+int main(int argc, char** argv) {
+ InitLLVM X(argc, argv);
+)";
+
+ // Used objects and variables
+ OS << " LLVMContext " << ctx << ";\n"
+ << " Module *" << modName
+ << "= new Module(\"ir2builder generated module\", " << ctx << ");\n"
+ << " IRBuilder<> " << builder << "(" << ctx << ");\n";
+
+ // Global generation
+ for (auto &G : M.globals()) {
+ std::string initVal = "nullptr";
+ if (G.hasInitializer()) {
+ // In case of BlockAddress initializer we need to declare the function
+ // and basic block so it can be used
+ if (auto ba = dyn_cast<BlockAddress>(G.getInitializer())) {
+ OS << "auto " << getVal(ba->getFunction()) << " = " << modName
+ << "->getOrInsertFunction(\"" << ba->getFunction()->getName()
+ << "\", " << getType(ba->getFunction()->getFunctionType())
+ << ");\n";
+ // Extract basic block
+ // TODO: The function might need to be created in here
+ // since the basic blocks don't exist yet
+ OS << "// TODO: Basic block extraction\n";
+ }
+ initVal = getVal(G.getInitializer());
+ }
+
+ std::string gname = getVal(&G);
+ OS << "auto " << gname << " = new " << llvmPrefix << "GlobalVariable(*"
+ << modName << ", " << getType(G.getValueType()) << ", "
+ << to_str(G.isConstant()) << ", " << getLinkage(G) << ", " << initVal
+ << ", \"" << escape(G.getName().str()) << "\", "
+ << "nullptr"
+ << ", " << getThreadLocalMode(G.getThreadLocalMode()) << ", "
+ << std::to_string(G.getAddressSpace()) << ", "
+ << to_str(G.isExternallyInitialized()) << ");\n";
+ }
+ }
+
+ // Function generation
+ for (Function &F : M) {
+ if (!F.isDeclaration())
+ convert(F, OS);
+ }
+
+ // Epilogue
+ if (GenerateRunnable) {
+ // Print generated code
+ OS << " " << modName << "->print(outs(), nullptr);\n";
+ // Cleanup
+ OS << " delete " << modName << ";\n"
+ << " return 0;\n}\n";
+ }
+}
+
+void IR2Builder::convert(Function &F, raw_ostream &OS) {
+ phiIncomings.clear();
+ // Function
+ OS << "{\n\n";
+ auto fDecl = getVal(&F);
+ OS << llvmPrefix << "Function *" << fDecl;
+ OS << " = " << llvmPrefix << "Function::Create("
+ << getType(F.getFunctionType()) << ", " << getLinkage(F) << ", \""
+ << F.getName() << "\", " << modName << ");\n";
+
+ OS << "\n";
+
+ // Set attributes
+ if (F.getCallingConv() != CallingConv::C) { // C is default
+ OS << fDecl << "->setCallingConv(" + getCallingConv(F.getCallingConv())
+ << ");\n";
+ }
+ // TODO: Handle attributes with values
+ if (F.getAttributes().hasFnAttrs()) {
+ for (auto att : F.getAttributes().getFnAttrs()) {
+ OS << fDecl << "->addFnAttr(";
+ outputAttr(att, OS);
+ OS << ");\n";
+ }
+ }
+ if (F.getAttributes().hasRetAttrs()) {
+ for (auto att : F.getAttributes().getRetAttrs()) {
+ OS << fDecl << "->addRetAttr(";
+ outputAttr(att, OS);
+ OS << ");\n";
+ }
+ }
+ for (size_t i = 0; i < F.arg_size(); ++i) {
+ if (F.getAttributes().hasParamAttrs(i)) {
+ for (auto att : F.getAttributes().getAttributes(i + 1)) {
+ OS << fDecl << "->addParamAttr(" << i << ", ";
+ outputAttr(att, OS);
+ OS << ");\n";
+ }
+ }
+ }
+
+ // Save arguments into variables for easy access
+ for (unsigned i = 0; i < F.arg_size(); ++i) {
+ OS << "auto " << getVal(F.getArg(i)) << " = " << fDecl << "->getArg("
+ << std::to_string(i) << ");\n";
+ }
+
+ if (UseRPO) {
+ ReversePostOrderTraversal<Function *> RPOT(&F);
+
+ // Basic block declaration in order
+ for (BasicBlock *BB : RPOT) {
+ std::string bbName = getVal(BB);
+ OS << llvmPrefix << "BasicBlock* " << bbName << " = " << llvmPrefix
+ << "BasicBlock::Create(" << ctx << ", \"" << BB->getName() << "\", "
+ << fDecl << ");\n";
+ }
+
+ OS << "\n";
+
+ for (auto *BB : RPOT) {
+ OS << builder << "."
+ << "SetInsertPoint(" << getVal(BB) << ");\n";
+
+ for (auto J = BB->begin(), JE = BB->end(); J != JE; ++J) {
+ const Instruction *Inst = &*J;
+ convert(Inst, OS);
+ }
+
+ OS << "\n";
+ }
+ } else {
+ for (BasicBlock &BB : F) {
+ std::string bbName = getVal(&BB);
+ OS << llvmPrefix << "BasicBlock* " << bbName << " = " << llvmPrefix
+ << "BasicBlock::Create(" << ctx << ", \"" << BB.getName() << "\", "
+ << fDecl << ");\n";
+ }
+
+ OS << "\n";
+
+ for (auto &BB : F) {
+ OS << builder << "."
+ << "SetInsertPoint(" << getVal(&BB) << ");\n";
+
+ for (auto J = BB.begin(), JE = BB.end(); J != JE; ++J) {
+ const Instruction *Inst = &*J;
+ convert(Inst, OS);
+ }
+
+ OS << "\n";
+ }
+ }
+
+ // Output incoming values assignment into phis, this is needed as they
+ // might refer to a value not yet defined in the time of phi definition
+ for (auto l : phiIncomings) {
+ OS << l;
+ }
+
+ OS << "}\n";
+}
+
+void IR2Builder::convert(const Instruction *I, raw_ostream &OS) {
+ std::string call;
+
+ std::string op1 = "/* TODO */";
+ std::string op2 = "/* TODO */";
+ std::string op3 = "/* TODO */";
+
+ if (I->getNumOperands() > 0) {
+ op1 = getVal(I->getOperand(0));
+ }
+ if (I->getNumOperands() > 1) {
+ op2 = getVal(I->getOperand(1));
+ }
+ if (I->getNumOperands() > 2) {
+ op3 = getVal(I->getOperand(2));
+ }
+
+ switch (I->getOpcode()) {
+ case Instruction::Ret: {
+ if (I->getNumOperands() == 0)
+ call = "CreateRetVoid()";
+ else
+ call = "CreateRet(" + op1 + ")";
+ } break;
+ case Instruction::Br: {
+ const BranchInst *bi = dyn_cast<BranchInst>(I);
+ if (bi->isUnconditional()) {
+ call = "CreateBr(" + op1 + ")";
+ } else {
+ call = "CreateCondBr(" + op1 + ", " + op3 + ", " + op2 + ")";
+ }
+ } break;
+ case Instruction::Switch: {
+ auto swI = dyn_cast<SwitchInst>(I);
+ call = "CreateSwitch(" + op1 + ", " + op2 + ", " +
+ std::to_string(swI->getNumCases()) + ")";
+
+ std::string swVar = getNextVar();
+ // No need to save temporary var into symTable
+ OS << "auto " << swVar << " = " << builder << "." << call << ";\n";
+
+ for (auto c : swI->cases()) {
+ OS << swVar << "->addCase(" << getVal(c.getCaseValue()) << ", "
+ << getVal(c.getCaseSuccessor()) << ");\n";
+ }
+ return;
+ } break;
+ case Instruction::IndirectBr: {
+ auto inbrI = dyn_cast<IndirectBrInst>(I);
+ call = "CreateIndirectBr(" + op1 + ", " +
+ std::to_string(inbrI->getNumDestinations()) + ")";
+ std::string inbrVar = getNextVar();
+ OS << "auto " << inbrVar << " = " << builder << "." << call << ";\n";
+
+ for (auto c : inbrI->successors()) {
+ OS << inbrVar << "->addDestination(" << getVal(c) << ");\n";
+ }
+ } break;
+ case Instruction::Invoke: {
+ auto invI = dyn_cast<InvokeInst>(I);
+ std::string args = "{";
+ bool first = true;
+ for (unsigned i = 0; i < invI->arg_size(); ++i) {
+ if (!first)
+ args += ", ";
+ args += getVal(invI->getArgOperand(i));
+ first = false;
+ }
+ args += "}";
+ std::string funDecl = getNextVar();
+ OS << "auto " << funDecl << " = " << modName << "->getOrInsertFunction(\""
+ << I->getOperand(2)->getName() << "\", "
+ << getType(invI->getFunctionType()) << ");\n";
+ call = "CreateInvoke(" + funDecl + ", " + getVal(invI->getNormalDest()) +
+ ", " + getVal(invI->getUnwindDest()) + ", " + args + ")";
+ // TODO: Handle operand bundles
+ } break;
+ case Instruction::Resume: {
+ call = "CreateResume(" + op1 + ")";
+ } break;
+ case Instruction::Unreachable: {
+ call = "CreateUnreachable()";
+ } break;
+ case Instruction::CleanupRet: {
+ auto curI = dyn_cast<CleanupReturnInst>(I);
+ call =
+ "CreateCleanupRet(" + op1 + ", " + getVal(curI->getUnwindDest()) + ")";
+ } break;
+ case Instruction::CatchRet: {
+ call = "CreateCatchRet(" + op1 + ", " + op2 + ")";
+ } break;
+ case Instruction::CatchSwitch: {
+ auto swI = dyn_cast<CatchSwitchInst>(I);
+ call = "CreateCatchSwitch(" + op1 + ", " + op2 + ", " +
+ std::to_string(swI->getNumHandlers()) + ")";
+
+ std::string swVar = getVal(swI);
+ OS << "auto " << swVar << " = " << builder << "." << call << ";\n";
+ for (auto c : swI->handlers()) {
+ OS << swVar << "->addHandler(" << getVal(c) << ");\n";
+ }
+ return;
+ } break;
+ case Instruction::CallBr: {
+ auto callbrI = dyn_cast<CallBrInst>(I);
+ std::string inddest = "{";
+ bool first = true;
+ for (unsigned i = 0; i < callbrI->getNumIndirectDests(); ++i) {
+ if (!first)
+ inddest += ", ";
+ inddest += getVal(callbrI->getIndirectDest(i));
+ first = false;
+ }
+ inddest += "}";
+
+ std::string args = "{";
+ first = true;
+ for (unsigned i = 0; i < callbrI->arg_size(); ++i) {
+ if (!first)
+ args += ", ";
+ args += getVal(callbrI->getArgOperand(i));
+ first = false;
+ }
+ args += "}";
+ call = "CreateCallBr(" + getType(callbrI->getFunctionType()) + ", " +
+ getVal(I->getOperand(I->getNumOperands() - 1)) + ", " +
+ getVal(callbrI->getDefaultDest()) + ", " + inddest + ", " + args +
+ ")";
+ // TODO: Handle operand bundles
+ } break;
+ case Instruction::FNeg: {
+ call = "CreateFNeg(" + op1 + ")";
+ // TODO: Handle FPMathTag
+ } break;
+ case Instruction::Add: {
+ call = getBinArithOp("Add", op1, op2, I);
+ } break;
+ case Instruction::FAdd: {
+ call = getFPBinArithOp("FAdd", op1, op2, I);
+ } break;
+ case Instruction::Sub: {
+ call = getBinArithOp("Sub", op1, op2, I);
+ } break;
+ case Instruction::FSub: {
+ call = getFPBinArithOp("FSub", op1, op2, I);
+ } break;
+ case Instruction::Mul: {
+ call = getBinArithOp("Mul", op1, op2, I);
+ } break;
+ case Instruction::FMul: {
+ call = getFPBinArithOp("FMul", op1, op2, I);
+ } break;
+ case Instruction::UDiv: {
+ call = "CreateUDiv(" + op1 + ", " + op2 + ", \"\", " +
+ to_str(I->isExact()) + ")";
+ } break;
+ case Instruction::SDiv: {
+ call = "CreateSDiv(" + op1 + ", " + op2 + ", \"\", " +
+ to_str(I->isExact()) + ")";
+ } break;
+ case Instruction::FDiv: {
+ call = getFPBinArithOp("FDiv", op1, op2, I);
+ } break;
+ case Instruction::URem: {
+ call = "CreateURem(" + op1 + ", " + op2 + ")";
+ } break;
+ case Instruction::SRem: {
+ call = "CreateSRem(" + op1 + ", " + op2 + ")";
+ } break;
+ case Instruction::FRem: {
+ call = getFPBinArithOp("FRem", op1, op2, I);
+ } break;
+ case Instruction::Shl: {
+ call = getBinArithOp("Shl", op1, op2, I);
+ } break;
+ case Instruction::LShr: {
+ call = "CreateLShr(" + op1 + ", " + op2 + ", \"\", " +
+ to_str(I->isExact()) + ")";
+ } break;
+ case Instruction::AShr: {
+ call = "CreateAShr(" + op1 + ", " + op2 + ", \"\", " +
+ to_str(I->isExact()) + ")";
+ } break;
+ case Instruction::And: {
+ call = "CreateAnd(" + op1 + ", " + op2 + ")";
+ } break;
+ case Instruction::Or: {
+ call = "CreateOr(" + op1 + ", " + op2 + ")";
+ } break;
+ case Instruction::Xor: {
+ call = "CreateXor(" + op1 + ", " + op2 + ")";
+ } break;
+ case Instruction::Alloca: {
+ auto alI = dyn_cast<AllocaInst>(I);
+ auto val = alI->getArraySize();
+ auto valStr = val ? getVal(val) : "nullptr";
+ call = "CreateAlloca(" + getType(alI->getAllocatedType()) + ", " +
+ std::to_string(alI->getAddressSpace()) + ", " + valStr + ")";
+ } break;
+ case Instruction::Load: {
+ auto lI = dyn_cast<LoadInst>(I);
+ call = "CreateLoad(" + getType(I->getType()) + ", " + op1 + ", " +
+ to_str(lI->isVolatile()) + ")";
+ } break;
+ case Instruction::Store: {
+ auto sI = dyn_cast<StoreInst>(I);
+ call = "CreateStore(" + op1 + ", " + op2 + ", " + to_str(sI->isVolatile()) +
+ ")";
+ } break;
+ case Instruction::GetElementPtr: {
+ auto gepI = dyn_cast<GetElementPtrInst>(I);
+ std::string strList = llvmPrefix + "ArrayRef<" + llvmPrefix + "Value*>(";
+ if (I->getNumOperands() > 2)
+ strList += "{";
+ bool first = true;
+ for (unsigned i = 1; i < I->getNumOperands(); ++i) {
+ if (!first)
+ strList += ", ";
+ strList += getVal(I->getOperand(i));
+ first = false;
+ }
+ if (I->getNumOperands() > 2)
+ strList += "}";
+ strList += ")";
+ // TODO: For some structs the return type is ptr and it fails
+ call = "CreateGEP(" + getType(gepI->getResultElementType()) + ", " + op1 +
+ ", " + strList + ", \"\", " + to_str(gepI->isInBounds()) + ")";
+ } break;
+ case Instruction::Fence: {
+ auto fI = dyn_cast<FenceInst>(I);
+ call = "CreateFence(" + getAtomicOrdering(fI->getOrdering()) + ", " +
+ getSyncScopeID(fI->getSyncScopeID()) + ")";
+ } break;
+ case Instruction::AtomicCmpXchg: {
+ auto acmpxI = dyn_cast<AtomicCmpXchgInst>(I);
+ call = "CreateAtomicCmpXchg(" + op1 + ", " + op2 + ", " + op3 + ", Align(" +
+ std::to_string(acmpxI->getAlign().value()) + "), " +
+ getAtomicOrdering(acmpxI->getSuccessOrdering()) + ", " +
+ getAtomicOrdering(acmpxI->getFailureOrdering()) + ", " +
+ getSyncScopeID(acmpxI->getSyncScopeID()) + ")";
+ } break;
+ case Instruction::AtomicRMW: {
+ auto armwI = dyn_cast<AtomicRMWInst>(I);
+ call = "CreateAtomicRMW(" + getAtomicRMWOp(armwI->getOperation()) + ", " +
+ op1 + ", " + op2 + ", Align(" +
+ std::to_string(armwI->getAlign().value()) + "), " +
+ getAtomicOrdering(armwI->getOrdering()) + ", " +
+ getSyncScopeID(armwI->getSyncScopeID()) + ")";
+ } break;
+ case Instruction::Trunc: {
+ call = "CreateTrunc(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::ZExt: {
+ call = "CreateZExt(" + op1 + ", " + getType(I->getType()) + ", \"\", " +
+ to_str(I->hasNonNeg()) + ")";
+ } break;
+ case Instruction::SExt: {
+ call = "CreateSExt(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::FPToUI: {
+ call = "CreateFPToUI(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::FPToSI: {
+ call = "CreateFPToSI(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::UIToFP: {
+ call = "CreateUIToFP(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::SIToFP: {
+ call = "CreateSIToFP(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::FPTrunc: {
+ call = "CreateFPTrunc(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::FPExt: {
+ call = "CreateFPExt(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::PtrToInt: {
+ call = "CreatePtrToInt(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::IntToPtr: {
+ call = "CreateIntToPtr(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::BitCast: {
+ call = "CreateBitCast(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::AddrSpaceCast: {
+ call = "CreateAddrSpaceCast(" + op1 + ", " + getType(I->getType()) + ")";
+ } break;
+ case Instruction::CleanupPad: {
+ auto cupI = dyn_cast<CleanupPadInst>(I);
+ std::string argsStr = "{";
+ bool first = true;
+ for (unsigned i = 0; i < cupI->arg_size(); ++i) {
+ if (!first)
+ argsStr += ", ";
+ argsStr += getVal(cupI->getArgOperand(i));
+ first = false;
+ }
+ argsStr += "}";
+ call = "CreateCleanupPad(" + op1 + ", " + argsStr + ")";
+ } break;
+ case Instruction::CatchPad: {
+ auto capI = dyn_cast<CatchPadInst>(I);
+ std::string argsStr = "{";
+ bool first = true;
+ for (unsigned i = 0; i < capI->arg_size(); ++i) {
+ if (!first)
+ argsStr += ", ";
+ argsStr += getVal(capI->getArgOperand(i));
+ first = false;
+ }
+ argsStr += "}";
+ call = "CreateCatchPad(" + op1 + ", " + argsStr + ")";
+ } break;
+ case Instruction::ICmp: {
+ auto cmpI = dyn_cast<CmpInst>(I);
+ std::string cmpPredicate =
+ llvmPrefix + getCmpPredicate(cmpI->getPredicate());
+ call = "CreateICmp(" + cmpPredicate + ", " + op1 + ", " + op2 + ")";
+ } break;
+ case Instruction::FCmp: {
+ auto cmpI = dyn_cast<CmpInst>(I);
+ std::string cmpPredicate =
+ llvmPrefix + getCmpPredicate(cmpI->getPredicate());
+ call = "CreateFCmp(" + cmpPredicate + ", " + op1 + ", " + op2 + ")";
+ } break;
+ case Instruction::PHI: {
+ auto phI = dyn_cast<PHINode>(I);
+ call = "CreatePHI(" + getType(I->getType()) + ", " +
+ std::to_string(phI->getNumIncomingValues()) + ")";
+ std::string phVar = getVal(phI);
+ OS << "auto " << phVar << " = " << builder << "." << call << ";\n";
+
+ unsigned i = 0;
+ for (auto b : phI->blocks()) {
+ auto incVal = getVal(phI->getIncomingValue(i));
+ // Phis might contain incoming not yet defined variable in such case
+ // we save the line we would output here and output it after the
+ // whole function body was outputted
+ std::string line =
+ phVar + "->addIncoming(" + incVal + ", " + getVal(b) + ");\n";
+ phiIncomings.push_back(line);
+ ++i;
+ }
+ return;
+ } break;
+ case Instruction::Call: {
+ auto fcI = dyn_cast<CallBase>(I);
+ std::string argDecl = "";
+ if (fcI->arg_size() > 0) {
+ argDecl = getNextVar();
+ OS << "Value *" << argDecl << "[] = {";
+ bool isFirst = true;
+ for (unsigned i = 0; i < fcI->arg_size(); ++i) {
+ if (!isFirst)
+ OS << ", ";
+ OS << getVal(fcI->getArgOperand(i));
+ isFirst = false;
+ }
+ OS << "};\n";
+ }
+
+ /* TODO: Implement
+ std::string bundleDecl = "";
+ if (fcI->hasOperandBundles()) {
+ bundleDecl = getNextVar();
+ OS << "Value *" << bundleDecl << "[] = {";
+ isFirst = true;
+ for(unsigned i = 0; i < fcI->getNumOperandBundles(); ++i) {
+ if(!isFirst) OS << ", ";
+ // TODO: Probably create OperandBundleUse from the current gotten
+ from
+ // getOperandBundleAt and cast construct OperandBundleDefT with it,
+ // but this requires conversion of Inputs which are Use
+ OS << "...";
+ isFirst = false;
+ }
+ OS << "};\n";
+ }
+ */
+
+ auto fun = dyn_cast<Function>(I->getOperand(I->getNumOperands() - 1));
+ std::string funDecl = getNextVar();
+ if (!fun) {
+ fun = fcI->getCalledFunction();
+ }
+
+ if (!fun) {
+ assert(fcI->isIndirectCall() && "sanity check");
----------------
nvjle wrote:
I think this assertion will fail for inline asm-- need to account for `fcI->isInlineAsm()` as well.
https://github.com/llvm/llvm-project/pull/117129
More information about the llvm-commits
mailing list