[llvm] [Instrumentor] Add Instrumentor pass (PR #138958)
Matt Arsenault via llvm-commits
llvm-commits at lists.llvm.org
Wed May 21 01:38:38 PDT 2025
================
@@ -0,0 +1,645 @@
+//===-- Instrumentor.cpp - Highly configurable instrumentation pass -------===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+//
+//===----------------------------------------------------------------------===//
+
+#include "llvm/Transforms/IPO/Instrumentor.h"
+#include "llvm/Transforms/IPO/InstrumentorConfigFile.h"
+
+#include "llvm/ADT/PostOrderIterator.h"
+#include "llvm/ADT/SmallPtrSet.h"
+#include "llvm/ADT/SmallVector.h"
+#include "llvm/ADT/StringExtras.h"
+#include "llvm/ADT/StringMap.h"
+#include "llvm/ADT/iterator.h"
+#include "llvm/IR/Constant.h"
+#include "llvm/IR/Constants.h"
+#include "llvm/IR/DataLayout.h"
+#include "llvm/IR/DebugInfoMetadata.h"
+#include "llvm/IR/Function.h"
+#include "llvm/IR/IRBuilder.h"
+#include "llvm/IR/InstrTypes.h"
+#include "llvm/IR/Instruction.h"
+#include "llvm/IR/Instructions.h"
+#include "llvm/IR/IntrinsicInst.h"
+#include "llvm/IR/Intrinsics.h"
+#include "llvm/IR/LLVMContext.h"
+#include "llvm/IR/Metadata.h"
+#include "llvm/IR/Module.h"
+#include "llvm/IR/PassManager.h"
+#include "llvm/IR/Verifier.h"
+#include "llvm/IRReader/IRReader.h"
+#include "llvm/Support/CommandLine.h"
+#include "llvm/Support/ErrorHandling.h"
+#include "llvm/Support/Regex.h"
+
+#include <cassert>
+#include <cstdint>
+#include <functional>
+#include <iterator>
+#include <string>
+#include <system_error>
+#include <type_traits>
+
+using namespace llvm;
+using namespace llvm::instrumentor;
+
+#define DEBUG_TYPE "instrumentor"
+
+static cl::opt<std::string> WriteJSONConfig(
+ "instrumentor-write-config-file",
+ cl::desc(
+ "Write the instrumentor configuration into the specified JSON file"),
+ cl::init(""));
+static cl::opt<std::string> ReadJSONConfig(
+ "instrumentor-read-config-file",
+ cl::desc(
+ "Read the instrumentor configuration from the specified JSON file"),
+ cl::init(""));
+
+namespace {
+
+template <typename IRBuilderTy> void ensureDbgLoc(IRBuilderTy &IRB) {
+ if (IRB.getCurrentDebugLocation())
+ return;
+ auto *BB = IRB.GetInsertBlock();
+ if (auto *SP = BB->getParent()->getSubprogram())
+ IRB.SetCurrentDebugLocation(DILocation::get(BB->getContext(), 0, 0, SP));
+}
+
+template <typename IRBTy>
+Value *tryToCast(IRBTy &IRB, Value *V, Type *Ty, const DataLayout &DL,
+ bool AllowTruncate = false) {
+ if (!V)
+ return Constant::getAllOnesValue(Ty);
+ auto *VTy = V->getType();
+ if (VTy == Ty)
+ return V;
+ if (VTy->isAggregateType())
+ return V;
+ auto RequestedSize = DL.getTypeSizeInBits(Ty);
+ auto ValueSize = DL.getTypeSizeInBits(VTy);
+ bool IsTruncate = RequestedSize < ValueSize;
+ if (IsTruncate && !AllowTruncate)
+ return V;
+ if (IsTruncate && AllowTruncate)
+ return tryToCast(IRB,
+ IRB.CreateIntCast(V, IRB.getIntNTy(RequestedSize),
+ /*IsSigned=*/false),
+ Ty, DL, AllowTruncate);
+ if (VTy->isPointerTy() && Ty->isPointerTy())
+ return IRB.CreatePointerBitCastOrAddrSpaceCast(V, Ty);
+ if (VTy->isIntegerTy() && Ty->isIntegerTy())
+ return IRB.CreateIntCast(V, Ty, /*IsSigned=*/false);
+ if (VTy->isFloatingPointTy() && Ty->isIntOrPtrTy()) {
+ switch (ValueSize) {
+ case 64:
+ return tryToCast(IRB, IRB.CreateBitCast(V, IRB.getInt64Ty()), Ty, DL,
+ AllowTruncate);
+ case 32:
+ return tryToCast(IRB, IRB.CreateBitCast(V, IRB.getInt32Ty()), Ty, DL,
+ AllowTruncate);
+ case 16:
+ return tryToCast(IRB, IRB.CreateBitCast(V, IRB.getInt16Ty()), Ty, DL,
+ AllowTruncate);
+ case 8:
+ return tryToCast(IRB, IRB.CreateBitCast(V, IRB.getInt8Ty()), Ty, DL,
+ AllowTruncate);
+ default:
+ llvm_unreachable("unsupported floating point size");
+ }
+ }
+ return IRB.CreateBitOrPointerCast(V, Ty);
+}
+
+template <typename Ty> Constant *getCI(Type *IT, Ty Val) {
+ return ConstantInt::get(IT, Val);
+}
+
+class InstrumentorImpl final {
+public:
+ InstrumentorImpl(InstrumentationConfig &IConf, InstrumentorIRBuilderTy &IIRB,
+ Module &M, FunctionAnalysisManager &FAM)
+ : IConf(IConf), M(M), FAM(FAM), IIRB(IIRB) {
+ IConf.populate(IIRB);
+ }
+
+ /// Instrument the module, public entry point.
+ bool instrument();
+
+private:
+ bool shouldInstrumentTarget();
+ bool shouldInstrumentFunction(Function &Fn);
+
+ bool instrumentInstruction(Instruction &I, InstrumentationCaches &ICaches);
+ bool instrumentFunction(Function &Fn);
+
+ /// The instrumentation opportunities for instructions indexed by
+ /// their opcode.
+ DenseMap<unsigned, InstrumentationOpportunity *> InstChoicesPRE,
+ InstChoicesPOST;
+
+ /// The instrumentor configuration.
+ InstrumentationConfig &IConf;
+
+ /// The underlying module.
+ Module &M;
+
+ FunctionAnalysisManager &FAM;
+
+protected:
+ /// A special IR builder that keeps track of the inserted instructions.
+ InstrumentorIRBuilderTy &IIRB;
+};
+
+} // end anonymous namespace
+
+bool InstrumentorImpl::shouldInstrumentTarget() {
+ const Triple &T = M.getTargetTriple();
+ const bool IsGPU = T.isAMDGPU() || T.isNVPTX();
+
+ bool RegexMatches = true;
+ const auto TargetRegexStr = IConf.TargetRegex->getString();
+ if (!TargetRegexStr.empty()) {
+ llvm::Regex TargetRegex(TargetRegexStr);
+ std::string ErrMsg;
+ if (!TargetRegex.isValid(ErrMsg)) {
+ errs() << "WARNING: failed to parse target regex: " << ErrMsg << "\n";
+ return false;
+ }
+ RegexMatches = TargetRegex.match(T.str());
+ }
+
+ return ((IsGPU && IConf.GPUEnabled->getBool()) ||
+ (!IsGPU && IConf.HostEnabled->getBool())) &&
+ RegexMatches;
+}
+
+bool InstrumentorImpl::shouldInstrumentFunction(Function &Fn) {
+ if (Fn.isDeclaration())
+ return false;
+ return !Fn.getName().starts_with(IConf.getRTName()) ||
+ Fn.hasFnAttribute("instrument");
+}
+
+bool InstrumentorImpl::instrumentInstruction(Instruction &I,
+ InstrumentationCaches &ICaches) {
+ bool Changed = false;
+
+ // Skip instrumentation instructions.
+ if (IIRB.NewInsts.contains(&I))
+ return Changed;
+
+ // Count epochs eagerly.
+ ++IIRB.Epoche;
+
+ Value *IPtr = &I;
+ if (auto *IO = InstChoicesPRE.lookup(I.getOpcode())) {
+ IIRB.IRB.SetInsertPoint(&I);
+ ensureDbgLoc(IIRB.IRB);
+ Changed |= bool(IO->instrument(IPtr, IConf, IIRB, ICaches));
+ }
+
+ if (auto *IO = InstChoicesPOST.lookup(I.getOpcode())) {
+ IIRB.IRB.SetInsertPoint(I.getNextNonDebugInstruction());
+ ensureDbgLoc(IIRB.IRB);
+ Changed |= bool(IO->instrument(IPtr, IConf, IIRB, ICaches));
+ }
+ IIRB.returnAllocas();
+
+ return Changed;
+};
+
+bool InstrumentorImpl::instrumentFunction(Function &Fn) {
+ bool Changed = false;
+ if (!shouldInstrumentFunction(Fn))
+ return Changed;
+
+ InstrumentationCaches ICaches;
+ ReversePostOrderTraversal<Function *> RPOT(&Fn);
+ for (auto &It : RPOT)
+ for (auto &I : *It)
+ Changed |= instrumentInstruction(I, ICaches);
+
+ return Changed;
+}
+
+bool InstrumentorImpl::instrument() {
+ bool Changed = false;
+ if (!shouldInstrumentTarget())
+ return Changed;
+
+ for (auto &It : IConf.IChoices[InstrumentationLocation::INSTRUCTION_PRE])
+ if (It.second->Enabled)
+ InstChoicesPRE[It.second->getOpcode()] = It.second;
+ for (auto &It : IConf.IChoices[InstrumentationLocation::INSTRUCTION_POST])
+ if (It.second->Enabled)
+ InstChoicesPOST[It.second->getOpcode()] = It.second;
+
+ for (Function &Fn : M)
+ Changed |= instrumentFunction(Fn);
+
+ return Changed;
+}
+
+PreservedAnalyses InstrumentorPass::run(Module &M, FunctionAnalysisManager &FAM,
+ InstrumentationConfig &IConf,
+ InstrumentorIRBuilderTy &IIRB) {
+ InstrumentorImpl Impl(IConf, IIRB, M, FAM);
+ if (IConf.ReadConfig && !readConfigFromJSON(IConf, ReadJSONConfig))
+ return PreservedAnalyses::all();
+
+ writeConfigToJSON(IConf, WriteJSONConfig);
+
+ bool Changed = Impl.instrument();
+ if (!Changed)
+ return PreservedAnalyses::all();
+ return PreservedAnalyses::none();
+}
+
+PreservedAnalyses InstrumentorPass::run(Module &M, ModuleAnalysisManager &MAM) {
+ auto &FAM = MAM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager();
+ InstrumentationConfig *IConf =
+ UserIConf ? UserIConf : new InstrumentationConfig();
+ InstrumentorIRBuilderTy *IIRB =
+ UserIIRB ? UserIIRB : new InstrumentorIRBuilderTy(M, FAM);
+
+ auto PA = run(M, FAM, *IConf, *IIRB);
+
+ if (!UserIIRB)
+ delete IIRB;
+ if (!UserIConf)
+ delete IConf;
----------------
arsenm wrote:
Use unique_ptr
https://github.com/llvm/llvm-project/pull/138958
More information about the llvm-commits
mailing list