|  | //===- Debugify.cpp - Attach synthetic debug info to everything -----------===// | 
|  | // | 
|  | //                     The LLVM Compiler Infrastructure | 
|  | // | 
|  | // This file is distributed under the University of Illinois Open Source | 
|  | // License. See LICENSE.TXT for details. | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  | /// | 
|  | /// \file This pass attaches synthetic debug info to everything. It can be used | 
|  | /// to create targeted tests for debug info preservation. | 
|  | /// | 
|  | //===----------------------------------------------------------------------===// | 
|  |  | 
|  | #include "Debugify.h" | 
|  | #include "llvm/ADT/BitVector.h" | 
|  | #include "llvm/ADT/StringExtras.h" | 
|  | #include "llvm/IR/BasicBlock.h" | 
|  | #include "llvm/IR/Constants.h" | 
|  | #include "llvm/IR/DIBuilder.h" | 
|  | #include "llvm/IR/DebugInfo.h" | 
|  | #include "llvm/IR/Function.h" | 
|  | #include "llvm/IR/GlobalVariable.h" | 
|  | #include "llvm/IR/InstIterator.h" | 
|  | #include "llvm/IR/Instruction.h" | 
|  | #include "llvm/IR/Instructions.h" | 
|  | #include "llvm/IR/IntrinsicInst.h" | 
|  | #include "llvm/IR/Module.h" | 
|  | #include "llvm/IR/Type.h" | 
|  | #include "llvm/Pass.h" | 
|  | #include "llvm/Support/raw_ostream.h" | 
|  | #include "llvm/Transforms/IPO.h" | 
|  |  | 
|  | using namespace llvm; | 
|  |  | 
|  | namespace { | 
|  |  | 
|  | cl::opt<bool> Quiet("debugify-quiet", | 
|  | cl::desc("Suppress verbose debugify output")); | 
|  |  | 
|  | raw_ostream &dbg() { return Quiet ? nulls() : errs(); } | 
|  |  | 
|  | uint64_t getAllocSizeInBits(Module &M, Type *Ty) { | 
|  | return Ty->isSized() ? M.getDataLayout().getTypeAllocSizeInBits(Ty) : 0; | 
|  | } | 
|  |  | 
|  | bool isFunctionSkipped(Function &F) { | 
|  | return F.isDeclaration() || !F.hasExactDefinition(); | 
|  | } | 
|  |  | 
|  | /// Find the basic block's terminating instruction. | 
|  | /// | 
|  | /// Special care is needed to handle musttail and deopt calls, as these behave | 
|  | /// like (but are in fact not) terminators. | 
|  | Instruction *findTerminatingInstruction(BasicBlock &BB) { | 
|  | if (auto *I = BB.getTerminatingMustTailCall()) | 
|  | return I; | 
|  | if (auto *I = BB.getTerminatingDeoptimizeCall()) | 
|  | return I; | 
|  | return BB.getTerminator(); | 
|  | } | 
|  |  | 
|  | bool applyDebugifyMetadata(Module &M, | 
|  | iterator_range<Module::iterator> Functions, | 
|  | StringRef Banner) { | 
|  | // Skip modules with debug info. | 
|  | if (M.getNamedMetadata("llvm.dbg.cu")) { | 
|  | dbg() << Banner << "Skipping module with debug info\n"; | 
|  | return false; | 
|  | } | 
|  |  | 
|  | DIBuilder DIB(M); | 
|  | LLVMContext &Ctx = M.getContext(); | 
|  |  | 
|  | // Get a DIType which corresponds to Ty. | 
|  | DenseMap<uint64_t, DIType *> TypeCache; | 
|  | auto getCachedDIType = [&](Type *Ty) -> DIType * { | 
|  | uint64_t Size = getAllocSizeInBits(M, Ty); | 
|  | DIType *&DTy = TypeCache[Size]; | 
|  | if (!DTy) { | 
|  | std::string Name = "ty" + utostr(Size); | 
|  | DTy = DIB.createBasicType(Name, Size, dwarf::DW_ATE_unsigned); | 
|  | } | 
|  | return DTy; | 
|  | }; | 
|  |  | 
|  | unsigned NextLine = 1; | 
|  | unsigned NextVar = 1; | 
|  | auto File = DIB.createFile(M.getName(), "/"); | 
|  | auto CU = DIB.createCompileUnit(dwarf::DW_LANG_C, File, "debugify", | 
|  | /*isOptimized=*/true, "", 0); | 
|  |  | 
|  | // Visit each instruction. | 
|  | for (Function &F : Functions) { | 
|  | if (isFunctionSkipped(F)) | 
|  | continue; | 
|  |  | 
|  | auto SPType = DIB.createSubroutineType(DIB.getOrCreateTypeArray(None)); | 
|  | DISubprogram::DISPFlags SPFlags = | 
|  | DISubprogram::SPFlagDefinition | DISubprogram::SPFlagOptimized; | 
|  | if (F.hasPrivateLinkage() || F.hasInternalLinkage()) | 
|  | SPFlags |= DISubprogram::SPFlagLocalToUnit; | 
|  | auto SP = DIB.createFunction(CU, F.getName(), F.getName(), File, NextLine, | 
|  | SPType, NextLine, DINode::FlagZero, SPFlags); | 
|  | F.setSubprogram(SP); | 
|  | for (BasicBlock &BB : F) { | 
|  | // Attach debug locations. | 
|  | for (Instruction &I : BB) | 
|  | I.setDebugLoc(DILocation::get(Ctx, NextLine++, 1, SP)); | 
|  |  | 
|  | // Inserting debug values into EH pads can break IR invariants. | 
|  | if (BB.isEHPad()) | 
|  | continue; | 
|  |  | 
|  | // Find the terminating instruction, after which no debug values are | 
|  | // attached. | 
|  | Instruction *LastInst = findTerminatingInstruction(BB); | 
|  | assert(LastInst && "Expected basic block with a terminator"); | 
|  |  | 
|  | // Maintain an insertion point which can't be invalidated when updates | 
|  | // are made. | 
|  | BasicBlock::iterator InsertPt = BB.getFirstInsertionPt(); | 
|  | assert(InsertPt != BB.end() && "Expected to find an insertion point"); | 
|  | Instruction *InsertBefore = &*InsertPt; | 
|  |  | 
|  | // Attach debug values. | 
|  | for (Instruction *I = &*BB.begin(); I != LastInst; I = I->getNextNode()) { | 
|  | // Skip void-valued instructions. | 
|  | if (I->getType()->isVoidTy()) | 
|  | continue; | 
|  |  | 
|  | // Phis and EH pads must be grouped at the beginning of the block. | 
|  | // Only advance the insertion point when we finish visiting these. | 
|  | if (!isa<PHINode>(I) && !I->isEHPad()) | 
|  | InsertBefore = I->getNextNode(); | 
|  |  | 
|  | std::string Name = utostr(NextVar++); | 
|  | const DILocation *Loc = I->getDebugLoc().get(); | 
|  | auto LocalVar = DIB.createAutoVariable(SP, Name, File, Loc->getLine(), | 
|  | getCachedDIType(I->getType()), | 
|  | /*AlwaysPreserve=*/true); | 
|  | DIB.insertDbgValueIntrinsic(I, LocalVar, DIB.createExpression(), Loc, | 
|  | InsertBefore); | 
|  | } | 
|  | } | 
|  | DIB.finalizeSubprogram(SP); | 
|  | } | 
|  | DIB.finalize(); | 
|  |  | 
|  | // Track the number of distinct lines and variables. | 
|  | NamedMDNode *NMD = M.getOrInsertNamedMetadata("llvm.debugify"); | 
|  | auto *IntTy = Type::getInt32Ty(Ctx); | 
|  | auto addDebugifyOperand = [&](unsigned N) { | 
|  | NMD->addOperand(MDNode::get( | 
|  | Ctx, ValueAsMetadata::getConstant(ConstantInt::get(IntTy, N)))); | 
|  | }; | 
|  | addDebugifyOperand(NextLine - 1); // Original number of lines. | 
|  | addDebugifyOperand(NextVar - 1);  // Original number of variables. | 
|  | assert(NMD->getNumOperands() == 2 && | 
|  | "llvm.debugify should have exactly 2 operands!"); | 
|  |  | 
|  | // Claim that this synthetic debug info is valid. | 
|  | StringRef DIVersionKey = "Debug Info Version"; | 
|  | if (!M.getModuleFlag(DIVersionKey)) | 
|  | M.addModuleFlag(Module::Warning, DIVersionKey, DEBUG_METADATA_VERSION); | 
|  |  | 
|  | return true; | 
|  | } | 
|  |  | 
|  | /// Return true if a mis-sized diagnostic is issued for \p DVI. | 
|  | bool diagnoseMisSizedDbgValue(Module &M, DbgValueInst *DVI) { | 
|  | // The size of a dbg.value's value operand should match the size of the | 
|  | // variable it corresponds to. | 
|  | // | 
|  | // TODO: This, along with a check for non-null value operands, should be | 
|  | // promoted to verifier failures. | 
|  | Value *V = DVI->getValue(); | 
|  | if (!V) | 
|  | return false; | 
|  |  | 
|  | // For now, don't try to interpret anything more complicated than an empty | 
|  | // DIExpression. Eventually we should try to handle OP_deref and fragments. | 
|  | if (DVI->getExpression()->getNumElements()) | 
|  | return false; | 
|  |  | 
|  | Type *Ty = V->getType(); | 
|  | uint64_t ValueOperandSize = getAllocSizeInBits(M, Ty); | 
|  | Optional<uint64_t> DbgVarSize = DVI->getFragmentSizeInBits(); | 
|  | if (!ValueOperandSize || !DbgVarSize) | 
|  | return false; | 
|  |  | 
|  | bool HasBadSize = false; | 
|  | if (Ty->isIntegerTy()) { | 
|  | auto Signedness = DVI->getVariable()->getSignedness(); | 
|  | if (Signedness && *Signedness == DIBasicType::Signedness::Signed) | 
|  | HasBadSize = ValueOperandSize < *DbgVarSize; | 
|  | } else { | 
|  | HasBadSize = ValueOperandSize != *DbgVarSize; | 
|  | } | 
|  |  | 
|  | if (HasBadSize) { | 
|  | dbg() << "ERROR: dbg.value operand has size " << ValueOperandSize | 
|  | << ", but its variable has size " << *DbgVarSize << ": "; | 
|  | DVI->print(dbg()); | 
|  | dbg() << "\n"; | 
|  | } | 
|  | return HasBadSize; | 
|  | } | 
|  |  | 
|  | bool checkDebugifyMetadata(Module &M, | 
|  | iterator_range<Module::iterator> Functions, | 
|  | StringRef NameOfWrappedPass, StringRef Banner, | 
|  | bool Strip, DebugifyStatsMap *StatsMap) { | 
|  | // Skip modules without debugify metadata. | 
|  | NamedMDNode *NMD = M.getNamedMetadata("llvm.debugify"); | 
|  | if (!NMD) { | 
|  | dbg() << Banner << "Skipping module without debugify metadata\n"; | 
|  | return false; | 
|  | } | 
|  |  | 
|  | auto getDebugifyOperand = [&](unsigned Idx) -> unsigned { | 
|  | return mdconst::extract<ConstantInt>(NMD->getOperand(Idx)->getOperand(0)) | 
|  | ->getZExtValue(); | 
|  | }; | 
|  | assert(NMD->getNumOperands() == 2 && | 
|  | "llvm.debugify should have exactly 2 operands!"); | 
|  | unsigned OriginalNumLines = getDebugifyOperand(0); | 
|  | unsigned OriginalNumVars = getDebugifyOperand(1); | 
|  | bool HasErrors = false; | 
|  |  | 
|  | // Track debug info loss statistics if able. | 
|  | DebugifyStatistics *Stats = nullptr; | 
|  | if (StatsMap && !NameOfWrappedPass.empty()) | 
|  | Stats = &StatsMap->operator[](NameOfWrappedPass); | 
|  |  | 
|  | BitVector MissingLines{OriginalNumLines, true}; | 
|  | BitVector MissingVars{OriginalNumVars, true}; | 
|  | for (Function &F : Functions) { | 
|  | if (isFunctionSkipped(F)) | 
|  | continue; | 
|  |  | 
|  | // Find missing lines. | 
|  | for (Instruction &I : instructions(F)) { | 
|  | if (isa<DbgValueInst>(&I)) | 
|  | continue; | 
|  |  | 
|  | auto DL = I.getDebugLoc(); | 
|  | if (DL && DL.getLine() != 0) { | 
|  | MissingLines.reset(DL.getLine() - 1); | 
|  | continue; | 
|  | } | 
|  |  | 
|  | if (!DL) { | 
|  | dbg() << "ERROR: Instruction with empty DebugLoc in function "; | 
|  | dbg() << F.getName() << " --"; | 
|  | I.print(dbg()); | 
|  | dbg() << "\n"; | 
|  | HasErrors = true; | 
|  | } | 
|  | } | 
|  |  | 
|  | // Find missing variables and mis-sized debug values. | 
|  | for (Instruction &I : instructions(F)) { | 
|  | auto *DVI = dyn_cast<DbgValueInst>(&I); | 
|  | if (!DVI) | 
|  | continue; | 
|  |  | 
|  | unsigned Var = ~0U; | 
|  | (void)to_integer(DVI->getVariable()->getName(), Var, 10); | 
|  | assert(Var <= OriginalNumVars && "Unexpected name for DILocalVariable"); | 
|  | bool HasBadSize = diagnoseMisSizedDbgValue(M, DVI); | 
|  | if (!HasBadSize) | 
|  | MissingVars.reset(Var - 1); | 
|  | HasErrors |= HasBadSize; | 
|  | } | 
|  | } | 
|  |  | 
|  | // Print the results. | 
|  | for (unsigned Idx : MissingLines.set_bits()) | 
|  | dbg() << "WARNING: Missing line " << Idx + 1 << "\n"; | 
|  |  | 
|  | for (unsigned Idx : MissingVars.set_bits()) | 
|  | dbg() << "WARNING: Missing variable " << Idx + 1 << "\n"; | 
|  |  | 
|  | // Update DI loss statistics. | 
|  | if (Stats) { | 
|  | Stats->NumDbgLocsExpected += OriginalNumLines; | 
|  | Stats->NumDbgLocsMissing += MissingLines.count(); | 
|  | Stats->NumDbgValuesExpected += OriginalNumVars; | 
|  | Stats->NumDbgValuesMissing += MissingVars.count(); | 
|  | } | 
|  |  | 
|  | dbg() << Banner; | 
|  | if (!NameOfWrappedPass.empty()) | 
|  | dbg() << " [" << NameOfWrappedPass << "]"; | 
|  | dbg() << ": " << (HasErrors ? "FAIL" : "PASS") << '\n'; | 
|  |  | 
|  | // Strip the Debugify Metadata if required. | 
|  | if (Strip) { | 
|  | StripDebugInfo(M); | 
|  | M.eraseNamedMetadata(NMD); | 
|  | return true; | 
|  | } | 
|  |  | 
|  | return false; | 
|  | } | 
|  |  | 
|  | /// ModulePass for attaching synthetic debug info to everything, used with the | 
|  | /// legacy module pass manager. | 
|  | struct DebugifyModulePass : public ModulePass { | 
|  | bool runOnModule(Module &M) override { | 
|  | return applyDebugifyMetadata(M, M.functions(), "ModuleDebugify: "); | 
|  | } | 
|  |  | 
|  | DebugifyModulePass() : ModulePass(ID) {} | 
|  |  | 
|  | void getAnalysisUsage(AnalysisUsage &AU) const override { | 
|  | AU.setPreservesAll(); | 
|  | } | 
|  |  | 
|  | static char ID; // Pass identification. | 
|  | }; | 
|  |  | 
|  | /// FunctionPass for attaching synthetic debug info to instructions within a | 
|  | /// single function, used with the legacy module pass manager. | 
|  | struct DebugifyFunctionPass : public FunctionPass { | 
|  | bool runOnFunction(Function &F) override { | 
|  | Module &M = *F.getParent(); | 
|  | auto FuncIt = F.getIterator(); | 
|  | return applyDebugifyMetadata(M, make_range(FuncIt, std::next(FuncIt)), | 
|  | "FunctionDebugify: "); | 
|  | } | 
|  |  | 
|  | DebugifyFunctionPass() : FunctionPass(ID) {} | 
|  |  | 
|  | void getAnalysisUsage(AnalysisUsage &AU) const override { | 
|  | AU.setPreservesAll(); | 
|  | } | 
|  |  | 
|  | static char ID; // Pass identification. | 
|  | }; | 
|  |  | 
|  | /// ModulePass for checking debug info inserted by -debugify, used with the | 
|  | /// legacy module pass manager. | 
|  | struct CheckDebugifyModulePass : public ModulePass { | 
|  | bool runOnModule(Module &M) override { | 
|  | return checkDebugifyMetadata(M, M.functions(), NameOfWrappedPass, | 
|  | "CheckModuleDebugify", Strip, StatsMap); | 
|  | } | 
|  |  | 
|  | CheckDebugifyModulePass(bool Strip = false, StringRef NameOfWrappedPass = "", | 
|  | DebugifyStatsMap *StatsMap = nullptr) | 
|  | : ModulePass(ID), Strip(Strip), NameOfWrappedPass(NameOfWrappedPass), | 
|  | StatsMap(StatsMap) {} | 
|  |  | 
|  | void getAnalysisUsage(AnalysisUsage &AU) const override { | 
|  | AU.setPreservesAll(); | 
|  | } | 
|  |  | 
|  | static char ID; // Pass identification. | 
|  |  | 
|  | private: | 
|  | bool Strip; | 
|  | StringRef NameOfWrappedPass; | 
|  | DebugifyStatsMap *StatsMap; | 
|  | }; | 
|  |  | 
|  | /// FunctionPass for checking debug info inserted by -debugify-function, used | 
|  | /// with the legacy module pass manager. | 
|  | struct CheckDebugifyFunctionPass : public FunctionPass { | 
|  | bool runOnFunction(Function &F) override { | 
|  | Module &M = *F.getParent(); | 
|  | auto FuncIt = F.getIterator(); | 
|  | return checkDebugifyMetadata(M, make_range(FuncIt, std::next(FuncIt)), | 
|  | NameOfWrappedPass, "CheckFunctionDebugify", | 
|  | Strip, StatsMap); | 
|  | } | 
|  |  | 
|  | CheckDebugifyFunctionPass(bool Strip = false, | 
|  | StringRef NameOfWrappedPass = "", | 
|  | DebugifyStatsMap *StatsMap = nullptr) | 
|  | : FunctionPass(ID), Strip(Strip), NameOfWrappedPass(NameOfWrappedPass), | 
|  | StatsMap(StatsMap) {} | 
|  |  | 
|  | void getAnalysisUsage(AnalysisUsage &AU) const override { | 
|  | AU.setPreservesAll(); | 
|  | } | 
|  |  | 
|  | static char ID; // Pass identification. | 
|  |  | 
|  | private: | 
|  | bool Strip; | 
|  | StringRef NameOfWrappedPass; | 
|  | DebugifyStatsMap *StatsMap; | 
|  | }; | 
|  |  | 
|  | } // end anonymous namespace | 
|  |  | 
|  | void exportDebugifyStats(llvm::StringRef Path, const DebugifyStatsMap &Map) { | 
|  | std::error_code EC; | 
|  | raw_fd_ostream OS{Path, EC}; | 
|  | if (EC) { | 
|  | errs() << "Could not open file: " << EC.message() << ", " << Path << '\n'; | 
|  | return; | 
|  | } | 
|  |  | 
|  | OS << "Pass Name" << ',' << "# of missing debug values" << ',' | 
|  | << "# of missing locations" << ',' << "Missing/Expected value ratio" << ',' | 
|  | << "Missing/Expected location ratio" << '\n'; | 
|  | for (const auto &Entry : Map) { | 
|  | StringRef Pass = Entry.first; | 
|  | DebugifyStatistics Stats = Entry.second; | 
|  |  | 
|  | OS << Pass << ',' << Stats.NumDbgValuesMissing << ',' | 
|  | << Stats.NumDbgLocsMissing << ',' << Stats.getMissingValueRatio() << ',' | 
|  | << Stats.getEmptyLocationRatio() << '\n'; | 
|  | } | 
|  | } | 
|  |  | 
|  | ModulePass *createDebugifyModulePass() { return new DebugifyModulePass(); } | 
|  |  | 
|  | FunctionPass *createDebugifyFunctionPass() { | 
|  | return new DebugifyFunctionPass(); | 
|  | } | 
|  |  | 
|  | PreservedAnalyses NewPMDebugifyPass::run(Module &M, ModuleAnalysisManager &) { | 
|  | applyDebugifyMetadata(M, M.functions(), "ModuleDebugify: "); | 
|  | return PreservedAnalyses::all(); | 
|  | } | 
|  |  | 
|  | ModulePass *createCheckDebugifyModulePass(bool Strip, | 
|  | StringRef NameOfWrappedPass, | 
|  | DebugifyStatsMap *StatsMap) { | 
|  | return new CheckDebugifyModulePass(Strip, NameOfWrappedPass, StatsMap); | 
|  | } | 
|  |  | 
|  | FunctionPass *createCheckDebugifyFunctionPass(bool Strip, | 
|  | StringRef NameOfWrappedPass, | 
|  | DebugifyStatsMap *StatsMap) { | 
|  | return new CheckDebugifyFunctionPass(Strip, NameOfWrappedPass, StatsMap); | 
|  | } | 
|  |  | 
|  | PreservedAnalyses NewPMCheckDebugifyPass::run(Module &M, | 
|  | ModuleAnalysisManager &) { | 
|  | checkDebugifyMetadata(M, M.functions(), "", "CheckModuleDebugify", false, | 
|  | nullptr); | 
|  | return PreservedAnalyses::all(); | 
|  | } | 
|  |  | 
|  | char DebugifyModulePass::ID = 0; | 
|  | static RegisterPass<DebugifyModulePass> DM("debugify", | 
|  | "Attach debug info to everything"); | 
|  |  | 
|  | char CheckDebugifyModulePass::ID = 0; | 
|  | static RegisterPass<CheckDebugifyModulePass> | 
|  | CDM("check-debugify", "Check debug info from -debugify"); | 
|  |  | 
|  | char DebugifyFunctionPass::ID = 0; | 
|  | static RegisterPass<DebugifyFunctionPass> DF("debugify-function", | 
|  | "Attach debug info to a function"); | 
|  |  | 
|  | char CheckDebugifyFunctionPass::ID = 0; | 
|  | static RegisterPass<CheckDebugifyFunctionPass> | 
|  | CDF("check-debugify-function", "Check debug info from -debugify-function"); |