//===- Debugify.cpp - Attach synthetic debug info to everything -----------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// /// /// \file This pass attaches synthetic debug info to everything. It can be used /// to create targeted tests for debug info preservation. /// //===----------------------------------------------------------------------===// #include "Debugify.h" #include "llvm/ADT/BitVector.h" #include "llvm/ADT/StringExtras.h" #include "llvm/IR/BasicBlock.h" #include "llvm/IR/Constants.h" #include "llvm/IR/DIBuilder.h" #include "llvm/IR/DebugInfo.h" #include "llvm/IR/Function.h" #include "llvm/IR/GlobalVariable.h" #include "llvm/IR/InstIterator.h" #include "llvm/IR/Instruction.h" #include "llvm/IR/Instructions.h" #include "llvm/IR/IntrinsicInst.h" #include "llvm/IR/Module.h" #include "llvm/IR/Type.h" #include "llvm/Pass.h" #include "llvm/Support/raw_ostream.h" #include "llvm/Transforms/IPO.h" using namespace llvm; namespace { cl::opt<bool> Quiet("debugify-quiet", cl::desc("Suppress verbose debugify output")); raw_ostream &dbg() { return Quiet ? nulls() : errs(); } uint64_t getAllocSizeInBits(Module &M, Type *Ty) { return Ty->isSized() ? M.getDataLayout().getTypeAllocSizeInBits(Ty) : 0; } bool isFunctionSkipped(Function &F) { return F.isDeclaration() || !F.hasExactDefinition(); } /// Find the basic block's terminating instruction. /// /// Special care is needed to handle musttail and deopt calls, as these behave /// like (but are in fact not) terminators. Instruction *findTerminatingInstruction(BasicBlock &BB) { if (auto *I = BB.getTerminatingMustTailCall()) return I; if (auto *I = BB.getTerminatingDeoptimizeCall()) return I; return BB.getTerminator(); } bool applyDebugifyMetadata(Module &M, iterator_range<Module::iterator> Functions, StringRef Banner) { // Skip modules with debug info. if (M.getNamedMetadata("llvm.dbg.cu")) { dbg() << Banner << "Skipping module with debug info\n"; return false; } DIBuilder DIB(M); LLVMContext &Ctx = M.getContext(); // Get a DIType which corresponds to Ty. DenseMap<uint64_t, DIType *> TypeCache; auto getCachedDIType = [&](Type *Ty) -> DIType * { uint64_t Size = getAllocSizeInBits(M, Ty); DIType *&DTy = TypeCache[Size]; if (!DTy) { std::string Name = "ty" + utostr(Size); DTy = DIB.createBasicType(Name, Size, dwarf::DW_ATE_unsigned); } return DTy; }; unsigned NextLine = 1; unsigned NextVar = 1; auto File = DIB.createFile(M.getName(), "/"); auto CU = DIB.createCompileUnit(dwarf::DW_LANG_C, File, "debugify", /*isOptimized=*/true, "", 0); // Visit each instruction. for (Function &F : Functions) { if (isFunctionSkipped(F)) continue; auto SPType = DIB.createSubroutineType(DIB.getOrCreateTypeArray(None)); bool IsLocalToUnit = F.hasPrivateLinkage() || F.hasInternalLinkage(); auto SP = DIB.createFunction(CU, F.getName(), F.getName(), File, NextLine, SPType, IsLocalToUnit, /*isDefinition=*/true, NextLine, DINode::FlagZero, /*isOptimized=*/true); F.setSubprogram(SP); for (BasicBlock &BB : F) { // Attach debug locations. for (Instruction &I : BB) I.setDebugLoc(DILocation::get(Ctx, NextLine++, 1, SP)); // Inserting debug values into EH pads can break IR invariants. if (BB.isEHPad()) continue; // Find the terminating instruction, after which no debug values are // attached. Instruction *LastInst = findTerminatingInstruction(BB); assert(LastInst && "Expected basic block with a terminator"); // Maintain an insertion point which can't be invalidated when updates // are made. BasicBlock::iterator InsertPt = BB.getFirstInsertionPt(); assert(InsertPt != BB.end() && "Expected to find an insertion point"); Instruction *InsertBefore = &*InsertPt; // Attach debug values. for (Instruction *I = &*BB.begin(); I != LastInst; I = I->getNextNode()) { // Skip void-valued instructions. if (I->getType()->isVoidTy()) continue; // Phis and EH pads must be grouped at the beginning of the block. // Only advance the insertion point when we finish visiting these. if (!isa<PHINode>(I) && !I->isEHPad()) InsertBefore = I->getNextNode(); std::string Name = utostr(NextVar++); const DILocation *Loc = I->getDebugLoc().get(); auto LocalVar = DIB.createAutoVariable(SP, Name, File, Loc->getLine(), getCachedDIType(I->getType()), /*AlwaysPreserve=*/true); DIB.insertDbgValueIntrinsic(I, LocalVar, DIB.createExpression(), Loc, InsertBefore); } } DIB.finalizeSubprogram(SP); } DIB.finalize(); // Track the number of distinct lines and variables. NamedMDNode *NMD = M.getOrInsertNamedMetadata("llvm.debugify"); auto *IntTy = Type::getInt32Ty(Ctx); auto addDebugifyOperand = [&](unsigned N) { NMD->addOperand(MDNode::get( Ctx, ValueAsMetadata::getConstant(ConstantInt::get(IntTy, N)))); }; addDebugifyOperand(NextLine - 1); // Original number of lines. addDebugifyOperand(NextVar - 1); // Original number of variables. assert(NMD->getNumOperands() == 2 && "llvm.debugify should have exactly 2 operands!"); // Claim that this synthetic debug info is valid. StringRef DIVersionKey = "Debug Info Version"; if (!M.getModuleFlag(DIVersionKey)) M.addModuleFlag(Module::Warning, DIVersionKey, DEBUG_METADATA_VERSION); return true; } /// Return true if a mis-sized diagnostic is issued for \p DVI. bool diagnoseMisSizedDbgValue(Module &M, DbgValueInst *DVI) { // The size of a dbg.value's value operand should match the size of the // variable it corresponds to. // // TODO: This, along with a check for non-null value operands, should be // promoted to verifier failures. Value *V = DVI->getValue(); if (!V) return false; // For now, don't try to interpret anything more complicated than an empty // DIExpression. Eventually we should try to handle OP_deref and fragments. if (DVI->getExpression()->getNumElements()) return false; Type *Ty = V->getType(); uint64_t ValueOperandSize = getAllocSizeInBits(M, Ty); Optional<uint64_t> DbgVarSize = DVI->getFragmentSizeInBits(); if (!ValueOperandSize || !DbgVarSize) return false; bool HasBadSize = false; if (Ty->isIntegerTy()) { auto Signedness = DVI->getVariable()->getSignedness(); if (Signedness && *Signedness == DIBasicType::Signedness::Signed) HasBadSize = ValueOperandSize < *DbgVarSize; } else { HasBadSize = ValueOperandSize != *DbgVarSize; } if (HasBadSize) { dbg() << "ERROR: dbg.value operand has size " << ValueOperandSize << ", but its variable has size " << *DbgVarSize << ": "; DVI->print(dbg()); dbg() << "\n"; } return HasBadSize; } bool checkDebugifyMetadata(Module &M, iterator_range<Module::iterator> Functions, StringRef NameOfWrappedPass, StringRef Banner, bool Strip, DebugifyStatsMap *StatsMap) { // Skip modules without debugify metadata. NamedMDNode *NMD = M.getNamedMetadata("llvm.debugify"); if (!NMD) { dbg() << Banner << "Skipping module without debugify metadata\n"; return false; } auto getDebugifyOperand = [&](unsigned Idx) -> unsigned { return mdconst::extract<ConstantInt>(NMD->getOperand(Idx)->getOperand(0)) ->getZExtValue(); }; assert(NMD->getNumOperands() == 2 && "llvm.debugify should have exactly 2 operands!"); unsigned OriginalNumLines = getDebugifyOperand(0); unsigned OriginalNumVars = getDebugifyOperand(1); bool HasErrors = false; // Track debug info loss statistics if able. DebugifyStatistics *Stats = nullptr; if (StatsMap && !NameOfWrappedPass.empty()) Stats = &StatsMap->operator[](NameOfWrappedPass); BitVector MissingLines{OriginalNumLines, true}; BitVector MissingVars{OriginalNumVars, true}; for (Function &F : Functions) { if (isFunctionSkipped(F)) continue; // Find missing lines. for (Instruction &I : instructions(F)) { if (isa<DbgValueInst>(&I)) continue; auto DL = I.getDebugLoc(); if (DL && DL.getLine() != 0) { MissingLines.reset(DL.getLine() - 1); continue; } if (!DL) { dbg() << "ERROR: Instruction with empty DebugLoc in function "; dbg() << F.getName() << " --"; I.print(dbg()); dbg() << "\n"; HasErrors = true; } } // Find missing variables and mis-sized debug values. for (Instruction &I : instructions(F)) { auto *DVI = dyn_cast<DbgValueInst>(&I); if (!DVI) continue; unsigned Var = ~0U; (void)to_integer(DVI->getVariable()->getName(), Var, 10); assert(Var <= OriginalNumVars && "Unexpected name for DILocalVariable"); bool HasBadSize = diagnoseMisSizedDbgValue(M, DVI); if (!HasBadSize) MissingVars.reset(Var - 1); HasErrors |= HasBadSize; } } // Print the results. for (unsigned Idx : MissingLines.set_bits()) dbg() << "WARNING: Missing line " << Idx + 1 << "\n"; for (unsigned Idx : MissingVars.set_bits()) dbg() << "WARNING: Missing variable " << Idx + 1 << "\n"; // Update DI loss statistics. if (Stats) { Stats->NumDbgLocsExpected += OriginalNumLines; Stats->NumDbgLocsMissing += MissingLines.count(); Stats->NumDbgValuesExpected += OriginalNumVars; Stats->NumDbgValuesMissing += MissingVars.count(); } dbg() << Banner; if (!NameOfWrappedPass.empty()) dbg() << " [" << NameOfWrappedPass << "]"; dbg() << ": " << (HasErrors ? "FAIL" : "PASS") << '\n'; // Strip the Debugify Metadata if required. if (Strip) { StripDebugInfo(M); M.eraseNamedMetadata(NMD); return true; } return false; } /// ModulePass for attaching synthetic debug info to everything, used with the /// legacy module pass manager. struct DebugifyModulePass : public ModulePass { bool runOnModule(Module &M) override { return applyDebugifyMetadata(M, M.functions(), "ModuleDebugify: "); } DebugifyModulePass() : ModulePass(ID) {} void getAnalysisUsage(AnalysisUsage &AU) const override { AU.setPreservesAll(); } static char ID; // Pass identification. }; /// FunctionPass for attaching synthetic debug info to instructions within a /// single function, used with the legacy module pass manager. struct DebugifyFunctionPass : public FunctionPass { bool runOnFunction(Function &F) override { Module &M = *F.getParent(); auto FuncIt = F.getIterator(); return applyDebugifyMetadata(M, make_range(FuncIt, std::next(FuncIt)), "FunctionDebugify: "); } DebugifyFunctionPass() : FunctionPass(ID) {} void getAnalysisUsage(AnalysisUsage &AU) const override { AU.setPreservesAll(); } static char ID; // Pass identification. }; /// ModulePass for checking debug info inserted by -debugify, used with the /// legacy module pass manager. struct CheckDebugifyModulePass : public ModulePass { bool runOnModule(Module &M) override { return checkDebugifyMetadata(M, M.functions(), NameOfWrappedPass, "CheckModuleDebugify", Strip, StatsMap); } CheckDebugifyModulePass(bool Strip = false, StringRef NameOfWrappedPass = "", DebugifyStatsMap *StatsMap = nullptr) : ModulePass(ID), Strip(Strip), NameOfWrappedPass(NameOfWrappedPass), StatsMap(StatsMap) {} void getAnalysisUsage(AnalysisUsage &AU) const override { AU.setPreservesAll(); } static char ID; // Pass identification. private: bool Strip; StringRef NameOfWrappedPass; DebugifyStatsMap *StatsMap; }; /// FunctionPass for checking debug info inserted by -debugify-function, used /// with the legacy module pass manager. struct CheckDebugifyFunctionPass : public FunctionPass { bool runOnFunction(Function &F) override { Module &M = *F.getParent(); auto FuncIt = F.getIterator(); return checkDebugifyMetadata(M, make_range(FuncIt, std::next(FuncIt)), NameOfWrappedPass, "CheckFunctionDebugify", Strip, StatsMap); } CheckDebugifyFunctionPass(bool Strip = false, StringRef NameOfWrappedPass = "", DebugifyStatsMap *StatsMap = nullptr) : FunctionPass(ID), Strip(Strip), NameOfWrappedPass(NameOfWrappedPass), StatsMap(StatsMap) {} void getAnalysisUsage(AnalysisUsage &AU) const override { AU.setPreservesAll(); } static char ID; // Pass identification. private: bool Strip; StringRef NameOfWrappedPass; DebugifyStatsMap *StatsMap; }; } // end anonymous namespace void exportDebugifyStats(llvm::StringRef Path, const DebugifyStatsMap &Map) { std::error_code EC; raw_fd_ostream OS{Path, EC}; if (EC) { errs() << "Could not open file: " << EC.message() << ", " << Path << '\n'; return; } OS << "Pass Name" << ',' << "# of missing debug values" << ',' << "# of missing locations" << ',' << "Missing/Expected value ratio" << ',' << "Missing/Expected location ratio" << '\n'; for (const auto &Entry : Map) { StringRef Pass = Entry.first; DebugifyStatistics Stats = Entry.second; OS << Pass << ',' << Stats.NumDbgValuesMissing << ',' << Stats.NumDbgLocsMissing << ',' << Stats.getMissingValueRatio() << ',' << Stats.getEmptyLocationRatio() << '\n'; } } ModulePass *createDebugifyModulePass() { return new DebugifyModulePass(); } FunctionPass *createDebugifyFunctionPass() { return new DebugifyFunctionPass(); } PreservedAnalyses NewPMDebugifyPass::run(Module &M, ModuleAnalysisManager &) { applyDebugifyMetadata(M, M.functions(), "ModuleDebugify: "); return PreservedAnalyses::all(); } ModulePass *createCheckDebugifyModulePass(bool Strip, StringRef NameOfWrappedPass, DebugifyStatsMap *StatsMap) { return new CheckDebugifyModulePass(Strip, NameOfWrappedPass, StatsMap); } FunctionPass *createCheckDebugifyFunctionPass(bool Strip, StringRef NameOfWrappedPass, DebugifyStatsMap *StatsMap) { return new CheckDebugifyFunctionPass(Strip, NameOfWrappedPass, StatsMap); } PreservedAnalyses NewPMCheckDebugifyPass::run(Module &M, ModuleAnalysisManager &) { checkDebugifyMetadata(M, M.functions(), "", "CheckModuleDebugify", false, nullptr); return PreservedAnalyses::all(); } char DebugifyModulePass::ID = 0; static RegisterPass<DebugifyModulePass> DM("debugify", "Attach debug info to everything"); char CheckDebugifyModulePass::ID = 0; static RegisterPass<CheckDebugifyModulePass> CDM("check-debugify", "Check debug info from -debugify"); char DebugifyFunctionPass::ID = 0; static RegisterPass<DebugifyFunctionPass> DF("debugify-function", "Attach debug info to a function"); char CheckDebugifyFunctionPass::ID = 0; static RegisterPass<CheckDebugifyFunctionPass> CDF("check-debugify-function", "Check debug info from -debugify-function");