//===- GraphBuilder.cpp -----------------------------------------*- C++ -*-===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// #include "GraphBuilder.h" #include "llvm/BinaryFormat/ELF.h" #include "llvm/MC/MCAsmInfo.h" #include "llvm/MC/MCContext.h" #include "llvm/MC/MCDisassembler/MCDisassembler.h" #include "llvm/MC/MCInst.h" #include "llvm/MC/MCInstPrinter.h" #include "llvm/MC/MCInstrAnalysis.h" #include "llvm/MC/MCInstrDesc.h" #include "llvm/MC/MCInstrInfo.h" #include "llvm/MC/MCObjectFileInfo.h" #include "llvm/MC/MCRegisterInfo.h" #include "llvm/MC/MCSubtargetInfo.h" #include "llvm/Object/Binary.h" #include "llvm/Object/COFF.h" #include "llvm/Object/ELFObjectFile.h" #include "llvm/Object/ObjectFile.h" #include "llvm/Support/Casting.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/Error.h" #include "llvm/Support/MemoryBuffer.h" #include "llvm/Support/TargetRegistry.h" #include "llvm/Support/TargetSelect.h" #include "llvm/Support/raw_ostream.h" using Instr = llvm::cfi_verify::FileAnalysis::Instr; namespace llvm { namespace cfi_verify { unsigned long long SearchLengthForUndef; unsigned long long SearchLengthForConditionalBranch; static cl::opt<unsigned long long, true> SearchLengthForUndefArg( "search-length-undef", cl::desc("Specify the maximum amount of instructions " "to inspect when searching for an undefined " "instruction from a conditional branch."), cl::location(SearchLengthForUndef), cl::init(2)); static cl::opt<unsigned long long, true> SearchLengthForConditionalBranchArg( "search-length-cb", cl::desc("Specify the maximum amount of instructions " "to inspect when searching for a conditional " "branch from an indirect control flow."), cl::location(SearchLengthForConditionalBranch), cl::init(20)); std::vector<uint64_t> GraphResult::flattenAddress(uint64_t Address) const { std::vector<uint64_t> Addresses; auto It = IntermediateNodes.find(Address); Addresses.push_back(Address); while (It != IntermediateNodes.end()) { Addresses.push_back(It->second); It = IntermediateNodes.find(It->second); } return Addresses; } void printPairToDOT(const FileAnalysis &Analysis, raw_ostream &OS, uint64_t From, uint64_t To) { OS << " \"" << format_hex(From, 2) << ": "; Analysis.printInstruction(Analysis.getInstructionOrDie(From), OS); OS << "\" -> \"" << format_hex(To, 2) << ": "; Analysis.printInstruction(Analysis.getInstructionOrDie(To), OS); OS << "\"\n"; } void GraphResult::printToDOT(const FileAnalysis &Analysis, raw_ostream &OS) const { std::map<uint64_t, uint64_t> SortedIntermediateNodes( IntermediateNodes.begin(), IntermediateNodes.end()); OS << "digraph graph_" << format_hex(BaseAddress, 2) << " {\n"; for (const auto &KV : SortedIntermediateNodes) printPairToDOT(Analysis, OS, KV.first, KV.second); for (auto &BranchNode : ConditionalBranchNodes) { for (auto &V : {BranchNode.Target, BranchNode.Fallthrough}) printPairToDOT(Analysis, OS, BranchNode.Address, V); } OS << "}\n"; } GraphResult GraphBuilder::buildFlowGraph(const FileAnalysis &Analysis, uint64_t Address) { GraphResult Result; Result.BaseAddress = Address; DenseSet<uint64_t> OpenedNodes; const auto &IndirectInstructions = Analysis.getIndirectInstructions(); if (IndirectInstructions.find(Address) == IndirectInstructions.end()) return Result; buildFlowGraphImpl(Analysis, OpenedNodes, Result, Address, 0); return Result; } void GraphBuilder::buildFlowsToUndefined(const FileAnalysis &Analysis, GraphResult &Result, ConditionalBranchNode &BranchNode, const Instr &BranchInstrMeta) { assert(SearchLengthForUndef > 0 && "Search length for undefined flow must be greater than zero."); // Start setting up the next node in the block. uint64_t NextAddress = 0; const Instr *NextMetaPtr; // Find out the next instruction in the block and add it to the new // node. if (BranchNode.Target && !BranchNode.Fallthrough) { // We know the target of the branch, find the fallthrough. NextMetaPtr = Analysis.getNextInstructionSequential(BranchInstrMeta); if (!NextMetaPtr) { errs() << "Failed to get next instruction from " << format_hex(BranchNode.Address, 2) << ".\n"; return; } NextAddress = NextMetaPtr->VMAddress; BranchNode.Fallthrough = NextMetaPtr->VMAddress; // Add the new node to the branch head. } else if (BranchNode.Fallthrough && !BranchNode.Target) { // We already know the fallthrough, evaluate the target. uint64_t Target; if (!Analysis.getMCInstrAnalysis()->evaluateBranch( BranchInstrMeta.Instruction, BranchInstrMeta.VMAddress, BranchInstrMeta.InstructionSize, Target)) { errs() << "Failed to get branch target for conditional branch at address " << format_hex(BranchInstrMeta.VMAddress, 2) << ".\n"; return; } // Resolve the meta pointer for the target of this branch. NextMetaPtr = Analysis.getInstruction(Target); if (!NextMetaPtr) { errs() << "Failed to find instruction at address " << format_hex(Target, 2) << ".\n"; return; } NextAddress = Target; BranchNode.Target = NextMetaPtr->VMAddress; // Add the new node to the branch head. } else { errs() << "ControlBranchNode supplied to buildFlowsToUndefined should " "provide Target xor Fallthrough.\n"; return; } uint64_t CurrentAddress = NextAddress; const Instr *CurrentMetaPtr = NextMetaPtr; // Now the branch head has been set properly, complete the rest of the block. for (uint64_t i = 1; i < SearchLengthForUndef; ++i) { // Check to see whether the block should die. if (Analysis.isCFITrap(*CurrentMetaPtr)) { BranchNode.CFIProtection = true; return; } // Find the metadata of the next instruction. NextMetaPtr = Analysis.getDefiniteNextInstruction(*CurrentMetaPtr); if (!NextMetaPtr) return; // Setup the next node. NextAddress = NextMetaPtr->VMAddress; // Add this as an intermediate. Result.IntermediateNodes[CurrentAddress] = NextAddress; // Move the 'current' pointers to the new tail of the block. CurrentMetaPtr = NextMetaPtr; CurrentAddress = NextAddress; } // Final check of the last thing we added to the block. if (Analysis.isCFITrap(*CurrentMetaPtr)) BranchNode.CFIProtection = true; } void GraphBuilder::buildFlowGraphImpl(const FileAnalysis &Analysis, DenseSet<uint64_t> &OpenedNodes, GraphResult &Result, uint64_t Address, uint64_t Depth) { // If we've exceeded the flow length, terminate. if (Depth >= SearchLengthForConditionalBranch) { Result.OrphanedNodes.push_back(Address); return; } // Ensure this flow is acyclic. if (OpenedNodes.count(Address)) Result.OrphanedNodes.push_back(Address); // If this flow is already explored, stop here. if (Result.IntermediateNodes.count(Address)) return; // Get the metadata for the node instruction. const auto &InstrMetaPtr = Analysis.getInstruction(Address); if (!InstrMetaPtr) { errs() << "Failed to build flow graph for instruction at address " << format_hex(Address, 2) << ".\n"; Result.OrphanedNodes.push_back(Address); return; } const auto &ChildMeta = *InstrMetaPtr; OpenedNodes.insert(Address); std::set<const Instr *> CFCrossRefs = Analysis.getDirectControlFlowXRefs(ChildMeta); bool HasValidCrossRef = false; for (const auto *ParentMetaPtr : CFCrossRefs) { assert(ParentMetaPtr && "CFCrossRefs returned nullptr."); const auto &ParentMeta = *ParentMetaPtr; const auto &ParentDesc = Analysis.getMCInstrInfo()->get(ParentMeta.Instruction.getOpcode()); if (!ParentDesc.mayAffectControlFlow(ParentMeta.Instruction, *Analysis.getRegisterInfo())) { // If this cross reference doesn't affect CF, continue the graph. buildFlowGraphImpl(Analysis, OpenedNodes, Result, ParentMeta.VMAddress, Depth + 1); Result.IntermediateNodes[ParentMeta.VMAddress] = Address; HasValidCrossRef = true; continue; } // Call instructions are not valid in the upwards traversal. if (ParentDesc.isCall()) { Result.IntermediateNodes[ParentMeta.VMAddress] = Address; Result.OrphanedNodes.push_back(ParentMeta.VMAddress); continue; } // Evaluate the branch target to ascertain whether this XRef is the result // of a fallthrough or the target of a branch. uint64_t BranchTarget; if (!Analysis.getMCInstrAnalysis()->evaluateBranch( ParentMeta.Instruction, ParentMeta.VMAddress, ParentMeta.InstructionSize, BranchTarget)) { errs() << "Failed to evaluate branch target for instruction at address " << format_hex(ParentMeta.VMAddress, 2) << ".\n"; Result.IntermediateNodes[ParentMeta.VMAddress] = Address; Result.OrphanedNodes.push_back(ParentMeta.VMAddress); continue; } // Allow unconditional branches to be part of the upwards traversal. if (ParentDesc.isUnconditionalBranch()) { // Ensures that the unconditional branch is actually an XRef to the child. if (BranchTarget != Address) { errs() << "Control flow to " << format_hex(Address, 2) << ", but target resolution of " << format_hex(ParentMeta.VMAddress, 2) << " is not this address?\n"; Result.IntermediateNodes[ParentMeta.VMAddress] = Address; Result.OrphanedNodes.push_back(ParentMeta.VMAddress); continue; } buildFlowGraphImpl(Analysis, OpenedNodes, Result, ParentMeta.VMAddress, Depth + 1); Result.IntermediateNodes[ParentMeta.VMAddress] = Address; HasValidCrossRef = true; continue; } // Ensure that any unknown CFs are caught. if (!ParentDesc.isConditionalBranch()) { errs() << "Unknown control flow encountered when building graph at " << format_hex(Address, 2) << "\n."; Result.IntermediateNodes[ParentMeta.VMAddress] = Address; Result.OrphanedNodes.push_back(ParentMeta.VMAddress); continue; } // Only direct conditional branches should be present at this point. Setup // a conditional branch node and build flows to the ud2. ConditionalBranchNode BranchNode; BranchNode.Address = ParentMeta.VMAddress; BranchNode.Target = 0; BranchNode.Fallthrough = 0; BranchNode.CFIProtection = false; BranchNode.IndirectCFIsOnTargetPath = (BranchTarget == Address); if (BranchTarget == Address) BranchNode.Target = Address; else BranchNode.Fallthrough = Address; HasValidCrossRef = true; buildFlowsToUndefined(Analysis, Result, BranchNode, ParentMeta); Result.ConditionalBranchNodes.push_back(BranchNode); } if (!HasValidCrossRef) Result.OrphanedNodes.push_back(Address); OpenedNodes.erase(Address); } } // namespace cfi_verify } // namespace llvm