//===- ObjectLinker.cpp ---------------------------------------------------===// // // The MCLinker Project // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// #include <mcld/Object/ObjectLinker.h> #include <mcld/LinkerConfig.h> #include <mcld/Module.h> #include <mcld/InputTree.h> #include <mcld/IRBuilder.h> #include <mcld/LD/LDSection.h> #include <mcld/LD/LDContext.h> #include <mcld/LD/Archive.h> #include <mcld/LD/ArchiveReader.h> #include <mcld/LD/ObjectReader.h> #include <mcld/LD/DynObjReader.h> #include <mcld/LD/GroupReader.h> #include <mcld/LD/BinaryReader.h> #include <mcld/LD/ObjectWriter.h> #include <mcld/LD/ResolveInfo.h> #include <mcld/LD/RelocData.h> #include <mcld/LD/Relocator.h> #include <mcld/Support/RealPath.h> #include <mcld/Support/MemoryArea.h> #include <mcld/Support/MsgHandling.h> #include <mcld/Support/DefSymParser.h> #include <mcld/Target/TargetLDBackend.h> #include <mcld/Fragment/FragmentLinker.h> #include <mcld/Object/ObjectBuilder.h> #include <llvm/Support/Casting.h> using namespace llvm; using namespace mcld; ObjectLinker::ObjectLinker(const LinkerConfig& pConfig, TargetLDBackend& pLDBackend) : m_Config(pConfig), m_pLinker(NULL), m_pModule(NULL), m_pBuilder(NULL), m_LDBackend(pLDBackend), m_pObjectReader(NULL), m_pDynObjReader(NULL), m_pArchiveReader(NULL), m_pGroupReader(NULL), m_pBinaryReader(NULL), m_pWriter(NULL) { } ObjectLinker::~ObjectLinker() { delete m_pLinker; delete m_pObjectReader; delete m_pDynObjReader; delete m_pArchiveReader; delete m_pGroupReader; delete m_pBinaryReader; delete m_pWriter; } void ObjectLinker::setup(Module& pModule, IRBuilder& pBuilder) { m_pModule = &pModule; m_pBuilder = &pBuilder; // set up soname if (!m_Config.options().soname().empty()) { m_pModule->setName(m_Config.options().soname()); } } /// initFragmentLinker - initialize FragmentLinker /// Connect all components with FragmentLinker bool ObjectLinker::initFragmentLinker() { if (NULL == m_pLinker) { m_pLinker = new FragmentLinker(m_Config, *m_pModule, m_LDBackend); } // initialize the readers and writers // Because constructor can not be failed, we initalize all readers and // writers outside the FragmentLinker constructors. m_pObjectReader = m_LDBackend.createObjectReader(*m_pBuilder); m_pArchiveReader = m_LDBackend.createArchiveReader(*m_pModule); m_pDynObjReader = m_LDBackend.createDynObjReader(*m_pBuilder); m_pBinaryReader = m_LDBackend.createBinaryReader(*m_pBuilder); m_pGroupReader = new GroupReader(*m_pModule, *m_pObjectReader, *m_pDynObjReader, *m_pArchiveReader, *m_pBinaryReader); m_pWriter = m_LDBackend.createWriter(); // initialize Relocator m_LDBackend.initRelocator(); return true; } /// initStdSections - initialize standard sections bool ObjectLinker::initStdSections() { ObjectBuilder builder(m_Config, *m_pModule); // initialize standard sections if (!m_LDBackend.initStdSections(builder)) return false; // initialize target-dependent sections m_LDBackend.initTargetSections(*m_pModule, builder); return true; } void ObjectLinker::normalize() { // ----- set up inputs ----- // Module::input_iterator input, inEnd = m_pModule->input_end(); for (input = m_pModule->input_begin(); input!=inEnd; ++input) { // is a group node if (isGroup(input)) { getGroupReader()->readGroup(input, m_pBuilder->getInputBuilder(), m_Config); continue; } // already got type - for example, bitcode or external OIR (object // intermediate representation) if ((*input)->type() == Input::Script || (*input)->type() == Input::Archive || (*input)->type() == Input::External) continue; if (Input::Object == (*input)->type()) { m_pModule->getObjectList().push_back(*input); continue; } if (Input::DynObj == (*input)->type()) { m_pModule->getLibraryList().push_back(*input); continue; } // read input as a binary file if (m_Config.options().isBinaryInput()) { (*input)->setType(Input::Object); getBinaryReader()->readBinary(**input); m_pModule->getObjectList().push_back(*input); } // is a relocatable object file else if (getObjectReader()->isMyFormat(**input)) { (*input)->setType(Input::Object); getObjectReader()->readHeader(**input); getObjectReader()->readSections(**input); getObjectReader()->readSymbols(**input); m_pModule->getObjectList().push_back(*input); } // is a shared object file else if (getDynObjReader()->isMyFormat(**input)) { (*input)->setType(Input::DynObj); getDynObjReader()->readHeader(**input); getDynObjReader()->readSymbols(**input); m_pModule->getLibraryList().push_back(*input); } // is an archive else if (getArchiveReader()->isMyFormat(**input)) { (*input)->setType(Input::Archive); Archive archive(**input, m_pBuilder->getInputBuilder()); getArchiveReader()->readArchive(archive); if(archive.numOfObjectMember() > 0) { m_pModule->getInputTree().merge<InputTree::Inclusive>(input, archive.inputs()); } } else { fatal(diag::err_unrecognized_input_file) << (*input)->path() << m_Config.targets().triple().str(); } } // end of for } bool ObjectLinker::linkable() const { // check we have input and output files if (m_pModule->getInputTree().empty()) { error(diag::err_no_inputs); return false; } // can not mix -static with shared objects Module::const_lib_iterator lib, libEnd = m_pModule->lib_end(); for (lib = m_pModule->lib_begin(); lib != libEnd; ++lib) { if((*lib)->attribute()->isStatic()) { error(diag::err_mixed_shared_static_objects) << (*lib)->name() << (*lib)->path(); return false; } } // --nmagic and --omagic options lead to static executable program. // These options turn off page alignment of sections. Because the // sections are not aligned to pages, these sections can not contain any // exported functions. Also, because the two options disable linking // against shared libraries, the output absolutely does not call outside // functions. if (m_Config.options().nmagic() && !m_Config.isCodeStatic()) { error(diag::err_nmagic_not_static); return false; } if (m_Config.options().omagic() && !m_Config.isCodeStatic()) { error(diag::err_omagic_not_static); return false; } return true; } /// readRelocations - read all relocation entries /// /// All symbols should be read and resolved before this function. bool ObjectLinker::readRelocations() { // Bitcode is read by the other path. This function reads relocation sections // in object files. mcld::InputTree::bfs_iterator input, inEnd = m_pModule->getInputTree().bfs_end(); for (input=m_pModule->getInputTree().bfs_begin(); input!=inEnd; ++input) { if ((*input)->type() == Input::Object && (*input)->hasMemArea()) { if (!getObjectReader()->readRelocations(**input)) return false; } // ignore the other kinds of files. } return true; } /// mergeSections - put allinput sections into output sections bool ObjectLinker::mergeSections() { ObjectBuilder builder(m_Config, *m_pModule); Module::obj_iterator obj, objEnd = m_pModule->obj_end(); for (obj = m_pModule->obj_begin(); obj != objEnd; ++obj) { LDContext::sect_iterator sect, sectEnd = (*obj)->context()->sectEnd(); for (sect = (*obj)->context()->sectBegin(); sect != sectEnd; ++sect) { switch ((*sect)->kind()) { // Some *INPUT sections should not be merged. case LDFileFormat::Ignore: case LDFileFormat::Null: case LDFileFormat::Relocation: case LDFileFormat::NamePool: case LDFileFormat::Group: case LDFileFormat::StackNote: // skip continue; case LDFileFormat::Target: if (!m_LDBackend.mergeSection(*m_pModule, **sect)) { error(diag::err_cannot_merge_section) << (*sect)->name() << (*obj)->name(); return false; } break; case LDFileFormat::EhFrame: { if (!(*sect)->hasEhFrame()) continue; // skip LDSection* out_sect = NULL; if (NULL == (out_sect = builder.MergeSection(**sect))) { error(diag::err_cannot_merge_section) << (*sect)->name() << (*obj)->name(); return false; } if (!m_LDBackend.updateSectionFlags(*out_sect, **sect)) { error(diag::err_cannot_merge_section) << (*sect)->name() << (*obj)->name(); return false; } break; } default: { if (!(*sect)->hasSectionData()) continue; // skip LDSection* out_sect = NULL; if (NULL == (out_sect = builder.MergeSection(**sect))) { error(diag::err_cannot_merge_section) << (*sect)->name() << (*obj)->name(); return false; } if (!m_LDBackend.updateSectionFlags(*out_sect, **sect)) { error(diag::err_cannot_merge_section) << (*sect)->name() << (*obj)->name(); return false; } break; } } // end of switch } // for each section } // for each obj return true; } /// addStandardSymbols - shared object and executable files need some /// standard symbols /// @return if there are some input symbols with the same name to the /// standard symbols, return false bool ObjectLinker::addStandardSymbols() { // create and add section symbols for each output section Module::iterator iter, iterEnd = m_pModule->end(); for (iter = m_pModule->begin(); iter != iterEnd; ++iter) { m_pModule->getSectionSymbolSet().add(**iter, m_pModule->getNamePool()); } return m_LDBackend.initStandardSymbols(*m_pBuilder, *m_pModule); } /// addTargetSymbols - some targets, such as MIPS and ARM, need some /// target-dependent symbols /// @return if there are some input symbols with the same name to the /// target symbols, return false bool ObjectLinker::addTargetSymbols() { m_LDBackend.initTargetSymbols(*m_pBuilder, *m_pModule); return true; } /// addScriptSymbols - define symbols from the command line option or linker /// scripts. bool ObjectLinker::addScriptSymbols() { const LinkerScript& script = m_pModule->getScript(); LinkerScript::DefSymMap::const_entry_iterator it; LinkerScript::DefSymMap::const_entry_iterator ie = script.defSymMap().end(); // go through the entire defSymMap for (it = script.defSymMap().begin(); it != ie; ++it) { const llvm::StringRef sym = it.getEntry()->key(); ResolveInfo* old_info = m_pModule->getNamePool().findInfo(sym); // if the symbol does not exist, we can set type to NOTYPE // else we retain its type, same goes for size - 0 or retain old value // and visibility - Default or retain if (old_info != NULL) { if(!m_pBuilder->AddSymbol<IRBuilder::Force, IRBuilder::Unresolve>( sym, static_cast<ResolveInfo::Type>(old_info->type()), ResolveInfo::Define, ResolveInfo::Absolute, old_info->size(), 0x0, FragmentRef::Null(), old_info->visibility())) return false; } else { if (!m_pBuilder->AddSymbol<IRBuilder::Force, IRBuilder::Unresolve>( sym, ResolveInfo::NoType, ResolveInfo::Define, ResolveInfo::Absolute, 0x0, 0x0, FragmentRef::Null(), ResolveInfo::Default)) return false; } } return true; } bool ObjectLinker::scanRelocations() { // apply all relocations of all inputs Module::obj_iterator input, inEnd = m_pModule->obj_end(); for (input = m_pModule->obj_begin(); input != inEnd; ++input) { m_LDBackend.getRelocator()->initializeScan(**input); LDContext::sect_iterator rs, rsEnd = (*input)->context()->relocSectEnd(); for (rs = (*input)->context()->relocSectBegin(); rs != rsEnd; ++rs) { // bypass the reloc section if // 1. its section kind is changed to Ignore. (The target section is a // discarded group section.) // 2. it has no reloc data. (All symbols in the input relocs are in the // discarded group sections) if (LDFileFormat::Ignore == (*rs)->kind() || !(*rs)->hasRelocData()) continue; RelocData::iterator reloc, rEnd = (*rs)->getRelocData()->end(); for (reloc = (*rs)->getRelocData()->begin(); reloc != rEnd; ++reloc) { Relocation* relocation = llvm::cast<Relocation>(reloc); // scan relocation if (LinkerConfig::Object != m_Config.codeGenType()) m_LDBackend.getRelocator()->scanRelocation( *relocation, *m_pBuilder, *m_pModule, **rs); else m_LDBackend.getRelocator()->partialScanRelocation( *relocation, *m_pModule, **rs); } // for all relocations } // for all relocation section m_LDBackend.getRelocator()->finalizeScan(**input); } // for all inputs return true; } /// initStubs - initialize stub-related stuff. bool ObjectLinker::initStubs() { // initialize BranchIslandFactory m_LDBackend.initBRIslandFactory(); // initialize StubFactory m_LDBackend.initStubFactory(); // initialize target stubs m_LDBackend.initTargetStubs(); return true; } /// allocateCommonSymobols - allocate fragments for common symbols to the /// corresponding sections bool ObjectLinker::allocateCommonSymbols() { if (LinkerConfig::Object != m_Config.codeGenType() || m_Config.options().isDefineCommon()) return m_LDBackend.allocateCommonSymbols(*m_pModule); return true; } /// prelayout - help backend to do some modification before layout bool ObjectLinker::prelayout() { // finalize the section symbols, set their fragment reference and push them // into output symbol table Module::iterator sect, sEnd = m_pModule->end(); for (sect = m_pModule->begin(); sect != sEnd; ++sect) { m_pModule->getSectionSymbolSet().finalize(**sect, m_pModule->getSymbolTable(), m_Config.codeGenType() == LinkerConfig::Object); } m_LDBackend.preLayout(*m_pModule, *m_pBuilder); /// check program interpreter - computer the name size of the runtime dyld if (!m_Config.isCodeStatic() && (LinkerConfig::Exec == m_Config.codeGenType() || m_Config.options().isPIE() || m_Config.options().hasDyld())) m_LDBackend.sizeInterp(); /// measure NamePools - compute the size of name pool sections /// In ELF, will compute the size of.symtab, .strtab, .dynsym, .dynstr, /// .hash and .shstrtab sections. /// /// dump all symbols and strings from FragmentLinker and build the format-dependent /// hash table. /// @note sizeNamePools replies on LinkerConfig::CodePosition. Must determine /// code position model before calling GNULDBackend::sizeNamePools() m_LDBackend.sizeNamePools(*m_pModule); return true; } /// layout - linearly layout all output sections and reserve some space /// for GOT/PLT /// Because we do not support instruction relaxing in this early version, /// if there is a branch can not jump to its target, we return false /// directly bool ObjectLinker::layout() { m_LDBackend.layout(*m_pModule); return true; } /// prelayout - help backend to do some modification after layout bool ObjectLinker::postlayout() { m_LDBackend.postLayout(*m_pModule, *m_pBuilder); return true; } /// finalizeSymbolValue - finalize the resolved symbol value. /// Before relocate(), after layout(), FragmentLinker should correct value of all /// symbol. bool ObjectLinker::finalizeSymbolValue() { bool finalized = m_pLinker->finalizeSymbols() && m_LDBackend.finalizeSymbols(); bool scriptSymsAdded = true; uint64_t symVal; const LinkerScript& script = m_pModule->getScript(); LinkerScript::DefSymMap::const_entry_iterator it; LinkerScript::DefSymMap::const_entry_iterator ie = script.defSymMap().end(); DefSymParser parser(*m_pModule); for (it = script.defSymMap().begin(); it != ie; ++it) { llvm::StringRef symName = it.getEntry()->key(); llvm::StringRef expr = it.getEntry()->value(); LDSymbol* symbol = m_pModule->getNamePool().findSymbol(symName); assert(NULL != symbol && "--defsym symbol should be in the name pool"); scriptSymsAdded &= parser.parse(expr, symVal); if (!scriptSymsAdded) break; symbol->setValue(symVal); } return finalized && scriptSymsAdded ; } /// relocate - applying relocation entries and create relocation /// section in the output files /// Create relocation section, asking TargetLDBackend to /// read the relocation information into RelocationEntry /// and push_back into the relocation section bool ObjectLinker::relocation() { return m_pLinker->applyRelocations(); } /// emitOutput - emit the output file. bool ObjectLinker::emitOutput(MemoryArea& pOutput) { return llvm::errc::success == getWriter()->writeObject(*m_pModule, pOutput); } /// postProcessing - do modification after all processes bool ObjectLinker::postProcessing(MemoryArea& pOutput) { m_pLinker->syncRelocationResult(pOutput); // emit .eh_frame_hdr // eh_frame_hdr should be emitted after syncRelocation, because eh_frame_hdr // needs FDE PC value, which will be corrected at syncRelocation m_LDBackend.postProcessing(pOutput); return true; }