//===- yaml2obj - Convert YAML to a binary object file --------------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This program takes a YAML description of an object file and outputs the // binary equivalent. // // This is used for writing tests that require binary files. // //===----------------------------------------------------------------------===// #include "llvm/ADT/SmallString.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ADT/StringMap.h" #include "llvm/ADT/StringSwitch.h" #include "llvm/Support/COFF.h" #include "llvm/Support/Casting.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/Endian.h" #include "llvm/Support/ManagedStatic.h" #include "llvm/Support/MemoryBuffer.h" #include "llvm/Support/PrettyStackTrace.h" #include "llvm/Support/Signals.h" #include "llvm/Support/SourceMgr.h" #include "llvm/Support/YAMLParser.h" #include "llvm/Support/raw_ostream.h" #include "llvm/Support/system_error.h" #include <vector> using namespace llvm; static cl::opt<std::string> Input(cl::Positional, cl::desc("<input>"), cl::init("-")); template<class T> typename llvm::enable_if_c<std::numeric_limits<T>::is_integer, bool>::type getAs(const llvm::yaml::ScalarNode *SN, T &Result) { SmallString<4> Storage; StringRef Value = SN->getValue(Storage); if (Value.getAsInteger(0, Result)) return false; return true; } // Given a container with begin and end with ::value_type of a character type. // Iterate through pairs of characters in the the set of [a-fA-F0-9] ignoring // all other characters. struct hex_pair_iterator { StringRef::const_iterator Current, End; typedef SmallVector<char, 2> value_type; value_type Pair; bool IsDone; hex_pair_iterator(StringRef C) : Current(C.begin()), End(C.end()), IsDone(false) { // Initalize Pair. ++*this; } // End iterator. hex_pair_iterator() : Current(), End(), IsDone(true) {} value_type operator *() const { return Pair; } hex_pair_iterator operator ++() { // We're at the end of the input. if (Current == End) { IsDone = true; return *this; } Pair = value_type(); for (; Current != End && Pair.size() != 2; ++Current) { // Is a valid hex digit. if ((*Current >= '0' && *Current <= '9') || (*Current >= 'a' && *Current <= 'f') || (*Current >= 'A' && *Current <= 'F')) Pair.push_back(*Current); } // Hit the end without getting 2 hex digits. Pair is invalid. if (Pair.size() != 2) IsDone = true; return *this; } bool operator ==(const hex_pair_iterator Other) { return (IsDone == Other.IsDone) || (Current == Other.Current && End == Other.End); } bool operator !=(const hex_pair_iterator Other) { return !(*this == Other); } }; template <class ContainerOut> static bool hexStringToByteArray(StringRef Str, ContainerOut &Out) { for (hex_pair_iterator I(Str), E; I != E; ++I) { typename hex_pair_iterator::value_type Pair = *I; typename ContainerOut::value_type Byte; if (StringRef(Pair.data(), 2).getAsInteger(16, Byte)) return false; Out.push_back(Byte); } return true; } /// This parses a yaml stream that represents a COFF object file. /// See docs/yaml2obj for the yaml scheema. struct COFFParser { COFFParser(yaml::Stream &Input) : YS(Input) { std::memset(&Header, 0, sizeof(Header)); // A COFF string table always starts with a 4 byte size field. Offsets into // it include this size, so allocate it now. StringTable.append(4, 0); } bool parseHeader(yaml::Node *HeaderN) { yaml::MappingNode *MN = dyn_cast<yaml::MappingNode>(HeaderN); if (!MN) { YS.printError(HeaderN, "header's value must be a mapping node"); return false; } for (yaml::MappingNode::iterator i = MN->begin(), e = MN->end(); i != e; ++i) { yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(i->getKey()); if (!Key) { YS.printError(i->getKey(), "Keys must be scalar values"); return false; } SmallString<32> Storage; StringRef KeyValue = Key->getValue(Storage); if (KeyValue == "Characteristics") { if (!parseHeaderCharacteristics(i->getValue())) return false; } else { yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(i->getValue()); if (!Value) { YS.printError(Value, Twine(KeyValue) + " must be a scalar value"); return false; } if (KeyValue == "Machine") { uint16_t Machine = COFF::MT_Invalid; if (!getAs(Value, Machine)) { // It's not a raw number, try matching the string. StringRef ValueValue = Value->getValue(Storage); Machine = StringSwitch<COFF::MachineTypes>(ValueValue) .Case( "IMAGE_FILE_MACHINE_UNKNOWN" , COFF::IMAGE_FILE_MACHINE_UNKNOWN) .Case( "IMAGE_FILE_MACHINE_AM33" , COFF::IMAGE_FILE_MACHINE_AM33) .Case( "IMAGE_FILE_MACHINE_AMD64" , COFF::IMAGE_FILE_MACHINE_AMD64) .Case( "IMAGE_FILE_MACHINE_ARM" , COFF::IMAGE_FILE_MACHINE_ARM) .Case( "IMAGE_FILE_MACHINE_ARMV7" , COFF::IMAGE_FILE_MACHINE_ARMV7) .Case( "IMAGE_FILE_MACHINE_EBC" , COFF::IMAGE_FILE_MACHINE_EBC) .Case( "IMAGE_FILE_MACHINE_I386" , COFF::IMAGE_FILE_MACHINE_I386) .Case( "IMAGE_FILE_MACHINE_IA64" , COFF::IMAGE_FILE_MACHINE_IA64) .Case( "IMAGE_FILE_MACHINE_M32R" , COFF::IMAGE_FILE_MACHINE_M32R) .Case( "IMAGE_FILE_MACHINE_MIPS16" , COFF::IMAGE_FILE_MACHINE_MIPS16) .Case( "IMAGE_FILE_MACHINE_MIPSFPU" , COFF::IMAGE_FILE_MACHINE_MIPSFPU) .Case( "IMAGE_FILE_MACHINE_MIPSFPU16" , COFF::IMAGE_FILE_MACHINE_MIPSFPU16) .Case( "IMAGE_FILE_MACHINE_POWERPC" , COFF::IMAGE_FILE_MACHINE_POWERPC) .Case( "IMAGE_FILE_MACHINE_POWERPCFP" , COFF::IMAGE_FILE_MACHINE_POWERPCFP) .Case( "IMAGE_FILE_MACHINE_R4000" , COFF::IMAGE_FILE_MACHINE_R4000) .Case( "IMAGE_FILE_MACHINE_SH3" , COFF::IMAGE_FILE_MACHINE_SH3) .Case( "IMAGE_FILE_MACHINE_SH3DSP" , COFF::IMAGE_FILE_MACHINE_SH3DSP) .Case( "IMAGE_FILE_MACHINE_SH4" , COFF::IMAGE_FILE_MACHINE_SH4) .Case( "IMAGE_FILE_MACHINE_SH5" , COFF::IMAGE_FILE_MACHINE_SH5) .Case( "IMAGE_FILE_MACHINE_THUMB" , COFF::IMAGE_FILE_MACHINE_THUMB) .Case( "IMAGE_FILE_MACHINE_WCEMIPSV2" , COFF::IMAGE_FILE_MACHINE_WCEMIPSV2) .Default(COFF::MT_Invalid); if (Machine == COFF::MT_Invalid) { YS.printError(Value, "Invalid value for Machine"); return false; } } Header.Machine = Machine; } else if (KeyValue == "NumberOfSections") { if (!getAs(Value, Header.NumberOfSections)) { YS.printError(Value, "Invalid value for NumberOfSections"); return false; } } else if (KeyValue == "TimeDateStamp") { if (!getAs(Value, Header.TimeDateStamp)) { YS.printError(Value, "Invalid value for TimeDateStamp"); return false; } } else if (KeyValue == "PointerToSymbolTable") { if (!getAs(Value, Header.PointerToSymbolTable)) { YS.printError(Value, "Invalid value for PointerToSymbolTable"); return false; } } else if (KeyValue == "NumberOfSymbols") { if (!getAs(Value, Header.NumberOfSymbols)) { YS.printError(Value, "Invalid value for NumberOfSymbols"); return false; } } else if (KeyValue == "SizeOfOptionalHeader") { if (!getAs(Value, Header.SizeOfOptionalHeader)) { YS.printError(Value, "Invalid value for SizeOfOptionalHeader"); return false; } } else { YS.printError(Key, "Unrecognized key in header"); return false; } } } return true; } bool parseHeaderCharacteristics(yaml::Node *Characteristics) { yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(Characteristics); yaml::SequenceNode *SeqValue = dyn_cast<yaml::SequenceNode>(Characteristics); if (!Value && !SeqValue) { YS.printError(Characteristics, "Characteristics must either be a number or sequence"); return false; } if (Value) { if (!getAs(Value, Header.Characteristics)) { YS.printError(Value, "Invalid value for Characteristics"); return false; } } else { for (yaml::SequenceNode::iterator ci = SeqValue->begin(), ce = SeqValue->end(); ci != ce; ++ci) { yaml::ScalarNode *CharValue = dyn_cast<yaml::ScalarNode>(&*ci); if (!CharValue) { YS.printError(CharValue, "Characteristics must be scalar values"); return false; } SmallString<32> Storage; StringRef Char = CharValue->getValue(Storage); uint16_t Characteristic = StringSwitch<COFF::Characteristics>(Char) .Case( "IMAGE_FILE_RELOCS_STRIPPED" , COFF::IMAGE_FILE_RELOCS_STRIPPED) .Case( "IMAGE_FILE_EXECUTABLE_IMAGE" , COFF::IMAGE_FILE_EXECUTABLE_IMAGE) .Case( "IMAGE_FILE_LINE_NUMS_STRIPPED" , COFF::IMAGE_FILE_LINE_NUMS_STRIPPED) .Case( "IMAGE_FILE_LOCAL_SYMS_STRIPPED" , COFF::IMAGE_FILE_LOCAL_SYMS_STRIPPED) .Case( "IMAGE_FILE_AGGRESSIVE_WS_TRIM" , COFF::IMAGE_FILE_AGGRESSIVE_WS_TRIM) .Case( "IMAGE_FILE_LARGE_ADDRESS_AWARE" , COFF::IMAGE_FILE_LARGE_ADDRESS_AWARE) .Case( "IMAGE_FILE_BYTES_REVERSED_LO" , COFF::IMAGE_FILE_BYTES_REVERSED_LO) .Case( "IMAGE_FILE_32BIT_MACHINE" , COFF::IMAGE_FILE_32BIT_MACHINE) .Case( "IMAGE_FILE_DEBUG_STRIPPED" , COFF::IMAGE_FILE_DEBUG_STRIPPED) .Case( "IMAGE_FILE_REMOVABLE_RUN_FROM_SWAP" , COFF::IMAGE_FILE_REMOVABLE_RUN_FROM_SWAP) .Case( "IMAGE_FILE_SYSTEM" , COFF::IMAGE_FILE_SYSTEM) .Case( "IMAGE_FILE_DLL" , COFF::IMAGE_FILE_DLL) .Case( "IMAGE_FILE_UP_SYSTEM_ONLY" , COFF::IMAGE_FILE_UP_SYSTEM_ONLY) .Default(COFF::C_Invalid); if (Characteristic == COFF::C_Invalid) { // TODO: Typo-correct. YS.printError(CharValue, "Invalid value for Characteristic"); return false; } Header.Characteristics |= Characteristic; } } return true; } bool parseSections(yaml::Node *SectionsN) { yaml::SequenceNode *SN = dyn_cast<yaml::SequenceNode>(SectionsN); if (!SN) { YS.printError(SectionsN, "Sections must be a sequence"); return false; } for (yaml::SequenceNode::iterator i = SN->begin(), e = SN->end(); i != e; ++i) { Section Sec; std::memset(&Sec.Header, 0, sizeof(Sec.Header)); yaml::MappingNode *SecMap = dyn_cast<yaml::MappingNode>(&*i); if (!SecMap) { YS.printError(&*i, "Section entry must be a map"); return false; } for (yaml::MappingNode::iterator si = SecMap->begin(), se = SecMap->end(); si != se; ++si) { yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(si->getKey()); if (!Key) { YS.printError(si->getKey(), "Keys must be scalar values"); return false; } SmallString<32> Storage; StringRef KeyValue = Key->getValue(Storage); yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue()); if (KeyValue == "Name") { // If the name is less than 8 bytes, store it in place, otherwise // store it in the string table. StringRef Name = Value->getValue(Storage); std::fill_n(Sec.Header.Name, unsigned(COFF::NameSize), 0); if (Name.size() <= COFF::NameSize) { std::copy(Name.begin(), Name.end(), Sec.Header.Name); } else { // Add string to the string table and format the index for output. unsigned Index = getStringIndex(Name); std::string str = utostr(Index); if (str.size() > 7) { YS.printError(Value, "String table got too large"); return false; } Sec.Header.Name[0] = '/'; std::copy(str.begin(), str.end(), Sec.Header.Name + 1); } } else if (KeyValue == "VirtualSize") { if (!getAs(Value, Sec.Header.VirtualSize)) { YS.printError(Value, "Invalid value for VirtualSize"); return false; } } else if (KeyValue == "VirtualAddress") { if (!getAs(Value, Sec.Header.VirtualAddress)) { YS.printError(Value, "Invalid value for VirtualAddress"); return false; } } else if (KeyValue == "SizeOfRawData") { if (!getAs(Value, Sec.Header.SizeOfRawData)) { YS.printError(Value, "Invalid value for SizeOfRawData"); return false; } } else if (KeyValue == "PointerToRawData") { if (!getAs(Value, Sec.Header.PointerToRawData)) { YS.printError(Value, "Invalid value for PointerToRawData"); return false; } } else if (KeyValue == "PointerToRelocations") { if (!getAs(Value, Sec.Header.PointerToRelocations)) { YS.printError(Value, "Invalid value for PointerToRelocations"); return false; } } else if (KeyValue == "PointerToLineNumbers") { if (!getAs(Value, Sec.Header.PointerToLineNumbers)) { YS.printError(Value, "Invalid value for PointerToLineNumbers"); return false; } } else if (KeyValue == "NumberOfRelocations") { if (!getAs(Value, Sec.Header.NumberOfRelocations)) { YS.printError(Value, "Invalid value for NumberOfRelocations"); return false; } } else if (KeyValue == "NumberOfLineNumbers") { if (!getAs(Value, Sec.Header.NumberOfLineNumbers)) { YS.printError(Value, "Invalid value for NumberOfLineNumbers"); return false; } } else if (KeyValue == "Characteristics") { yaml::SequenceNode *SeqValue = dyn_cast<yaml::SequenceNode>(si->getValue()); if (!Value && !SeqValue) { YS.printError(si->getValue(), "Characteristics must either be a number or sequence"); return false; } if (Value) { if (!getAs(Value, Sec.Header.Characteristics)) { YS.printError(Value, "Invalid value for Characteristics"); return false; } } else { for (yaml::SequenceNode::iterator ci = SeqValue->begin(), ce = SeqValue->end(); ci != ce; ++ci) { yaml::ScalarNode *CharValue = dyn_cast<yaml::ScalarNode>(&*ci); if (!CharValue) { YS.printError(CharValue, "Invalid value for Characteristics"); return false; } StringRef Char = CharValue->getValue(Storage); uint32_t Characteristic = StringSwitch<COFF::SectionCharacteristics>(Char) .Case( "IMAGE_SCN_TYPE_NO_PAD" , COFF::IMAGE_SCN_TYPE_NO_PAD) .Case( "IMAGE_SCN_CNT_CODE" , COFF::IMAGE_SCN_CNT_CODE) .Case( "IMAGE_SCN_CNT_INITIALIZED_DATA" , COFF::IMAGE_SCN_CNT_INITIALIZED_DATA) .Case( "IMAGE_SCN_CNT_UNINITIALIZED_DATA" , COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA) .Case( "IMAGE_SCN_LNK_OTHER" , COFF::IMAGE_SCN_LNK_OTHER) .Case( "IMAGE_SCN_LNK_INFO" , COFF::IMAGE_SCN_LNK_INFO) .Case( "IMAGE_SCN_LNK_REMOVE" , COFF::IMAGE_SCN_LNK_REMOVE) .Case( "IMAGE_SCN_LNK_COMDAT" , COFF::IMAGE_SCN_LNK_COMDAT) .Case( "IMAGE_SCN_GPREL" , COFF::IMAGE_SCN_GPREL) .Case( "IMAGE_SCN_MEM_PURGEABLE" , COFF::IMAGE_SCN_MEM_PURGEABLE) .Case( "IMAGE_SCN_MEM_16BIT" , COFF::IMAGE_SCN_MEM_16BIT) .Case( "IMAGE_SCN_MEM_LOCKED" , COFF::IMAGE_SCN_MEM_LOCKED) .Case( "IMAGE_SCN_MEM_PRELOAD" , COFF::IMAGE_SCN_MEM_PRELOAD) .Case( "IMAGE_SCN_ALIGN_1BYTES" , COFF::IMAGE_SCN_ALIGN_1BYTES) .Case( "IMAGE_SCN_ALIGN_2BYTES" , COFF::IMAGE_SCN_ALIGN_2BYTES) .Case( "IMAGE_SCN_ALIGN_4BYTES" , COFF::IMAGE_SCN_ALIGN_4BYTES) .Case( "IMAGE_SCN_ALIGN_8BYTES" , COFF::IMAGE_SCN_ALIGN_8BYTES) .Case( "IMAGE_SCN_ALIGN_16BYTES" , COFF::IMAGE_SCN_ALIGN_16BYTES) .Case( "IMAGE_SCN_ALIGN_32BYTES" , COFF::IMAGE_SCN_ALIGN_32BYTES) .Case( "IMAGE_SCN_ALIGN_64BYTES" , COFF::IMAGE_SCN_ALIGN_64BYTES) .Case( "IMAGE_SCN_ALIGN_128BYTES" , COFF::IMAGE_SCN_ALIGN_128BYTES) .Case( "IMAGE_SCN_ALIGN_256BYTES" , COFF::IMAGE_SCN_ALIGN_256BYTES) .Case( "IMAGE_SCN_ALIGN_512BYTES" , COFF::IMAGE_SCN_ALIGN_512BYTES) .Case( "IMAGE_SCN_ALIGN_1024BYTES" , COFF::IMAGE_SCN_ALIGN_1024BYTES) .Case( "IMAGE_SCN_ALIGN_2048BYTES" , COFF::IMAGE_SCN_ALIGN_2048BYTES) .Case( "IMAGE_SCN_ALIGN_4096BYTES" , COFF::IMAGE_SCN_ALIGN_4096BYTES) .Case( "IMAGE_SCN_ALIGN_8192BYTES" , COFF::IMAGE_SCN_ALIGN_8192BYTES) .Case( "IMAGE_SCN_LNK_NRELOC_OVFL" , COFF::IMAGE_SCN_LNK_NRELOC_OVFL) .Case( "IMAGE_SCN_MEM_DISCARDABLE" , COFF::IMAGE_SCN_MEM_DISCARDABLE) .Case( "IMAGE_SCN_MEM_NOT_CACHED" , COFF::IMAGE_SCN_MEM_NOT_CACHED) .Case( "IMAGE_SCN_MEM_NOT_PAGED" , COFF::IMAGE_SCN_MEM_NOT_PAGED) .Case( "IMAGE_SCN_MEM_SHARED" , COFF::IMAGE_SCN_MEM_SHARED) .Case( "IMAGE_SCN_MEM_EXECUTE" , COFF::IMAGE_SCN_MEM_EXECUTE) .Case( "IMAGE_SCN_MEM_READ" , COFF::IMAGE_SCN_MEM_READ) .Case( "IMAGE_SCN_MEM_WRITE" , COFF::IMAGE_SCN_MEM_WRITE) .Default(COFF::SC_Invalid); if (Characteristic == COFF::SC_Invalid) { YS.printError(CharValue, "Invalid value for Characteristic"); return false; } Sec.Header.Characteristics |= Characteristic; } } } else if (KeyValue == "SectionData") { yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue()); SmallString<32> Storage; StringRef Data = Value->getValue(Storage); if (!hexStringToByteArray(Data, Sec.Data)) { YS.printError(Value, "SectionData must be a collection of pairs of" "hex bytes"); return false; } } else si->skip(); } Sections.push_back(Sec); } return true; } bool parseSymbols(yaml::Node *SymbolsN) { yaml::SequenceNode *SN = dyn_cast<yaml::SequenceNode>(SymbolsN); if (!SN) { YS.printError(SymbolsN, "Symbols must be a sequence"); return false; } for (yaml::SequenceNode::iterator i = SN->begin(), e = SN->end(); i != e; ++i) { Symbol Sym; std::memset(&Sym.Header, 0, sizeof(Sym.Header)); yaml::MappingNode *SymMap = dyn_cast<yaml::MappingNode>(&*i); if (!SymMap) { YS.printError(&*i, "Symbol must be a map"); return false; } for (yaml::MappingNode::iterator si = SymMap->begin(), se = SymMap->end(); si != se; ++si) { yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(si->getKey()); if (!Key) { YS.printError(si->getKey(), "Keys must be scalar values"); return false; } SmallString<32> Storage; StringRef KeyValue = Key->getValue(Storage); yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue()); if (!Value) { YS.printError(si->getValue(), "Must be a scalar value"); return false; } if (KeyValue == "Name") { // If the name is less than 8 bytes, store it in place, otherwise // store it in the string table. StringRef Name = Value->getValue(Storage); std::fill_n(Sym.Header.Name, unsigned(COFF::NameSize), 0); if (Name.size() <= COFF::NameSize) { std::copy(Name.begin(), Name.end(), Sym.Header.Name); } else { // Add string to the string table and format the index for output. unsigned Index = getStringIndex(Name); *reinterpret_cast<support::aligned_ulittle32_t*>( Sym.Header.Name + 4) = Index; } } else if (KeyValue == "Value") { if (!getAs(Value, Sym.Header.Value)) { YS.printError(Value, "Invalid value for Value"); return false; } } else if (KeyValue == "SimpleType") { Sym.Header.Type |= StringSwitch<COFF::SymbolBaseType>( Value->getValue(Storage)) .Case("IMAGE_SYM_TYPE_NULL", COFF::IMAGE_SYM_TYPE_NULL) .Case("IMAGE_SYM_TYPE_VOID", COFF::IMAGE_SYM_TYPE_VOID) .Case("IMAGE_SYM_TYPE_CHAR", COFF::IMAGE_SYM_TYPE_CHAR) .Case("IMAGE_SYM_TYPE_SHORT", COFF::IMAGE_SYM_TYPE_SHORT) .Case("IMAGE_SYM_TYPE_INT", COFF::IMAGE_SYM_TYPE_INT) .Case("IMAGE_SYM_TYPE_LONG", COFF::IMAGE_SYM_TYPE_LONG) .Case("IMAGE_SYM_TYPE_FLOAT", COFF::IMAGE_SYM_TYPE_FLOAT) .Case("IMAGE_SYM_TYPE_DOUBLE", COFF::IMAGE_SYM_TYPE_DOUBLE) .Case("IMAGE_SYM_TYPE_STRUCT", COFF::IMAGE_SYM_TYPE_STRUCT) .Case("IMAGE_SYM_TYPE_UNION", COFF::IMAGE_SYM_TYPE_UNION) .Case("IMAGE_SYM_TYPE_ENUM", COFF::IMAGE_SYM_TYPE_ENUM) .Case("IMAGE_SYM_TYPE_MOE", COFF::IMAGE_SYM_TYPE_MOE) .Case("IMAGE_SYM_TYPE_BYTE", COFF::IMAGE_SYM_TYPE_BYTE) .Case("IMAGE_SYM_TYPE_WORD", COFF::IMAGE_SYM_TYPE_WORD) .Case("IMAGE_SYM_TYPE_UINT", COFF::IMAGE_SYM_TYPE_UINT) .Case("IMAGE_SYM_TYPE_DWORD", COFF::IMAGE_SYM_TYPE_DWORD) .Default(COFF::IMAGE_SYM_TYPE_NULL); } else if (KeyValue == "ComplexType") { Sym.Header.Type |= StringSwitch<COFF::SymbolComplexType>( Value->getValue(Storage)) .Case("IMAGE_SYM_DTYPE_NULL", COFF::IMAGE_SYM_DTYPE_NULL) .Case("IMAGE_SYM_DTYPE_POINTER", COFF::IMAGE_SYM_DTYPE_POINTER) .Case("IMAGE_SYM_DTYPE_FUNCTION", COFF::IMAGE_SYM_DTYPE_FUNCTION) .Case("IMAGE_SYM_DTYPE_ARRAY", COFF::IMAGE_SYM_DTYPE_ARRAY) .Default(COFF::IMAGE_SYM_DTYPE_NULL) << COFF::SCT_COMPLEX_TYPE_SHIFT; } else if (KeyValue == "StorageClass") { Sym.Header.StorageClass = StringSwitch<COFF::SymbolStorageClass>( Value->getValue(Storage)) .Case( "IMAGE_SYM_CLASS_END_OF_FUNCTION" , COFF::IMAGE_SYM_CLASS_END_OF_FUNCTION) .Case( "IMAGE_SYM_CLASS_NULL" , COFF::IMAGE_SYM_CLASS_NULL) .Case( "IMAGE_SYM_CLASS_AUTOMATIC" , COFF::IMAGE_SYM_CLASS_AUTOMATIC) .Case( "IMAGE_SYM_CLASS_EXTERNAL" , COFF::IMAGE_SYM_CLASS_EXTERNAL) .Case( "IMAGE_SYM_CLASS_STATIC" , COFF::IMAGE_SYM_CLASS_STATIC) .Case( "IMAGE_SYM_CLASS_REGISTER" , COFF::IMAGE_SYM_CLASS_REGISTER) .Case( "IMAGE_SYM_CLASS_EXTERNAL_DEF" , COFF::IMAGE_SYM_CLASS_EXTERNAL_DEF) .Case( "IMAGE_SYM_CLASS_LABEL" , COFF::IMAGE_SYM_CLASS_LABEL) .Case( "IMAGE_SYM_CLASS_UNDEFINED_LABEL" , COFF::IMAGE_SYM_CLASS_UNDEFINED_LABEL) .Case( "IMAGE_SYM_CLASS_MEMBER_OF_STRUCT" , COFF::IMAGE_SYM_CLASS_MEMBER_OF_STRUCT) .Case( "IMAGE_SYM_CLASS_ARGUMENT" , COFF::IMAGE_SYM_CLASS_ARGUMENT) .Case( "IMAGE_SYM_CLASS_STRUCT_TAG" , COFF::IMAGE_SYM_CLASS_STRUCT_TAG) .Case( "IMAGE_SYM_CLASS_MEMBER_OF_UNION" , COFF::IMAGE_SYM_CLASS_MEMBER_OF_UNION) .Case( "IMAGE_SYM_CLASS_UNION_TAG" , COFF::IMAGE_SYM_CLASS_UNION_TAG) .Case( "IMAGE_SYM_CLASS_TYPE_DEFINITION" , COFF::IMAGE_SYM_CLASS_TYPE_DEFINITION) .Case( "IMAGE_SYM_CLASS_UNDEFINED_STATIC" , COFF::IMAGE_SYM_CLASS_UNDEFINED_STATIC) .Case( "IMAGE_SYM_CLASS_ENUM_TAG" , COFF::IMAGE_SYM_CLASS_ENUM_TAG) .Case( "IMAGE_SYM_CLASS_MEMBER_OF_ENUM" , COFF::IMAGE_SYM_CLASS_MEMBER_OF_ENUM) .Case( "IMAGE_SYM_CLASS_REGISTER_PARAM" , COFF::IMAGE_SYM_CLASS_REGISTER_PARAM) .Case( "IMAGE_SYM_CLASS_BIT_FIELD" , COFF::IMAGE_SYM_CLASS_BIT_FIELD) .Case( "IMAGE_SYM_CLASS_BLOCK" , COFF::IMAGE_SYM_CLASS_BLOCK) .Case( "IMAGE_SYM_CLASS_FUNCTION" , COFF::IMAGE_SYM_CLASS_FUNCTION) .Case( "IMAGE_SYM_CLASS_END_OF_STRUCT" , COFF::IMAGE_SYM_CLASS_END_OF_STRUCT) .Case( "IMAGE_SYM_CLASS_FILE" , COFF::IMAGE_SYM_CLASS_FILE) .Case( "IMAGE_SYM_CLASS_SECTION" , COFF::IMAGE_SYM_CLASS_SECTION) .Case( "IMAGE_SYM_CLASS_WEAK_EXTERNAL" , COFF::IMAGE_SYM_CLASS_WEAK_EXTERNAL) .Case( "IMAGE_SYM_CLASS_CLR_TOKEN" , COFF::IMAGE_SYM_CLASS_CLR_TOKEN) .Default(COFF::SSC_Invalid); if (Sym.Header.StorageClass == COFF::SSC_Invalid) { YS.printError(Value, "Invalid value for StorageClass"); return false; } } else if (KeyValue == "SectionNumber") { if (!getAs(Value, Sym.Header.SectionNumber)) { YS.printError(Value, "Invalid value for SectionNumber"); return false; } } else if (KeyValue == "AuxillaryData") { StringRef Data = Value->getValue(Storage); if (!hexStringToByteArray(Data, Sym.AuxSymbols)) { YS.printError(Value, "AuxillaryData must be a collection of pairs" "of hex bytes"); return false; } } else si->skip(); } Symbols.push_back(Sym); } return true; } bool parse() { yaml::Document &D = *YS.begin(); yaml::MappingNode *Root = dyn_cast<yaml::MappingNode>(D.getRoot()); if (!Root) { YS.printError(D.getRoot(), "Root node must be a map"); return false; } for (yaml::MappingNode::iterator i = Root->begin(), e = Root->end(); i != e; ++i) { yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(i->getKey()); if (!Key) { YS.printError(i->getKey(), "Keys must be scalar values"); return false; } SmallString<32> Storage; StringRef KeyValue = Key->getValue(Storage); if (KeyValue == "header") { if (!parseHeader(i->getValue())) return false; } else if (KeyValue == "sections") { if (!parseSections(i->getValue())) return false; } else if (KeyValue == "symbols") { if (!parseSymbols(i->getValue())) return false; } } return !YS.failed(); } unsigned getStringIndex(StringRef Str) { StringMap<unsigned>::iterator i = StringTableMap.find(Str); if (i == StringTableMap.end()) { unsigned Index = StringTable.size(); StringTable.append(Str.begin(), Str.end()); StringTable.push_back(0); StringTableMap[Str] = Index; return Index; } return i->second; } yaml::Stream &YS; COFF::header Header; struct Section { COFF::section Header; std::vector<uint8_t> Data; std::vector<COFF::relocation> Relocations; }; struct Symbol { COFF::symbol Header; std::vector<uint8_t> AuxSymbols; }; std::vector<Section> Sections; std::vector<Symbol> Symbols; StringMap<unsigned> StringTableMap; std::string StringTable; }; // Take a CP and assign addresses and sizes to everything. Returns false if the // layout is not valid to do. static bool layoutCOFF(COFFParser &CP) { uint32_t SectionTableStart = 0; uint32_t SectionTableSize = 0; // The section table starts immediately after the header, including the // optional header. SectionTableStart = sizeof(COFF::header) + CP.Header.SizeOfOptionalHeader; SectionTableSize = sizeof(COFF::section) * CP.Sections.size(); uint32_t CurrentSectionDataOffset = SectionTableStart + SectionTableSize; // Assign each section data address consecutively. for (std::vector<COFFParser::Section>::iterator i = CP.Sections.begin(), e = CP.Sections.end(); i != e; ++i) { if (!i->Data.empty()) { i->Header.SizeOfRawData = i->Data.size(); i->Header.PointerToRawData = CurrentSectionDataOffset; CurrentSectionDataOffset += i->Header.SizeOfRawData; // TODO: Handle alignment. } else { i->Header.SizeOfRawData = 0; i->Header.PointerToRawData = 0; } } uint32_t SymbolTableStart = CurrentSectionDataOffset; // Calculate number of symbols. uint32_t NumberOfSymbols = 0; for (std::vector<COFFParser::Symbol>::iterator i = CP.Symbols.begin(), e = CP.Symbols.end(); i != e; ++i) { if (i->AuxSymbols.size() % COFF::SymbolSize != 0) { errs() << "AuxillaryData size not a multiple of symbol size!\n"; return false; } i->Header.NumberOfAuxSymbols = i->AuxSymbols.size() / COFF::SymbolSize; NumberOfSymbols += 1 + i->Header.NumberOfAuxSymbols; } // Store all the allocated start addresses in the header. CP.Header.NumberOfSections = CP.Sections.size(); CP.Header.NumberOfSymbols = NumberOfSymbols; CP.Header.PointerToSymbolTable = SymbolTableStart; *reinterpret_cast<support::ulittle32_t *>(&CP.StringTable[0]) = CP.StringTable.size(); return true; } template <typename value_type> struct binary_le_impl { value_type Value; binary_le_impl(value_type V) : Value(V) {} }; template <typename value_type> raw_ostream &operator <<( raw_ostream &OS , const binary_le_impl<value_type> &BLE) { char Buffer[sizeof(BLE.Value)]; support::endian::write<value_type, support::little, support::unaligned>( Buffer, BLE.Value); OS.write(Buffer, sizeof(BLE.Value)); return OS; } template <typename value_type> binary_le_impl<value_type> binary_le(value_type V) { return binary_le_impl<value_type>(V); } void writeCOFF(COFFParser &CP, raw_ostream &OS) { OS << binary_le(CP.Header.Machine) << binary_le(CP.Header.NumberOfSections) << binary_le(CP.Header.TimeDateStamp) << binary_le(CP.Header.PointerToSymbolTable) << binary_le(CP.Header.NumberOfSymbols) << binary_le(CP.Header.SizeOfOptionalHeader) << binary_le(CP.Header.Characteristics); // Output section table. for (std::vector<COFFParser::Section>::const_iterator i = CP.Sections.begin(), e = CP.Sections.end(); i != e; ++i) { OS.write(i->Header.Name, COFF::NameSize); OS << binary_le(i->Header.VirtualSize) << binary_le(i->Header.VirtualAddress) << binary_le(i->Header.SizeOfRawData) << binary_le(i->Header.PointerToRawData) << binary_le(i->Header.PointerToRelocations) << binary_le(i->Header.PointerToLineNumbers) << binary_le(i->Header.NumberOfRelocations) << binary_le(i->Header.NumberOfLineNumbers) << binary_le(i->Header.Characteristics); } // Output section data. for (std::vector<COFFParser::Section>::const_iterator i = CP.Sections.begin(), e = CP.Sections.end(); i != e; ++i) { if (!i->Data.empty()) OS.write(reinterpret_cast<const char*>(&i->Data[0]), i->Data.size()); } // Output symbol table. for (std::vector<COFFParser::Symbol>::const_iterator i = CP.Symbols.begin(), e = CP.Symbols.end(); i != e; ++i) { OS.write(i->Header.Name, COFF::NameSize); OS << binary_le(i->Header.Value) << binary_le(i->Header.SectionNumber) << binary_le(i->Header.Type) << binary_le(i->Header.StorageClass) << binary_le(i->Header.NumberOfAuxSymbols); if (!i->AuxSymbols.empty()) OS.write( reinterpret_cast<const char*>(&i->AuxSymbols[0]) , i->AuxSymbols.size()); } // Output string table. OS.write(&CP.StringTable[0], CP.StringTable.size()); } int main(int argc, char **argv) { cl::ParseCommandLineOptions(argc, argv); sys::PrintStackTraceOnErrorSignal(); PrettyStackTraceProgram X(argc, argv); llvm_shutdown_obj Y; // Call llvm_shutdown() on exit. OwningPtr<MemoryBuffer> Buf; if (MemoryBuffer::getFileOrSTDIN(Input, Buf)) return 1; SourceMgr SM; yaml::Stream S(Buf->getBuffer(), SM); COFFParser CP(S); if (!CP.parse()) { errs() << "yaml2obj: Failed to parse YAML file!\n"; return 1; } if (!layoutCOFF(CP)) { errs() << "yaml2obj: Failed to layout COFF file!\n"; return 1; } writeCOFF(CP, outs()); }