diff options
Diffstat (limited to 'include/llvm/Object')
| -rw-r--r-- | include/llvm/Object/Archive.h | 22 | ||||
| -rw-r--r-- | include/llvm/Object/Binary.h | 66 | ||||
| -rw-r--r-- | include/llvm/Object/COFF.h | 494 | ||||
| -rw-r--r-- | include/llvm/Object/COFFYAML.h | 32 | ||||
| -rw-r--r-- | include/llvm/Object/ELF.h | 2 | ||||
| -rw-r--r-- | include/llvm/Object/ELFObjectFile.h | 288 | ||||
| -rw-r--r-- | include/llvm/Object/ELFTypes.h | 8 | ||||
| -rw-r--r-- | include/llvm/Object/ELFYAML.h | 8 | ||||
| -rw-r--r-- | include/llvm/Object/Error.h | 3 | ||||
| -rw-r--r-- | include/llvm/Object/IRObjectFile.h | 23 | ||||
| -rw-r--r-- | include/llvm/Object/MachO.h | 249 | ||||
| -rw-r--r-- | include/llvm/Object/MachOUniversal.h | 13 | ||||
| -rw-r--r-- | include/llvm/Object/ObjectFile.h | 209 | ||||
| -rw-r--r-- | include/llvm/Object/RelocVisitor.h | 319 | ||||
| -rw-r--r-- | include/llvm/Object/SymbolicFile.h | 22 | 
15 files changed, 1153 insertions, 605 deletions
| diff --git a/include/llvm/Object/Archive.h b/include/llvm/Object/Archive.h index af6c995..7c03dcd 100644 --- a/include/llvm/Object/Archive.h +++ b/include/llvm/Object/Archive.h @@ -14,6 +14,7 @@  #ifndef LLVM_OBJECT_ARCHIVE_H  #define LLVM_OBJECT_ARCHIVE_H +#include "llvm/ADT/iterator_range.h"  #include "llvm/ADT/StringRef.h"  #include "llvm/Object/Binary.h"  #include "llvm/Support/ErrorHandling.h" @@ -89,8 +90,7 @@ public:        return StringRef(Data.data() + StartOfFile, getSize());      } -    ErrorOr<std::unique_ptr<MemoryBuffer>> -    getMemoryBuffer(bool FullPath = false) const; +    ErrorOr<MemoryBufferRef> getMemoryBufferRef() const;      ErrorOr<std::unique_ptr<Binary>>      getAsBinary(LLVMContext *Context = nullptr) const; @@ -98,12 +98,12 @@ public:    class child_iterator {      Child child; +    public:      child_iterator() : child(Child(nullptr, nullptr)) {}      child_iterator(const Child &c) : child(c) {} -    const Child* operator->() const { -      return &child; -    } +    const Child *operator->() const { return &child; } +    const Child &operator*() const { return child; }      bool operator==(const child_iterator &other) const {        return child == other.child; @@ -113,11 +113,11 @@ public:        return !(*this == other);      } -    bool operator <(const child_iterator &other) const { +    bool operator<(const child_iterator &other) const {        return child < other.child;      } -    child_iterator& operator++() {  // Preincrement +    child_iterator &operator++() { // Preincrement        child = child.getNext();        return *this;      } @@ -164,8 +164,8 @@ public:      }    }; -  Archive(std::unique_ptr<MemoryBuffer> Source, std::error_code &EC); -  static ErrorOr<Archive *> create(std::unique_ptr<MemoryBuffer> Source); +  Archive(MemoryBufferRef Source, std::error_code &EC); +  static ErrorOr<std::unique_ptr<Archive>> create(MemoryBufferRef Source);    enum Kind {      K_GNU, @@ -179,6 +179,10 @@ public:    child_iterator child_begin(bool SkipInternal = true) const;    child_iterator child_end() const; +  iterator_range<child_iterator> children(bool SkipInternal = true) const { +    return iterator_range<child_iterator>(child_begin(SkipInternal), +                                          child_end()); +  }    symbol_iterator symbol_begin() const;    symbol_iterator symbol_end() const; diff --git a/include/llvm/Object/Binary.h b/include/llvm/Object/Binary.h index 9be2fbe..4b2b7e6 100644 --- a/include/llvm/Object/Binary.h +++ b/include/llvm/Object/Binary.h @@ -17,11 +17,11 @@  #include "llvm/Object/Error.h"  #include "llvm/Support/ErrorOr.h"  #include "llvm/Support/FileSystem.h" +#include "llvm/Support/MemoryBuffer.h"  namespace llvm {  class LLVMContext; -class MemoryBuffer;  class StringRef;  namespace object { @@ -34,9 +34,9 @@ private:    unsigned int TypeID;  protected: -  std::unique_ptr<MemoryBuffer> Data; +  MemoryBufferRef Data; -  Binary(unsigned int Type, std::unique_ptr<MemoryBuffer> Source); +  Binary(unsigned int Type, MemoryBufferRef Source);    enum {      ID_Archive, @@ -78,8 +78,8 @@ public:    virtual ~Binary();    StringRef getData() const; -  MemoryBuffer *releaseBuffer() { return Data.release(); }    StringRef getFileName() const; +  MemoryBufferRef getMemoryBufferRef() const;    // Cast methods.    unsigned int getType() const { return TypeID; } @@ -125,13 +125,59 @@ public:  /// @brief Create a Binary from Source, autodetecting the file type.  /// -/// @param Source The data to create the Binary from. Ownership is transferred -///        to the Binary if successful. If an error is returned, -///        Source is destroyed by createBinary before returning. -ErrorOr<Binary *> createBinary(std::unique_ptr<MemoryBuffer> &Source, -                               LLVMContext *Context = nullptr); +/// @param Source The data to create the Binary from. +ErrorOr<std::unique_ptr<Binary>> createBinary(MemoryBufferRef Source, +                                              LLVMContext *Context = nullptr); -ErrorOr<Binary *> createBinary(StringRef Path); +template <typename T> class OwningBinary { +  std::unique_ptr<T> Bin; +  std::unique_ptr<MemoryBuffer> Buf; + +public: +  OwningBinary(); +  OwningBinary(std::unique_ptr<T> Bin, std::unique_ptr<MemoryBuffer> Buf); +  OwningBinary(OwningBinary<T>&& Other); +  OwningBinary<T> &operator=(OwningBinary<T> &&Other); + +  std::pair<std::unique_ptr<T>, std::unique_ptr<MemoryBuffer>> takeBinary(); + +  T* getBinary(); +  const T* getBinary() const; +}; + +template <typename T> +OwningBinary<T>::OwningBinary(std::unique_ptr<T> Bin, +                              std::unique_ptr<MemoryBuffer> Buf) +    : Bin(std::move(Bin)), Buf(std::move(Buf)) {} + +template <typename T> OwningBinary<T>::OwningBinary() {} + +template <typename T> +OwningBinary<T>::OwningBinary(OwningBinary &&Other) +    : Bin(std::move(Other.Bin)), Buf(std::move(Other.Buf)) {} + +template <typename T> +OwningBinary<T> &OwningBinary<T>::operator=(OwningBinary &&Other) { +  Bin = std::move(Other.Bin); +  Buf = std::move(Other.Buf); +  return *this; +} + +template <typename T> +std::pair<std::unique_ptr<T>, std::unique_ptr<MemoryBuffer>> +OwningBinary<T>::takeBinary() { +  return std::make_pair(std::move(Bin), std::move(Buf)); +} + +template <typename T> T* OwningBinary<T>::getBinary() { +  return Bin.get(); +} + +template <typename T> const T* OwningBinary<T>::getBinary() const { +  return Bin.get(); +} + +ErrorOr<OwningBinary<Binary>> createBinary(StringRef Path);  }  } diff --git a/include/llvm/Object/COFF.h b/include/llvm/Object/COFF.h index e2da070..3368d68 100644 --- a/include/llvm/Object/COFF.h +++ b/include/llvm/Object/COFF.h @@ -14,22 +14,31 @@  #ifndef LLVM_OBJECT_COFF_H  #define LLVM_OBJECT_COFF_H +#include "llvm/ADT/PointerUnion.h"  #include "llvm/Object/ObjectFile.h"  #include "llvm/Support/COFF.h"  #include "llvm/Support/Endian.h" +#include "llvm/Support/ErrorOr.h"  namespace llvm {  template <typename T> class ArrayRef;  namespace object {  class ImportDirectoryEntryRef; +class DelayImportDirectoryEntryRef;  class ExportDirectoryEntryRef; +class ImportedSymbolRef; +class BaseRelocRef;  typedef content_iterator<ImportDirectoryEntryRef> import_directory_iterator; +typedef content_iterator<DelayImportDirectoryEntryRef> +    delay_import_directory_iterator;  typedef content_iterator<ExportDirectoryEntryRef> export_directory_iterator; +typedef content_iterator<ImportedSymbolRef> imported_symbol_iterator; +typedef content_iterator<BaseRelocRef> base_reloc_iterator;  /// The DOS compatible header at the front of all PE/COFF executables.  struct dos_header { -  support::ulittle16_t Magic; +  char                 Magic[2];    support::ulittle16_t UsedBytesInTheLastPage;    support::ulittle16_t FileSizeInPages;    support::ulittle16_t NumberOfRelocationItems; @@ -62,6 +71,22 @@ struct coff_file_header {    bool isImportLibrary() const { return NumberOfSections == 0xffff; }  }; +struct coff_bigobj_file_header { +  support::ulittle16_t Sig1; +  support::ulittle16_t Sig2; +  support::ulittle16_t Version; +  support::ulittle16_t Machine; +  support::ulittle32_t TimeDateStamp; +  uint8_t              UUID[16]; +  support::ulittle32_t unused1; +  support::ulittle32_t unused2; +  support::ulittle32_t unused3; +  support::ulittle32_t unused4; +  support::ulittle32_t NumberOfSections; +  support::ulittle32_t PointerToSymbolTable; +  support::ulittle32_t NumberOfSymbols; +}; +  /// The 32-bit PE header that follows the COFF header.  struct pe32_header {    support::ulittle16_t Magic; @@ -87,12 +112,14 @@ struct pe32_header {    support::ulittle32_t SizeOfHeaders;    support::ulittle32_t CheckSum;    support::ulittle16_t Subsystem; +  // FIXME: This should be DllCharacteristics.    support::ulittle16_t DLLCharacteristics;    support::ulittle32_t SizeOfStackReserve;    support::ulittle32_t SizeOfStackCommit;    support::ulittle32_t SizeOfHeapReserve;    support::ulittle32_t SizeOfHeapCommit;    support::ulittle32_t LoaderFlags; +  // FIXME: This should be NumberOfRvaAndSizes.    support::ulittle32_t NumberOfRvaAndSize;  }; @@ -142,22 +169,40 @@ struct import_directory_table_entry {    support::ulittle32_t ImportAddressTableRVA;  }; -struct import_lookup_table_entry32 { -  support::ulittle32_t data; +template <typename IntTy> +struct import_lookup_table_entry { +  IntTy Data; -  bool isOrdinal() const { return data & 0x80000000; } +  bool isOrdinal() const { return Data < 0; }    uint16_t getOrdinal() const {      assert(isOrdinal() && "ILT entry is not an ordinal!"); -    return data & 0xFFFF; +    return Data & 0xFFFF;    }    uint32_t getHintNameRVA() const {      assert(!isOrdinal() && "ILT entry is not a Hint/Name RVA!"); -    return data; +    return Data & 0xFFFFFFFF;    }  }; +typedef import_lookup_table_entry<support::little32_t> +    import_lookup_table_entry32; +typedef import_lookup_table_entry<support::little64_t> +    import_lookup_table_entry64; + +struct delay_import_directory_table_entry { +  // dumpbin reports this field as "Characteristics" instead of "Attributes". +  support::ulittle32_t Attributes; +  support::ulittle32_t Name; +  support::ulittle32_t ModuleHandle; +  support::ulittle32_t DelayImportAddressTable; +  support::ulittle32_t DelayImportNameTable; +  support::ulittle32_t BoundDelayImportTable; +  support::ulittle32_t UnloadDelayImportTable; +  support::ulittle32_t TimeStamp; +}; +  struct export_directory_table_entry {    support::ulittle32_t ExportFlags;    support::ulittle32_t TimeDateStamp; @@ -180,67 +225,147 @@ union export_address_table_entry {  typedef support::ulittle32_t export_name_pointer_table_entry;  typedef support::ulittle16_t export_ordinal_table_entry; -struct coff_symbol { -  struct StringTableOffset { -    support::ulittle32_t Zeroes; -    support::ulittle32_t Offset; -  }; +struct StringTableOffset { +  support::ulittle32_t Zeroes; +  support::ulittle32_t Offset; +}; +template <typename SectionNumberType> +struct coff_symbol {    union { -    char ShortName[8]; +    char ShortName[COFF::NameSize];      StringTableOffset Offset;    } Name;    support::ulittle32_t Value; -  support::ulittle16_t SectionNumber; +  SectionNumberType SectionNumber;    support::ulittle16_t Type; -  support::ulittle8_t StorageClass; -  support::ulittle8_t NumberOfAuxSymbols; +  uint8_t StorageClass; +  uint8_t NumberOfAuxSymbols; +}; + +typedef coff_symbol<support::ulittle16_t> coff_symbol16; +typedef coff_symbol<support::ulittle32_t> coff_symbol32; -  uint8_t getBaseType() const { return Type & 0x0F; } +class COFFSymbolRef { +public: +  COFFSymbolRef(const coff_symbol16 *CS) : CS16(CS), CS32(nullptr) {} +  COFFSymbolRef(const coff_symbol32 *CS) : CS16(nullptr), CS32(CS) {} +  COFFSymbolRef() : CS16(nullptr), CS32(nullptr) {} + +  const void *getRawPtr() const { +    return CS16 ? static_cast<const void *>(CS16) : CS32; +  } + +  friend bool operator<(COFFSymbolRef A, COFFSymbolRef B) { +    return A.getRawPtr() < B.getRawPtr(); +  } + +  bool isBigObj() const { +    if (CS16) +      return false; +    if (CS32) +      return true; +    llvm_unreachable("COFFSymbolRef points to nothing!"); +  } + +  const char *getShortName() const { +    return CS16 ? CS16->Name.ShortName : CS32->Name.ShortName; +  } + +  const StringTableOffset &getStringTableOffset() const { +    return CS16 ? CS16->Name.Offset : CS32->Name.Offset; +  } + +  uint32_t getValue() const { return CS16 ? CS16->Value : CS32->Value; } + +  int32_t getSectionNumber() const { +    if (CS16) { +      // Reserved sections are returned as negative numbers. +      if (CS16->SectionNumber <= COFF::MaxNumberOfSections16) +        return CS16->SectionNumber; +      return static_cast<int16_t>(CS16->SectionNumber); +    } +    return static_cast<int32_t>(CS32->SectionNumber); +  } -  uint8_t getComplexType() const { return (Type & 0xF0) >> 4; } +  uint16_t getType() const { return CS16 ? CS16->Type : CS32->Type; } + +  uint8_t getStorageClass() const { +    return CS16 ? CS16->StorageClass : CS32->StorageClass; +  } + +  uint8_t getNumberOfAuxSymbols() const { +    return CS16 ? CS16->NumberOfAuxSymbols : CS32->NumberOfAuxSymbols; +  } + +  uint8_t getBaseType() const { return getType() & 0x0F; } + +  uint8_t getComplexType() const { +    return (getType() & 0xF0) >> COFF::SCT_COMPLEX_TYPE_SHIFT; +  } + +  bool isExternal() const { +    return getStorageClass() == COFF::IMAGE_SYM_CLASS_EXTERNAL; +  } + +  bool isCommon() const { +    return isExternal() && getSectionNumber() == COFF::IMAGE_SYM_UNDEFINED && +           getValue() != 0; +  } + +  bool isUndefined() const { +    return isExternal() && getSectionNumber() == COFF::IMAGE_SYM_UNDEFINED && +           getValue() == 0; +  } + +  bool isWeakExternal() const { +    return getStorageClass() == COFF::IMAGE_SYM_CLASS_WEAK_EXTERNAL; +  }    bool isFunctionDefinition() const { -    return StorageClass == COFF::IMAGE_SYM_CLASS_EXTERNAL && -           getBaseType() == COFF::IMAGE_SYM_TYPE_NULL && +    return isExternal() && getBaseType() == COFF::IMAGE_SYM_TYPE_NULL &&             getComplexType() == COFF::IMAGE_SYM_DTYPE_FUNCTION && -           !COFF::isReservedSectionNumber(SectionNumber); +           !COFF::isReservedSectionNumber(getSectionNumber());    }    bool isFunctionLineInfo() const { -    return StorageClass == COFF::IMAGE_SYM_CLASS_FUNCTION; +    return getStorageClass() == COFF::IMAGE_SYM_CLASS_FUNCTION;    } -  bool isWeakExternal() const { -    return StorageClass == COFF::IMAGE_SYM_CLASS_WEAK_EXTERNAL || -           (StorageClass == COFF::IMAGE_SYM_CLASS_EXTERNAL && -            SectionNumber == COFF::IMAGE_SYM_UNDEFINED && Value == 0); +  bool isAnyUndefined() const { +    return isUndefined() || isWeakExternal();    }    bool isFileRecord() const { -    return StorageClass == COFF::IMAGE_SYM_CLASS_FILE; +    return getStorageClass() == COFF::IMAGE_SYM_CLASS_FILE;    }    bool isSectionDefinition() const {      // C++/CLI creates external ABS symbols for non-const appdomain globals.      // These are also followed by an auxiliary section definition. -    bool isAppdomainGlobal = StorageClass == COFF::IMAGE_SYM_CLASS_EXTERNAL && -                             SectionNumber == COFF::IMAGE_SYM_ABSOLUTE; -    bool isOrdinarySection = -        StorageClass == COFF::IMAGE_SYM_CLASS_STATIC && Value == 0; +    bool isAppdomainGlobal = +        getStorageClass() == COFF::IMAGE_SYM_CLASS_EXTERNAL && +        getSectionNumber() == COFF::IMAGE_SYM_ABSOLUTE; +    bool isOrdinarySection = getStorageClass() == COFF::IMAGE_SYM_CLASS_STATIC; +    if (!getNumberOfAuxSymbols()) +      return false;      return isAppdomainGlobal || isOrdinarySection;    }    bool isCLRToken() const { -    return StorageClass == COFF::IMAGE_SYM_CLASS_CLR_TOKEN; +    return getStorageClass() == COFF::IMAGE_SYM_CLASS_CLR_TOKEN;    } + +private: +  const coff_symbol16 *CS16; +  const coff_symbol32 *CS32;  };  struct coff_section { -  char Name[8]; +  char Name[COFF::NameSize];    support::ulittle32_t VirtualSize;    support::ulittle32_t VirtualAddress;    support::ulittle32_t SizeOfRawData; @@ -254,9 +379,9 @@ struct coff_section {    // Returns true if the actual number of relocations is stored in    // VirtualAddress field of the first relocation table entry.    bool hasExtendedRelocations() const { -    return Characteristics & COFF::IMAGE_SCN_LNK_NRELOC_OVFL && -        NumberOfRelocations == UINT16_MAX; -  }; +    return (Characteristics & COFF::IMAGE_SCN_LNK_NRELOC_OVFL) && +           NumberOfRelocations == UINT16_MAX; +  }  };  struct coff_relocation { @@ -270,7 +395,6 @@ struct coff_aux_function_definition {    support::ulittle32_t TotalSize;    support::ulittle32_t PointerToLinenumber;    support::ulittle32_t PointerToNextFunction; -  char Unused[2];  };  struct coff_aux_bf_and_ef_symbol { @@ -278,17 +402,11 @@ struct coff_aux_bf_and_ef_symbol {    support::ulittle16_t Linenumber;    char Unused2[6];    support::ulittle32_t PointerToNextFunction; -  char Unused3[2];  };  struct coff_aux_weak_external {    support::ulittle32_t TagIndex;    support::ulittle32_t Characteristics; -  char Unused[10]; -}; - -struct coff_aux_file { -  char FileName[18];  };  struct coff_aux_section_definition { @@ -296,16 +414,22 @@ struct coff_aux_section_definition {    support::ulittle16_t NumberOfRelocations;    support::ulittle16_t NumberOfLinenumbers;    support::ulittle32_t CheckSum; -  support::ulittle16_t Number; -  support::ulittle8_t Selection; -  char Unused[3]; +  support::ulittle16_t NumberLowPart; +  uint8_t              Selection; +  uint8_t              Unused; +  support::ulittle16_t NumberHighPart; +  int32_t getNumber(bool IsBigObj) const { +    uint32_t Number = static_cast<uint32_t>(NumberLowPart); +    if (IsBigObj) +      Number |= static_cast<uint32_t>(NumberHighPart) << 16; +    return static_cast<int32_t>(Number); +  }  };  struct coff_aux_clr_token { -  support::ulittle8_t AuxType; -  support::ulittle8_t Reserved; +  uint8_t              AuxType; +  uint8_t              Reserved;    support::ulittle32_t SymbolTableIndex; -  char Unused[12];  };  struct coff_load_configuration32 { @@ -324,7 +448,7 @@ struct coff_load_configuration32 {    support::ulittle32_t ProcessAffinityMask;    support::ulittle32_t ProcessHeapFlags;    support::ulittle16_t CSDVersion; -  uint16_t Reserved; +  support::ulittle16_t Reserved;    support::ulittle32_t EditList;    support::ulittle32_t SecurityCookie;    support::ulittle32_t SEHandlerTable; @@ -337,32 +461,114 @@ struct coff_runtime_function_x64 {    support::ulittle32_t UnwindInformation;  }; +struct coff_base_reloc_block_header { +  support::ulittle32_t PageRVA; +  support::ulittle32_t BlockSize; +}; + +struct coff_base_reloc_block_entry { +  support::ulittle16_t Data; +  int getType() const { return Data >> 12; } +  int getOffset() const { return Data & ((1 << 12) - 1); } +}; +  class COFFObjectFile : public ObjectFile {  private:    friend class ImportDirectoryEntryRef;    friend class ExportDirectoryEntryRef;    const coff_file_header *COFFHeader; +  const coff_bigobj_file_header *COFFBigObjHeader;    const pe32_header *PE32Header;    const pe32plus_header *PE32PlusHeader;    const data_directory *DataDirectory;    const coff_section *SectionTable; -  const coff_symbol *SymbolTable; +  const coff_symbol16 *SymbolTable16; +  const coff_symbol32 *SymbolTable32;    const char *StringTable;    uint32_t StringTableSize;    const import_directory_table_entry *ImportDirectory;    uint32_t NumberOfImportDirectory; +  const delay_import_directory_table_entry *DelayImportDirectory; +  uint32_t NumberOfDelayImportDirectory;    const export_directory_table_entry *ExportDirectory; +  const coff_base_reloc_block_header *BaseRelocHeader; +  const coff_base_reloc_block_header *BaseRelocEnd;    std::error_code getString(uint32_t offset, StringRef &Res) const; -  const coff_symbol *toSymb(DataRefImpl Symb) const; +  template <typename coff_symbol_type> +  const coff_symbol_type *toSymb(DataRefImpl Symb) const;    const coff_section *toSec(DataRefImpl Sec) const;    const coff_relocation *toRel(DataRefImpl Rel) const;    std::error_code initSymbolTablePtr();    std::error_code initImportTablePtr(); +  std::error_code initDelayImportTablePtr();    std::error_code initExportTablePtr(); +  std::error_code initBaseRelocPtr(); +public: +  uintptr_t getSymbolTable() const { +    if (SymbolTable16) +      return reinterpret_cast<uintptr_t>(SymbolTable16); +    if (SymbolTable32) +      return reinterpret_cast<uintptr_t>(SymbolTable32); +    return uintptr_t(0); +  } +  uint16_t getMachine() const { +    if (COFFHeader) +      return COFFHeader->Machine; +    if (COFFBigObjHeader) +      return COFFBigObjHeader->Machine; +    llvm_unreachable("no COFF header!"); +  } +  uint16_t getSizeOfOptionalHeader() const { +    if (COFFHeader) +      return COFFHeader->isImportLibrary() ? 0 +                                           : COFFHeader->SizeOfOptionalHeader; +    // bigobj doesn't have this field. +    if (COFFBigObjHeader) +      return 0; +    llvm_unreachable("no COFF header!"); +  } +  uint16_t getCharacteristics() const { +    if (COFFHeader) +      return COFFHeader->isImportLibrary() ? 0 : COFFHeader->Characteristics; +    // bigobj doesn't have characteristics to speak of, +    // editbin will silently lie to you if you attempt to set any. +    if (COFFBigObjHeader) +      return 0; +    llvm_unreachable("no COFF header!"); +  } +  uint32_t getTimeDateStamp() const { +    if (COFFHeader) +      return COFFHeader->TimeDateStamp; +    if (COFFBigObjHeader) +      return COFFBigObjHeader->TimeDateStamp; +    llvm_unreachable("no COFF header!"); +  } +  uint32_t getNumberOfSections() const { +    if (COFFHeader) +      return COFFHeader->isImportLibrary() ? 0 : COFFHeader->NumberOfSections; +    if (COFFBigObjHeader) +      return COFFBigObjHeader->NumberOfSections; +    llvm_unreachable("no COFF header!"); +  } +  uint32_t getPointerToSymbolTable() const { +    if (COFFHeader) +      return COFFHeader->isImportLibrary() ? 0 +                                           : COFFHeader->PointerToSymbolTable; +    if (COFFBigObjHeader) +      return COFFBigObjHeader->PointerToSymbolTable; +    llvm_unreachable("no COFF header!"); +  } +  uint32_t getNumberOfSymbols() const { +    if (COFFHeader) +      return COFFHeader->isImportLibrary() ? 0 : COFFHeader->NumberOfSymbols; +    if (COFFBigObjHeader) +      return COFFBigObjHeader->NumberOfSymbols; +    llvm_unreachable("no COFF header!"); +  }  protected:    void moveSymbolNext(DataRefImpl &Symb) const override;    std::error_code getSymbolName(DataRefImpl Symb, @@ -378,24 +584,19 @@ protected:    void moveSectionNext(DataRefImpl &Sec) const override;    std::error_code getSectionName(DataRefImpl Sec,                                   StringRef &Res) const override; -  std::error_code getSectionAddress(DataRefImpl Sec, -                                    uint64_t &Res) const override; -  std::error_code getSectionSize(DataRefImpl Sec, uint64_t &Res) const override; +  uint64_t getSectionAddress(DataRefImpl Sec) const override; +  uint64_t getSectionSize(DataRefImpl Sec) const override;    std::error_code getSectionContents(DataRefImpl Sec,                                       StringRef &Res) const override; -  std::error_code getSectionAlignment(DataRefImpl Sec, -                                      uint64_t &Res) const override; -  std::error_code isSectionText(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionData(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionBSS(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionVirtual(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionZeroInit(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionReadOnlyData(DataRefImpl Sec, -                                        bool &Res) const override; -  std::error_code isSectionRequiredForExecution(DataRefImpl Sec, -                                                bool &Res) const override; -  std::error_code sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb, -                                        bool &Result) const override; +  uint64_t getSectionAlignment(DataRefImpl Sec) const override; +  bool isSectionText(DataRefImpl Sec) const override; +  bool isSectionData(DataRefImpl Sec) const override; +  bool isSectionBSS(DataRefImpl Sec) const override; +  bool isSectionVirtual(DataRefImpl Sec) const override; +  bool isSectionZeroInit(DataRefImpl Sec) const override; +  bool isSectionReadOnlyData(DataRefImpl Sec) const override; +  bool isSectionRequiredForExecution(DataRefImpl Sec) const override; +  bool sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb) const override;    relocation_iterator section_rel_begin(DataRefImpl Sec) const override;    relocation_iterator section_rel_end(DataRefImpl Sec) const override; @@ -414,54 +615,93 @@ protected:    getRelocationValueString(DataRefImpl Rel,                             SmallVectorImpl<char> &Result) const override; -  std::error_code getLibraryNext(DataRefImpl LibData, -                                 LibraryRef &Result) const override; -  std::error_code getLibraryPath(DataRefImpl LibData, -                                 StringRef &Result) const override; -  public: -  COFFObjectFile(std::unique_ptr<MemoryBuffer> Object, std::error_code &EC); +  COFFObjectFile(MemoryBufferRef Object, std::error_code &EC);    basic_symbol_iterator symbol_begin_impl() const override;    basic_symbol_iterator symbol_end_impl() const override; -  library_iterator needed_library_begin() const override; -  library_iterator needed_library_end() const override;    section_iterator section_begin() const override;    section_iterator section_end() const override;    const coff_section *getCOFFSection(const SectionRef &Section) const; -  const coff_symbol *getCOFFSymbol(const SymbolRef &Symbol) const; +  COFFSymbolRef getCOFFSymbol(const DataRefImpl &Ref) const; +  COFFSymbolRef getCOFFSymbol(const SymbolRef &Symbol) const;    const coff_relocation *getCOFFRelocation(const RelocationRef &Reloc) const;    uint8_t getBytesInAddress() const override;    StringRef getFileFormatName() const override;    unsigned getArch() const override; -  StringRef getLoadName() const override;    import_directory_iterator import_directory_begin() const;    import_directory_iterator import_directory_end() const; +  delay_import_directory_iterator delay_import_directory_begin() const; +  delay_import_directory_iterator delay_import_directory_end() const;    export_directory_iterator export_directory_begin() const;    export_directory_iterator export_directory_end() const; - -  std::error_code getHeader(const coff_file_header *&Res) const; -  std::error_code getCOFFHeader(const coff_file_header *&Res) const; +  base_reloc_iterator base_reloc_begin() const; +  base_reloc_iterator base_reloc_end() const; + +  iterator_range<import_directory_iterator> import_directories() const; +  iterator_range<delay_import_directory_iterator> +      delay_import_directories() const; +  iterator_range<export_directory_iterator> export_directories() const; +  iterator_range<base_reloc_iterator> base_relocs() const; + +  const dos_header *getDOSHeader() const { +    if (!PE32Header && !PE32PlusHeader) +      return nullptr; +    return reinterpret_cast<const dos_header *>(base()); +  }    std::error_code getPE32Header(const pe32_header *&Res) const;    std::error_code getPE32PlusHeader(const pe32plus_header *&Res) const;    std::error_code getDataDirectory(uint32_t index,                                     const data_directory *&Res) const;    std::error_code getSection(int32_t index, const coff_section *&Res) const; -  std::error_code getSymbol(uint32_t index, const coff_symbol *&Res) const; +  template <typename coff_symbol_type> +  std::error_code getSymbol(uint32_t Index, +                            const coff_symbol_type *&Res) const { +    if (Index >= getNumberOfSymbols()) +      return object_error::parse_failed; + +    Res = reinterpret_cast<coff_symbol_type *>(getSymbolTable()) + Index; +    return object_error::success; +  } +  ErrorOr<COFFSymbolRef> getSymbol(uint32_t index) const { +    if (SymbolTable16) { +      const coff_symbol16 *Symb = nullptr; +      if (std::error_code EC = getSymbol(index, Symb)) +        return EC; +      return COFFSymbolRef(Symb); +    } +    if (SymbolTable32) { +      const coff_symbol32 *Symb = nullptr; +      if (std::error_code EC = getSymbol(index, Symb)) +        return EC; +      return COFFSymbolRef(Symb); +    } +    return object_error::parse_failed; +  }    template <typename T>    std::error_code getAuxSymbol(uint32_t index, const T *&Res) const { -    const coff_symbol *s; -    std::error_code ec = getSymbol(index, s); -    Res = reinterpret_cast<const T *>(s); -    return ec; +    ErrorOr<COFFSymbolRef> s = getSymbol(index); +    if (std::error_code EC = s.getError()) +      return EC; +    Res = reinterpret_cast<const T *>(s->getRawPtr()); +    return object_error::success; +  } +  std::error_code getSymbolName(COFFSymbolRef Symbol, StringRef &Res) const; + +  ArrayRef<uint8_t> getSymbolAuxData(COFFSymbolRef Symbol) const; + +  size_t getSymbolTableEntrySize() const { +    if (COFFHeader) +      return sizeof(coff_symbol16); +    if (COFFBigObjHeader) +      return sizeof(coff_symbol32); +    llvm_unreachable("null symbol table pointer!");    } -  std::error_code getSymbolName(const coff_symbol *symbol, -                                StringRef &Res) const; -  ArrayRef<uint8_t> getSymbolAuxData(const coff_symbol *symbol) const;    std::error_code getSectionName(const coff_section *Sec, StringRef &Res) const; +  uint64_t getSectionSize(const coff_section *Sec) const;    std::error_code getSectionContents(const coff_section *Sec,                                       ArrayRef<uint8_t> &Res) const; @@ -470,6 +710,9 @@ public:    std::error_code getHintName(uint32_t Rva, uint16_t &Hint,                                StringRef &Name) const; +  bool isRelocatableObject() const override; +  bool is64() const { return PE32PlusHeader; } +    static inline bool classof(const Binary *v) { return v->isCOFF(); }  }; @@ -483,7 +726,14 @@ public:    bool operator==(const ImportDirectoryEntryRef &Other) const;    void moveNext(); + +  imported_symbol_iterator imported_symbol_begin() const; +  imported_symbol_iterator imported_symbol_end() const; +  iterator_range<imported_symbol_iterator> imported_symbols() const; +    std::error_code getName(StringRef &Result) const; +  std::error_code getImportLookupTableRVA(uint32_t &Result) const; +  std::error_code getImportAddressTableRVA(uint32_t &Result) const;    std::error_code    getImportTableEntry(const import_directory_table_entry *&Result) const; @@ -497,6 +747,31 @@ private:    const COFFObjectFile *OwningObject;  }; +class DelayImportDirectoryEntryRef { +public: +  DelayImportDirectoryEntryRef() : OwningObject(nullptr) {} +  DelayImportDirectoryEntryRef(const delay_import_directory_table_entry *T, +                               uint32_t I, const COFFObjectFile *Owner) +      : Table(T), Index(I), OwningObject(Owner) {} + +  bool operator==(const DelayImportDirectoryEntryRef &Other) const; +  void moveNext(); + +  imported_symbol_iterator imported_symbol_begin() const; +  imported_symbol_iterator imported_symbol_end() const; +  iterator_range<imported_symbol_iterator> imported_symbols() const; + +  std::error_code getName(StringRef &Result) const; +  std::error_code getDelayImportTable( +      const delay_import_directory_table_entry *&Result) const; +  std::error_code getImportAddress(int AddrIndex, uint64_t &Result) const; + +private: +  const delay_import_directory_table_entry *Table; +  uint32_t Index; +  const COFFObjectFile *OwningObject; +}; +  // The iterator for the export directory table entry.  class ExportDirectoryEntryRef {  public: @@ -519,6 +794,49 @@ private:    uint32_t Index;    const COFFObjectFile *OwningObject;  }; + +class ImportedSymbolRef { +public: +  ImportedSymbolRef() : OwningObject(nullptr) {} +  ImportedSymbolRef(const import_lookup_table_entry32 *Entry, uint32_t I, +                    const COFFObjectFile *Owner) +      : Entry32(Entry), Entry64(nullptr), Index(I), OwningObject(Owner) {} +  ImportedSymbolRef(const import_lookup_table_entry64 *Entry, uint32_t I, +                    const COFFObjectFile *Owner) +      : Entry32(nullptr), Entry64(Entry), Index(I), OwningObject(Owner) {} + +  bool operator==(const ImportedSymbolRef &Other) const; +  void moveNext(); + +  std::error_code getSymbolName(StringRef &Result) const; +  std::error_code getOrdinal(uint16_t &Result) const; + +private: +  const import_lookup_table_entry32 *Entry32; +  const import_lookup_table_entry64 *Entry64; +  uint32_t Index; +  const COFFObjectFile *OwningObject; +}; + +class BaseRelocRef { +public: +  BaseRelocRef() : OwningObject(nullptr) {} +  BaseRelocRef(const coff_base_reloc_block_header *Header, +               const COFFObjectFile *Owner) +      : Header(Header), Index(0), OwningObject(Owner) {} + +  bool operator==(const BaseRelocRef &Other) const; +  void moveNext(); + +  std::error_code getType(uint8_t &Type) const; +  std::error_code getRVA(uint32_t &Result) const; + +private: +  const coff_base_reloc_block_header *Header; +  uint32_t Index; +  const COFFObjectFile *OwningObject; +}; +  } // end namespace object  } // end namespace llvm diff --git a/include/llvm/Object/COFFYAML.h b/include/llvm/Object/COFFYAML.h index 4aba08f..12a2522 100644 --- a/include/llvm/Object/COFFYAML.h +++ b/include/llvm/Object/COFFYAML.h @@ -31,6 +31,12 @@ inline SectionCharacteristics operator|(SectionCharacteristics a,    uint32_t Ret = static_cast<uint32_t>(a) | static_cast<uint32_t>(b);    return static_cast<SectionCharacteristics>(Ret);  } + +inline DLLCharacteristics operator|(DLLCharacteristics a, +                                    DLLCharacteristics b) { +  uint16_t Ret = static_cast<uint16_t>(a) | static_cast<uint16_t>(b); +  return static_cast<DLLCharacteristics>(Ret); +}  }  // The structure of the yaml files is not an exact 1:1 match to COFF. In order @@ -69,7 +75,13 @@ namespace COFFYAML {      Symbol();    }; +  struct PEHeader { +    COFF::PE32Header Header; +    Optional<COFF::DataDirectory> DataDirectories[COFF::NUM_DATA_DIRECTORIES]; +  }; +    struct Object { +    Optional<PEHeader> OptionalHeader;      COFF::header Header;      std::vector<Section> Sections;      std::vector<Symbol> Symbols; @@ -131,6 +143,11 @@ struct ScalarEnumerationTraits<COFF::RelocationTypeAMD64> {  };  template <> +struct ScalarEnumerationTraits<COFF::WindowsSubsystem> { +  static void enumeration(IO &IO, COFF::WindowsSubsystem &Value); +}; + +template <>  struct ScalarBitSetTraits<COFF::Characteristics> {    static void bitset(IO &IO, COFF::Characteristics &Value);  }; @@ -141,11 +158,26 @@ struct ScalarBitSetTraits<COFF::SectionCharacteristics> {  };  template <> +struct ScalarBitSetTraits<COFF::DLLCharacteristics> { +  static void bitset(IO &IO, COFF::DLLCharacteristics &Value); +}; + +template <>  struct MappingTraits<COFFYAML::Relocation> {    static void mapping(IO &IO, COFFYAML::Relocation &Rel);  };  template <> +struct MappingTraits<COFFYAML::PEHeader> { +  static void mapping(IO &IO, COFFYAML::PEHeader &PH); +}; + +template <> +struct MappingTraits<COFF::DataDirectory> { +  static void mapping(IO &IO, COFF::DataDirectory &DD); +}; + +template <>  struct MappingTraits<COFF::header> {    static void mapping(IO &IO, COFF::header &H);  }; diff --git a/include/llvm/Object/ELF.h b/include/llvm/Object/ELF.h index fbc48e6..7c10bbf 100644 --- a/include/llvm/Object/ELF.h +++ b/include/llvm/Object/ELF.h @@ -540,7 +540,7 @@ ELFFile<ELFT>::getSectionContents(const Elf_Shdr *Sec) const {    if (Sec->sh_offset + Sec->sh_size > Buf.size())      return object_error::parse_failed;    const uint8_t *Start = base() + Sec->sh_offset; -  return ArrayRef<uint8_t>(Start, Sec->sh_size); +  return makeArrayRef(Start, Sec->sh_size);  }  template <class ELFT> diff --git a/include/llvm/Object/ELFObjectFile.h b/include/llvm/Object/ELFObjectFile.h index cfb6b08..3fcd98d 100644 --- a/include/llvm/Object/ELFObjectFile.h +++ b/include/llvm/Object/ELFObjectFile.h @@ -11,8 +11,8 @@  //  //===----------------------------------------------------------------------===// -#ifndef LLVM_OBJECT_ELF_OBJECT_FILE_H -#define LLVM_OBJECT_ELF_OBJECT_FILE_H +#ifndef LLVM_OBJECT_ELFOBJECTFILE_H +#define LLVM_OBJECT_ELFOBJECTFILE_H  #include "llvm/ADT/DenseMap.h"  #include "llvm/ADT/PointerIntPair.h" @@ -35,8 +35,23 @@  namespace llvm {  namespace object { -template <class ELFT> -class ELFObjectFile : public ObjectFile { +class ELFObjectFileBase : public ObjectFile { +protected: +  ELFObjectFileBase(unsigned int Type, MemoryBufferRef Source); + +public: +  virtual std::error_code getRelocationAddend(DataRefImpl Rel, +                                              int64_t &Res) const = 0; +  virtual std::pair<symbol_iterator, symbol_iterator> +  getELFDynamicSymbolIterators() const = 0; + +  virtual std::error_code getSymbolVersion(SymbolRef Symb, StringRef &Version, +                                           bool &IsDefault) const = 0; + +  static inline bool classof(const Binary *v) { return v->isELF(); } +}; + +template <class ELFT> class ELFObjectFile : public ELFObjectFileBase {  public:    LLVM_ELF_IMPORT_TYPES_ELFT(ELFT) @@ -65,37 +80,28 @@ protected:                                       uint32_t &Res) const override;    std::error_code getSymbolSize(DataRefImpl Symb, uint64_t &Res) const override;    uint32_t getSymbolFlags(DataRefImpl Symb) const override; +  std::error_code getSymbolOther(DataRefImpl Symb, uint8_t &Res) const override;    std::error_code getSymbolType(DataRefImpl Symb,                                  SymbolRef::Type &Res) const override;    std::error_code getSymbolSection(DataRefImpl Symb,                                     section_iterator &Res) const override; -  std::error_code getLibraryNext(DataRefImpl Data, -                                 LibraryRef &Result) const override; -  std::error_code getLibraryPath(DataRefImpl Data, -                                 StringRef &Res) const override; -    void moveSectionNext(DataRefImpl &Sec) const override;    std::error_code getSectionName(DataRefImpl Sec,                                   StringRef &Res) const override; -  std::error_code getSectionAddress(DataRefImpl Sec, -                                    uint64_t &Res) const override; -  std::error_code getSectionSize(DataRefImpl Sec, uint64_t &Res) const override; +  uint64_t getSectionAddress(DataRefImpl Sec) const override; +  uint64_t getSectionSize(DataRefImpl Sec) const override;    std::error_code getSectionContents(DataRefImpl Sec,                                       StringRef &Res) const override; -  std::error_code getSectionAlignment(DataRefImpl Sec, -                                      uint64_t &Res) const override; -  std::error_code isSectionText(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionData(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionBSS(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionRequiredForExecution(DataRefImpl Sec, -                                                bool &Res) const override; -  std::error_code isSectionVirtual(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionZeroInit(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionReadOnlyData(DataRefImpl Sec, -                                        bool &Res) const override; -  std::error_code sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb, -                                        bool &Result) const override; +  uint64_t getSectionAlignment(DataRefImpl Sec) const override; +  bool isSectionText(DataRefImpl Sec) const override; +  bool isSectionData(DataRefImpl Sec) const override; +  bool isSectionBSS(DataRefImpl Sec) const override; +  bool isSectionRequiredForExecution(DataRefImpl Sec) const override; +  bool isSectionVirtual(DataRefImpl Sec) const override; +  bool isSectionZeroInit(DataRefImpl Sec) const override; +  bool isSectionReadOnlyData(DataRefImpl Sec) const override; +  bool sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb) const override;    relocation_iterator section_rel_begin(DataRefImpl Sec) const override;    relocation_iterator section_rel_end(DataRefImpl Sec) const override;    section_iterator getRelocatedSection(DataRefImpl Sec) const override; @@ -177,7 +183,7 @@ protected:    bool isDyldELFObject;  public: -  ELFObjectFile(std::unique_ptr<MemoryBuffer> Object, std::error_code &EC); +  ELFObjectFile(MemoryBufferRef Object, std::error_code &EC);    const Elf_Sym *getSymbol(DataRefImpl Symb) const; @@ -190,17 +196,20 @@ public:    section_iterator section_begin() const override;    section_iterator section_end() const override; -  library_iterator needed_library_begin() const override; -  library_iterator needed_library_end() const override; - -  std::error_code getRelocationAddend(DataRefImpl Rel, int64_t &Res) const; +  std::error_code getRelocationAddend(DataRefImpl Rel, +                                      int64_t &Res) const override;    std::error_code getSymbolVersion(SymbolRef Symb, StringRef &Version, -                                   bool &IsDefault) const; +                                   bool &IsDefault) const override;    uint8_t getBytesInAddress() const override;    StringRef getFileFormatName() const override;    unsigned getArch() const override; -  StringRef getLoadName() const override; +  StringRef getLoadName() const; + +  std::error_code getPlatformFlags(unsigned &Result) const override { +    Result = EF.getHeader()->e_flags; +    return object_error::success; +  }    const ELFFile<ELFT> *getELFFile() const { return &EF; } @@ -209,6 +218,11 @@ public:      return v->getType() == getELFType(ELFT::TargetEndianness == support::little,                                        ELFT::Is64Bits);    } + +  std::pair<symbol_iterator, symbol_iterator> +  getELFDynamicSymbolIterators() const override; + +  bool isRelocatableObject() const override;  };  // Use an alignment of 2 for the typedefs since that is the worst case for @@ -295,6 +309,13 @@ std::error_code ELFObjectFile<ELFT>::getSymbolSize(DataRefImpl Symb,  }  template <class ELFT> +std::error_code ELFObjectFile<ELFT>::getSymbolOther(DataRefImpl Symb, +                                                    uint8_t &Result) const { +  Result = toELFSymIter(Symb)->st_other; +  return object_error::success; +} + +template <class ELFT>  std::error_code  ELFObjectFile<ELFT>::getSymbolType(DataRefImpl Symb,                                     SymbolRef::Type &Result) const { @@ -387,17 +408,13 @@ std::error_code ELFObjectFile<ELFT>::getSectionName(DataRefImpl Sec,  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::getSectionAddress(DataRefImpl Sec, -                                                       uint64_t &Result) const { -  Result = toELFShdrIter(Sec)->sh_addr; -  return object_error::success; +uint64_t ELFObjectFile<ELFT>::getSectionAddress(DataRefImpl Sec) const { +  return toELFShdrIter(Sec)->sh_addr;  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::getSectionSize(DataRefImpl Sec, -                                                    uint64_t &Result) const { -  Result = toELFShdrIter(Sec)->sh_size; -  return object_error::success; +uint64_t ELFObjectFile<ELFT>::getSectionSize(DataRefImpl Sec) const { +  return toELFShdrIter(Sec)->sh_size;  }  template <class ELFT> @@ -410,79 +427,59 @@ ELFObjectFile<ELFT>::getSectionContents(DataRefImpl Sec,  }  template <class ELFT> -std::error_code -ELFObjectFile<ELFT>::getSectionAlignment(DataRefImpl Sec, -                                         uint64_t &Result) const { -  Result = toELFShdrIter(Sec)->sh_addralign; -  return object_error::success; +uint64_t ELFObjectFile<ELFT>::getSectionAlignment(DataRefImpl Sec) const { +  return toELFShdrIter(Sec)->sh_addralign;  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::isSectionText(DataRefImpl Sec, -                                                   bool &Result) const { -  Result = toELFShdrIter(Sec)->sh_flags & ELF::SHF_EXECINSTR; -  return object_error::success; +bool ELFObjectFile<ELFT>::isSectionText(DataRefImpl Sec) const { +  return toELFShdrIter(Sec)->sh_flags & ELF::SHF_EXECINSTR;  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::isSectionData(DataRefImpl Sec, -                                                   bool &Result) const { +bool ELFObjectFile<ELFT>::isSectionData(DataRefImpl Sec) const {    Elf_Shdr_Iter EShdr = toELFShdrIter(Sec); -  Result = EShdr->sh_flags & (ELF::SHF_ALLOC | ELF::SHF_WRITE) && -           EShdr->sh_type == ELF::SHT_PROGBITS; -  return object_error::success; +  return EShdr->sh_flags & (ELF::SHF_ALLOC | ELF::SHF_WRITE) && +         EShdr->sh_type == ELF::SHT_PROGBITS;  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::isSectionBSS(DataRefImpl Sec, -                                                  bool &Result) const { +bool ELFObjectFile<ELFT>::isSectionBSS(DataRefImpl Sec) const {    Elf_Shdr_Iter EShdr = toELFShdrIter(Sec); -  Result = EShdr->sh_flags & (ELF::SHF_ALLOC | ELF::SHF_WRITE) && -           EShdr->sh_type == ELF::SHT_NOBITS; -  return object_error::success; +  return EShdr->sh_flags & (ELF::SHF_ALLOC | ELF::SHF_WRITE) && +         EShdr->sh_type == ELF::SHT_NOBITS;  }  template <class ELFT> -std::error_code -ELFObjectFile<ELFT>::isSectionRequiredForExecution(DataRefImpl Sec, -                                                   bool &Result) const { -  Result = toELFShdrIter(Sec)->sh_flags & ELF::SHF_ALLOC; -  return object_error::success; +bool ELFObjectFile<ELFT>::isSectionRequiredForExecution(DataRefImpl Sec) const { +  return toELFShdrIter(Sec)->sh_flags & ELF::SHF_ALLOC;  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::isSectionVirtual(DataRefImpl Sec, -                                                      bool &Result) const { -  Result = toELFShdrIter(Sec)->sh_type == ELF::SHT_NOBITS; -  return object_error::success; +bool ELFObjectFile<ELFT>::isSectionVirtual(DataRefImpl Sec) const { +  return toELFShdrIter(Sec)->sh_type == ELF::SHT_NOBITS;  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::isSectionZeroInit(DataRefImpl Sec, -                                                       bool &Result) const { -  Result = toELFShdrIter(Sec)->sh_type == ELF::SHT_NOBITS; -  return object_error::success; +bool ELFObjectFile<ELFT>::isSectionZeroInit(DataRefImpl Sec) const { +  return toELFShdrIter(Sec)->sh_type == ELF::SHT_NOBITS;  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::isSectionReadOnlyData(DataRefImpl Sec, -                                                           bool &Result) const { +bool ELFObjectFile<ELFT>::isSectionReadOnlyData(DataRefImpl Sec) const {    Elf_Shdr_Iter EShdr = toELFShdrIter(Sec); -  Result = !(EShdr->sh_flags & (ELF::SHF_WRITE | ELF::SHF_EXECINSTR)); -  return object_error::success; +  return !(EShdr->sh_flags & (ELF::SHF_WRITE | ELF::SHF_EXECINSTR));  }  template <class ELFT> -std::error_code ELFObjectFile<ELFT>::sectionContainsSymbol(DataRefImpl Sec, -                                                           DataRefImpl Symb, -                                                           bool &Result) const { +bool ELFObjectFile<ELFT>::sectionContainsSymbol(DataRefImpl Sec, +                                                DataRefImpl Symb) const {    Elf_Sym_Iter ESym = toELFSymIter(Symb);    uintX_t Index = ESym->st_shndx;    bool Reserved = Index >= ELF::SHN_LORESERVE && Index <= ELF::SHN_HIRESERVE; -  Result = !Reserved && (&*toELFShdrIter(Sec) == EF.getSection(ESym->st_shndx)); -  return object_error::success; +  return !Reserved && (&*toELFShdrIter(Sec) == EF.getSection(ESym->st_shndx));  }  template <class ELFT> @@ -741,6 +738,7 @@ std::error_code ELFObjectFile<ELFT>::getRelocationValueString(      Result.append(fmtbuf.begin(), fmtbuf.end());      break;    } +  case ELF::EM_386:    case ELF::EM_ARM:    case ELF::EM_HEXAGON:    case ELF::EM_MIPS: @@ -773,13 +771,13 @@ ELFObjectFile<ELFT>::getRela(DataRefImpl Rela) const {  }  template <class ELFT> -ELFObjectFile<ELFT>::ELFObjectFile(std::unique_ptr<MemoryBuffer> Object, -                                   std::error_code &EC) -    : ObjectFile(getELFType(static_cast<endianness>(ELFT::TargetEndianness) == -                                support::little, -                            ELFT::Is64Bits), -                 std::move(Object)), -      EF(Data->getBuffer(), EC) {} +ELFObjectFile<ELFT>::ELFObjectFile(MemoryBufferRef Object, std::error_code &EC) +    : ELFObjectFileBase( +          getELFType(static_cast<endianness>(ELFT::TargetEndianness) == +                         support::little, +                     ELFT::Is64Bits), +          Object), +      EF(Data.getBuffer(), EC) {}  template <class ELFT>  basic_symbol_iterator ELFObjectFile<ELFT>::symbol_begin_impl() const { @@ -825,50 +823,13 @@ StringRef ELFObjectFile<ELFT>::getLoadName() const {  }  template <class ELFT> -library_iterator ELFObjectFile<ELFT>::needed_library_begin() const { -  Elf_Dyn_Iter DI = EF.begin_dynamic_table(); -  Elf_Dyn_Iter DE = EF.end_dynamic_table(); - -  while (DI != DE && DI->getTag() != ELF::DT_SONAME) -    ++DI; - -  return library_iterator(LibraryRef(toDRI(DI), this)); -} - -template <class ELFT> -std::error_code ELFObjectFile<ELFT>::getLibraryNext(DataRefImpl Data, -                                                    LibraryRef &Result) const { -  Elf_Dyn_Iter DI = toELFDynIter(Data); -  Elf_Dyn_Iter DE = EF.end_dynamic_table(); - -  // Skip to the next DT_NEEDED entry. -  do -    ++DI; -  while (DI != DE && DI->getTag() != ELF::DT_NEEDED); - -  Result = LibraryRef(toDRI(DI), this); -  return object_error::success; -} - -template <class ELFT> -std::error_code ELFObjectFile<ELFT>::getLibraryPath(DataRefImpl Data, -                                                    StringRef &Res) const { -  Res = EF.getDynamicString(toELFDynIter(Data)->getVal()); -  return object_error::success; -} - -template <class ELFT> -library_iterator ELFObjectFile<ELFT>::needed_library_end() const { -  return library_iterator(LibraryRef(toDRI(EF.end_dynamic_table()), this)); -} - -template <class ELFT>  uint8_t ELFObjectFile<ELFT>::getBytesInAddress() const {    return ELFT::Is64Bits ? 8 : 4;  }  template <class ELFT>  StringRef ELFObjectFile<ELFT>::getFileFormatName() const { +  bool IsLittleEndian = ELFT::TargetEndianness == support::little;    switch (EF.getHeader()->e_ident[ELF::EI_CLASS]) {    case ELF::ELFCLASS32:      switch (EF.getHeader()->e_machine) { @@ -877,7 +838,7 @@ StringRef ELFObjectFile<ELFT>::getFileFormatName() const {      case ELF::EM_X86_64:        return "ELF32-x86-64";      case ELF::EM_ARM: -      return "ELF32-arm"; +      return (IsLittleEndian ? "ELF32-arm-little" : "ELF32-arm-big");      case ELF::EM_HEXAGON:        return "ELF32-hexagon";      case ELF::EM_MIPS: @@ -897,7 +858,7 @@ StringRef ELFObjectFile<ELFT>::getFileFormatName() const {      case ELF::EM_X86_64:        return "ELF64-x86-64";      case ELF::EM_AARCH64: -      return "ELF64-aarch64"; +      return (IsLittleEndian ? "ELF64-aarch64-little" : "ELF64-aarch64-big");      case ELF::EM_PPC64:        return "ELF64-ppc64";      case ELF::EM_S390: @@ -938,6 +899,8 @@ unsigned ELFObjectFile<ELFT>::getArch() const {      default:        report_fatal_error("Invalid ELFCLASS!");      } +  case ELF::EM_PPC: +    return Triple::ppc;    case ELF::EM_PPC64:      return IsLittleEndian ? Triple::ppc64le : Triple::ppc64;    case ELF::EM_S390: @@ -954,73 +917,34 @@ unsigned ELFObjectFile<ELFT>::getArch() const {    }  } -/// FIXME: Maybe we should have a base ElfObjectFile that is not a template -/// and make these member functions? +template <class ELFT> +std::pair<symbol_iterator, symbol_iterator> +ELFObjectFile<ELFT>::getELFDynamicSymbolIterators() const { +  return std::make_pair(dynamic_symbol_begin(), dynamic_symbol_end()); +} + +template <class ELFT> bool ELFObjectFile<ELFT>::isRelocatableObject() const { +  return EF.getHeader()->e_type == ELF::ET_REL; +} +  inline std::error_code getELFRelocationAddend(const RelocationRef R,                                                int64_t &Addend) {    const ObjectFile *Obj = R.getObjectFile();    DataRefImpl DRI = R.getRawDataRefImpl(); -  // Little-endian 32-bit -  if (const ELF32LEObjectFile *ELFObj = dyn_cast<ELF32LEObjectFile>(Obj)) -    return ELFObj->getRelocationAddend(DRI, Addend); - -  // Big-endian 32-bit -  if (const ELF32BEObjectFile *ELFObj = dyn_cast<ELF32BEObjectFile>(Obj)) -    return ELFObj->getRelocationAddend(DRI, Addend); - -  // Little-endian 64-bit -  if (const ELF64LEObjectFile *ELFObj = dyn_cast<ELF64LEObjectFile>(Obj)) -    return ELFObj->getRelocationAddend(DRI, Addend); - -  // Big-endian 64-bit -  if (const ELF64BEObjectFile *ELFObj = dyn_cast<ELF64BEObjectFile>(Obj)) -    return ELFObj->getRelocationAddend(DRI, Addend); - -  llvm_unreachable("Object passed to getELFRelocationAddend() is not ELF"); +  return cast<ELFObjectFileBase>(Obj)->getRelocationAddend(DRI, Addend);  }  inline std::pair<symbol_iterator, symbol_iterator> -getELFDynamicSymbolIterators(SymbolicFile *Obj) { -  if (const ELF32LEObjectFile *ELF = dyn_cast<ELF32LEObjectFile>(Obj)) -    return std::make_pair(ELF->dynamic_symbol_begin(), -                          ELF->dynamic_symbol_end()); -  if (const ELF64LEObjectFile *ELF = dyn_cast<ELF64LEObjectFile>(Obj)) -    return std::make_pair(ELF->dynamic_symbol_begin(), -                          ELF->dynamic_symbol_end()); -  if (const ELF32BEObjectFile *ELF = dyn_cast<ELF32BEObjectFile>(Obj)) -    return std::make_pair(ELF->dynamic_symbol_begin(), -                          ELF->dynamic_symbol_end()); -  if (const ELF64BEObjectFile *ELF = cast<ELF64BEObjectFile>(Obj)) -    return std::make_pair(ELF->dynamic_symbol_begin(), -                          ELF->dynamic_symbol_end()); - -  llvm_unreachable( -      "Object passed to getELFDynamicSymbolIterators() is not ELF"); +getELFDynamicSymbolIterators(const SymbolicFile *Obj) { +  return cast<ELFObjectFileBase>(Obj)->getELFDynamicSymbolIterators();  } -/// This is a generic interface for retrieving GNU symbol version -/// information from an ELFObjectFile.  inline std::error_code GetELFSymbolVersion(const ObjectFile *Obj,                                             const SymbolRef &Sym,                                             StringRef &Version,                                             bool &IsDefault) { -  // Little-endian 32-bit -  if (const ELF32LEObjectFile *ELFObj = dyn_cast<ELF32LEObjectFile>(Obj)) -    return ELFObj->getSymbolVersion(Sym, Version, IsDefault); - -  // Big-endian 32-bit -  if (const ELF32BEObjectFile *ELFObj = dyn_cast<ELF32BEObjectFile>(Obj)) -    return ELFObj->getSymbolVersion(Sym, Version, IsDefault); - -  // Little-endian 64-bit -  if (const ELF64LEObjectFile *ELFObj = dyn_cast<ELF64LEObjectFile>(Obj)) -    return ELFObj->getSymbolVersion(Sym, Version, IsDefault); - -  // Big-endian 64-bit -  if (const ELF64BEObjectFile *ELFObj = dyn_cast<ELF64BEObjectFile>(Obj)) -    return ELFObj->getSymbolVersion(Sym, Version, IsDefault); - -  llvm_unreachable("Object passed to GetELFSymbolVersion() is not ELF"); +  return cast<ELFObjectFileBase>(Obj) +      ->getSymbolVersion(Sym, Version, IsDefault);  }  }  } diff --git a/include/llvm/Object/ELFTypes.h b/include/llvm/Object/ELFTypes.h index 84b6031..4bc0c7c 100644 --- a/include/llvm/Object/ELFTypes.h +++ b/include/llvm/Object/ELFTypes.h @@ -7,8 +7,8 @@  //  //===----------------------------------------------------------------------===// -#ifndef LLVM_OBJECT_ELF_TYPES_H -#define LLVM_OBJECT_ELF_TYPES_H +#ifndef LLVM_OBJECT_ELFTYPES_H +#define LLVM_OBJECT_ELFTYPES_H  #include "llvm/Support/AlignOf.h"  #include "llvm/Support/DataTypes.h" @@ -176,6 +176,7 @@ struct Elf_Sym_Base<ELFType<TargetEndianness, MaxAlign, true> > {  template <class ELFT>  struct Elf_Sym_Impl : Elf_Sym_Base<ELFT> {    using Elf_Sym_Base<ELFT>::st_info; +  using Elf_Sym_Base<ELFT>::st_other;    // These accessors and mutators correspond to the ELF32_ST_BIND,    // ELF32_ST_TYPE, and ELF32_ST_INFO macros defined in the ELF specification: @@ -186,6 +187,9 @@ struct Elf_Sym_Impl : Elf_Sym_Base<ELFT> {    void setBindingAndType(unsigned char b, unsigned char t) {      st_info = (b << 4) + (t & 0x0f);    } + +  /// Access to the STV_xxx flag stored in the first two bits of st_other. +  unsigned char getVisibility() const { return st_other & 0x3; }  };  /// Elf_Versym: This is the structure of entries in the SHT_GNU_versym section diff --git a/include/llvm/Object/ELFYAML.h b/include/llvm/Object/ELFYAML.h index fc8cc95..687611d 100644 --- a/include/llvm/Object/ELFYAML.h +++ b/include/llvm/Object/ELFYAML.h @@ -45,6 +45,7 @@ LLVM_YAML_STRONG_TYPEDEF(uint8_t, ELF_REL)  LLVM_YAML_STRONG_TYPEDEF(uint64_t, ELF_SHF)  LLVM_YAML_STRONG_TYPEDEF(uint8_t, ELF_STT)  LLVM_YAML_STRONG_TYPEDEF(uint8_t, ELF_STV) +LLVM_YAML_STRONG_TYPEDEF(uint8_t, ELF_STO)  // For now, hardcode 64 bits everywhere that 32 or 64 would be needed  // since 64-bit can hold 32-bit values too. @@ -63,7 +64,7 @@ struct Symbol {    StringRef Section;    llvm::yaml::Hex64 Value;    llvm::yaml::Hex64 Size; -  ELF_STV Visibility; +  uint8_t Other;  };  struct LocalGlobalWeakSymbols {    std::vector<Symbol> Local; @@ -175,6 +176,11 @@ struct ScalarEnumerationTraits<ELFYAML::ELF_STV> {  };  template <> +struct ScalarBitSetTraits<ELFYAML::ELF_STO> { +  static void bitset(IO &IO, ELFYAML::ELF_STO &Value); +}; + +template <>  struct ScalarEnumerationTraits<ELFYAML::ELF_REL> {    static void enumeration(IO &IO, ELFYAML::ELF_REL &Value);  }; diff --git a/include/llvm/Object/Error.h b/include/llvm/Object/Error.h index 701da12..90c2bd7 100644 --- a/include/llvm/Object/Error.h +++ b/include/llvm/Object/Error.h @@ -26,7 +26,8 @@ enum class object_error {    arch_not_found,    invalid_file_type,    parse_failed, -  unexpected_eof +  unexpected_eof, +  bitcode_section_not_found,  };  inline std::error_code make_error_code(object_error e) { diff --git a/include/llvm/Object/IRObjectFile.h b/include/llvm/Object/IRObjectFile.h index b33cc26..b650d5d 100644 --- a/include/llvm/Object/IRObjectFile.h +++ b/include/llvm/Object/IRObjectFile.h @@ -11,8 +11,8 @@  //  //===----------------------------------------------------------------------===// -#ifndef LLVM_OBJECT_IR_OBJECT_FILE_H -#define LLVM_OBJECT_IR_OBJECT_FILE_H +#ifndef LLVM_OBJECT_IROBJECTFILE_H +#define LLVM_OBJECT_IROBJECTFILE_H  #include "llvm/Object/SymbolicFile.h" @@ -22,13 +22,15 @@ class Module;  class GlobalValue;  namespace object { +class ObjectFile; +  class IRObjectFile : public SymbolicFile {    std::unique_ptr<Module> M;    std::unique_ptr<Mangler> Mang;    std::vector<std::pair<std::string, uint32_t>> AsmSymbols;  public: -  IRObjectFile(std::unique_ptr<MemoryBuffer> Object, std::unique_ptr<Module> M); +  IRObjectFile(MemoryBufferRef Object, std::unique_ptr<Module> M);    ~IRObjectFile();    void moveSymbolNext(DataRefImpl &Symb) const override;    std::error_code printSymbolName(raw_ostream &OS, @@ -49,9 +51,18 @@ public:      return v->isIR();    } -  static ErrorOr<IRObjectFile *> -  createIRObjectFile(std::unique_ptr<MemoryBuffer> Object, -                     LLVMContext &Context); +  /// \brief Finds and returns bitcode embedded in the given object file, or an +  /// error code if not found. +  static ErrorOr<MemoryBufferRef> findBitcodeInObject(const ObjectFile &Obj); + +  /// \brief Finds and returns bitcode in the given memory buffer (which may +  /// be either a bitcode file or a native object file with embedded bitcode), +  /// or an error code if not found. +  static ErrorOr<MemoryBufferRef> +  findBitcodeInMemBuffer(MemoryBufferRef Object); + +  static ErrorOr<std::unique_ptr<IRObjectFile>> +  createIRObjectFile(MemoryBufferRef Object, LLVMContext &Context);  };  }  } diff --git a/include/llvm/Object/MachO.h b/include/llvm/Object/MachO.h index e93ebb8..768cda6 100644 --- a/include/llvm/Object/MachO.h +++ b/include/llvm/Object/MachO.h @@ -49,6 +49,141 @@ public:  };  typedef content_iterator<DiceRef> dice_iterator; +/// ExportEntry encapsulates the current-state-of-the-walk used when doing a +/// non-recursive walk of the trie data structure.  This allows you to iterate +/// across all exported symbols using: +///      for (const llvm::object::ExportEntry &AnExport : Obj->exports()) { +///      } +class ExportEntry { +public: +  ExportEntry(ArrayRef<uint8_t> Trie); + +  StringRef name() const; +  uint64_t flags() const; +  uint64_t address() const; +  uint64_t other() const; +  StringRef otherName() const; +  uint32_t nodeOffset() const; + +  bool operator==(const ExportEntry &) const; + +  void moveNext(); + +private: +  friend class MachOObjectFile; +  void moveToFirst(); +  void moveToEnd(); +  uint64_t readULEB128(const uint8_t *&p); +  void pushDownUntilBottom(); +  void pushNode(uint64_t Offset); + +  // Represents a node in the mach-o exports trie. +  struct NodeState { +    NodeState(const uint8_t *Ptr); +    const uint8_t *Start; +    const uint8_t *Current; +    uint64_t Flags; +    uint64_t Address; +    uint64_t Other; +    const char *ImportName; +    unsigned ChildCount; +    unsigned NextChildIndex; +    unsigned ParentStringLength; +    bool IsExportNode; +  }; + +  ArrayRef<uint8_t> Trie; +  SmallString<256> CumulativeString; +  SmallVector<NodeState, 16> Stack; +  bool Malformed; +  bool Done; +}; +typedef content_iterator<ExportEntry> export_iterator; + +/// MachORebaseEntry encapsulates the current state in the decompression of    +/// rebasing opcodes. This allows you to iterate through the compressed table of +/// rebasing using: +///    for (const llvm::object::MachORebaseEntry &Entry : Obj->rebaseTable()) { +///    } +class MachORebaseEntry { +public: +  MachORebaseEntry(ArrayRef<uint8_t> opcodes, bool is64Bit); + +  uint32_t segmentIndex() const; +  uint64_t segmentOffset() const; +  StringRef typeName() const; + +  bool operator==(const MachORebaseEntry &) const; + +  void moveNext(); +   +private: +  friend class MachOObjectFile; +  void moveToFirst(); +  void moveToEnd(); +  uint64_t readULEB128(); + +  ArrayRef<uint8_t> Opcodes; +  const uint8_t *Ptr; +  uint64_t SegmentOffset; +  uint32_t SegmentIndex; +  uint64_t RemainingLoopCount; +  uint64_t AdvanceAmount; +  uint8_t  RebaseType; +  uint8_t  PointerSize; +  bool     Malformed; +  bool     Done; +}; +typedef content_iterator<MachORebaseEntry> rebase_iterator; + +/// MachOBindEntry encapsulates the current state in the decompression of +/// binding opcodes. This allows you to iterate through the compressed table of +/// bindings using: +///    for (const llvm::object::MachOBindEntry &Entry : Obj->bindTable()) { +///    } +class MachOBindEntry { +public: +  enum class Kind { Regular, Lazy, Weak }; + +  MachOBindEntry(ArrayRef<uint8_t> Opcodes, bool is64Bit, MachOBindEntry::Kind); + +  uint32_t segmentIndex() const; +  uint64_t segmentOffset() const; +  StringRef typeName() const; +  StringRef symbolName() const; +  uint32_t flags() const; +  int64_t addend() const; +  int ordinal() const; + +  bool operator==(const MachOBindEntry &) const; + +  void moveNext(); + +private: +  friend class MachOObjectFile; +  void moveToFirst(); +  void moveToEnd(); +  uint64_t readULEB128(); +  int64_t readSLEB128(); + +  ArrayRef<uint8_t> Opcodes; +  const uint8_t *Ptr; +  uint64_t SegmentOffset; +  uint32_t SegmentIndex; +  StringRef SymbolName; +  int      Ordinal; +  uint32_t Flags; +  int64_t  Addend; +  uint64_t RemainingLoopCount; +  uint64_t AdvanceAmount; +  uint8_t  BindType; +  uint8_t  PointerSize; +  Kind     TableKind; +  bool     Malformed; +  bool     Done; +}; +typedef content_iterator<MachOBindEntry> bind_iterator; +  class MachOObjectFile : public ObjectFile {  public:    struct LoadCommandInfo { @@ -56,8 +191,8 @@ public:      MachO::load_command C; // The command itself.    }; -  MachOObjectFile(std::unique_ptr<MemoryBuffer> Object, bool IsLittleEndian, -                  bool Is64Bits, std::error_code &EC); +  MachOObjectFile(MemoryBufferRef Object, bool IsLittleEndian, bool Is64Bits, +                  std::error_code &EC);    void moveSymbolNext(DataRefImpl &Symb) const override;    std::error_code getSymbolName(DataRefImpl Symb, @@ -80,24 +215,19 @@ public:    void moveSectionNext(DataRefImpl &Sec) const override;    std::error_code getSectionName(DataRefImpl Sec,                                   StringRef &Res) const override; -  std::error_code getSectionAddress(DataRefImpl Sec, -                                    uint64_t &Res) const override; -  std::error_code getSectionSize(DataRefImpl Sec, uint64_t &Res) const override; +  uint64_t getSectionAddress(DataRefImpl Sec) const override; +  uint64_t getSectionSize(DataRefImpl Sec) const override;    std::error_code getSectionContents(DataRefImpl Sec,                                       StringRef &Res) const override; -  std::error_code getSectionAlignment(DataRefImpl Sec, -                                      uint64_t &Res) const override; -  std::error_code isSectionText(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionData(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionBSS(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionRequiredForExecution(DataRefImpl Sec, -                                                bool &Res) const override; -  std::error_code isSectionVirtual(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionZeroInit(DataRefImpl Sec, bool &Res) const override; -  std::error_code isSectionReadOnlyData(DataRefImpl Sec, -                                        bool &Res) const override; -  std::error_code sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb, -                                        bool &Result) const override; +  uint64_t getSectionAlignment(DataRefImpl Sec) const override; +  bool isSectionText(DataRefImpl Sec) const override; +  bool isSectionData(DataRefImpl Sec) const override; +  bool isSectionBSS(DataRefImpl Sec) const override; +  bool isSectionRequiredForExecution(DataRefImpl Sec) const override; +  bool isSectionVirtual(DataRefImpl Sec) const override; +  bool isSectionZeroInit(DataRefImpl Sec) const override; +  bool isSectionReadOnlyData(DataRefImpl Sec) const override; +  bool sectionContainsSymbol(DataRefImpl Sec, DataRefImpl Symb) const override;    relocation_iterator section_rel_begin(DataRefImpl Sec) const override;    relocation_iterator section_rel_end(DataRefImpl Sec) const override; @@ -118,13 +248,8 @@ public:    std::error_code getRelocationHidden(DataRefImpl Rel,                                        bool &Result) const override; -  std::error_code getLibraryNext(DataRefImpl LibData, -                                 LibraryRef &Res) const override; -  std::error_code getLibraryPath(DataRefImpl LibData, -                                 StringRef &Res) const override; -    // MachO specific. -  std::error_code getLibraryShortNameByIndex(unsigned Index, StringRef &Res); +  std::error_code getLibraryShortNameByIndex(unsigned Index, StringRef &) const;    // TODO: Would be useful to have an iterator based version    // of the load command interface too. @@ -138,21 +263,45 @@ public:    section_iterator section_begin() const override;    section_iterator section_end() const override; -  library_iterator needed_library_begin() const override; -  library_iterator needed_library_end() const override; -    uint8_t getBytesInAddress() const override;    StringRef getFileFormatName() const override;    unsigned getArch() const override; - -  StringRef getLoadName() const override; +  Triple getArch(const char **McpuDefault, Triple *ThumbTriple) const;    relocation_iterator section_rel_begin(unsigned Index) const;    relocation_iterator section_rel_end(unsigned Index) const;    dice_iterator begin_dices() const;    dice_iterator end_dices() const; +   +  /// For use iterating over all exported symbols. +  iterator_range<export_iterator> exports() const; +   +  /// For use examining a trie not in a MachOObjectFile. +  static iterator_range<export_iterator> exports(ArrayRef<uint8_t> Trie); + +  /// For use iterating over all rebase table entries. +  iterator_range<rebase_iterator> rebaseTable() const; + +  /// For use examining rebase opcodes not in a MachOObjectFile. +  static iterator_range<rebase_iterator> rebaseTable(ArrayRef<uint8_t> Opcodes, +                                                     bool is64); + +  /// For use iterating over all bind table entries. +  iterator_range<bind_iterator> bindTable() const; + +  /// For use iterating over all lazy bind table entries. +  iterator_range<bind_iterator> lazyBindTable() const; + +  /// For use iterating over all lazy bind table entries. +  iterator_range<bind_iterator> weakBindTable() const; + +  /// For use examining bind opcodes not in a MachOObjectFile. +  static iterator_range<bind_iterator> bindTable(ArrayRef<uint8_t> Opcodes, +                                                 bool is64, +                                                 MachOBindEntry::Kind); +    // In a MachO file, sections have a segment name. This is used in the .o    // files. They have a single segment, but this field specifies which segment @@ -173,6 +322,8 @@ public:                                      const MachO::any_relocation_info &RE) const;    uint32_t getScatteredRelocationValue(                                      const MachO::any_relocation_info &RE) const; +  uint32_t getScatteredRelocationType( +                                    const MachO::any_relocation_info &RE) const;    unsigned getAnyRelocationAddress(const MachO::any_relocation_info &RE) const;    unsigned getAnyRelocationPCRel(const MachO::any_relocation_info &RE) const;    unsigned getAnyRelocationLength(const MachO::any_relocation_info &RE) const; @@ -203,6 +354,16 @@ public:    getVersionMinLoadCommand(const LoadCommandInfo &L) const;    MachO::dylib_command    getDylibIDLoadCommand(const LoadCommandInfo &L) const; +  MachO::dyld_info_command +  getDyldInfoLoadCommand(const LoadCommandInfo &L) const; +  MachO::dylinker_command +  getDylinkerCommand(const LoadCommandInfo &L) const; +  MachO::uuid_command +  getUuidCommand(const LoadCommandInfo &L) const; +  MachO::source_version_command +  getSourceVersionCommand(const LoadCommandInfo &L) const; +  MachO::entry_point_command +  getEntryPointCommand(const LoadCommandInfo &L) const;    MachO::any_relocation_info getRelocation(DataRefImpl Rel) const;    MachO::data_in_code_entry getDice(DataRefImpl Rel) const; @@ -216,6 +377,12 @@ public:    MachO::symtab_command getSymtabLoadCommand() const;    MachO::dysymtab_command getDysymtabLoadCommand() const;    MachO::linkedit_data_command getDataInCodeLoadCommand() const; +  ArrayRef<uint8_t> getDyldInfoRebaseOpcodes() const; +  ArrayRef<uint8_t> getDyldInfoBindOpcodes() const; +  ArrayRef<uint8_t> getDyldInfoWeakBindOpcodes() const; +  ArrayRef<uint8_t> getDyldInfoLazyBindOpcodes() const; +  ArrayRef<uint8_t> getDyldInfoExportsTrie() const; +  ArrayRef<uint8_t> getUuid() const;    StringRef getStringTableData() const;    bool is64Bit() const; @@ -225,26 +392,36 @@ public:                                           StringRef &Suffix);    static Triple::ArchType getArch(uint32_t CPUType); -  static Triple getArch(uint32_t CPUType, uint32_t CPUSubType); -  static Triple getArch(StringRef ArchFlag); +  static Triple getArch(uint32_t CPUType, uint32_t CPUSubType, +                        const char **McpuDefault = nullptr); +  static Triple getThumbArch(uint32_t CPUType, uint32_t CPUSubType, +                             const char **McpuDefault = nullptr); +  static Triple getArch(uint32_t CPUType, uint32_t CPUSubType, +                        const char **McpuDefault, Triple *ThumbTriple); +  static bool isValidArch(StringRef ArchFlag);    static Triple getHostArch(); +  bool isRelocatableObject() const override; + +  bool hasPageZeroSegment() const { return HasPageZeroSegment; } +    static bool classof(const Binary *v) {      return v->isMachO();    } -  const char *getSectionPointer(DataRefImpl Rel) const; -  private: -  typedef SmallVector<const char *, 1> SectionList; +  typedef SmallVector<const char*, 1> SectionList;    SectionList Sections; -  typedef SmallVector<const char *, 1> LibraryList; +  typedef SmallVector<const char*, 1> LibraryList;    LibraryList Libraries;    typedef SmallVector<StringRef, 1> LibraryShortName; -  LibraryShortName LibrariesShortNames; +  mutable LibraryShortName LibrariesShortNames;    const char *SymtabLoadCmd;    const char *DysymtabLoadCmd;    const char *DataInCodeLoadCmd; +  const char *DyldInfoLoadCmd; +  const char *UuidLoadCmd; +  bool HasPageZeroSegment;  };  /// DiceRef diff --git a/include/llvm/Object/MachOUniversal.h b/include/llvm/Object/MachOUniversal.h index e6677f5..46cf3fb 100644 --- a/include/llvm/Object/MachOUniversal.h +++ b/include/llvm/Object/MachOUniversal.h @@ -25,8 +25,6 @@  namespace llvm {  namespace object { -class ObjectFile; -  class MachOUniversalBinary : public Binary {    virtual void anchor(); @@ -58,7 +56,7 @@ public:        return T.getArchName();      } -    ErrorOr<std::unique_ptr<ObjectFile>> getAsObjectFile() const; +    ErrorOr<std::unique_ptr<MachOObjectFile>> getAsObjectFile() const;      std::error_code getAsArchive(std::unique_ptr<Archive> &Result) const;    }; @@ -84,10 +82,9 @@ public:      }    }; -  MachOUniversalBinary(std::unique_ptr<MemoryBuffer> Source, -                       std::error_code &ec); -  static ErrorOr<MachOUniversalBinary *> -  create(std::unique_ptr<MemoryBuffer> Source); +  MachOUniversalBinary(MemoryBufferRef Souce, std::error_code &EC); +  static ErrorOr<std::unique_ptr<MachOUniversalBinary>> +  create(MemoryBufferRef Source);    object_iterator begin_objects() const {      return ObjectForArch(this, 0); @@ -103,7 +100,7 @@ public:      return V->isMachOUniversalBinary();    } -  ErrorOr<std::unique_ptr<ObjectFile>> +  ErrorOr<std::unique_ptr<MachOObjectFile>>    getObjectForArch(Triple::ArchType Arch) const;  }; diff --git a/include/llvm/Object/ObjectFile.h b/include/llvm/Object/ObjectFile.h index 646abf8..68b873a 100644 --- a/include/llvm/Object/ObjectFile.h +++ b/include/llvm/Object/ObjectFile.h @@ -27,6 +27,8 @@ namespace llvm {  namespace object {  class ObjectFile; +class COFFObjectFile; +class MachOObjectFile;  class SymbolRef;  class symbol_iterator; @@ -93,23 +95,22 @@ public:    void moveNext();    std::error_code getName(StringRef &Result) const; -  std::error_code getAddress(uint64_t &Result) const; -  std::error_code getSize(uint64_t &Result) const; +  uint64_t getAddress() const; +  uint64_t getSize() const;    std::error_code getContents(StringRef &Result) const;    /// @brief Get the alignment of this section as the actual value (not log 2). -  std::error_code getAlignment(uint64_t &Result) const; +  uint64_t getAlignment() const; -  // FIXME: Move to the normalization layer when it's created. -  std::error_code isText(bool &Result) const; -  std::error_code isData(bool &Result) const; -  std::error_code isBSS(bool &Result) const; -  std::error_code isRequiredForExecution(bool &Result) const; -  std::error_code isVirtual(bool &Result) const; -  std::error_code isZeroInit(bool &Result) const; -  std::error_code isReadOnlyData(bool &Result) const; +  bool isText() const; +  bool isData() const; +  bool isBSS() const; +  bool isRequiredForExecution() const; +  bool isVirtual() const; +  bool isZeroInit() const; +  bool isReadOnlyData() const; -  std::error_code containsSymbol(SymbolRef S, bool &Result) const; +  bool containsSymbol(SymbolRef S) const;    relocation_iterator relocation_begin() const;    relocation_iterator relocation_end() const; @@ -149,6 +150,7 @@ public:    std::error_code getAlignment(uint32_t &Result) const;    std::error_code getSize(uint64_t &Result) const;    std::error_code getType(SymbolRef::Type &Result) const; +  std::error_code getOther(uint8_t &Result) const;    /// @brief Get section this symbol is defined in reference to. Result is    /// end_sections() if it is undefined or is an absolute symbol. @@ -175,30 +177,6 @@ public:    }  }; -/// LibraryRef - This is a value type class that represents a single library in -/// the list of libraries needed by a shared or dynamic object. -class LibraryRef { -  friend class SectionRef; -  DataRefImpl LibraryPimpl; -  const ObjectFile *OwningObject; - -public: -  LibraryRef() : OwningObject(nullptr) { } - -  LibraryRef(DataRefImpl LibraryP, const ObjectFile *Owner); - -  bool operator==(const LibraryRef &Other) const; -  bool operator<(const LibraryRef &Other) const; - -  std::error_code getNext(LibraryRef &Result) const; - -  // Get the path to this library, as stored in the object file. -  std::error_code getPath(StringRef &Result) const; - -  DataRefImpl getRawDataRefImpl() const; -}; -typedef content_iterator<LibraryRef> library_iterator; -  /// ObjectFile - This class is the base class for all object file types.  /// Concrete instances of this object are created by createObjectFile, which  /// figures out which type to create. @@ -208,10 +186,10 @@ class ObjectFile : public SymbolicFile {    ObjectFile(const ObjectFile &other) LLVM_DELETED_FUNCTION;  protected: -  ObjectFile(unsigned int Type, std::unique_ptr<MemoryBuffer> Source); +  ObjectFile(unsigned int Type, MemoryBufferRef Source);    const uint8_t *base() const { -    return reinterpret_cast<const uint8_t *>(Data->getBufferStart()); +    return reinterpret_cast<const uint8_t *>(Data.getBufferStart());    }    // These functions are for SymbolRef to call internally. The main goal of @@ -237,35 +215,31 @@ protected:                                          SymbolRef::Type &Res) const = 0;    virtual std::error_code getSymbolSection(DataRefImpl Symb,                                             section_iterator &Res) const = 0; +  virtual std::error_code getSymbolOther(DataRefImpl Symb, +                                         uint8_t &Res) const { +    return object_error::invalid_file_type; +  }    // Same as above for SectionRef.    friend class SectionRef;    virtual void moveSectionNext(DataRefImpl &Sec) const = 0;    virtual std::error_code getSectionName(DataRefImpl Sec,                                           StringRef &Res) const = 0; -  virtual std::error_code getSectionAddress(DataRefImpl Sec, -                                            uint64_t &Res) const = 0; -  virtual std::error_code getSectionSize(DataRefImpl Sec, -                                         uint64_t &Res) const = 0; +  virtual uint64_t getSectionAddress(DataRefImpl Sec) const = 0; +  virtual uint64_t getSectionSize(DataRefImpl Sec) const = 0;    virtual std::error_code getSectionContents(DataRefImpl Sec,                                               StringRef &Res) const = 0; -  virtual std::error_code getSectionAlignment(DataRefImpl Sec, -                                              uint64_t &Res) const = 0; -  virtual std::error_code isSectionText(DataRefImpl Sec, bool &Res) const = 0; -  virtual std::error_code isSectionData(DataRefImpl Sec, bool &Res) const = 0; -  virtual std::error_code isSectionBSS(DataRefImpl Sec, bool &Res) const = 0; -  virtual std::error_code isSectionRequiredForExecution(DataRefImpl Sec, -                                                        bool &Res) const = 0; +  virtual uint64_t getSectionAlignment(DataRefImpl Sec) const = 0; +  virtual bool isSectionText(DataRefImpl Sec) const = 0; +  virtual bool isSectionData(DataRefImpl Sec) const = 0; +  virtual bool isSectionBSS(DataRefImpl Sec) const = 0; +  virtual bool isSectionRequiredForExecution(DataRefImpl Sec) const = 0;    // A section is 'virtual' if its contents aren't present in the object image. -  virtual std::error_code isSectionVirtual(DataRefImpl Sec, -                                           bool &Res) const = 0; -  virtual std::error_code isSectionZeroInit(DataRefImpl Sec, -                                            bool &Res) const = 0; -  virtual std::error_code isSectionReadOnlyData(DataRefImpl Sec, -                                                bool &Res) const = 0; -  virtual std::error_code sectionContainsSymbol(DataRefImpl Sec, -                                                DataRefImpl Symb, -                                                bool &Result) const = 0; +  virtual bool isSectionVirtual(DataRefImpl Sec) const = 0; +  virtual bool isSectionZeroInit(DataRefImpl Sec) const = 0; +  virtual bool isSectionReadOnlyData(DataRefImpl Sec) const = 0; +  virtual bool sectionContainsSymbol(DataRefImpl Sec, +                                     DataRefImpl Symb) const = 0;    virtual relocation_iterator section_rel_begin(DataRefImpl Sec) const = 0;    virtual relocation_iterator section_rel_end(DataRefImpl Sec) const = 0;    virtual section_iterator getRelocatedSection(DataRefImpl Sec) const; @@ -292,13 +266,6 @@ protected:      return object_error::success;    } -  // Same for LibraryRef -  friend class LibraryRef; -  virtual std::error_code getLibraryNext(DataRefImpl Lib, -                                         LibraryRef &Res) const = 0; -  virtual std::error_code getLibraryPath(DataRefImpl Lib, -                                         StringRef &Res) const = 0; -  public:    typedef iterator_range<symbol_iterator> symbol_iterator_range;    symbol_iterator_range symbols() const { @@ -313,9 +280,6 @@ public:      return section_iterator_range(section_begin(), section_end());    } -  virtual library_iterator needed_library_begin() const = 0; -  virtual library_iterator needed_library_end() const = 0; -    /// @brief The number of bytes used to represent an address in this object    ///        file format.    virtual uint8_t getBytesInAddress() const = 0; @@ -323,21 +287,26 @@ public:    virtual StringRef getFileFormatName() const = 0;    virtual /* Triple::ArchType */ unsigned getArch() const = 0; -  /// For shared objects, returns the name which this object should be -  /// loaded from at runtime. This corresponds to DT_SONAME on ELF and -  /// LC_ID_DYLIB (install name) on MachO. -  virtual StringRef getLoadName() const = 0; +  /// Returns platform-specific object flags, if any. +  virtual std::error_code getPlatformFlags(unsigned &Result) const { +    Result = 0; +    return object_error::invalid_file_type; +  } + +  /// True if this is a relocatable object (.o/.obj). +  virtual bool isRelocatableObject() const = 0;    /// @returns Pointer to ObjectFile subclass to handle this type of object.    /// @param ObjectPath The path to the object file. ObjectPath.isObject must    ///        return true.    /// @brief Create ObjectFile from path. -  static ErrorOr<ObjectFile *> createObjectFile(StringRef ObjectPath); -  static ErrorOr<ObjectFile *> -  createObjectFile(std::unique_ptr<MemoryBuffer> &Object, -                   sys::fs::file_magic Type); -  static ErrorOr<ObjectFile *> -  createObjectFile(std::unique_ptr<MemoryBuffer> &Object) { +  static ErrorOr<OwningBinary<ObjectFile>> +  createObjectFile(StringRef ObjectPath); + +  static ErrorOr<std::unique_ptr<ObjectFile>> +  createObjectFile(MemoryBufferRef Object, sys::fs::file_magic Type); +  static ErrorOr<std::unique_ptr<ObjectFile>> +  createObjectFile(MemoryBufferRef Object) {      return createObjectFile(Object, sys::fs::file_magic::unknown);    } @@ -346,13 +315,14 @@ public:      return v->isObject();    } -public: -  static ErrorOr<ObjectFile *> -  createCOFFObjectFile(std::unique_ptr<MemoryBuffer> Object); -  static ErrorOr<ObjectFile *> -  createELFObjectFile(std::unique_ptr<MemoryBuffer> &Object); -  static ErrorOr<ObjectFile *> -  createMachOObjectFile(std::unique_ptr<MemoryBuffer> &Object); +  static ErrorOr<std::unique_ptr<COFFObjectFile>> +  createCOFFObjectFile(MemoryBufferRef Object); + +  static ErrorOr<std::unique_ptr<ObjectFile>> +  createELFObjectFile(MemoryBufferRef Object); + +  static ErrorOr<std::unique_ptr<MachOObjectFile>> +  createMachOObjectFile(MemoryBufferRef Object);  };  // Inline function definitions. @@ -383,6 +353,10 @@ inline std::error_code SymbolRef::getType(SymbolRef::Type &Result) const {    return getObject()->getSymbolType(getRawDataRefImpl(), Result);  } +inline std::error_code SymbolRef::getOther(uint8_t &Result) const { +  return getObject()->getSymbolOther(getRawDataRefImpl(), Result); +} +  inline const ObjectFile *SymbolRef::getObject() const {    const SymbolicFile *O = BasicSymbolRef::getObject();    return cast<ObjectFile>(O); @@ -415,54 +389,53 @@ inline std::error_code SectionRef::getName(StringRef &Result) const {    return OwningObject->getSectionName(SectionPimpl, Result);  } -inline std::error_code SectionRef::getAddress(uint64_t &Result) const { -  return OwningObject->getSectionAddress(SectionPimpl, Result); +inline uint64_t SectionRef::getAddress() const { +  return OwningObject->getSectionAddress(SectionPimpl);  } -inline std::error_code SectionRef::getSize(uint64_t &Result) const { -  return OwningObject->getSectionSize(SectionPimpl, Result); +inline uint64_t SectionRef::getSize() const { +  return OwningObject->getSectionSize(SectionPimpl);  }  inline std::error_code SectionRef::getContents(StringRef &Result) const {    return OwningObject->getSectionContents(SectionPimpl, Result);  } -inline std::error_code SectionRef::getAlignment(uint64_t &Result) const { -  return OwningObject->getSectionAlignment(SectionPimpl, Result); +inline uint64_t SectionRef::getAlignment() const { +  return OwningObject->getSectionAlignment(SectionPimpl);  } -inline std::error_code SectionRef::isText(bool &Result) const { -  return OwningObject->isSectionText(SectionPimpl, Result); +inline bool SectionRef::isText() const { +  return OwningObject->isSectionText(SectionPimpl);  } -inline std::error_code SectionRef::isData(bool &Result) const { -  return OwningObject->isSectionData(SectionPimpl, Result); +inline bool SectionRef::isData() const { +  return OwningObject->isSectionData(SectionPimpl);  } -inline std::error_code SectionRef::isBSS(bool &Result) const { -  return OwningObject->isSectionBSS(SectionPimpl, Result); +inline bool SectionRef::isBSS() const { +  return OwningObject->isSectionBSS(SectionPimpl);  } -inline std::error_code SectionRef::isRequiredForExecution(bool &Result) const { -  return OwningObject->isSectionRequiredForExecution(SectionPimpl, Result); +inline bool SectionRef::isRequiredForExecution() const { +  return OwningObject->isSectionRequiredForExecution(SectionPimpl);  } -inline std::error_code SectionRef::isVirtual(bool &Result) const { -  return OwningObject->isSectionVirtual(SectionPimpl, Result); +inline bool SectionRef::isVirtual() const { +  return OwningObject->isSectionVirtual(SectionPimpl);  } -inline std::error_code SectionRef::isZeroInit(bool &Result) const { -  return OwningObject->isSectionZeroInit(SectionPimpl, Result); +inline bool SectionRef::isZeroInit() const { +  return OwningObject->isSectionZeroInit(SectionPimpl);  } -inline std::error_code SectionRef::isReadOnlyData(bool &Result) const { -  return OwningObject->isSectionReadOnlyData(SectionPimpl, Result); +inline bool SectionRef::isReadOnlyData() const { +  return OwningObject->isSectionReadOnlyData(SectionPimpl);  } -inline std::error_code SectionRef::containsSymbol(SymbolRef S, -                                                  bool &Result) const { +inline bool SectionRef::containsSymbol(SymbolRef S) const {    return OwningObject->sectionContainsSymbol(SectionPimpl, -                                             S.getRawDataRefImpl(), Result); +                                             S.getRawDataRefImpl());  }  inline relocation_iterator SectionRef::relocation_begin() const { @@ -533,26 +506,6 @@ inline const ObjectFile *RelocationRef::getObjectFile() const {    return OwningObject;  } -// Inline function definitions. -inline LibraryRef::LibraryRef(DataRefImpl LibraryP, const ObjectFile *Owner) -  : LibraryPimpl(LibraryP) -  , OwningObject(Owner) {} - -inline bool LibraryRef::operator==(const LibraryRef &Other) const { -  return LibraryPimpl == Other.LibraryPimpl; -} - -inline bool LibraryRef::operator<(const LibraryRef &Other) const { -  return LibraryPimpl < Other.LibraryPimpl; -} - -inline std::error_code LibraryRef::getNext(LibraryRef &Result) const { -  return OwningObject->getLibraryNext(LibraryPimpl, Result); -} - -inline std::error_code LibraryRef::getPath(StringRef &Result) const { -  return OwningObject->getLibraryPath(LibraryPimpl, Result); -}  } // end namespace object  } // end namespace llvm diff --git a/include/llvm/Object/RelocVisitor.h b/include/llvm/Object/RelocVisitor.h index 5ca2450..91eafd5 100644 --- a/include/llvm/Object/RelocVisitor.h +++ b/include/llvm/Object/RelocVisitor.h @@ -17,6 +17,7 @@  #define LLVM_OBJECT_RELOCVISITOR_H  #include "llvm/ADT/StringRef.h" +#include "llvm/Object/COFF.h"  #include "llvm/Object/ELFObjectFile.h"  #include "llvm/Object/ObjectFile.h"  #include "llvm/Support/Debug.h" @@ -40,22 +41,39 @@ struct RelocToApply {  /// @brief Base class for object file relocation visitors.  class RelocVisitor {  public: -  explicit RelocVisitor(StringRef FileFormat) -    : FileFormat(FileFormat), HasError(false) {} +  explicit RelocVisitor(const ObjectFile &Obj) +    : ObjToVisit(Obj), HasError(false) {}    // TODO: Should handle multiple applied relocations via either passing in the    // previously computed value or just count paired relocations as a single    // visit. -  RelocToApply visit(uint32_t RelocType, RelocationRef R, uint64_t SecAddr = 0, -                     uint64_t Value = 0) { -    if (FileFormat == "ELF64-x86-64") { -      switch (RelocType) { +  RelocToApply visit(uint32_t RelocType, RelocationRef R, uint64_t Value = 0) { +    if (isa<ELFObjectFileBase>(ObjToVisit)) +      return visitELF(RelocType, R, Value); +    if (isa<COFFObjectFile>(ObjToVisit)) +      return visitCOFF(RelocType, R, Value); + +    HasError = true; +    return RelocToApply(); +  } + +  bool error() { return HasError; } + +private: +  const ObjectFile &ObjToVisit; +  bool HasError; + +  RelocToApply visitELF(uint32_t RelocType, RelocationRef R, uint64_t Value) { +    if (ObjToVisit.getBytesInAddress() == 8) { // 64-bit object file +      switch (ObjToVisit.getArch()) { +      case Triple::x86_64: +        switch (RelocType) {          case llvm::ELF::R_X86_64_NONE:            return visitELF_X86_64_NONE(R);          case llvm::ELF::R_X86_64_64:            return visitELF_X86_64_64(R, Value);          case llvm::ELF::R_X86_64_PC32: -          return visitELF_X86_64_PC32(R, Value, SecAddr); +          return visitELF_X86_64_PC32(R, Value);          case llvm::ELF::R_X86_64_32:            return visitELF_X86_64_32(R, Value);          case llvm::ELF::R_X86_64_32S: @@ -63,116 +81,147 @@ public:          default:            HasError = true;            return RelocToApply(); -      } -    } else if (FileFormat == "ELF32-i386") { -      switch (RelocType) { -      case llvm::ELF::R_386_NONE: -        return visitELF_386_NONE(R); -      case llvm::ELF::R_386_32: -        return visitELF_386_32(R, Value); -      case llvm::ELF::R_386_PC32: -        return visitELF_386_PC32(R, Value, SecAddr); -      default: -        HasError = true; -        return RelocToApply(); -      } -    } else if (FileFormat == "ELF64-ppc64") { -      switch (RelocType) { -      case llvm::ELF::R_PPC64_ADDR32: -        return visitELF_PPC64_ADDR32(R, Value); -      case llvm::ELF::R_PPC64_ADDR64: -        return visitELF_PPC64_ADDR64(R, Value); -      default: -        HasError = true; -        return RelocToApply(); -      } -    } else if (FileFormat == "ELF32-ppc") { -      switch (RelocType) { -      case llvm::ELF::R_PPC_ADDR32: -        return visitELF_PPC_ADDR32(R, Value); -      default: -        HasError = true; -        return RelocToApply(); -      } -    } else if (FileFormat == "ELF32-mips") { -      switch (RelocType) { -      case llvm::ELF::R_MIPS_32: -        return visitELF_MIPS_32(R, Value); -      default: -        HasError = true; -        return RelocToApply(); -      } -    } else if (FileFormat == "ELF64-mips") { -      switch (RelocType) { -      case llvm::ELF::R_MIPS_32: -        return visitELF_MIPS_32(R, Value); -      case llvm::ELF::R_MIPS_64: -        return visitELF_MIPS_64(R, Value); -      default: -        HasError = true; -        return RelocToApply(); -      } -    } else if (FileFormat == "ELF64-aarch64") { -      switch (RelocType) { -      case llvm::ELF::R_AARCH64_ABS32: -        return visitELF_AARCH64_ABS32(R, Value); -      case llvm::ELF::R_AARCH64_ABS64: -        return visitELF_AARCH64_ABS64(R, Value); -      default: -        HasError = true; -        return RelocToApply(); -      } -    } else if (FileFormat == "ELF64-s390") { -      switch (RelocType) { -      case llvm::ELF::R_390_32: -        return visitELF_390_32(R, Value); -      case llvm::ELF::R_390_64: -        return visitELF_390_64(R, Value); +        } +      case Triple::aarch64: +        switch (RelocType) { +        case llvm::ELF::R_AARCH64_ABS32: +          return visitELF_AARCH64_ABS32(R, Value); +        case llvm::ELF::R_AARCH64_ABS64: +          return visitELF_AARCH64_ABS64(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        } +      case Triple::mips64el: +      case Triple::mips64: +        switch (RelocType) { +        case llvm::ELF::R_MIPS_32: +          return visitELF_MIPS_32(R, Value); +        case llvm::ELF::R_MIPS_64: +          return visitELF_MIPS_64(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        } +      case Triple::ppc64le: +      case Triple::ppc64: +        switch (RelocType) { +        case llvm::ELF::R_PPC64_ADDR32: +          return visitELF_PPC64_ADDR32(R, Value); +        case llvm::ELF::R_PPC64_ADDR64: +          return visitELF_PPC64_ADDR64(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        } +      case Triple::systemz: +        switch (RelocType) { +        case llvm::ELF::R_390_32: +          return visitELF_390_32(R, Value); +        case llvm::ELF::R_390_64: +          return visitELF_390_64(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        } +      case Triple::sparcv9: +        switch (RelocType) { +        case llvm::ELF::R_SPARC_32: +        case llvm::ELF::R_SPARC_UA32: +          return visitELF_SPARCV9_32(R, Value); +        case llvm::ELF::R_SPARC_64: +        case llvm::ELF::R_SPARC_UA64: +          return visitELF_SPARCV9_64(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        }        default:          HasError = true;          return RelocToApply();        } -    } else if (FileFormat == "ELF32-sparc") { -      switch (RelocType) { -      case llvm::ELF::R_SPARC_32: -      case llvm::ELF::R_SPARC_UA32: -        return visitELF_SPARC_32(R, Value); +    } else if (ObjToVisit.getBytesInAddress() == 4) { // 32-bit object file +      switch (ObjToVisit.getArch()) { +      case Triple::x86: +        switch (RelocType) { +        case llvm::ELF::R_386_NONE: +          return visitELF_386_NONE(R); +        case llvm::ELF::R_386_32: +          return visitELF_386_32(R, Value); +        case llvm::ELF::R_386_PC32: +          return visitELF_386_PC32(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        } +      case Triple::ppc: +        switch (RelocType) { +        case llvm::ELF::R_PPC_ADDR32: +          return visitELF_PPC_ADDR32(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        } +      case Triple::arm: +      case Triple::armeb: +        switch (RelocType) { +        default: +          HasError = true; +          return RelocToApply(); +        case llvm::ELF::R_ARM_ABS32: +          return visitELF_ARM_ABS32(R, Value); +        } +      case Triple::mipsel: +      case Triple::mips: +        switch (RelocType) { +        case llvm::ELF::R_MIPS_32: +          return visitELF_MIPS_32(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        } +      case Triple::sparc: +        switch (RelocType) { +        case llvm::ELF::R_SPARC_32: +        case llvm::ELF::R_SPARC_UA32: +          return visitELF_SPARC_32(R, Value); +        default: +          HasError = true; +          return RelocToApply(); +        }        default:          HasError = true;          return RelocToApply();        } -    } else if (FileFormat == "ELF64-sparc") { +    } else { +      report_fatal_error("Invalid word size in object file"); +    } +  } + +  RelocToApply visitCOFF(uint32_t RelocType, RelocationRef R, uint64_t Value) { +    switch (ObjToVisit.getArch()) { +    case Triple::x86:        switch (RelocType) { -      case llvm::ELF::R_SPARC_32: -      case llvm::ELF::R_SPARC_UA32: -        return visitELF_SPARCV9_32(R, Value); -      case llvm::ELF::R_SPARC_64: -      case llvm::ELF::R_SPARC_UA64: -        return visitELF_SPARCV9_64(R, Value); -      default: -        HasError = true; -        return RelocToApply(); +      case COFF::IMAGE_REL_I386_SECREL: +        return visitCOFF_I386_SECREL(R, Value); +      case COFF::IMAGE_REL_I386_DIR32: +        return visitCOFF_I386_DIR32(R, Value);        } -    } else if (FileFormat == "ELF32-arm") { +      break; +    case Triple::x86_64:        switch (RelocType) { -      default: -        HasError = true; -        return RelocToApply(); -      case llvm::ELF::R_ARM_ABS32: -        return visitELF_ARM_ABS32(R, Value); +      case COFF::IMAGE_REL_AMD64_SECREL: +        return visitCOFF_AMD64_SECREL(R, Value); +      case COFF::IMAGE_REL_AMD64_ADDR64: +        return visitCOFF_AMD64_ADDR64(R, Value);        } +      break;      }      HasError = true;      return RelocToApply();    } -  bool error() { return HasError; } - -private: -  StringRef FileFormat; -  bool HasError; - -  int64_t getAddend32LE(RelocationRef R) { +  int64_t getELFAddend32LE(RelocationRef R) {      const ELF32LEObjectFile *Obj = cast<ELF32LEObjectFile>(R.getObjectFile());      DataRefImpl DRI = R.getRawDataRefImpl();      int64_t Addend; @@ -180,7 +229,7 @@ private:      return Addend;    } -  int64_t getAddend64LE(RelocationRef R) { +  int64_t getELFAddend64LE(RelocationRef R) {      const ELF64LEObjectFile *Obj = cast<ELF64LEObjectFile>(R.getObjectFile());      DataRefImpl DRI = R.getRawDataRefImpl();      int64_t Addend; @@ -188,7 +237,7 @@ private:      return Addend;    } -  int64_t getAddend32BE(RelocationRef R) { +  int64_t getELFAddend32BE(RelocationRef R) {      const ELF32BEObjectFile *Obj = cast<ELF32BEObjectFile>(R.getObjectFile());      DataRefImpl DRI = R.getRawDataRefImpl();      int64_t Addend; @@ -196,7 +245,7 @@ private:      return Addend;    } -  int64_t getAddend64BE(RelocationRef R) { +  int64_t getELFAddend64BE(RelocationRef R) {      const ELF64BEObjectFile *Obj = cast<ELF64BEObjectFile>(R.getObjectFile());      DataRefImpl DRI = R.getRawDataRefImpl();      int64_t Addend; @@ -213,13 +262,12 @@ private:    // Ideally the Addend here will be the addend in the data for    // the relocation. It's not actually the case for Rel relocations.    RelocToApply visitELF_386_32(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend32LE(R); +    int64_t Addend = getELFAddend32LE(R);      return RelocToApply(Value + Addend, 4);    } -  RelocToApply visitELF_386_PC32(RelocationRef R, uint64_t Value, -                                 uint64_t SecAddr) { -    int64_t Addend = getAddend32LE(R); +  RelocToApply visitELF_386_PC32(RelocationRef R, uint64_t Value) { +    int64_t Addend = getELFAddend32LE(R);      uint64_t Address;      R.getOffset(Address);      return RelocToApply(Value + Addend - Address, 4); @@ -230,23 +278,22 @@ private:      return RelocToApply(0, 0);    }    RelocToApply visitELF_X86_64_64(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend64LE(R); +    int64_t Addend = getELFAddend64LE(R);      return RelocToApply(Value + Addend, 8);    } -  RelocToApply visitELF_X86_64_PC32(RelocationRef R, uint64_t Value, -                                    uint64_t SecAddr) { -    int64_t Addend = getAddend64LE(R); +  RelocToApply visitELF_X86_64_PC32(RelocationRef R, uint64_t Value) { +    int64_t Addend = getELFAddend64LE(R);      uint64_t Address;      R.getOffset(Address);      return RelocToApply(Value + Addend - Address, 4);    }    RelocToApply visitELF_X86_64_32(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend64LE(R); +    int64_t Addend = getELFAddend64LE(R);      uint32_t Res = (Value + Addend) & 0xFFFFFFFF;      return RelocToApply(Res, 4);    }    RelocToApply visitELF_X86_64_32S(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend64LE(R); +    int64_t Addend = getELFAddend64LE(R);      int32_t Res = (Value + Addend) & 0xFFFFFFFF;      return RelocToApply(Res, 4);    } @@ -266,7 +313,7 @@ private:    /// PPC32 ELF    RelocToApply visitELF_PPC_ADDR32(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend32BE(R); +    int64_t Addend = getELFAddend32BE(R);      uint32_t Res = (Value + Addend) & 0xFFFFFFFF;      return RelocToApply(Res, 4);    } @@ -288,7 +335,8 @@ private:    // AArch64 ELF    RelocToApply visitELF_AARCH64_ABS32(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend64LE(R); +    int64_t Addend; +    getELFRelocationAddend(R, Addend);      int64_t Res =  Value + Addend;      // Overflow check allows for both signed and unsigned interpretation. @@ -299,13 +347,14 @@ private:    }    RelocToApply visitELF_AARCH64_ABS64(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend64LE(R); +    int64_t Addend; +    getELFRelocationAddend(R, Addend);      return RelocToApply(Value + Addend, 8);    }    // SystemZ ELF    RelocToApply visitELF_390_32(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend64BE(R); +    int64_t Addend = getELFAddend64BE(R);      int64_t Res = Value + Addend;      // Overflow check allows for both signed and unsigned interpretation. @@ -316,30 +365,54 @@ private:    }    RelocToApply visitELF_390_64(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend64BE(R); +    int64_t Addend = getELFAddend64BE(R);      return RelocToApply(Value + Addend, 8);    }    RelocToApply visitELF_SPARC_32(RelocationRef R, uint32_t Value) { -    int32_t Addend = getAddend32BE(R); +    int32_t Addend = getELFAddend32BE(R);      return RelocToApply(Value + Addend, 4);    }    RelocToApply visitELF_SPARCV9_32(RelocationRef R, uint64_t Value) { -    int32_t Addend = getAddend64BE(R); +    int32_t Addend = getELFAddend64BE(R);      return RelocToApply(Value + Addend, 4);    }    RelocToApply visitELF_SPARCV9_64(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend64BE(R); +    int64_t Addend = getELFAddend64BE(R);      return RelocToApply(Value + Addend, 8);    }    RelocToApply visitELF_ARM_ABS32(RelocationRef R, uint64_t Value) { -    int64_t Addend = getAddend32LE(R); -    return RelocToApply(Value + Addend, 4); +    int64_t Addend; +    getELFRelocationAddend(R, Addend); +    int64_t Res = Value + Addend; + +    // Overflow check allows for both signed and unsigned interpretation. +    if (Res < INT32_MIN || Res > UINT32_MAX) +      HasError = true; + +    return RelocToApply(static_cast<uint32_t>(Res), 4);    } +  /// I386 COFF +  RelocToApply visitCOFF_I386_SECREL(RelocationRef R, uint64_t Value) { +    return RelocToApply(static_cast<uint32_t>(Value), /*Width=*/4); +  } + +  RelocToApply visitCOFF_I386_DIR32(RelocationRef R, uint64_t Value) { +    return RelocToApply(static_cast<uint32_t>(Value), /*Width=*/4); +  } + +  /// AMD64 COFF +  RelocToApply visitCOFF_AMD64_SECREL(RelocationRef R, uint64_t Value) { +    return RelocToApply(static_cast<uint32_t>(Value), /*Width=*/4); +  } + +  RelocToApply visitCOFF_AMD64_ADDR64(RelocationRef R, uint64_t Value) { +    return RelocToApply(Value, /*Width=*/8); +  }  };  } diff --git a/include/llvm/Object/SymbolicFile.h b/include/llvm/Object/SymbolicFile.h index 77eef4a..435799a 100644 --- a/include/llvm/Object/SymbolicFile.h +++ b/include/llvm/Object/SymbolicFile.h @@ -11,8 +11,8 @@  //  //===----------------------------------------------------------------------===// -#ifndef LLVM_OBJECT_SYMBOLIC_FILE_H -#define LLVM_OBJECT_SYMBOLIC_FILE_H +#ifndef LLVM_OBJECT_SYMBOLICFILE_H +#define LLVM_OBJECT_SYMBOLICFILE_H  #include "llvm/Object/Binary.h" @@ -87,8 +87,9 @@ public:      SF_Absolute = 1U << 3,       // Absolute symbol      SF_Common = 1U << 4,         // Symbol has common linkage      SF_Indirect = 1U << 5,       // Symbol is an alias to another symbol -    SF_FormatSpecific = 1U << 6  // Specific to the object file format +    SF_FormatSpecific = 1U << 6, // Specific to the object file format                                   // (e.g. section symbols) +    SF_Thumb = 1U << 7           // Thumb symbol in a 32-bit ARM binary    };    BasicSymbolRef() : OwningObject(nullptr) { } @@ -115,7 +116,7 @@ const uint64_t UnknownAddressOrSize = ~0ULL;  class SymbolicFile : public Binary {  public:    virtual ~SymbolicFile(); -  SymbolicFile(unsigned int Type, std::unique_ptr<MemoryBuffer> Source); +  SymbolicFile(unsigned int Type, MemoryBufferRef Source);    // virtual interface.    virtual void moveSymbolNext(DataRefImpl &Symb) const = 0; @@ -142,15 +143,16 @@ public:    }    // construction aux. -  static ErrorOr<SymbolicFile *> -  createSymbolicFile(std::unique_ptr<MemoryBuffer> &Object, -                     sys::fs::file_magic Type, LLVMContext *Context); +  static ErrorOr<std::unique_ptr<SymbolicFile>> +  createSymbolicFile(MemoryBufferRef Object, sys::fs::file_magic Type, +                     LLVMContext *Context); -  static ErrorOr<SymbolicFile *> -  createSymbolicFile(std::unique_ptr<MemoryBuffer> &Object) { +  static ErrorOr<std::unique_ptr<SymbolicFile>> +  createSymbolicFile(MemoryBufferRef Object) {      return createSymbolicFile(Object, sys::fs::file_magic::unknown, nullptr);    } -  static ErrorOr<SymbolicFile *> createSymbolicFile(StringRef ObjectPath); +  static ErrorOr<OwningBinary<SymbolicFile>> +  createSymbolicFile(StringRef ObjectPath);    static inline bool classof(const Binary *v) {      return v->isSymbolic(); | 
