| //===- Chunks.h -------------------------------------------------*- C++ -*-===// |
| // |
| // The LLVM Linker |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #ifndef LLD_COFF_CHUNKS_H |
| #define LLD_COFF_CHUNKS_H |
| |
| #include "Config.h" |
| #include "InputFiles.h" |
| #include "lld/Common/LLVM.h" |
| #include "llvm/ADT/ArrayRef.h" |
| #include "llvm/ADT/iterator.h" |
| #include "llvm/ADT/iterator_range.h" |
| #include "llvm/MC/StringTableBuilder.h" |
| #include "llvm/Object/COFF.h" |
| #include <utility> |
| #include <vector> |
| |
| namespace lld { |
| namespace coff { |
| |
| using llvm::COFF::ImportDirectoryTableEntry; |
| using llvm::object::COFFSymbolRef; |
| using llvm::object::SectionRef; |
| using llvm::object::coff_relocation; |
| using llvm::object::coff_section; |
| |
| class Baserel; |
| class Defined; |
| class DefinedImportData; |
| class DefinedRegular; |
| class ObjFile; |
| class OutputSection; |
| class Symbol; |
| |
| // Mask for permissions (discardable, writable, readable, executable, etc). |
| const uint32_t PermMask = 0xFE000000; |
| |
| // Mask for section types (code, data, bss). |
| const uint32_t TypeMask = 0x000000E0; |
| |
| // A Chunk represents a chunk of data that will occupy space in the |
| // output (if the resolver chose that). It may or may not be backed by |
| // a section of an input file. It could be linker-created data, or |
| // doesn't even have actual data (if common or bss). |
| class Chunk { |
| public: |
| enum Kind { SectionKind, OtherKind }; |
| Kind kind() const { return ChunkKind; } |
| virtual ~Chunk() = default; |
| |
| // Returns the size of this chunk (even if this is a common or BSS.) |
| virtual size_t getSize() const = 0; |
| |
| // Write this chunk to a mmap'ed file, assuming Buf is pointing to |
| // beginning of the file. Because this function may use RVA values |
| // of other chunks for relocations, you need to set them properly |
| // before calling this function. |
| virtual void writeTo(uint8_t *Buf) const {} |
| |
| // Called by the writer after an RVA is assigned, but before calling |
| // getSize(). |
| virtual void finalizeContents() {} |
| |
| // The writer sets and uses the addresses. |
| uint64_t getRVA() const { return RVA; } |
| void setRVA(uint64_t V) { RVA = V; } |
| |
| // Returns true if this has non-zero data. BSS chunks return |
| // false. If false is returned, the space occupied by this chunk |
| // will be filled with zeros. |
| virtual bool hasData() const { return true; } |
| |
| // Returns readable/writable/executable bits. |
| virtual uint32_t getOutputCharacteristics() const { return 0; } |
| |
| // Returns the section name if this is a section chunk. |
| // It is illegal to call this function on non-section chunks. |
| virtual StringRef getSectionName() const { |
| llvm_unreachable("unimplemented getSectionName"); |
| } |
| |
| // An output section has pointers to chunks in the section, and each |
| // chunk has a back pointer to an output section. |
| void setOutputSection(OutputSection *O) { Out = O; } |
| OutputSection *getOutputSection() const { return Out; } |
| |
| // Windows-specific. |
| // Collect all locations that contain absolute addresses for base relocations. |
| virtual void getBaserels(std::vector<Baserel> *Res) {} |
| |
| // Returns a human-readable name of this chunk. Chunks are unnamed chunks of |
| // bytes, so this is used only for logging or debugging. |
| virtual StringRef getDebugName() { return ""; } |
| |
| // The alignment of this chunk. The writer uses the value. |
| uint32_t Alignment = 1; |
| |
| protected: |
| Chunk(Kind K = OtherKind) : ChunkKind(K) {} |
| const Kind ChunkKind; |
| |
| // The RVA of this chunk in the output. The writer sets a value. |
| uint64_t RVA = 0; |
| |
| // The output section for this chunk. |
| OutputSection *Out = nullptr; |
| |
| public: |
| // The offset from beginning of the output section. The writer sets a value. |
| uint64_t OutputSectionOff = 0; |
| }; |
| |
| // A chunk corresponding a section of an input file. |
| class SectionChunk final : public Chunk { |
| // Identical COMDAT Folding feature accesses section internal data. |
| friend class ICF; |
| |
| public: |
| class symbol_iterator : public llvm::iterator_adaptor_base< |
| symbol_iterator, const coff_relocation *, |
| std::random_access_iterator_tag, Symbol *> { |
| friend SectionChunk; |
| |
| ObjFile *File; |
| |
| symbol_iterator(ObjFile *File, const coff_relocation *I) |
| : symbol_iterator::iterator_adaptor_base(I), File(File) {} |
| |
| public: |
| symbol_iterator() = default; |
| |
| Symbol *operator*() const { return File->getSymbol(I->SymbolTableIndex); } |
| }; |
| |
| SectionChunk(ObjFile *File, const coff_section *Header); |
| static bool classof(const Chunk *C) { return C->kind() == SectionKind; } |
| size_t getSize() const override { return Header->SizeOfRawData; } |
| ArrayRef<uint8_t> getContents() const; |
| void writeTo(uint8_t *Buf) const override; |
| bool hasData() const override; |
| uint32_t getOutputCharacteristics() const override; |
| StringRef getSectionName() const override { return SectionName; } |
| void getBaserels(std::vector<Baserel> *Res) override; |
| bool isCOMDAT() const; |
| void applyRelX64(uint8_t *Off, uint16_t Type, OutputSection *OS, uint64_t S, |
| uint64_t P) const; |
| void applyRelX86(uint8_t *Off, uint16_t Type, OutputSection *OS, uint64_t S, |
| uint64_t P) const; |
| void applyRelARM(uint8_t *Off, uint16_t Type, OutputSection *OS, uint64_t S, |
| uint64_t P) const; |
| void applyRelARM64(uint8_t *Off, uint16_t Type, OutputSection *OS, uint64_t S, |
| uint64_t P) const; |
| |
| // Called if the garbage collector decides to not include this chunk |
| // in a final output. It's supposed to print out a log message to stdout. |
| void printDiscardedMessage() const; |
| |
| // Adds COMDAT associative sections to this COMDAT section. A chunk |
| // and its children are treated as a group by the garbage collector. |
| void addAssociative(SectionChunk *Child); |
| |
| StringRef getDebugName() override; |
| |
| // Returns true if the chunk was not dropped by GC. |
| bool isLive() { return Live; } |
| |
| // Used by the garbage collector. |
| void markLive() { |
| assert(Config->DoGC && "should only mark things live from GC"); |
| assert(!isLive() && "Cannot mark an already live section!"); |
| Live = true; |
| } |
| |
| // True if this is a codeview debug info chunk. These will not be laid out in |
| // the image. Instead they will end up in the PDB, if one is requested. |
| bool isCodeView() const { |
| return SectionName == ".debug" || SectionName.startswith(".debug$"); |
| } |
| |
| // True if this is a DWARF debug info or exception handling chunk. |
| bool isDWARF() const { |
| return SectionName.startswith(".debug_") || SectionName == ".eh_frame"; |
| } |
| |
| // Allow iteration over the bodies of this chunk's relocated symbols. |
| llvm::iterator_range<symbol_iterator> symbols() const { |
| return llvm::make_range(symbol_iterator(File, Relocs.begin()), |
| symbol_iterator(File, Relocs.end())); |
| } |
| |
| // Allow iteration over the associated child chunks for this section. |
| ArrayRef<SectionChunk *> children() const { return AssocChildren; } |
| |
| // A pointer pointing to a replacement for this chunk. |
| // Initially it points to "this" object. If this chunk is merged |
| // with other chunk by ICF, it points to another chunk, |
| // and this chunk is considrered as dead. |
| SectionChunk *Repl; |
| |
| // The CRC of the contents as described in the COFF spec 4.5.5. |
| // Auxiliary Format 5: Section Definitions. Used for ICF. |
| uint32_t Checksum = 0; |
| |
| const coff_section *Header; |
| |
| // The file that this chunk was created from. |
| ObjFile *File; |
| |
| // The COMDAT leader symbol if this is a COMDAT chunk. |
| DefinedRegular *Sym = nullptr; |
| |
| ArrayRef<coff_relocation> Relocs; |
| |
| private: |
| StringRef SectionName; |
| std::vector<SectionChunk *> AssocChildren; |
| |
| // Used by the garbage collector. |
| bool Live; |
| |
| // Used for ICF (Identical COMDAT Folding) |
| void replace(SectionChunk *Other); |
| uint32_t Class[2] = {0, 0}; |
| }; |
| |
| // This class is used to implement an lld-specific feature (not implemented in |
| // MSVC) that minimizes the output size by finding string literals sharing tail |
| // parts and merging them. |
| // |
| // If string tail merging is enabled and a section is identified as containing a |
| // string literal, it is added to a MergeChunk with an appropriate alignment. |
| // The MergeChunk then tail merges the strings using the StringTableBuilder |
| // class and assigns RVAs and section offsets to each of the member chunks based |
| // on the offsets assigned by the StringTableBuilder. |
| class MergeChunk : public Chunk { |
| public: |
| MergeChunk(uint32_t Alignment); |
| static void addSection(SectionChunk *C); |
| void finalizeContents() override; |
| |
| uint32_t getOutputCharacteristics() const override; |
| StringRef getSectionName() const override { return ".rdata"; } |
| size_t getSize() const override; |
| void writeTo(uint8_t *Buf) const override; |
| |
| static std::map<uint32_t, MergeChunk *> Instances; |
| std::vector<SectionChunk *> Sections; |
| |
| private: |
| llvm::StringTableBuilder Builder; |
| }; |
| |
| // A chunk for common symbols. Common chunks don't have actual data. |
| class CommonChunk : public Chunk { |
| public: |
| CommonChunk(const COFFSymbolRef Sym); |
| size_t getSize() const override { return Sym.getValue(); } |
| bool hasData() const override { return false; } |
| uint32_t getOutputCharacteristics() const override; |
| StringRef getSectionName() const override { return ".bss"; } |
| |
| private: |
| const COFFSymbolRef Sym; |
| }; |
| |
| // A chunk for linker-created strings. |
| class StringChunk : public Chunk { |
| public: |
| explicit StringChunk(StringRef S) : Str(S) {} |
| size_t getSize() const override { return Str.size() + 1; } |
| void writeTo(uint8_t *Buf) const override; |
| |
| private: |
| StringRef Str; |
| }; |
| |
| static const uint8_t ImportThunkX86[] = { |
| 0xff, 0x25, 0x00, 0x00, 0x00, 0x00, // JMP *0x0 |
| }; |
| |
| static const uint8_t ImportThunkARM[] = { |
| 0x40, 0xf2, 0x00, 0x0c, // mov.w ip, #0 |
| 0xc0, 0xf2, 0x00, 0x0c, // mov.t ip, #0 |
| 0xdc, 0xf8, 0x00, 0xf0, // ldr.w pc, [ip] |
| }; |
| |
| static const uint8_t ImportThunkARM64[] = { |
| 0x10, 0x00, 0x00, 0x90, // adrp x16, #0 |
| 0x10, 0x02, 0x40, 0xf9, // ldr x16, [x16] |
| 0x00, 0x02, 0x1f, 0xd6, // br x16 |
| }; |
| |
| // Windows-specific. |
| // A chunk for DLL import jump table entry. In a final output, it's |
| // contents will be a JMP instruction to some __imp_ symbol. |
| class ImportThunkChunkX64 : public Chunk { |
| public: |
| explicit ImportThunkChunkX64(Defined *S); |
| size_t getSize() const override { return sizeof(ImportThunkX86); } |
| void writeTo(uint8_t *Buf) const override; |
| |
| private: |
| Defined *ImpSymbol; |
| }; |
| |
| class ImportThunkChunkX86 : public Chunk { |
| public: |
| explicit ImportThunkChunkX86(Defined *S) : ImpSymbol(S) {} |
| size_t getSize() const override { return sizeof(ImportThunkX86); } |
| void getBaserels(std::vector<Baserel> *Res) override; |
| void writeTo(uint8_t *Buf) const override; |
| |
| private: |
| Defined *ImpSymbol; |
| }; |
| |
| class ImportThunkChunkARM : public Chunk { |
| public: |
| explicit ImportThunkChunkARM(Defined *S) : ImpSymbol(S) {} |
| size_t getSize() const override { return sizeof(ImportThunkARM); } |
| void getBaserels(std::vector<Baserel> *Res) override; |
| void writeTo(uint8_t *Buf) const override; |
| |
| private: |
| Defined *ImpSymbol; |
| }; |
| |
| class ImportThunkChunkARM64 : public Chunk { |
| public: |
| explicit ImportThunkChunkARM64(Defined *S) : ImpSymbol(S) {} |
| size_t getSize() const override { return sizeof(ImportThunkARM64); } |
| void writeTo(uint8_t *Buf) const override; |
| |
| private: |
| Defined *ImpSymbol; |
| }; |
| |
| // Windows-specific. |
| // See comments for DefinedLocalImport class. |
| class LocalImportChunk : public Chunk { |
| public: |
| explicit LocalImportChunk(Defined *S) : Sym(S) { |
| Alignment = Config->is64() ? 8 : 4; |
| } |
| size_t getSize() const override; |
| void getBaserels(std::vector<Baserel> *Res) override; |
| void writeTo(uint8_t *Buf) const override; |
| |
| private: |
| Defined *Sym; |
| }; |
| |
| // Duplicate RVAs are not allowed in RVA tables, so unique symbols by chunk and |
| // offset into the chunk. Order does not matter as the RVA table will be sorted |
| // later. |
| struct ChunkAndOffset { |
| Chunk *InputChunk; |
| uint32_t Offset; |
| |
| struct DenseMapInfo { |
| static ChunkAndOffset getEmptyKey() { |
| return {llvm::DenseMapInfo<Chunk *>::getEmptyKey(), 0}; |
| } |
| static ChunkAndOffset getTombstoneKey() { |
| return {llvm::DenseMapInfo<Chunk *>::getTombstoneKey(), 0}; |
| } |
| static unsigned getHashValue(const ChunkAndOffset &CO) { |
| return llvm::DenseMapInfo<std::pair<Chunk *, uint32_t>>::getHashValue( |
| {CO.InputChunk, CO.Offset}); |
| } |
| static bool isEqual(const ChunkAndOffset &LHS, const ChunkAndOffset &RHS) { |
| return LHS.InputChunk == RHS.InputChunk && LHS.Offset == RHS.Offset; |
| } |
| }; |
| }; |
| |
| using SymbolRVASet = llvm::DenseSet<ChunkAndOffset>; |
| |
| // Table which contains symbol RVAs. Used for /safeseh and /guard:cf. |
| class RVATableChunk : public Chunk { |
| public: |
| explicit RVATableChunk(SymbolRVASet S) : Syms(std::move(S)) {} |
| size_t getSize() const override { return Syms.size() * 4; } |
| void writeTo(uint8_t *Buf) const override; |
| |
| private: |
| SymbolRVASet Syms; |
| }; |
| |
| // Windows-specific. |
| // This class represents a block in .reloc section. |
| // See the PE/COFF spec 5.6 for details. |
| class BaserelChunk : public Chunk { |
| public: |
| BaserelChunk(uint32_t Page, Baserel *Begin, Baserel *End); |
| size_t getSize() const override { return Data.size(); } |
| void writeTo(uint8_t *Buf) const override; |
| |
| private: |
| std::vector<uint8_t> Data; |
| }; |
| |
| class Baserel { |
| public: |
| Baserel(uint32_t V, uint8_t Ty) : RVA(V), Type(Ty) {} |
| explicit Baserel(uint32_t V) : Baserel(V, getDefaultType()) {} |
| uint8_t getDefaultType(); |
| |
| uint32_t RVA; |
| uint8_t Type; |
| }; |
| |
| void applyMOV32T(uint8_t *Off, uint32_t V); |
| void applyBranch24T(uint8_t *Off, int32_t V); |
| |
| } // namespace coff |
| } // namespace lld |
| |
| namespace llvm { |
| template <> |
| struct DenseMapInfo<lld::coff::ChunkAndOffset> |
| : lld::coff::ChunkAndOffset::DenseMapInfo {}; |
| } |
| |
| #endif |