xref: /freebsd/contrib/llvm-project/lld/COFF/Writer.cpp (revision fb03ea46eb853b2d128828e9d82882125bcc1657)
10b57cec5SDimitry Andric //===- Writer.cpp ---------------------------------------------------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric 
90b57cec5SDimitry Andric #include "Writer.h"
10349cc55cSDimitry Andric #include "COFFLinkerContext.h"
11e8d8bef9SDimitry Andric #include "CallGraphSort.h"
120b57cec5SDimitry Andric #include "Config.h"
130b57cec5SDimitry Andric #include "DLL.h"
140b57cec5SDimitry Andric #include "InputFiles.h"
155ffd83dbSDimitry Andric #include "LLDMapFile.h"
160b57cec5SDimitry Andric #include "MapFile.h"
170b57cec5SDimitry Andric #include "PDB.h"
180b57cec5SDimitry Andric #include "SymbolTable.h"
190b57cec5SDimitry Andric #include "Symbols.h"
200b57cec5SDimitry Andric #include "lld/Common/ErrorHandler.h"
210b57cec5SDimitry Andric #include "lld/Common/Memory.h"
220b57cec5SDimitry Andric #include "lld/Common/Timer.h"
230b57cec5SDimitry Andric #include "llvm/ADT/DenseMap.h"
240b57cec5SDimitry Andric #include "llvm/ADT/STLExtras.h"
25480093f4SDimitry Andric #include "llvm/ADT/StringSet.h"
260b57cec5SDimitry Andric #include "llvm/ADT/StringSwitch.h"
270b57cec5SDimitry Andric #include "llvm/Support/BinaryStreamReader.h"
280b57cec5SDimitry Andric #include "llvm/Support/Debug.h"
290b57cec5SDimitry Andric #include "llvm/Support/Endian.h"
300b57cec5SDimitry Andric #include "llvm/Support/FileOutputBuffer.h"
310b57cec5SDimitry Andric #include "llvm/Support/Parallel.h"
320b57cec5SDimitry Andric #include "llvm/Support/Path.h"
330b57cec5SDimitry Andric #include "llvm/Support/RandomNumberGenerator.h"
340b57cec5SDimitry Andric #include "llvm/Support/xxhash.h"
350b57cec5SDimitry Andric #include <algorithm>
360b57cec5SDimitry Andric #include <cstdio>
370b57cec5SDimitry Andric #include <map>
380b57cec5SDimitry Andric #include <memory>
390b57cec5SDimitry Andric #include <utility>
400b57cec5SDimitry Andric 
410b57cec5SDimitry Andric using namespace llvm;
420b57cec5SDimitry Andric using namespace llvm::COFF;
430b57cec5SDimitry Andric using namespace llvm::object;
440b57cec5SDimitry Andric using namespace llvm::support;
450b57cec5SDimitry Andric using namespace llvm::support::endian;
465ffd83dbSDimitry Andric using namespace lld;
475ffd83dbSDimitry Andric using namespace lld::coff;
480b57cec5SDimitry Andric 
490b57cec5SDimitry Andric /* To re-generate DOSProgram:
500b57cec5SDimitry Andric $ cat > /tmp/DOSProgram.asm
510b57cec5SDimitry Andric org 0
520b57cec5SDimitry Andric         ; Copy cs to ds.
530b57cec5SDimitry Andric         push cs
540b57cec5SDimitry Andric         pop ds
550b57cec5SDimitry Andric         ; Point ds:dx at the $-terminated string.
560b57cec5SDimitry Andric         mov dx, str
570b57cec5SDimitry Andric         ; Int 21/AH=09h: Write string to standard output.
580b57cec5SDimitry Andric         mov ah, 0x9
590b57cec5SDimitry Andric         int 0x21
600b57cec5SDimitry Andric         ; Int 21/AH=4Ch: Exit with return code (in AL).
610b57cec5SDimitry Andric         mov ax, 0x4C01
620b57cec5SDimitry Andric         int 0x21
630b57cec5SDimitry Andric str:
640b57cec5SDimitry Andric         db 'This program cannot be run in DOS mode.$'
650b57cec5SDimitry Andric align 8, db 0
660b57cec5SDimitry Andric $ nasm -fbin /tmp/DOSProgram.asm -o /tmp/DOSProgram.bin
670b57cec5SDimitry Andric $ xxd -i /tmp/DOSProgram.bin
680b57cec5SDimitry Andric */
690b57cec5SDimitry Andric static unsigned char dosProgram[] = {
700b57cec5SDimitry Andric   0x0e, 0x1f, 0xba, 0x0e, 0x00, 0xb4, 0x09, 0xcd, 0x21, 0xb8, 0x01, 0x4c,
710b57cec5SDimitry Andric   0xcd, 0x21, 0x54, 0x68, 0x69, 0x73, 0x20, 0x70, 0x72, 0x6f, 0x67, 0x72,
720b57cec5SDimitry Andric   0x61, 0x6d, 0x20, 0x63, 0x61, 0x6e, 0x6e, 0x6f, 0x74, 0x20, 0x62, 0x65,
730b57cec5SDimitry Andric   0x20, 0x72, 0x75, 0x6e, 0x20, 0x69, 0x6e, 0x20, 0x44, 0x4f, 0x53, 0x20,
740b57cec5SDimitry Andric   0x6d, 0x6f, 0x64, 0x65, 0x2e, 0x24, 0x00, 0x00
750b57cec5SDimitry Andric };
760b57cec5SDimitry Andric static_assert(sizeof(dosProgram) % 8 == 0,
770b57cec5SDimitry Andric               "DOSProgram size must be multiple of 8");
780b57cec5SDimitry Andric 
790b57cec5SDimitry Andric static const int dosStubSize = sizeof(dos_header) + sizeof(dosProgram);
800b57cec5SDimitry Andric static_assert(dosStubSize % 8 == 0, "DOSStub size must be multiple of 8");
810b57cec5SDimitry Andric 
820b57cec5SDimitry Andric static const int numberOfDataDirectory = 16;
830b57cec5SDimitry Andric 
840b57cec5SDimitry Andric namespace {
850b57cec5SDimitry Andric 
860b57cec5SDimitry Andric class DebugDirectoryChunk : public NonSectionChunk {
870b57cec5SDimitry Andric public:
88349cc55cSDimitry Andric   DebugDirectoryChunk(COFFLinkerContext &c,
89349cc55cSDimitry Andric                       const std::vector<std::pair<COFF::DebugType, Chunk *>> &r,
905ffd83dbSDimitry Andric                       bool writeRepro)
91349cc55cSDimitry Andric       : records(r), writeRepro(writeRepro), ctx(c) {}
920b57cec5SDimitry Andric 
930b57cec5SDimitry Andric   size_t getSize() const override {
940b57cec5SDimitry Andric     return (records.size() + int(writeRepro)) * sizeof(debug_directory);
950b57cec5SDimitry Andric   }
960b57cec5SDimitry Andric 
970b57cec5SDimitry Andric   void writeTo(uint8_t *b) const override {
980b57cec5SDimitry Andric     auto *d = reinterpret_cast<debug_directory *>(b);
990b57cec5SDimitry Andric 
1005ffd83dbSDimitry Andric     for (const std::pair<COFF::DebugType, Chunk *>& record : records) {
1015ffd83dbSDimitry Andric       Chunk *c = record.second;
102349cc55cSDimitry Andric       OutputSection *os = ctx.getOutputSection(c);
1035ffd83dbSDimitry Andric       uint64_t offs = os->getFileOff() + (c->getRVA() - os->getRVA());
1045ffd83dbSDimitry Andric       fillEntry(d, record.first, c->getSize(), c->getRVA(), offs);
1050b57cec5SDimitry Andric       ++d;
1060b57cec5SDimitry Andric     }
1070b57cec5SDimitry Andric 
1080b57cec5SDimitry Andric     if (writeRepro) {
1090b57cec5SDimitry Andric       // FIXME: The COFF spec allows either a 0-sized entry to just say
1100b57cec5SDimitry Andric       // "the timestamp field is really a hash", or a 4-byte size field
1110b57cec5SDimitry Andric       // followed by that many bytes containing a longer hash (with the
1120b57cec5SDimitry Andric       // lowest 4 bytes usually being the timestamp in little-endian order).
1130b57cec5SDimitry Andric       // Consider storing the full 8 bytes computed by xxHash64 here.
1140b57cec5SDimitry Andric       fillEntry(d, COFF::IMAGE_DEBUG_TYPE_REPRO, 0, 0, 0);
1150b57cec5SDimitry Andric     }
1160b57cec5SDimitry Andric   }
1170b57cec5SDimitry Andric 
1180b57cec5SDimitry Andric   void setTimeDateStamp(uint32_t timeDateStamp) {
1190b57cec5SDimitry Andric     for (support::ulittle32_t *tds : timeDateStamps)
1200b57cec5SDimitry Andric       *tds = timeDateStamp;
1210b57cec5SDimitry Andric   }
1220b57cec5SDimitry Andric 
1230b57cec5SDimitry Andric private:
1240b57cec5SDimitry Andric   void fillEntry(debug_directory *d, COFF::DebugType debugType, size_t size,
1250b57cec5SDimitry Andric                  uint64_t rva, uint64_t offs) const {
1260b57cec5SDimitry Andric     d->Characteristics = 0;
1270b57cec5SDimitry Andric     d->TimeDateStamp = 0;
1280b57cec5SDimitry Andric     d->MajorVersion = 0;
1290b57cec5SDimitry Andric     d->MinorVersion = 0;
1300b57cec5SDimitry Andric     d->Type = debugType;
1310b57cec5SDimitry Andric     d->SizeOfData = size;
1320b57cec5SDimitry Andric     d->AddressOfRawData = rva;
1330b57cec5SDimitry Andric     d->PointerToRawData = offs;
1340b57cec5SDimitry Andric 
1350b57cec5SDimitry Andric     timeDateStamps.push_back(&d->TimeDateStamp);
1360b57cec5SDimitry Andric   }
1370b57cec5SDimitry Andric 
1380b57cec5SDimitry Andric   mutable std::vector<support::ulittle32_t *> timeDateStamps;
1395ffd83dbSDimitry Andric   const std::vector<std::pair<COFF::DebugType, Chunk *>> &records;
1400b57cec5SDimitry Andric   bool writeRepro;
141349cc55cSDimitry Andric 
142349cc55cSDimitry Andric   COFFLinkerContext &ctx;
1430b57cec5SDimitry Andric };
1440b57cec5SDimitry Andric 
1450b57cec5SDimitry Andric class CVDebugRecordChunk : public NonSectionChunk {
1460b57cec5SDimitry Andric public:
1470b57cec5SDimitry Andric   size_t getSize() const override {
1480b57cec5SDimitry Andric     return sizeof(codeview::DebugInfo) + config->pdbAltPath.size() + 1;
1490b57cec5SDimitry Andric   }
1500b57cec5SDimitry Andric 
1510b57cec5SDimitry Andric   void writeTo(uint8_t *b) const override {
1520b57cec5SDimitry Andric     // Save off the DebugInfo entry to backfill the file signature (build id)
1530b57cec5SDimitry Andric     // in Writer::writeBuildId
1540b57cec5SDimitry Andric     buildId = reinterpret_cast<codeview::DebugInfo *>(b);
1550b57cec5SDimitry Andric 
1560b57cec5SDimitry Andric     // variable sized field (PDB Path)
1570b57cec5SDimitry Andric     char *p = reinterpret_cast<char *>(b + sizeof(*buildId));
1580b57cec5SDimitry Andric     if (!config->pdbAltPath.empty())
1590b57cec5SDimitry Andric       memcpy(p, config->pdbAltPath.data(), config->pdbAltPath.size());
1600b57cec5SDimitry Andric     p[config->pdbAltPath.size()] = '\0';
1610b57cec5SDimitry Andric   }
1620b57cec5SDimitry Andric 
1630b57cec5SDimitry Andric   mutable codeview::DebugInfo *buildId = nullptr;
1640b57cec5SDimitry Andric };
1650b57cec5SDimitry Andric 
1665ffd83dbSDimitry Andric class ExtendedDllCharacteristicsChunk : public NonSectionChunk {
1675ffd83dbSDimitry Andric public:
1685ffd83dbSDimitry Andric   ExtendedDllCharacteristicsChunk(uint32_t c) : characteristics(c) {}
1695ffd83dbSDimitry Andric 
1705ffd83dbSDimitry Andric   size_t getSize() const override { return 4; }
1715ffd83dbSDimitry Andric 
1725ffd83dbSDimitry Andric   void writeTo(uint8_t *buf) const override { write32le(buf, characteristics); }
1735ffd83dbSDimitry Andric 
1745ffd83dbSDimitry Andric   uint32_t characteristics = 0;
1755ffd83dbSDimitry Andric };
1765ffd83dbSDimitry Andric 
1770b57cec5SDimitry Andric // PartialSection represents a group of chunks that contribute to an
1780b57cec5SDimitry Andric // OutputSection. Collating a collection of PartialSections of same name and
1790b57cec5SDimitry Andric // characteristics constitutes the OutputSection.
1800b57cec5SDimitry Andric class PartialSectionKey {
1810b57cec5SDimitry Andric public:
1820b57cec5SDimitry Andric   StringRef name;
1830b57cec5SDimitry Andric   unsigned characteristics;
1840b57cec5SDimitry Andric 
1850b57cec5SDimitry Andric   bool operator<(const PartialSectionKey &other) const {
1860b57cec5SDimitry Andric     int c = name.compare(other.name);
1870b57cec5SDimitry Andric     if (c == 1)
1880b57cec5SDimitry Andric       return false;
1890b57cec5SDimitry Andric     if (c == 0)
1900b57cec5SDimitry Andric       return characteristics < other.characteristics;
1910b57cec5SDimitry Andric     return true;
1920b57cec5SDimitry Andric   }
1930b57cec5SDimitry Andric };
1940b57cec5SDimitry Andric 
1950b57cec5SDimitry Andric // The writer writes a SymbolTable result to a file.
1960b57cec5SDimitry Andric class Writer {
1970b57cec5SDimitry Andric public:
198349cc55cSDimitry Andric   Writer(COFFLinkerContext &c) : buffer(errorHandler().outputBuffer), ctx(c) {}
1990b57cec5SDimitry Andric   void run();
2000b57cec5SDimitry Andric 
2010b57cec5SDimitry Andric private:
2020b57cec5SDimitry Andric   void createSections();
2030b57cec5SDimitry Andric   void createMiscChunks();
2040b57cec5SDimitry Andric   void createImportTables();
2050b57cec5SDimitry Andric   void appendImportThunks();
2060b57cec5SDimitry Andric   void locateImportTables();
2070b57cec5SDimitry Andric   void createExportTable();
2080b57cec5SDimitry Andric   void mergeSections();
2090b57cec5SDimitry Andric   void removeUnusedSections();
2100b57cec5SDimitry Andric   void assignAddresses();
2110b57cec5SDimitry Andric   void finalizeAddresses();
2120b57cec5SDimitry Andric   void removeEmptySections();
2130b57cec5SDimitry Andric   void assignOutputSectionIndices();
2140b57cec5SDimitry Andric   void createSymbolAndStringTable();
2150b57cec5SDimitry Andric   void openFile(StringRef outputPath);
2160b57cec5SDimitry Andric   template <typename PEHeaderTy> void writeHeader();
2170b57cec5SDimitry Andric   void createSEHTable();
2180b57cec5SDimitry Andric   void createRuntimePseudoRelocs();
2190b57cec5SDimitry Andric   void insertCtorDtorSymbols();
2200b57cec5SDimitry Andric   void createGuardCFTables();
2210b57cec5SDimitry Andric   void markSymbolsForRVATable(ObjFile *file,
2220b57cec5SDimitry Andric                               ArrayRef<SectionChunk *> symIdxChunks,
2230b57cec5SDimitry Andric                               SymbolRVASet &tableSymbols);
224e8d8bef9SDimitry Andric   void getSymbolsFromSections(ObjFile *file,
225e8d8bef9SDimitry Andric                               ArrayRef<SectionChunk *> symIdxChunks,
226e8d8bef9SDimitry Andric                               std::vector<Symbol *> &symbols);
2270b57cec5SDimitry Andric   void maybeAddRVATable(SymbolRVASet tableSymbols, StringRef tableSym,
228fe6060f1SDimitry Andric                         StringRef countSym, bool hasFlag=false);
2290b57cec5SDimitry Andric   void setSectionPermissions();
2300b57cec5SDimitry Andric   void writeSections();
2310b57cec5SDimitry Andric   void writeBuildId();
232e8d8bef9SDimitry Andric   void sortSections();
2330b57cec5SDimitry Andric   void sortExceptionTable();
2340b57cec5SDimitry Andric   void sortCRTSectionChunks(std::vector<Chunk *> &chunks);
2350b57cec5SDimitry Andric   void addSyntheticIdata();
2360b57cec5SDimitry Andric   void fixPartialSectionChars(StringRef name, uint32_t chars);
2370b57cec5SDimitry Andric   bool fixGnuImportChunks();
238e8d8bef9SDimitry Andric   void fixTlsAlignment();
2390b57cec5SDimitry Andric   PartialSection *createPartialSection(StringRef name, uint32_t outChars);
2400b57cec5SDimitry Andric   PartialSection *findPartialSection(StringRef name, uint32_t outChars);
2410b57cec5SDimitry Andric 
2420b57cec5SDimitry Andric   llvm::Optional<coff_symbol16> createSymbol(Defined *d);
2430b57cec5SDimitry Andric   size_t addEntryToStringTable(StringRef str);
2440b57cec5SDimitry Andric 
2450b57cec5SDimitry Andric   OutputSection *findSection(StringRef name);
2460b57cec5SDimitry Andric   void addBaserels();
2470b57cec5SDimitry Andric   void addBaserelBlocks(std::vector<Baserel> &v);
2480b57cec5SDimitry Andric 
2490b57cec5SDimitry Andric   uint32_t getSizeOfInitializedData();
2500b57cec5SDimitry Andric 
2510b57cec5SDimitry Andric   std::unique_ptr<FileOutputBuffer> &buffer;
2520b57cec5SDimitry Andric   std::map<PartialSectionKey, PartialSection *> partialSections;
2530b57cec5SDimitry Andric   std::vector<char> strtab;
2540b57cec5SDimitry Andric   std::vector<llvm::object::coff_symbol16> outputSymtab;
2550b57cec5SDimitry Andric   IdataContents idata;
2560b57cec5SDimitry Andric   Chunk *importTableStart = nullptr;
2570b57cec5SDimitry Andric   uint64_t importTableSize = 0;
25885868e8aSDimitry Andric   Chunk *edataStart = nullptr;
25985868e8aSDimitry Andric   Chunk *edataEnd = nullptr;
2600b57cec5SDimitry Andric   Chunk *iatStart = nullptr;
2610b57cec5SDimitry Andric   uint64_t iatSize = 0;
2620b57cec5SDimitry Andric   DelayLoadContents delayIdata;
2630b57cec5SDimitry Andric   EdataContents edata;
2640b57cec5SDimitry Andric   bool setNoSEHCharacteristic = false;
265e8d8bef9SDimitry Andric   uint32_t tlsAlignment = 0;
2660b57cec5SDimitry Andric 
2670b57cec5SDimitry Andric   DebugDirectoryChunk *debugDirectory = nullptr;
2685ffd83dbSDimitry Andric   std::vector<std::pair<COFF::DebugType, Chunk *>> debugRecords;
2690b57cec5SDimitry Andric   CVDebugRecordChunk *buildId = nullptr;
2700b57cec5SDimitry Andric   ArrayRef<uint8_t> sectionTable;
2710b57cec5SDimitry Andric 
2720b57cec5SDimitry Andric   uint64_t fileSize;
2730b57cec5SDimitry Andric   uint32_t pointerToSymbolTable = 0;
2740b57cec5SDimitry Andric   uint64_t sizeOfImage;
2750b57cec5SDimitry Andric   uint64_t sizeOfHeaders;
2760b57cec5SDimitry Andric 
2770b57cec5SDimitry Andric   OutputSection *textSec;
2780b57cec5SDimitry Andric   OutputSection *rdataSec;
2790b57cec5SDimitry Andric   OutputSection *buildidSec;
2800b57cec5SDimitry Andric   OutputSection *dataSec;
2810b57cec5SDimitry Andric   OutputSection *pdataSec;
2820b57cec5SDimitry Andric   OutputSection *idataSec;
2830b57cec5SDimitry Andric   OutputSection *edataSec;
2840b57cec5SDimitry Andric   OutputSection *didatSec;
2850b57cec5SDimitry Andric   OutputSection *rsrcSec;
2860b57cec5SDimitry Andric   OutputSection *relocSec;
2870b57cec5SDimitry Andric   OutputSection *ctorsSec;
2880b57cec5SDimitry Andric   OutputSection *dtorsSec;
2890b57cec5SDimitry Andric 
2900b57cec5SDimitry Andric   // The first and last .pdata sections in the output file.
2910b57cec5SDimitry Andric   //
2920b57cec5SDimitry Andric   // We need to keep track of the location of .pdata in whichever section it
2930b57cec5SDimitry Andric   // gets merged into so that we can sort its contents and emit a correct data
2940b57cec5SDimitry Andric   // directory entry for the exception table. This is also the case for some
2950b57cec5SDimitry Andric   // other sections (such as .edata) but because the contents of those sections
2960b57cec5SDimitry Andric   // are entirely linker-generated we can keep track of their locations using
2970b57cec5SDimitry Andric   // the chunks that the linker creates. All .pdata chunks come from input
2980b57cec5SDimitry Andric   // files, so we need to keep track of them separately.
2990b57cec5SDimitry Andric   Chunk *firstPdata = nullptr;
3000b57cec5SDimitry Andric   Chunk *lastPdata;
301349cc55cSDimitry Andric 
302349cc55cSDimitry Andric   COFFLinkerContext &ctx;
3030b57cec5SDimitry Andric };
3040b57cec5SDimitry Andric } // anonymous namespace
3050b57cec5SDimitry Andric 
306349cc55cSDimitry Andric void lld::coff::writeResult(COFFLinkerContext &ctx) { Writer(ctx).run(); }
3070b57cec5SDimitry Andric 
3080b57cec5SDimitry Andric void OutputSection::addChunk(Chunk *c) {
3090b57cec5SDimitry Andric   chunks.push_back(c);
3100b57cec5SDimitry Andric }
3110b57cec5SDimitry Andric 
3120b57cec5SDimitry Andric void OutputSection::insertChunkAtStart(Chunk *c) {
3130b57cec5SDimitry Andric   chunks.insert(chunks.begin(), c);
3140b57cec5SDimitry Andric }
3150b57cec5SDimitry Andric 
3160b57cec5SDimitry Andric void OutputSection::setPermissions(uint32_t c) {
3170b57cec5SDimitry Andric   header.Characteristics &= ~permMask;
3180b57cec5SDimitry Andric   header.Characteristics |= c;
3190b57cec5SDimitry Andric }
3200b57cec5SDimitry Andric 
3210b57cec5SDimitry Andric void OutputSection::merge(OutputSection *other) {
3220b57cec5SDimitry Andric   chunks.insert(chunks.end(), other->chunks.begin(), other->chunks.end());
3230b57cec5SDimitry Andric   other->chunks.clear();
3240b57cec5SDimitry Andric   contribSections.insert(contribSections.end(), other->contribSections.begin(),
3250b57cec5SDimitry Andric                          other->contribSections.end());
3260b57cec5SDimitry Andric   other->contribSections.clear();
3270b57cec5SDimitry Andric }
3280b57cec5SDimitry Andric 
3290b57cec5SDimitry Andric // Write the section header to a given buffer.
3300b57cec5SDimitry Andric void OutputSection::writeHeaderTo(uint8_t *buf) {
3310b57cec5SDimitry Andric   auto *hdr = reinterpret_cast<coff_section *>(buf);
3320b57cec5SDimitry Andric   *hdr = header;
3330b57cec5SDimitry Andric   if (stringTableOff) {
3340b57cec5SDimitry Andric     // If name is too long, write offset into the string table as a name.
3350b57cec5SDimitry Andric     sprintf(hdr->Name, "/%d", stringTableOff);
3360b57cec5SDimitry Andric   } else {
3370b57cec5SDimitry Andric     assert(!config->debug || name.size() <= COFF::NameSize ||
3380b57cec5SDimitry Andric            (hdr->Characteristics & IMAGE_SCN_MEM_DISCARDABLE) == 0);
3390b57cec5SDimitry Andric     strncpy(hdr->Name, name.data(),
3400b57cec5SDimitry Andric             std::min(name.size(), (size_t)COFF::NameSize));
3410b57cec5SDimitry Andric   }
3420b57cec5SDimitry Andric }
3430b57cec5SDimitry Andric 
3440b57cec5SDimitry Andric void OutputSection::addContributingPartialSection(PartialSection *sec) {
3450b57cec5SDimitry Andric   contribSections.push_back(sec);
3460b57cec5SDimitry Andric }
3470b57cec5SDimitry Andric 
3480b57cec5SDimitry Andric // Check whether the target address S is in range from a relocation
3490b57cec5SDimitry Andric // of type relType at address P.
3500b57cec5SDimitry Andric static bool isInRange(uint16_t relType, uint64_t s, uint64_t p, int margin) {
3510b57cec5SDimitry Andric   if (config->machine == ARMNT) {
3520b57cec5SDimitry Andric     int64_t diff = AbsoluteDifference(s, p + 4) + margin;
3530b57cec5SDimitry Andric     switch (relType) {
3540b57cec5SDimitry Andric     case IMAGE_REL_ARM_BRANCH20T:
3550b57cec5SDimitry Andric       return isInt<21>(diff);
3560b57cec5SDimitry Andric     case IMAGE_REL_ARM_BRANCH24T:
3570b57cec5SDimitry Andric     case IMAGE_REL_ARM_BLX23T:
3580b57cec5SDimitry Andric       return isInt<25>(diff);
3590b57cec5SDimitry Andric     default:
3600b57cec5SDimitry Andric       return true;
3610b57cec5SDimitry Andric     }
3620b57cec5SDimitry Andric   } else if (config->machine == ARM64) {
3630b57cec5SDimitry Andric     int64_t diff = AbsoluteDifference(s, p) + margin;
3640b57cec5SDimitry Andric     switch (relType) {
3650b57cec5SDimitry Andric     case IMAGE_REL_ARM64_BRANCH26:
3660b57cec5SDimitry Andric       return isInt<28>(diff);
3670b57cec5SDimitry Andric     case IMAGE_REL_ARM64_BRANCH19:
3680b57cec5SDimitry Andric       return isInt<21>(diff);
3690b57cec5SDimitry Andric     case IMAGE_REL_ARM64_BRANCH14:
3700b57cec5SDimitry Andric       return isInt<16>(diff);
3710b57cec5SDimitry Andric     default:
3720b57cec5SDimitry Andric       return true;
3730b57cec5SDimitry Andric     }
3740b57cec5SDimitry Andric   } else {
3750b57cec5SDimitry Andric     llvm_unreachable("Unexpected architecture");
3760b57cec5SDimitry Andric   }
3770b57cec5SDimitry Andric }
3780b57cec5SDimitry Andric 
3790b57cec5SDimitry Andric // Return the last thunk for the given target if it is in range,
3800b57cec5SDimitry Andric // or create a new one.
3810b57cec5SDimitry Andric static std::pair<Defined *, bool>
3820b57cec5SDimitry Andric getThunk(DenseMap<uint64_t, Defined *> &lastThunks, Defined *target, uint64_t p,
3830b57cec5SDimitry Andric          uint16_t type, int margin) {
3840b57cec5SDimitry Andric   Defined *&lastThunk = lastThunks[target->getRVA()];
3850b57cec5SDimitry Andric   if (lastThunk && isInRange(type, lastThunk->getRVA(), p, margin))
3860b57cec5SDimitry Andric     return {lastThunk, false};
3870b57cec5SDimitry Andric   Chunk *c;
3880b57cec5SDimitry Andric   switch (config->machine) {
3890b57cec5SDimitry Andric   case ARMNT:
3900b57cec5SDimitry Andric     c = make<RangeExtensionThunkARM>(target);
3910b57cec5SDimitry Andric     break;
3920b57cec5SDimitry Andric   case ARM64:
3930b57cec5SDimitry Andric     c = make<RangeExtensionThunkARM64>(target);
3940b57cec5SDimitry Andric     break;
3950b57cec5SDimitry Andric   default:
3960b57cec5SDimitry Andric     llvm_unreachable("Unexpected architecture");
3970b57cec5SDimitry Andric   }
3980b57cec5SDimitry Andric   Defined *d = make<DefinedSynthetic>("", c);
3990b57cec5SDimitry Andric   lastThunk = d;
4000b57cec5SDimitry Andric   return {d, true};
4010b57cec5SDimitry Andric }
4020b57cec5SDimitry Andric 
4030b57cec5SDimitry Andric // This checks all relocations, and for any relocation which isn't in range
4040b57cec5SDimitry Andric // it adds a thunk after the section chunk that contains the relocation.
4050b57cec5SDimitry Andric // If the latest thunk for the specific target is in range, that is used
4060b57cec5SDimitry Andric // instead of creating a new thunk. All range checks are done with the
4070b57cec5SDimitry Andric // specified margin, to make sure that relocations that originally are in
4080b57cec5SDimitry Andric // range, but only barely, also get thunks - in case other added thunks makes
4090b57cec5SDimitry Andric // the target go out of range.
4100b57cec5SDimitry Andric //
4110b57cec5SDimitry Andric // After adding thunks, we verify that all relocations are in range (with
4120b57cec5SDimitry Andric // no extra margin requirements). If this failed, we restart (throwing away
4130b57cec5SDimitry Andric // the previously created thunks) and retry with a wider margin.
4140b57cec5SDimitry Andric static bool createThunks(OutputSection *os, int margin) {
4150b57cec5SDimitry Andric   bool addressesChanged = false;
4160b57cec5SDimitry Andric   DenseMap<uint64_t, Defined *> lastThunks;
4170b57cec5SDimitry Andric   DenseMap<std::pair<ObjFile *, Defined *>, uint32_t> thunkSymtabIndices;
4180b57cec5SDimitry Andric   size_t thunksSize = 0;
4190b57cec5SDimitry Andric   // Recheck Chunks.size() each iteration, since we can insert more
4200b57cec5SDimitry Andric   // elements into it.
4210b57cec5SDimitry Andric   for (size_t i = 0; i != os->chunks.size(); ++i) {
4220b57cec5SDimitry Andric     SectionChunk *sc = dyn_cast_or_null<SectionChunk>(os->chunks[i]);
4230b57cec5SDimitry Andric     if (!sc)
4240b57cec5SDimitry Andric       continue;
4250b57cec5SDimitry Andric     size_t thunkInsertionSpot = i + 1;
4260b57cec5SDimitry Andric 
4270b57cec5SDimitry Andric     // Try to get a good enough estimate of where new thunks will be placed.
4280b57cec5SDimitry Andric     // Offset this by the size of the new thunks added so far, to make the
4290b57cec5SDimitry Andric     // estimate slightly better.
4300b57cec5SDimitry Andric     size_t thunkInsertionRVA = sc->getRVA() + sc->getSize() + thunksSize;
4310b57cec5SDimitry Andric     ObjFile *file = sc->file;
4320b57cec5SDimitry Andric     std::vector<std::pair<uint32_t, uint32_t>> relocReplacements;
4330b57cec5SDimitry Andric     ArrayRef<coff_relocation> originalRelocs =
4340b57cec5SDimitry Andric         file->getCOFFObj()->getRelocations(sc->header);
4350b57cec5SDimitry Andric     for (size_t j = 0, e = originalRelocs.size(); j < e; ++j) {
4360b57cec5SDimitry Andric       const coff_relocation &rel = originalRelocs[j];
4370b57cec5SDimitry Andric       Symbol *relocTarget = file->getSymbol(rel.SymbolTableIndex);
4380b57cec5SDimitry Andric 
4390b57cec5SDimitry Andric       // The estimate of the source address P should be pretty accurate,
4400b57cec5SDimitry Andric       // but we don't know whether the target Symbol address should be
4410b57cec5SDimitry Andric       // offset by thunksSize or not (or by some of thunksSize but not all of
4420b57cec5SDimitry Andric       // it), giving us some uncertainty once we have added one thunk.
4430b57cec5SDimitry Andric       uint64_t p = sc->getRVA() + rel.VirtualAddress + thunksSize;
4440b57cec5SDimitry Andric 
4450b57cec5SDimitry Andric       Defined *sym = dyn_cast_or_null<Defined>(relocTarget);
4460b57cec5SDimitry Andric       if (!sym)
4470b57cec5SDimitry Andric         continue;
4480b57cec5SDimitry Andric 
4490b57cec5SDimitry Andric       uint64_t s = sym->getRVA();
4500b57cec5SDimitry Andric 
4510b57cec5SDimitry Andric       if (isInRange(rel.Type, s, p, margin))
4520b57cec5SDimitry Andric         continue;
4530b57cec5SDimitry Andric 
4540b57cec5SDimitry Andric       // If the target isn't in range, hook it up to an existing or new
4550b57cec5SDimitry Andric       // thunk.
4560b57cec5SDimitry Andric       Defined *thunk;
4570b57cec5SDimitry Andric       bool wasNew;
4580b57cec5SDimitry Andric       std::tie(thunk, wasNew) = getThunk(lastThunks, sym, p, rel.Type, margin);
4590b57cec5SDimitry Andric       if (wasNew) {
4600b57cec5SDimitry Andric         Chunk *thunkChunk = thunk->getChunk();
4610b57cec5SDimitry Andric         thunkChunk->setRVA(
4620b57cec5SDimitry Andric             thunkInsertionRVA); // Estimate of where it will be located.
4630b57cec5SDimitry Andric         os->chunks.insert(os->chunks.begin() + thunkInsertionSpot, thunkChunk);
4640b57cec5SDimitry Andric         thunkInsertionSpot++;
4650b57cec5SDimitry Andric         thunksSize += thunkChunk->getSize();
4660b57cec5SDimitry Andric         thunkInsertionRVA += thunkChunk->getSize();
4670b57cec5SDimitry Andric         addressesChanged = true;
4680b57cec5SDimitry Andric       }
4690b57cec5SDimitry Andric 
4700b57cec5SDimitry Andric       // To redirect the relocation, add a symbol to the parent object file's
4710b57cec5SDimitry Andric       // symbol table, and replace the relocation symbol table index with the
4720b57cec5SDimitry Andric       // new index.
4730b57cec5SDimitry Andric       auto insertion = thunkSymtabIndices.insert({{file, thunk}, ~0U});
4740b57cec5SDimitry Andric       uint32_t &thunkSymbolIndex = insertion.first->second;
4750b57cec5SDimitry Andric       if (insertion.second)
4760b57cec5SDimitry Andric         thunkSymbolIndex = file->addRangeThunkSymbol(thunk);
4770b57cec5SDimitry Andric       relocReplacements.push_back({j, thunkSymbolIndex});
4780b57cec5SDimitry Andric     }
4790b57cec5SDimitry Andric 
4800b57cec5SDimitry Andric     // Get a writable copy of this section's relocations so they can be
4810b57cec5SDimitry Andric     // modified. If the relocations point into the object file, allocate new
4820b57cec5SDimitry Andric     // memory. Otherwise, this must be previously allocated memory that can be
4830b57cec5SDimitry Andric     // modified in place.
4840b57cec5SDimitry Andric     ArrayRef<coff_relocation> curRelocs = sc->getRelocs();
4850b57cec5SDimitry Andric     MutableArrayRef<coff_relocation> newRelocs;
4860b57cec5SDimitry Andric     if (originalRelocs.data() == curRelocs.data()) {
4870b57cec5SDimitry Andric       newRelocs = makeMutableArrayRef(
48804eeddc0SDimitry Andric           bAlloc().Allocate<coff_relocation>(originalRelocs.size()),
4890b57cec5SDimitry Andric           originalRelocs.size());
4900b57cec5SDimitry Andric     } else {
4910b57cec5SDimitry Andric       newRelocs = makeMutableArrayRef(
4920b57cec5SDimitry Andric           const_cast<coff_relocation *>(curRelocs.data()), curRelocs.size());
4930b57cec5SDimitry Andric     }
4940b57cec5SDimitry Andric 
4950b57cec5SDimitry Andric     // Copy each relocation, but replace the symbol table indices which need
4960b57cec5SDimitry Andric     // thunks.
4970b57cec5SDimitry Andric     auto nextReplacement = relocReplacements.begin();
4980b57cec5SDimitry Andric     auto endReplacement = relocReplacements.end();
4990b57cec5SDimitry Andric     for (size_t i = 0, e = originalRelocs.size(); i != e; ++i) {
5000b57cec5SDimitry Andric       newRelocs[i] = originalRelocs[i];
5010b57cec5SDimitry Andric       if (nextReplacement != endReplacement && nextReplacement->first == i) {
5020b57cec5SDimitry Andric         newRelocs[i].SymbolTableIndex = nextReplacement->second;
5030b57cec5SDimitry Andric         ++nextReplacement;
5040b57cec5SDimitry Andric       }
5050b57cec5SDimitry Andric     }
5060b57cec5SDimitry Andric 
5070b57cec5SDimitry Andric     sc->setRelocs(newRelocs);
5080b57cec5SDimitry Andric   }
5090b57cec5SDimitry Andric   return addressesChanged;
5100b57cec5SDimitry Andric }
5110b57cec5SDimitry Andric 
5120b57cec5SDimitry Andric // Verify that all relocations are in range, with no extra margin requirements.
5130b57cec5SDimitry Andric static bool verifyRanges(const std::vector<Chunk *> chunks) {
5140b57cec5SDimitry Andric   for (Chunk *c : chunks) {
5150b57cec5SDimitry Andric     SectionChunk *sc = dyn_cast_or_null<SectionChunk>(c);
5160b57cec5SDimitry Andric     if (!sc)
5170b57cec5SDimitry Andric       continue;
5180b57cec5SDimitry Andric 
5190b57cec5SDimitry Andric     ArrayRef<coff_relocation> relocs = sc->getRelocs();
5200b57cec5SDimitry Andric     for (size_t j = 0, e = relocs.size(); j < e; ++j) {
5210b57cec5SDimitry Andric       const coff_relocation &rel = relocs[j];
5220b57cec5SDimitry Andric       Symbol *relocTarget = sc->file->getSymbol(rel.SymbolTableIndex);
5230b57cec5SDimitry Andric 
5240b57cec5SDimitry Andric       Defined *sym = dyn_cast_or_null<Defined>(relocTarget);
5250b57cec5SDimitry Andric       if (!sym)
5260b57cec5SDimitry Andric         continue;
5270b57cec5SDimitry Andric 
5280b57cec5SDimitry Andric       uint64_t p = sc->getRVA() + rel.VirtualAddress;
5290b57cec5SDimitry Andric       uint64_t s = sym->getRVA();
5300b57cec5SDimitry Andric 
5310b57cec5SDimitry Andric       if (!isInRange(rel.Type, s, p, 0))
5320b57cec5SDimitry Andric         return false;
5330b57cec5SDimitry Andric     }
5340b57cec5SDimitry Andric   }
5350b57cec5SDimitry Andric   return true;
5360b57cec5SDimitry Andric }
5370b57cec5SDimitry Andric 
5380b57cec5SDimitry Andric // Assign addresses and add thunks if necessary.
5390b57cec5SDimitry Andric void Writer::finalizeAddresses() {
5400b57cec5SDimitry Andric   assignAddresses();
5410b57cec5SDimitry Andric   if (config->machine != ARMNT && config->machine != ARM64)
5420b57cec5SDimitry Andric     return;
5430b57cec5SDimitry Andric 
5440b57cec5SDimitry Andric   size_t origNumChunks = 0;
545349cc55cSDimitry Andric   for (OutputSection *sec : ctx.outputSections) {
5460b57cec5SDimitry Andric     sec->origChunks = sec->chunks;
5470b57cec5SDimitry Andric     origNumChunks += sec->chunks.size();
5480b57cec5SDimitry Andric   }
5490b57cec5SDimitry Andric 
5500b57cec5SDimitry Andric   int pass = 0;
5510b57cec5SDimitry Andric   int margin = 1024 * 100;
5520b57cec5SDimitry Andric   while (true) {
5530b57cec5SDimitry Andric     // First check whether we need thunks at all, or if the previous pass of
5540b57cec5SDimitry Andric     // adding them turned out ok.
5550b57cec5SDimitry Andric     bool rangesOk = true;
5560b57cec5SDimitry Andric     size_t numChunks = 0;
557349cc55cSDimitry Andric     for (OutputSection *sec : ctx.outputSections) {
5580b57cec5SDimitry Andric       if (!verifyRanges(sec->chunks)) {
5590b57cec5SDimitry Andric         rangesOk = false;
5600b57cec5SDimitry Andric         break;
5610b57cec5SDimitry Andric       }
5620b57cec5SDimitry Andric       numChunks += sec->chunks.size();
5630b57cec5SDimitry Andric     }
5640b57cec5SDimitry Andric     if (rangesOk) {
5650b57cec5SDimitry Andric       if (pass > 0)
5660b57cec5SDimitry Andric         log("Added " + Twine(numChunks - origNumChunks) + " thunks with " +
5670b57cec5SDimitry Andric             "margin " + Twine(margin) + " in " + Twine(pass) + " passes");
5680b57cec5SDimitry Andric       return;
5690b57cec5SDimitry Andric     }
5700b57cec5SDimitry Andric 
5710b57cec5SDimitry Andric     if (pass >= 10)
5720b57cec5SDimitry Andric       fatal("adding thunks hasn't converged after " + Twine(pass) + " passes");
5730b57cec5SDimitry Andric 
5740b57cec5SDimitry Andric     if (pass > 0) {
5750b57cec5SDimitry Andric       // If the previous pass didn't work out, reset everything back to the
5760b57cec5SDimitry Andric       // original conditions before retrying with a wider margin. This should
5770b57cec5SDimitry Andric       // ideally never happen under real circumstances.
578349cc55cSDimitry Andric       for (OutputSection *sec : ctx.outputSections)
5790b57cec5SDimitry Andric         sec->chunks = sec->origChunks;
5800b57cec5SDimitry Andric       margin *= 2;
5810b57cec5SDimitry Andric     }
5820b57cec5SDimitry Andric 
5830b57cec5SDimitry Andric     // Try adding thunks everywhere where it is needed, with a margin
5840b57cec5SDimitry Andric     // to avoid things going out of range due to the added thunks.
5850b57cec5SDimitry Andric     bool addressesChanged = false;
586349cc55cSDimitry Andric     for (OutputSection *sec : ctx.outputSections)
5870b57cec5SDimitry Andric       addressesChanged |= createThunks(sec, margin);
5880b57cec5SDimitry Andric     // If the verification above thought we needed thunks, we should have
5890b57cec5SDimitry Andric     // added some.
5900b57cec5SDimitry Andric     assert(addressesChanged);
591fe6060f1SDimitry Andric     (void)addressesChanged;
5920b57cec5SDimitry Andric 
5930b57cec5SDimitry Andric     // Recalculate the layout for the whole image (and verify the ranges at
5940b57cec5SDimitry Andric     // the start of the next round).
5950b57cec5SDimitry Andric     assignAddresses();
5960b57cec5SDimitry Andric 
5970b57cec5SDimitry Andric     pass++;
5980b57cec5SDimitry Andric   }
5990b57cec5SDimitry Andric }
6000b57cec5SDimitry Andric 
6010b57cec5SDimitry Andric // The main function of the writer.
6020b57cec5SDimitry Andric void Writer::run() {
603349cc55cSDimitry Andric   ScopedTimer t1(ctx.codeLayoutTimer);
6040b57cec5SDimitry Andric 
6050b57cec5SDimitry Andric   createImportTables();
6060b57cec5SDimitry Andric   createSections();
6070b57cec5SDimitry Andric   appendImportThunks();
608e8d8bef9SDimitry Andric   // Import thunks must be added before the Control Flow Guard tables are added.
609e8d8bef9SDimitry Andric   createMiscChunks();
6100b57cec5SDimitry Andric   createExportTable();
6110b57cec5SDimitry Andric   mergeSections();
6120b57cec5SDimitry Andric   removeUnusedSections();
6130b57cec5SDimitry Andric   finalizeAddresses();
6140b57cec5SDimitry Andric   removeEmptySections();
6150b57cec5SDimitry Andric   assignOutputSectionIndices();
6160b57cec5SDimitry Andric   setSectionPermissions();
6170b57cec5SDimitry Andric   createSymbolAndStringTable();
6180b57cec5SDimitry Andric 
6190b57cec5SDimitry Andric   if (fileSize > UINT32_MAX)
6200b57cec5SDimitry Andric     fatal("image size (" + Twine(fileSize) + ") " +
6210b57cec5SDimitry Andric         "exceeds maximum allowable size (" + Twine(UINT32_MAX) + ")");
6220b57cec5SDimitry Andric 
6230b57cec5SDimitry Andric   openFile(config->outputFile);
6240b57cec5SDimitry Andric   if (config->is64()) {
6250b57cec5SDimitry Andric     writeHeader<pe32plus_header>();
6260b57cec5SDimitry Andric   } else {
6270b57cec5SDimitry Andric     writeHeader<pe32_header>();
6280b57cec5SDimitry Andric   }
6290b57cec5SDimitry Andric   writeSections();
6300b57cec5SDimitry Andric   sortExceptionTable();
6310b57cec5SDimitry Andric 
632e8d8bef9SDimitry Andric   // Fix up the alignment in the TLS Directory's characteristic field,
633e8d8bef9SDimitry Andric   // if a specific alignment value is needed
634e8d8bef9SDimitry Andric   if (tlsAlignment)
635e8d8bef9SDimitry Andric     fixTlsAlignment();
636e8d8bef9SDimitry Andric 
6370b57cec5SDimitry Andric   t1.stop();
6380b57cec5SDimitry Andric 
6390b57cec5SDimitry Andric   if (!config->pdbPath.empty() && config->debug) {
6400b57cec5SDimitry Andric     assert(buildId);
641349cc55cSDimitry Andric     createPDB(ctx, sectionTable, buildId->buildId);
6420b57cec5SDimitry Andric   }
6430b57cec5SDimitry Andric   writeBuildId();
6440b57cec5SDimitry Andric 
645349cc55cSDimitry Andric   writeLLDMapFile(ctx);
646349cc55cSDimitry Andric   writeMapFile(ctx);
6470b57cec5SDimitry Andric 
6480b57cec5SDimitry Andric   if (errorCount())
6490b57cec5SDimitry Andric     return;
6500b57cec5SDimitry Andric 
651349cc55cSDimitry Andric   ScopedTimer t2(ctx.outputCommitTimer);
6520b57cec5SDimitry Andric   if (auto e = buffer->commit())
6530b57cec5SDimitry Andric     fatal("failed to write the output file: " + toString(std::move(e)));
6540b57cec5SDimitry Andric }
6550b57cec5SDimitry Andric 
6560b57cec5SDimitry Andric static StringRef getOutputSectionName(StringRef name) {
6570b57cec5SDimitry Andric   StringRef s = name.split('$').first;
6580b57cec5SDimitry Andric 
6590b57cec5SDimitry Andric   // Treat a later period as a separator for MinGW, for sections like
6600b57cec5SDimitry Andric   // ".ctors.01234".
6610b57cec5SDimitry Andric   return s.substr(0, s.find('.', 1));
6620b57cec5SDimitry Andric }
6630b57cec5SDimitry Andric 
6640b57cec5SDimitry Andric // For /order.
6650b57cec5SDimitry Andric static void sortBySectionOrder(std::vector<Chunk *> &chunks) {
6660b57cec5SDimitry Andric   auto getPriority = [](const Chunk *c) {
6670b57cec5SDimitry Andric     if (auto *sec = dyn_cast<SectionChunk>(c))
6680b57cec5SDimitry Andric       if (sec->sym)
6690b57cec5SDimitry Andric         return config->order.lookup(sec->sym->getName());
6700b57cec5SDimitry Andric     return 0;
6710b57cec5SDimitry Andric   };
6720b57cec5SDimitry Andric 
6730b57cec5SDimitry Andric   llvm::stable_sort(chunks, [=](const Chunk *a, const Chunk *b) {
6740b57cec5SDimitry Andric     return getPriority(a) < getPriority(b);
6750b57cec5SDimitry Andric   });
6760b57cec5SDimitry Andric }
6770b57cec5SDimitry Andric 
6780b57cec5SDimitry Andric // Change the characteristics of existing PartialSections that belong to the
6790b57cec5SDimitry Andric // section Name to Chars.
6800b57cec5SDimitry Andric void Writer::fixPartialSectionChars(StringRef name, uint32_t chars) {
6810b57cec5SDimitry Andric   for (auto it : partialSections) {
6820b57cec5SDimitry Andric     PartialSection *pSec = it.second;
6830b57cec5SDimitry Andric     StringRef curName = pSec->name;
6840b57cec5SDimitry Andric     if (!curName.consume_front(name) ||
6850b57cec5SDimitry Andric         (!curName.empty() && !curName.startswith("$")))
6860b57cec5SDimitry Andric       continue;
6870b57cec5SDimitry Andric     if (pSec->characteristics == chars)
6880b57cec5SDimitry Andric       continue;
6890b57cec5SDimitry Andric     PartialSection *destSec = createPartialSection(pSec->name, chars);
6900b57cec5SDimitry Andric     destSec->chunks.insert(destSec->chunks.end(), pSec->chunks.begin(),
6910b57cec5SDimitry Andric                            pSec->chunks.end());
6920b57cec5SDimitry Andric     pSec->chunks.clear();
6930b57cec5SDimitry Andric   }
6940b57cec5SDimitry Andric }
6950b57cec5SDimitry Andric 
6960b57cec5SDimitry Andric // Sort concrete section chunks from GNU import libraries.
6970b57cec5SDimitry Andric //
6980b57cec5SDimitry Andric // GNU binutils doesn't use short import files, but instead produces import
6990b57cec5SDimitry Andric // libraries that consist of object files, with section chunks for the .idata$*
7000b57cec5SDimitry Andric // sections. These are linked just as regular static libraries. Each import
7010b57cec5SDimitry Andric // library consists of one header object, one object file for every imported
7020b57cec5SDimitry Andric // symbol, and one trailer object. In order for the .idata tables/lists to
7030b57cec5SDimitry Andric // be formed correctly, the section chunks within each .idata$* section need
7040b57cec5SDimitry Andric // to be grouped by library, and sorted alphabetically within each library
7050b57cec5SDimitry Andric // (which makes sure the header comes first and the trailer last).
7060b57cec5SDimitry Andric bool Writer::fixGnuImportChunks() {
7070b57cec5SDimitry Andric   uint32_t rdata = IMAGE_SCN_CNT_INITIALIZED_DATA | IMAGE_SCN_MEM_READ;
7080b57cec5SDimitry Andric 
7090b57cec5SDimitry Andric   // Make sure all .idata$* section chunks are mapped as RDATA in order to
7100b57cec5SDimitry Andric   // be sorted into the same sections as our own synthesized .idata chunks.
7110b57cec5SDimitry Andric   fixPartialSectionChars(".idata", rdata);
7120b57cec5SDimitry Andric 
7130b57cec5SDimitry Andric   bool hasIdata = false;
7140b57cec5SDimitry Andric   // Sort all .idata$* chunks, grouping chunks from the same library,
7150b57cec5SDimitry Andric   // with alphabetical ordering of the object fils within a library.
7160b57cec5SDimitry Andric   for (auto it : partialSections) {
7170b57cec5SDimitry Andric     PartialSection *pSec = it.second;
7180b57cec5SDimitry Andric     if (!pSec->name.startswith(".idata"))
7190b57cec5SDimitry Andric       continue;
7200b57cec5SDimitry Andric 
7210b57cec5SDimitry Andric     if (!pSec->chunks.empty())
7220b57cec5SDimitry Andric       hasIdata = true;
7230b57cec5SDimitry Andric     llvm::stable_sort(pSec->chunks, [&](Chunk *s, Chunk *t) {
7240b57cec5SDimitry Andric       SectionChunk *sc1 = dyn_cast_or_null<SectionChunk>(s);
7250b57cec5SDimitry Andric       SectionChunk *sc2 = dyn_cast_or_null<SectionChunk>(t);
7260b57cec5SDimitry Andric       if (!sc1 || !sc2) {
7270b57cec5SDimitry Andric         // if SC1, order them ascending. If SC2 or both null,
7280b57cec5SDimitry Andric         // S is not less than T.
7290b57cec5SDimitry Andric         return sc1 != nullptr;
7300b57cec5SDimitry Andric       }
7310b57cec5SDimitry Andric       // Make a string with "libraryname/objectfile" for sorting, achieving
7320b57cec5SDimitry Andric       // both grouping by library and sorting of objects within a library,
7330b57cec5SDimitry Andric       // at once.
7340b57cec5SDimitry Andric       std::string key1 =
7350b57cec5SDimitry Andric           (sc1->file->parentName + "/" + sc1->file->getName()).str();
7360b57cec5SDimitry Andric       std::string key2 =
7370b57cec5SDimitry Andric           (sc2->file->parentName + "/" + sc2->file->getName()).str();
7380b57cec5SDimitry Andric       return key1 < key2;
7390b57cec5SDimitry Andric     });
7400b57cec5SDimitry Andric   }
7410b57cec5SDimitry Andric   return hasIdata;
7420b57cec5SDimitry Andric }
7430b57cec5SDimitry Andric 
7440b57cec5SDimitry Andric // Add generated idata chunks, for imported symbols and DLLs, and a
7450b57cec5SDimitry Andric // terminator in .idata$2.
7460b57cec5SDimitry Andric void Writer::addSyntheticIdata() {
7470b57cec5SDimitry Andric   uint32_t rdata = IMAGE_SCN_CNT_INITIALIZED_DATA | IMAGE_SCN_MEM_READ;
7480b57cec5SDimitry Andric   idata.create();
7490b57cec5SDimitry Andric 
7500b57cec5SDimitry Andric   // Add the .idata content in the right section groups, to allow
7510b57cec5SDimitry Andric   // chunks from other linked in object files to be grouped together.
7520b57cec5SDimitry Andric   // See Microsoft PE/COFF spec 5.4 for details.
7530b57cec5SDimitry Andric   auto add = [&](StringRef n, std::vector<Chunk *> &v) {
7540b57cec5SDimitry Andric     PartialSection *pSec = createPartialSection(n, rdata);
7550b57cec5SDimitry Andric     pSec->chunks.insert(pSec->chunks.end(), v.begin(), v.end());
7560b57cec5SDimitry Andric   };
7570b57cec5SDimitry Andric 
7580b57cec5SDimitry Andric   // The loader assumes a specific order of data.
7590b57cec5SDimitry Andric   // Add each type in the correct order.
7600b57cec5SDimitry Andric   add(".idata$2", idata.dirs);
7610b57cec5SDimitry Andric   add(".idata$4", idata.lookups);
7620b57cec5SDimitry Andric   add(".idata$5", idata.addresses);
76385868e8aSDimitry Andric   if (!idata.hints.empty())
7640b57cec5SDimitry Andric     add(".idata$6", idata.hints);
7650b57cec5SDimitry Andric   add(".idata$7", idata.dllNames);
7660b57cec5SDimitry Andric }
7670b57cec5SDimitry Andric 
7680b57cec5SDimitry Andric // Locate the first Chunk and size of the import directory list and the
7690b57cec5SDimitry Andric // IAT.
7700b57cec5SDimitry Andric void Writer::locateImportTables() {
7710b57cec5SDimitry Andric   uint32_t rdata = IMAGE_SCN_CNT_INITIALIZED_DATA | IMAGE_SCN_MEM_READ;
7720b57cec5SDimitry Andric 
7730b57cec5SDimitry Andric   if (PartialSection *importDirs = findPartialSection(".idata$2", rdata)) {
7740b57cec5SDimitry Andric     if (!importDirs->chunks.empty())
7750b57cec5SDimitry Andric       importTableStart = importDirs->chunks.front();
7760b57cec5SDimitry Andric     for (Chunk *c : importDirs->chunks)
7770b57cec5SDimitry Andric       importTableSize += c->getSize();
7780b57cec5SDimitry Andric   }
7790b57cec5SDimitry Andric 
7800b57cec5SDimitry Andric   if (PartialSection *importAddresses = findPartialSection(".idata$5", rdata)) {
7810b57cec5SDimitry Andric     if (!importAddresses->chunks.empty())
7820b57cec5SDimitry Andric       iatStart = importAddresses->chunks.front();
7830b57cec5SDimitry Andric     for (Chunk *c : importAddresses->chunks)
7840b57cec5SDimitry Andric       iatSize += c->getSize();
7850b57cec5SDimitry Andric   }
7860b57cec5SDimitry Andric }
7870b57cec5SDimitry Andric 
7880b57cec5SDimitry Andric // Return whether a SectionChunk's suffix (the dollar and any trailing
7890b57cec5SDimitry Andric // suffix) should be removed and sorted into the main suffixless
7900b57cec5SDimitry Andric // PartialSection.
7910b57cec5SDimitry Andric static bool shouldStripSectionSuffix(SectionChunk *sc, StringRef name) {
7920b57cec5SDimitry Andric   // On MinGW, comdat groups are formed by putting the comdat group name
7930b57cec5SDimitry Andric   // after the '$' in the section name. For .eh_frame$<symbol>, that must
7940b57cec5SDimitry Andric   // still be sorted before the .eh_frame trailer from crtend.o, thus just
7950b57cec5SDimitry Andric   // strip the section name trailer. For other sections, such as
7960b57cec5SDimitry Andric   // .tls$$<symbol> (where non-comdat .tls symbols are otherwise stored in
7970b57cec5SDimitry Andric   // ".tls$"), they must be strictly sorted after .tls. And for the
7980b57cec5SDimitry Andric   // hypothetical case of comdat .CRT$XCU, we definitely need to keep the
7990b57cec5SDimitry Andric   // suffix for sorting. Thus, to play it safe, only strip the suffix for
8000b57cec5SDimitry Andric   // the standard sections.
8010b57cec5SDimitry Andric   if (!config->mingw)
8020b57cec5SDimitry Andric     return false;
8030b57cec5SDimitry Andric   if (!sc || !sc->isCOMDAT())
8040b57cec5SDimitry Andric     return false;
8050b57cec5SDimitry Andric   return name.startswith(".text$") || name.startswith(".data$") ||
8060b57cec5SDimitry Andric          name.startswith(".rdata$") || name.startswith(".pdata$") ||
8070b57cec5SDimitry Andric          name.startswith(".xdata$") || name.startswith(".eh_frame$");
8080b57cec5SDimitry Andric }
8090b57cec5SDimitry Andric 
810e8d8bef9SDimitry Andric void Writer::sortSections() {
811e8d8bef9SDimitry Andric   if (!config->callGraphProfile.empty()) {
812349cc55cSDimitry Andric     DenseMap<const SectionChunk *, int> order =
813349cc55cSDimitry Andric         computeCallGraphProfileOrder(ctx);
814e8d8bef9SDimitry Andric     for (auto it : order) {
815e8d8bef9SDimitry Andric       if (DefinedRegular *sym = it.first->sym)
816e8d8bef9SDimitry Andric         config->order[sym->getName()] = it.second;
817e8d8bef9SDimitry Andric     }
818e8d8bef9SDimitry Andric   }
819e8d8bef9SDimitry Andric   if (!config->order.empty())
820e8d8bef9SDimitry Andric     for (auto it : partialSections)
821e8d8bef9SDimitry Andric       sortBySectionOrder(it.second->chunks);
822e8d8bef9SDimitry Andric }
823e8d8bef9SDimitry Andric 
8240b57cec5SDimitry Andric // Create output section objects and add them to OutputSections.
8250b57cec5SDimitry Andric void Writer::createSections() {
8260b57cec5SDimitry Andric   // First, create the builtin sections.
8270b57cec5SDimitry Andric   const uint32_t data = IMAGE_SCN_CNT_INITIALIZED_DATA;
8280b57cec5SDimitry Andric   const uint32_t bss = IMAGE_SCN_CNT_UNINITIALIZED_DATA;
8290b57cec5SDimitry Andric   const uint32_t code = IMAGE_SCN_CNT_CODE;
8300b57cec5SDimitry Andric   const uint32_t discardable = IMAGE_SCN_MEM_DISCARDABLE;
8310b57cec5SDimitry Andric   const uint32_t r = IMAGE_SCN_MEM_READ;
8320b57cec5SDimitry Andric   const uint32_t w = IMAGE_SCN_MEM_WRITE;
8330b57cec5SDimitry Andric   const uint32_t x = IMAGE_SCN_MEM_EXECUTE;
8340b57cec5SDimitry Andric 
8350b57cec5SDimitry Andric   SmallDenseMap<std::pair<StringRef, uint32_t>, OutputSection *> sections;
8360b57cec5SDimitry Andric   auto createSection = [&](StringRef name, uint32_t outChars) {
8370b57cec5SDimitry Andric     OutputSection *&sec = sections[{name, outChars}];
8380b57cec5SDimitry Andric     if (!sec) {
8390b57cec5SDimitry Andric       sec = make<OutputSection>(name, outChars);
840349cc55cSDimitry Andric       ctx.outputSections.push_back(sec);
8410b57cec5SDimitry Andric     }
8420b57cec5SDimitry Andric     return sec;
8430b57cec5SDimitry Andric   };
8440b57cec5SDimitry Andric 
8450b57cec5SDimitry Andric   // Try to match the section order used by link.exe.
8460b57cec5SDimitry Andric   textSec = createSection(".text", code | r | x);
8470b57cec5SDimitry Andric   createSection(".bss", bss | r | w);
8480b57cec5SDimitry Andric   rdataSec = createSection(".rdata", data | r);
8490b57cec5SDimitry Andric   buildidSec = createSection(".buildid", data | r);
8500b57cec5SDimitry Andric   dataSec = createSection(".data", data | r | w);
8510b57cec5SDimitry Andric   pdataSec = createSection(".pdata", data | r);
8520b57cec5SDimitry Andric   idataSec = createSection(".idata", data | r);
8530b57cec5SDimitry Andric   edataSec = createSection(".edata", data | r);
8540b57cec5SDimitry Andric   didatSec = createSection(".didat", data | r);
8550b57cec5SDimitry Andric   rsrcSec = createSection(".rsrc", data | r);
8560b57cec5SDimitry Andric   relocSec = createSection(".reloc", data | discardable | r);
8570b57cec5SDimitry Andric   ctorsSec = createSection(".ctors", data | r | w);
8580b57cec5SDimitry Andric   dtorsSec = createSection(".dtors", data | r | w);
8590b57cec5SDimitry Andric 
8600b57cec5SDimitry Andric   // Then bin chunks by name and output characteristics.
861349cc55cSDimitry Andric   for (Chunk *c : ctx.symtab.getChunks()) {
8620b57cec5SDimitry Andric     auto *sc = dyn_cast<SectionChunk>(c);
8630b57cec5SDimitry Andric     if (sc && !sc->live) {
8640b57cec5SDimitry Andric       if (config->verbose)
8650b57cec5SDimitry Andric         sc->printDiscardedMessage();
8660b57cec5SDimitry Andric       continue;
8670b57cec5SDimitry Andric     }
8680b57cec5SDimitry Andric     StringRef name = c->getSectionName();
8690b57cec5SDimitry Andric     if (shouldStripSectionSuffix(sc, name))
8700b57cec5SDimitry Andric       name = name.split('$').first;
871e8d8bef9SDimitry Andric 
872e8d8bef9SDimitry Andric     if (name.startswith(".tls"))
873e8d8bef9SDimitry Andric       tlsAlignment = std::max(tlsAlignment, c->getAlignment());
874e8d8bef9SDimitry Andric 
8750b57cec5SDimitry Andric     PartialSection *pSec = createPartialSection(name,
8760b57cec5SDimitry Andric                                                 c->getOutputCharacteristics());
8770b57cec5SDimitry Andric     pSec->chunks.push_back(c);
8780b57cec5SDimitry Andric   }
8790b57cec5SDimitry Andric 
8800b57cec5SDimitry Andric   fixPartialSectionChars(".rsrc", data | r);
88185868e8aSDimitry Andric   fixPartialSectionChars(".edata", data | r);
8820b57cec5SDimitry Andric   // Even in non MinGW cases, we might need to link against GNU import
8830b57cec5SDimitry Andric   // libraries.
8840b57cec5SDimitry Andric   bool hasIdata = fixGnuImportChunks();
8850b57cec5SDimitry Andric   if (!idata.empty())
8860b57cec5SDimitry Andric     hasIdata = true;
8870b57cec5SDimitry Andric 
8880b57cec5SDimitry Andric   if (hasIdata)
8890b57cec5SDimitry Andric     addSyntheticIdata();
8900b57cec5SDimitry Andric 
891e8d8bef9SDimitry Andric   sortSections();
8920b57cec5SDimitry Andric 
8930b57cec5SDimitry Andric   if (hasIdata)
8940b57cec5SDimitry Andric     locateImportTables();
8950b57cec5SDimitry Andric 
8960b57cec5SDimitry Andric   // Then create an OutputSection for each section.
8970b57cec5SDimitry Andric   // '$' and all following characters in input section names are
8980b57cec5SDimitry Andric   // discarded when determining output section. So, .text$foo
8990b57cec5SDimitry Andric   // contributes to .text, for example. See PE/COFF spec 3.2.
9000b57cec5SDimitry Andric   for (auto it : partialSections) {
9010b57cec5SDimitry Andric     PartialSection *pSec = it.second;
9020b57cec5SDimitry Andric     StringRef name = getOutputSectionName(pSec->name);
9030b57cec5SDimitry Andric     uint32_t outChars = pSec->characteristics;
9040b57cec5SDimitry Andric 
9050b57cec5SDimitry Andric     if (name == ".CRT") {
9060b57cec5SDimitry Andric       // In link.exe, there is a special case for the I386 target where .CRT
9070b57cec5SDimitry Andric       // sections are treated as if they have output characteristics DATA | R if
9080b57cec5SDimitry Andric       // their characteristics are DATA | R | W. This implements the same
9090b57cec5SDimitry Andric       // special case for all architectures.
9100b57cec5SDimitry Andric       outChars = data | r;
9110b57cec5SDimitry Andric 
9120b57cec5SDimitry Andric       log("Processing section " + pSec->name + " -> " + name);
9130b57cec5SDimitry Andric 
9140b57cec5SDimitry Andric       sortCRTSectionChunks(pSec->chunks);
9150b57cec5SDimitry Andric     }
9160b57cec5SDimitry Andric 
9170b57cec5SDimitry Andric     OutputSection *sec = createSection(name, outChars);
9180b57cec5SDimitry Andric     for (Chunk *c : pSec->chunks)
9190b57cec5SDimitry Andric       sec->addChunk(c);
9200b57cec5SDimitry Andric 
9210b57cec5SDimitry Andric     sec->addContributingPartialSection(pSec);
9220b57cec5SDimitry Andric   }
9230b57cec5SDimitry Andric 
9240b57cec5SDimitry Andric   // Finally, move some output sections to the end.
9250b57cec5SDimitry Andric   auto sectionOrder = [&](const OutputSection *s) {
9260b57cec5SDimitry Andric     // Move DISCARDABLE (or non-memory-mapped) sections to the end of file
9270b57cec5SDimitry Andric     // because the loader cannot handle holes. Stripping can remove other
9280b57cec5SDimitry Andric     // discardable ones than .reloc, which is first of them (created early).
929*fb03ea46SDimitry Andric     if (s->header.Characteristics & IMAGE_SCN_MEM_DISCARDABLE) {
930*fb03ea46SDimitry Andric       // Move discardable sections named .debug_ to the end, after other
931*fb03ea46SDimitry Andric       // discardable sections. Stripping only removes the sections named
932*fb03ea46SDimitry Andric       // .debug_* - thus try to avoid leaving holes after stripping.
933*fb03ea46SDimitry Andric       if (s->name.startswith(".debug_"))
934*fb03ea46SDimitry Andric         return 3;
9350b57cec5SDimitry Andric       return 2;
936*fb03ea46SDimitry Andric     }
9370b57cec5SDimitry Andric     // .rsrc should come at the end of the non-discardable sections because its
9380b57cec5SDimitry Andric     // size may change by the Win32 UpdateResources() function, causing
9390b57cec5SDimitry Andric     // subsequent sections to move (see https://crbug.com/827082).
9400b57cec5SDimitry Andric     if (s == rsrcSec)
9410b57cec5SDimitry Andric       return 1;
9420b57cec5SDimitry Andric     return 0;
9430b57cec5SDimitry Andric   };
944349cc55cSDimitry Andric   llvm::stable_sort(ctx.outputSections,
9450b57cec5SDimitry Andric                     [&](const OutputSection *s, const OutputSection *t) {
9460b57cec5SDimitry Andric                       return sectionOrder(s) < sectionOrder(t);
9470b57cec5SDimitry Andric                     });
9480b57cec5SDimitry Andric }
9490b57cec5SDimitry Andric 
9500b57cec5SDimitry Andric void Writer::createMiscChunks() {
951349cc55cSDimitry Andric   for (MergeChunk *p : ctx.mergeChunkInstances) {
9520b57cec5SDimitry Andric     if (p) {
9530b57cec5SDimitry Andric       p->finalizeContents();
9540b57cec5SDimitry Andric       rdataSec->addChunk(p);
9550b57cec5SDimitry Andric     }
9560b57cec5SDimitry Andric   }
9570b57cec5SDimitry Andric 
9580b57cec5SDimitry Andric   // Create thunks for locally-dllimported symbols.
959349cc55cSDimitry Andric   if (!ctx.symtab.localImportChunks.empty()) {
960349cc55cSDimitry Andric     for (Chunk *c : ctx.symtab.localImportChunks)
9610b57cec5SDimitry Andric       rdataSec->addChunk(c);
9620b57cec5SDimitry Andric   }
9630b57cec5SDimitry Andric 
9640b57cec5SDimitry Andric   // Create Debug Information Chunks
9650b57cec5SDimitry Andric   OutputSection *debugInfoSec = config->mingw ? buildidSec : rdataSec;
9665ffd83dbSDimitry Andric   if (config->debug || config->repro || config->cetCompat) {
967349cc55cSDimitry Andric     debugDirectory =
968349cc55cSDimitry Andric         make<DebugDirectoryChunk>(ctx, debugRecords, config->repro);
9695ffd83dbSDimitry Andric     debugDirectory->setAlignment(4);
9700b57cec5SDimitry Andric     debugInfoSec->addChunk(debugDirectory);
9710b57cec5SDimitry Andric   }
9720b57cec5SDimitry Andric 
9730b57cec5SDimitry Andric   if (config->debug) {
9740b57cec5SDimitry Andric     // Make a CVDebugRecordChunk even when /DEBUG:CV is not specified.  We
9750b57cec5SDimitry Andric     // output a PDB no matter what, and this chunk provides the only means of
9760b57cec5SDimitry Andric     // allowing a debugger to match a PDB and an executable.  So we need it even
9770b57cec5SDimitry Andric     // if we're ultimately not going to write CodeView data to the PDB.
9780b57cec5SDimitry Andric     buildId = make<CVDebugRecordChunk>();
9795ffd83dbSDimitry Andric     debugRecords.push_back({COFF::IMAGE_DEBUG_TYPE_CODEVIEW, buildId});
9805ffd83dbSDimitry Andric   }
9810b57cec5SDimitry Andric 
9825ffd83dbSDimitry Andric   if (config->cetCompat) {
983e8d8bef9SDimitry Andric     debugRecords.push_back({COFF::IMAGE_DEBUG_TYPE_EX_DLLCHARACTERISTICS,
9845ffd83dbSDimitry Andric                             make<ExtendedDllCharacteristicsChunk>(
985e8d8bef9SDimitry Andric                                 IMAGE_DLL_CHARACTERISTICS_EX_CET_COMPAT)});
9865ffd83dbSDimitry Andric   }
9875ffd83dbSDimitry Andric 
988e8d8bef9SDimitry Andric   // Align and add each chunk referenced by the debug data directory.
989e8d8bef9SDimitry Andric   for (std::pair<COFF::DebugType, Chunk *> r : debugRecords) {
990e8d8bef9SDimitry Andric     r.second->setAlignment(4);
9915ffd83dbSDimitry Andric     debugInfoSec->addChunk(r.second);
9920b57cec5SDimitry Andric   }
9930b57cec5SDimitry Andric 
9940b57cec5SDimitry Andric   // Create SEH table. x86-only.
9950b57cec5SDimitry Andric   if (config->safeSEH)
9960b57cec5SDimitry Andric     createSEHTable();
9970b57cec5SDimitry Andric 
9980b57cec5SDimitry Andric   // Create /guard:cf tables if requested.
9990b57cec5SDimitry Andric   if (config->guardCF != GuardCFLevel::Off)
10000b57cec5SDimitry Andric     createGuardCFTables();
10010b57cec5SDimitry Andric 
10025ffd83dbSDimitry Andric   if (config->autoImport)
10030b57cec5SDimitry Andric     createRuntimePseudoRelocs();
10040b57cec5SDimitry Andric 
10055ffd83dbSDimitry Andric   if (config->mingw)
10060b57cec5SDimitry Andric     insertCtorDtorSymbols();
10070b57cec5SDimitry Andric }
10080b57cec5SDimitry Andric 
10090b57cec5SDimitry Andric // Create .idata section for the DLL-imported symbol table.
10100b57cec5SDimitry Andric // The format of this section is inherently Windows-specific.
10110b57cec5SDimitry Andric // IdataContents class abstracted away the details for us,
10120b57cec5SDimitry Andric // so we just let it create chunks and add them to the section.
10130b57cec5SDimitry Andric void Writer::createImportTables() {
10140b57cec5SDimitry Andric   // Initialize DLLOrder so that import entries are ordered in
10150b57cec5SDimitry Andric   // the same order as in the command line. (That affects DLL
10160b57cec5SDimitry Andric   // initialization order, and this ordering is MSVC-compatible.)
1017349cc55cSDimitry Andric   for (ImportFile *file : ctx.importFileInstances) {
10180b57cec5SDimitry Andric     if (!file->live)
10190b57cec5SDimitry Andric       continue;
10200b57cec5SDimitry Andric 
10210b57cec5SDimitry Andric     std::string dll = StringRef(file->dllName).lower();
10220b57cec5SDimitry Andric     if (config->dllOrder.count(dll) == 0)
10230b57cec5SDimitry Andric       config->dllOrder[dll] = config->dllOrder.size();
10240b57cec5SDimitry Andric 
10250b57cec5SDimitry Andric     if (file->impSym && !isa<DefinedImportData>(file->impSym))
10260b57cec5SDimitry Andric       fatal(toString(*file->impSym) + " was replaced");
10270b57cec5SDimitry Andric     DefinedImportData *impSym = cast_or_null<DefinedImportData>(file->impSym);
10280b57cec5SDimitry Andric     if (config->delayLoads.count(StringRef(file->dllName).lower())) {
10290b57cec5SDimitry Andric       if (!file->thunkSym)
10300b57cec5SDimitry Andric         fatal("cannot delay-load " + toString(file) +
10310b57cec5SDimitry Andric               " due to import of data: " + toString(*impSym));
10320b57cec5SDimitry Andric       delayIdata.add(impSym);
10330b57cec5SDimitry Andric     } else {
10340b57cec5SDimitry Andric       idata.add(impSym);
10350b57cec5SDimitry Andric     }
10360b57cec5SDimitry Andric   }
10370b57cec5SDimitry Andric }
10380b57cec5SDimitry Andric 
10390b57cec5SDimitry Andric void Writer::appendImportThunks() {
1040349cc55cSDimitry Andric   if (ctx.importFileInstances.empty())
10410b57cec5SDimitry Andric     return;
10420b57cec5SDimitry Andric 
1043349cc55cSDimitry Andric   for (ImportFile *file : ctx.importFileInstances) {
10440b57cec5SDimitry Andric     if (!file->live)
10450b57cec5SDimitry Andric       continue;
10460b57cec5SDimitry Andric 
10470b57cec5SDimitry Andric     if (!file->thunkSym)
10480b57cec5SDimitry Andric       continue;
10490b57cec5SDimitry Andric 
10500b57cec5SDimitry Andric     if (!isa<DefinedImportThunk>(file->thunkSym))
10510b57cec5SDimitry Andric       fatal(toString(*file->thunkSym) + " was replaced");
10520b57cec5SDimitry Andric     DefinedImportThunk *thunk = cast<DefinedImportThunk>(file->thunkSym);
10530b57cec5SDimitry Andric     if (file->thunkLive)
10540b57cec5SDimitry Andric       textSec->addChunk(thunk->getChunk());
10550b57cec5SDimitry Andric   }
10560b57cec5SDimitry Andric 
10570b57cec5SDimitry Andric   if (!delayIdata.empty()) {
10580b57cec5SDimitry Andric     Defined *helper = cast<Defined>(config->delayLoadHelper);
1059349cc55cSDimitry Andric     delayIdata.create(ctx, helper);
10600b57cec5SDimitry Andric     for (Chunk *c : delayIdata.getChunks())
10610b57cec5SDimitry Andric       didatSec->addChunk(c);
10620b57cec5SDimitry Andric     for (Chunk *c : delayIdata.getDataChunks())
10630b57cec5SDimitry Andric       dataSec->addChunk(c);
10640b57cec5SDimitry Andric     for (Chunk *c : delayIdata.getCodeChunks())
10650b57cec5SDimitry Andric       textSec->addChunk(c);
10660b57cec5SDimitry Andric   }
10670b57cec5SDimitry Andric }
10680b57cec5SDimitry Andric 
10690b57cec5SDimitry Andric void Writer::createExportTable() {
107085868e8aSDimitry Andric   if (!edataSec->chunks.empty()) {
107185868e8aSDimitry Andric     // Allow using a custom built export table from input object files, instead
107285868e8aSDimitry Andric     // of having the linker synthesize the tables.
107385868e8aSDimitry Andric     if (config->hadExplicitExports)
107485868e8aSDimitry Andric       warn("literal .edata sections override exports");
107585868e8aSDimitry Andric   } else if (!config->exports.empty()) {
10760b57cec5SDimitry Andric     for (Chunk *c : edata.chunks)
10770b57cec5SDimitry Andric       edataSec->addChunk(c);
10780b57cec5SDimitry Andric   }
107985868e8aSDimitry Andric   if (!edataSec->chunks.empty()) {
108085868e8aSDimitry Andric     edataStart = edataSec->chunks.front();
108185868e8aSDimitry Andric     edataEnd = edataSec->chunks.back();
108285868e8aSDimitry Andric   }
1083fe6060f1SDimitry Andric   // Warn on exported deleting destructor.
1084fe6060f1SDimitry Andric   for (auto e : config->exports)
1085fe6060f1SDimitry Andric     if (e.sym && e.sym->getName().startswith("??_G"))
1086fe6060f1SDimitry Andric       warn("export of deleting dtor: " + toString(*e.sym));
108785868e8aSDimitry Andric }
10880b57cec5SDimitry Andric 
10890b57cec5SDimitry Andric void Writer::removeUnusedSections() {
10900b57cec5SDimitry Andric   // Remove sections that we can be sure won't get content, to avoid
10910b57cec5SDimitry Andric   // allocating space for their section headers.
10920b57cec5SDimitry Andric   auto isUnused = [this](OutputSection *s) {
10930b57cec5SDimitry Andric     if (s == relocSec)
10940b57cec5SDimitry Andric       return false; // This section is populated later.
10950b57cec5SDimitry Andric     // MergeChunks have zero size at this point, as their size is finalized
10960b57cec5SDimitry Andric     // later. Only remove sections that have no Chunks at all.
10970b57cec5SDimitry Andric     return s->chunks.empty();
10980b57cec5SDimitry Andric   };
1099349cc55cSDimitry Andric   llvm::erase_if(ctx.outputSections, isUnused);
11000b57cec5SDimitry Andric }
11010b57cec5SDimitry Andric 
11020b57cec5SDimitry Andric // The Windows loader doesn't seem to like empty sections,
11030b57cec5SDimitry Andric // so we remove them if any.
11040b57cec5SDimitry Andric void Writer::removeEmptySections() {
11050b57cec5SDimitry Andric   auto isEmpty = [](OutputSection *s) { return s->getVirtualSize() == 0; };
1106349cc55cSDimitry Andric   llvm::erase_if(ctx.outputSections, isEmpty);
11070b57cec5SDimitry Andric }
11080b57cec5SDimitry Andric 
11090b57cec5SDimitry Andric void Writer::assignOutputSectionIndices() {
11100b57cec5SDimitry Andric   // Assign final output section indices, and assign each chunk to its output
11110b57cec5SDimitry Andric   // section.
11120b57cec5SDimitry Andric   uint32_t idx = 1;
1113349cc55cSDimitry Andric   for (OutputSection *os : ctx.outputSections) {
11140b57cec5SDimitry Andric     os->sectionIndex = idx;
11150b57cec5SDimitry Andric     for (Chunk *c : os->chunks)
11160b57cec5SDimitry Andric       c->setOutputSectionIdx(idx);
11170b57cec5SDimitry Andric     ++idx;
11180b57cec5SDimitry Andric   }
11190b57cec5SDimitry Andric 
11200b57cec5SDimitry Andric   // Merge chunks are containers of chunks, so assign those an output section
11210b57cec5SDimitry Andric   // too.
1122349cc55cSDimitry Andric   for (MergeChunk *mc : ctx.mergeChunkInstances)
11230b57cec5SDimitry Andric     if (mc)
11240b57cec5SDimitry Andric       for (SectionChunk *sc : mc->sections)
11250b57cec5SDimitry Andric         if (sc && sc->live)
11260b57cec5SDimitry Andric           sc->setOutputSectionIdx(mc->getOutputSectionIdx());
11270b57cec5SDimitry Andric }
11280b57cec5SDimitry Andric 
11290b57cec5SDimitry Andric size_t Writer::addEntryToStringTable(StringRef str) {
11300b57cec5SDimitry Andric   assert(str.size() > COFF::NameSize);
11310b57cec5SDimitry Andric   size_t offsetOfEntry = strtab.size() + 4; // +4 for the size field
11320b57cec5SDimitry Andric   strtab.insert(strtab.end(), str.begin(), str.end());
11330b57cec5SDimitry Andric   strtab.push_back('\0');
11340b57cec5SDimitry Andric   return offsetOfEntry;
11350b57cec5SDimitry Andric }
11360b57cec5SDimitry Andric 
11370b57cec5SDimitry Andric Optional<coff_symbol16> Writer::createSymbol(Defined *def) {
11380b57cec5SDimitry Andric   coff_symbol16 sym;
11390b57cec5SDimitry Andric   switch (def->kind()) {
11400b57cec5SDimitry Andric   case Symbol::DefinedAbsoluteKind:
11410b57cec5SDimitry Andric     sym.Value = def->getRVA();
11420b57cec5SDimitry Andric     sym.SectionNumber = IMAGE_SYM_ABSOLUTE;
11430b57cec5SDimitry Andric     break;
11440b57cec5SDimitry Andric   case Symbol::DefinedSyntheticKind:
11450b57cec5SDimitry Andric     // Relative symbols are unrepresentable in a COFF symbol table.
11460b57cec5SDimitry Andric     return None;
11470b57cec5SDimitry Andric   default: {
11480b57cec5SDimitry Andric     // Don't write symbols that won't be written to the output to the symbol
11490b57cec5SDimitry Andric     // table.
11500b57cec5SDimitry Andric     Chunk *c = def->getChunk();
11510b57cec5SDimitry Andric     if (!c)
11520b57cec5SDimitry Andric       return None;
1153349cc55cSDimitry Andric     OutputSection *os = ctx.getOutputSection(c);
11540b57cec5SDimitry Andric     if (!os)
11550b57cec5SDimitry Andric       return None;
11560b57cec5SDimitry Andric 
11570b57cec5SDimitry Andric     sym.Value = def->getRVA() - os->getRVA();
11580b57cec5SDimitry Andric     sym.SectionNumber = os->sectionIndex;
11590b57cec5SDimitry Andric     break;
11600b57cec5SDimitry Andric   }
11610b57cec5SDimitry Andric   }
11620b57cec5SDimitry Andric 
11630b57cec5SDimitry Andric   // Symbols that are runtime pseudo relocations don't point to the actual
11640b57cec5SDimitry Andric   // symbol data itself (as they are imported), but points to the IAT entry
11650b57cec5SDimitry Andric   // instead. Avoid emitting them to the symbol table, as they can confuse
11660b57cec5SDimitry Andric   // debuggers.
11670b57cec5SDimitry Andric   if (def->isRuntimePseudoReloc)
11680b57cec5SDimitry Andric     return None;
11690b57cec5SDimitry Andric 
11700b57cec5SDimitry Andric   StringRef name = def->getName();
11710b57cec5SDimitry Andric   if (name.size() > COFF::NameSize) {
11720b57cec5SDimitry Andric     sym.Name.Offset.Zeroes = 0;
11730b57cec5SDimitry Andric     sym.Name.Offset.Offset = addEntryToStringTable(name);
11740b57cec5SDimitry Andric   } else {
11750b57cec5SDimitry Andric     memset(sym.Name.ShortName, 0, COFF::NameSize);
11760b57cec5SDimitry Andric     memcpy(sym.Name.ShortName, name.data(), name.size());
11770b57cec5SDimitry Andric   }
11780b57cec5SDimitry Andric 
11790b57cec5SDimitry Andric   if (auto *d = dyn_cast<DefinedCOFF>(def)) {
11800b57cec5SDimitry Andric     COFFSymbolRef ref = d->getCOFFSymbol();
11810b57cec5SDimitry Andric     sym.Type = ref.getType();
11820b57cec5SDimitry Andric     sym.StorageClass = ref.getStorageClass();
11830b57cec5SDimitry Andric   } else {
11840b57cec5SDimitry Andric     sym.Type = IMAGE_SYM_TYPE_NULL;
11850b57cec5SDimitry Andric     sym.StorageClass = IMAGE_SYM_CLASS_EXTERNAL;
11860b57cec5SDimitry Andric   }
11870b57cec5SDimitry Andric   sym.NumberOfAuxSymbols = 0;
11880b57cec5SDimitry Andric   return sym;
11890b57cec5SDimitry Andric }
11900b57cec5SDimitry Andric 
11910b57cec5SDimitry Andric void Writer::createSymbolAndStringTable() {
11920b57cec5SDimitry Andric   // PE/COFF images are limited to 8 byte section names. Longer names can be
11930b57cec5SDimitry Andric   // supported by writing a non-standard string table, but this string table is
11940b57cec5SDimitry Andric   // not mapped at runtime and the long names will therefore be inaccessible.
11950b57cec5SDimitry Andric   // link.exe always truncates section names to 8 bytes, whereas binutils always
11960b57cec5SDimitry Andric   // preserves long section names via the string table. LLD adopts a hybrid
11970b57cec5SDimitry Andric   // solution where discardable sections have long names preserved and
11980b57cec5SDimitry Andric   // non-discardable sections have their names truncated, to ensure that any
11990b57cec5SDimitry Andric   // section which is mapped at runtime also has its name mapped at runtime.
1200349cc55cSDimitry Andric   for (OutputSection *sec : ctx.outputSections) {
12010b57cec5SDimitry Andric     if (sec->name.size() <= COFF::NameSize)
12020b57cec5SDimitry Andric       continue;
12030b57cec5SDimitry Andric     if ((sec->header.Characteristics & IMAGE_SCN_MEM_DISCARDABLE) == 0)
12040b57cec5SDimitry Andric       continue;
1205480093f4SDimitry Andric     if (config->warnLongSectionNames) {
1206480093f4SDimitry Andric       warn("section name " + sec->name +
1207480093f4SDimitry Andric            " is longer than 8 characters and will use a non-standard string "
1208480093f4SDimitry Andric            "table");
1209480093f4SDimitry Andric     }
12100b57cec5SDimitry Andric     sec->setStringTableOff(addEntryToStringTable(sec->name));
12110b57cec5SDimitry Andric   }
12120b57cec5SDimitry Andric 
12130b57cec5SDimitry Andric   if (config->debugDwarf || config->debugSymtab) {
1214349cc55cSDimitry Andric     for (ObjFile *file : ctx.objFileInstances) {
12150b57cec5SDimitry Andric       for (Symbol *b : file->getSymbols()) {
12160b57cec5SDimitry Andric         auto *d = dyn_cast_or_null<Defined>(b);
12170b57cec5SDimitry Andric         if (!d || d->writtenToSymtab)
12180b57cec5SDimitry Andric           continue;
12190b57cec5SDimitry Andric         d->writtenToSymtab = true;
12204824e7fdSDimitry Andric         if (auto *dc = dyn_cast_or_null<DefinedCOFF>(d)) {
12214824e7fdSDimitry Andric           COFFSymbolRef symRef = dc->getCOFFSymbol();
12224824e7fdSDimitry Andric           if (symRef.isSectionDefinition() ||
12234824e7fdSDimitry Andric               symRef.getStorageClass() == COFF::IMAGE_SYM_CLASS_LABEL)
12244824e7fdSDimitry Andric             continue;
12254824e7fdSDimitry Andric         }
12260b57cec5SDimitry Andric 
12270b57cec5SDimitry Andric         if (Optional<coff_symbol16> sym = createSymbol(d))
12280b57cec5SDimitry Andric           outputSymtab.push_back(*sym);
12290b57cec5SDimitry Andric       }
12300b57cec5SDimitry Andric     }
12310b57cec5SDimitry Andric   }
12320b57cec5SDimitry Andric 
12330b57cec5SDimitry Andric   if (outputSymtab.empty() && strtab.empty())
12340b57cec5SDimitry Andric     return;
12350b57cec5SDimitry Andric 
12360b57cec5SDimitry Andric   // We position the symbol table to be adjacent to the end of the last section.
12370b57cec5SDimitry Andric   uint64_t fileOff = fileSize;
12380b57cec5SDimitry Andric   pointerToSymbolTable = fileOff;
12390b57cec5SDimitry Andric   fileOff += outputSymtab.size() * sizeof(coff_symbol16);
12400b57cec5SDimitry Andric   fileOff += 4 + strtab.size();
12410b57cec5SDimitry Andric   fileSize = alignTo(fileOff, config->fileAlign);
12420b57cec5SDimitry Andric }
12430b57cec5SDimitry Andric 
12440b57cec5SDimitry Andric void Writer::mergeSections() {
12450b57cec5SDimitry Andric   if (!pdataSec->chunks.empty()) {
12460b57cec5SDimitry Andric     firstPdata = pdataSec->chunks.front();
12470b57cec5SDimitry Andric     lastPdata = pdataSec->chunks.back();
12480b57cec5SDimitry Andric   }
12490b57cec5SDimitry Andric 
12500b57cec5SDimitry Andric   for (auto &p : config->merge) {
12510b57cec5SDimitry Andric     StringRef toName = p.second;
12520b57cec5SDimitry Andric     if (p.first == toName)
12530b57cec5SDimitry Andric       continue;
12540b57cec5SDimitry Andric     StringSet<> names;
125504eeddc0SDimitry Andric     while (true) {
12560b57cec5SDimitry Andric       if (!names.insert(toName).second)
12570b57cec5SDimitry Andric         fatal("/merge: cycle found for section '" + p.first + "'");
12580b57cec5SDimitry Andric       auto i = config->merge.find(toName);
12590b57cec5SDimitry Andric       if (i == config->merge.end())
12600b57cec5SDimitry Andric         break;
12610b57cec5SDimitry Andric       toName = i->second;
12620b57cec5SDimitry Andric     }
12630b57cec5SDimitry Andric     OutputSection *from = findSection(p.first);
12640b57cec5SDimitry Andric     OutputSection *to = findSection(toName);
12650b57cec5SDimitry Andric     if (!from)
12660b57cec5SDimitry Andric       continue;
12670b57cec5SDimitry Andric     if (!to) {
12680b57cec5SDimitry Andric       from->name = toName;
12690b57cec5SDimitry Andric       continue;
12700b57cec5SDimitry Andric     }
12710b57cec5SDimitry Andric     to->merge(from);
12720b57cec5SDimitry Andric   }
12730b57cec5SDimitry Andric }
12740b57cec5SDimitry Andric 
12750b57cec5SDimitry Andric // Visits all sections to assign incremental, non-overlapping RVAs and
12760b57cec5SDimitry Andric // file offsets.
12770b57cec5SDimitry Andric void Writer::assignAddresses() {
12780b57cec5SDimitry Andric   sizeOfHeaders = dosStubSize + sizeof(PEMagic) + sizeof(coff_file_header) +
12790b57cec5SDimitry Andric                   sizeof(data_directory) * numberOfDataDirectory +
1280349cc55cSDimitry Andric                   sizeof(coff_section) * ctx.outputSections.size();
12810b57cec5SDimitry Andric   sizeOfHeaders +=
12820b57cec5SDimitry Andric       config->is64() ? sizeof(pe32plus_header) : sizeof(pe32_header);
12830b57cec5SDimitry Andric   sizeOfHeaders = alignTo(sizeOfHeaders, config->fileAlign);
12840b57cec5SDimitry Andric   fileSize = sizeOfHeaders;
12850b57cec5SDimitry Andric 
12860b57cec5SDimitry Andric   // The first page is kept unmapped.
12870b57cec5SDimitry Andric   uint64_t rva = alignTo(sizeOfHeaders, config->align);
12880b57cec5SDimitry Andric 
1289349cc55cSDimitry Andric   for (OutputSection *sec : ctx.outputSections) {
12900b57cec5SDimitry Andric     if (sec == relocSec)
12910b57cec5SDimitry Andric       addBaserels();
12920b57cec5SDimitry Andric     uint64_t rawSize = 0, virtualSize = 0;
12930b57cec5SDimitry Andric     sec->header.VirtualAddress = rva;
12940b57cec5SDimitry Andric 
12950b57cec5SDimitry Andric     // If /FUNCTIONPADMIN is used, functions are padded in order to create a
12960b57cec5SDimitry Andric     // hotpatchable image.
12970b57cec5SDimitry Andric     const bool isCodeSection =
12980b57cec5SDimitry Andric         (sec->header.Characteristics & IMAGE_SCN_CNT_CODE) &&
12990b57cec5SDimitry Andric         (sec->header.Characteristics & IMAGE_SCN_MEM_READ) &&
13000b57cec5SDimitry Andric         (sec->header.Characteristics & IMAGE_SCN_MEM_EXECUTE);
13010b57cec5SDimitry Andric     uint32_t padding = isCodeSection ? config->functionPadMin : 0;
13020b57cec5SDimitry Andric 
13030b57cec5SDimitry Andric     for (Chunk *c : sec->chunks) {
13040b57cec5SDimitry Andric       if (padding && c->isHotPatchable())
13050b57cec5SDimitry Andric         virtualSize += padding;
13060b57cec5SDimitry Andric       virtualSize = alignTo(virtualSize, c->getAlignment());
13070b57cec5SDimitry Andric       c->setRVA(rva + virtualSize);
13080b57cec5SDimitry Andric       virtualSize += c->getSize();
13090b57cec5SDimitry Andric       if (c->hasData)
13100b57cec5SDimitry Andric         rawSize = alignTo(virtualSize, config->fileAlign);
13110b57cec5SDimitry Andric     }
13120b57cec5SDimitry Andric     if (virtualSize > UINT32_MAX)
13130b57cec5SDimitry Andric       error("section larger than 4 GiB: " + sec->name);
13140b57cec5SDimitry Andric     sec->header.VirtualSize = virtualSize;
13150b57cec5SDimitry Andric     sec->header.SizeOfRawData = rawSize;
13160b57cec5SDimitry Andric     if (rawSize != 0)
13170b57cec5SDimitry Andric       sec->header.PointerToRawData = fileSize;
13180b57cec5SDimitry Andric     rva += alignTo(virtualSize, config->align);
13190b57cec5SDimitry Andric     fileSize += alignTo(rawSize, config->fileAlign);
13200b57cec5SDimitry Andric   }
13210b57cec5SDimitry Andric   sizeOfImage = alignTo(rva, config->align);
13220b57cec5SDimitry Andric 
13230b57cec5SDimitry Andric   // Assign addresses to sections in MergeChunks.
1324349cc55cSDimitry Andric   for (MergeChunk *mc : ctx.mergeChunkInstances)
13250b57cec5SDimitry Andric     if (mc)
13260b57cec5SDimitry Andric       mc->assignSubsectionRVAs();
13270b57cec5SDimitry Andric }
13280b57cec5SDimitry Andric 
13290b57cec5SDimitry Andric template <typename PEHeaderTy> void Writer::writeHeader() {
13300b57cec5SDimitry Andric   // Write DOS header. For backwards compatibility, the first part of a PE/COFF
13310b57cec5SDimitry Andric   // executable consists of an MS-DOS MZ executable. If the executable is run
13320b57cec5SDimitry Andric   // under DOS, that program gets run (usually to just print an error message).
13330b57cec5SDimitry Andric   // When run under Windows, the loader looks at AddressOfNewExeHeader and uses
13340b57cec5SDimitry Andric   // the PE header instead.
13350b57cec5SDimitry Andric   uint8_t *buf = buffer->getBufferStart();
13360b57cec5SDimitry Andric   auto *dos = reinterpret_cast<dos_header *>(buf);
13370b57cec5SDimitry Andric   buf += sizeof(dos_header);
13380b57cec5SDimitry Andric   dos->Magic[0] = 'M';
13390b57cec5SDimitry Andric   dos->Magic[1] = 'Z';
13400b57cec5SDimitry Andric   dos->UsedBytesInTheLastPage = dosStubSize % 512;
13410b57cec5SDimitry Andric   dos->FileSizeInPages = divideCeil(dosStubSize, 512);
13420b57cec5SDimitry Andric   dos->HeaderSizeInParagraphs = sizeof(dos_header) / 16;
13430b57cec5SDimitry Andric 
13440b57cec5SDimitry Andric   dos->AddressOfRelocationTable = sizeof(dos_header);
13450b57cec5SDimitry Andric   dos->AddressOfNewExeHeader = dosStubSize;
13460b57cec5SDimitry Andric 
13470b57cec5SDimitry Andric   // Write DOS program.
13480b57cec5SDimitry Andric   memcpy(buf, dosProgram, sizeof(dosProgram));
13490b57cec5SDimitry Andric   buf += sizeof(dosProgram);
13500b57cec5SDimitry Andric 
13510b57cec5SDimitry Andric   // Write PE magic
13520b57cec5SDimitry Andric   memcpy(buf, PEMagic, sizeof(PEMagic));
13530b57cec5SDimitry Andric   buf += sizeof(PEMagic);
13540b57cec5SDimitry Andric 
13550b57cec5SDimitry Andric   // Write COFF header
13560b57cec5SDimitry Andric   auto *coff = reinterpret_cast<coff_file_header *>(buf);
13570b57cec5SDimitry Andric   buf += sizeof(*coff);
13580b57cec5SDimitry Andric   coff->Machine = config->machine;
1359349cc55cSDimitry Andric   coff->NumberOfSections = ctx.outputSections.size();
13600b57cec5SDimitry Andric   coff->Characteristics = IMAGE_FILE_EXECUTABLE_IMAGE;
13610b57cec5SDimitry Andric   if (config->largeAddressAware)
13620b57cec5SDimitry Andric     coff->Characteristics |= IMAGE_FILE_LARGE_ADDRESS_AWARE;
13630b57cec5SDimitry Andric   if (!config->is64())
13640b57cec5SDimitry Andric     coff->Characteristics |= IMAGE_FILE_32BIT_MACHINE;
13650b57cec5SDimitry Andric   if (config->dll)
13660b57cec5SDimitry Andric     coff->Characteristics |= IMAGE_FILE_DLL;
1367480093f4SDimitry Andric   if (config->driverUponly)
1368480093f4SDimitry Andric     coff->Characteristics |= IMAGE_FILE_UP_SYSTEM_ONLY;
13690b57cec5SDimitry Andric   if (!config->relocatable)
13700b57cec5SDimitry Andric     coff->Characteristics |= IMAGE_FILE_RELOCS_STRIPPED;
13710b57cec5SDimitry Andric   if (config->swaprunCD)
13720b57cec5SDimitry Andric     coff->Characteristics |= IMAGE_FILE_REMOVABLE_RUN_FROM_SWAP;
13730b57cec5SDimitry Andric   if (config->swaprunNet)
13740b57cec5SDimitry Andric     coff->Characteristics |= IMAGE_FILE_NET_RUN_FROM_SWAP;
13750b57cec5SDimitry Andric   coff->SizeOfOptionalHeader =
13760b57cec5SDimitry Andric       sizeof(PEHeaderTy) + sizeof(data_directory) * numberOfDataDirectory;
13770b57cec5SDimitry Andric 
13780b57cec5SDimitry Andric   // Write PE header
13790b57cec5SDimitry Andric   auto *pe = reinterpret_cast<PEHeaderTy *>(buf);
13800b57cec5SDimitry Andric   buf += sizeof(*pe);
13810b57cec5SDimitry Andric   pe->Magic = config->is64() ? PE32Header::PE32_PLUS : PE32Header::PE32;
13820b57cec5SDimitry Andric 
13830b57cec5SDimitry Andric   // If {Major,Minor}LinkerVersion is left at 0.0, then for some
13840b57cec5SDimitry Andric   // reason signing the resulting PE file with Authenticode produces a
13850b57cec5SDimitry Andric   // signature that fails to validate on Windows 7 (but is OK on 10).
13860b57cec5SDimitry Andric   // Set it to 14.0, which is what VS2015 outputs, and which avoids
13870b57cec5SDimitry Andric   // that problem.
13880b57cec5SDimitry Andric   pe->MajorLinkerVersion = 14;
13890b57cec5SDimitry Andric   pe->MinorLinkerVersion = 0;
13900b57cec5SDimitry Andric 
13910b57cec5SDimitry Andric   pe->ImageBase = config->imageBase;
13920b57cec5SDimitry Andric   pe->SectionAlignment = config->align;
13930b57cec5SDimitry Andric   pe->FileAlignment = config->fileAlign;
13940b57cec5SDimitry Andric   pe->MajorImageVersion = config->majorImageVersion;
13950b57cec5SDimitry Andric   pe->MinorImageVersion = config->minorImageVersion;
13960b57cec5SDimitry Andric   pe->MajorOperatingSystemVersion = config->majorOSVersion;
13970b57cec5SDimitry Andric   pe->MinorOperatingSystemVersion = config->minorOSVersion;
1398e8d8bef9SDimitry Andric   pe->MajorSubsystemVersion = config->majorSubsystemVersion;
1399e8d8bef9SDimitry Andric   pe->MinorSubsystemVersion = config->minorSubsystemVersion;
14000b57cec5SDimitry Andric   pe->Subsystem = config->subsystem;
14010b57cec5SDimitry Andric   pe->SizeOfImage = sizeOfImage;
14020b57cec5SDimitry Andric   pe->SizeOfHeaders = sizeOfHeaders;
14030b57cec5SDimitry Andric   if (!config->noEntry) {
14040b57cec5SDimitry Andric     Defined *entry = cast<Defined>(config->entry);
14050b57cec5SDimitry Andric     pe->AddressOfEntryPoint = entry->getRVA();
14060b57cec5SDimitry Andric     // Pointer to thumb code must have the LSB set, so adjust it.
14070b57cec5SDimitry Andric     if (config->machine == ARMNT)
14080b57cec5SDimitry Andric       pe->AddressOfEntryPoint |= 1;
14090b57cec5SDimitry Andric   }
14100b57cec5SDimitry Andric   pe->SizeOfStackReserve = config->stackReserve;
14110b57cec5SDimitry Andric   pe->SizeOfStackCommit = config->stackCommit;
14120b57cec5SDimitry Andric   pe->SizeOfHeapReserve = config->heapReserve;
14130b57cec5SDimitry Andric   pe->SizeOfHeapCommit = config->heapCommit;
14140b57cec5SDimitry Andric   if (config->appContainer)
14150b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_APPCONTAINER;
1416480093f4SDimitry Andric   if (config->driverWdm)
1417480093f4SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_WDM_DRIVER;
14180b57cec5SDimitry Andric   if (config->dynamicBase)
14190b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_DYNAMIC_BASE;
14200b57cec5SDimitry Andric   if (config->highEntropyVA)
14210b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_HIGH_ENTROPY_VA;
14220b57cec5SDimitry Andric   if (!config->allowBind)
14230b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_NO_BIND;
14240b57cec5SDimitry Andric   if (config->nxCompat)
14250b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_NX_COMPAT;
14260b57cec5SDimitry Andric   if (!config->allowIsolation)
14270b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_NO_ISOLATION;
14280b57cec5SDimitry Andric   if (config->guardCF != GuardCFLevel::Off)
14290b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_GUARD_CF;
14300b57cec5SDimitry Andric   if (config->integrityCheck)
14310b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_FORCE_INTEGRITY;
1432979e22ffSDimitry Andric   if (setNoSEHCharacteristic || config->noSEH)
14330b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_NO_SEH;
14340b57cec5SDimitry Andric   if (config->terminalServerAware)
14350b57cec5SDimitry Andric     pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_TERMINAL_SERVER_AWARE;
14360b57cec5SDimitry Andric   pe->NumberOfRvaAndSize = numberOfDataDirectory;
14370b57cec5SDimitry Andric   if (textSec->getVirtualSize()) {
14380b57cec5SDimitry Andric     pe->BaseOfCode = textSec->getRVA();
14390b57cec5SDimitry Andric     pe->SizeOfCode = textSec->getRawSize();
14400b57cec5SDimitry Andric   }
14410b57cec5SDimitry Andric   pe->SizeOfInitializedData = getSizeOfInitializedData();
14420b57cec5SDimitry Andric 
14430b57cec5SDimitry Andric   // Write data directory
14440b57cec5SDimitry Andric   auto *dir = reinterpret_cast<data_directory *>(buf);
14450b57cec5SDimitry Andric   buf += sizeof(*dir) * numberOfDataDirectory;
144685868e8aSDimitry Andric   if (edataStart) {
144785868e8aSDimitry Andric     dir[EXPORT_TABLE].RelativeVirtualAddress = edataStart->getRVA();
144885868e8aSDimitry Andric     dir[EXPORT_TABLE].Size =
144985868e8aSDimitry Andric         edataEnd->getRVA() + edataEnd->getSize() - edataStart->getRVA();
14500b57cec5SDimitry Andric   }
14510b57cec5SDimitry Andric   if (importTableStart) {
14520b57cec5SDimitry Andric     dir[IMPORT_TABLE].RelativeVirtualAddress = importTableStart->getRVA();
14530b57cec5SDimitry Andric     dir[IMPORT_TABLE].Size = importTableSize;
14540b57cec5SDimitry Andric   }
14550b57cec5SDimitry Andric   if (iatStart) {
14560b57cec5SDimitry Andric     dir[IAT].RelativeVirtualAddress = iatStart->getRVA();
14570b57cec5SDimitry Andric     dir[IAT].Size = iatSize;
14580b57cec5SDimitry Andric   }
14590b57cec5SDimitry Andric   if (rsrcSec->getVirtualSize()) {
14600b57cec5SDimitry Andric     dir[RESOURCE_TABLE].RelativeVirtualAddress = rsrcSec->getRVA();
14610b57cec5SDimitry Andric     dir[RESOURCE_TABLE].Size = rsrcSec->getVirtualSize();
14620b57cec5SDimitry Andric   }
14630b57cec5SDimitry Andric   if (firstPdata) {
14640b57cec5SDimitry Andric     dir[EXCEPTION_TABLE].RelativeVirtualAddress = firstPdata->getRVA();
14650b57cec5SDimitry Andric     dir[EXCEPTION_TABLE].Size =
14660b57cec5SDimitry Andric         lastPdata->getRVA() + lastPdata->getSize() - firstPdata->getRVA();
14670b57cec5SDimitry Andric   }
14680b57cec5SDimitry Andric   if (relocSec->getVirtualSize()) {
14690b57cec5SDimitry Andric     dir[BASE_RELOCATION_TABLE].RelativeVirtualAddress = relocSec->getRVA();
14700b57cec5SDimitry Andric     dir[BASE_RELOCATION_TABLE].Size = relocSec->getVirtualSize();
14710b57cec5SDimitry Andric   }
1472349cc55cSDimitry Andric   if (Symbol *sym = ctx.symtab.findUnderscore("_tls_used")) {
14730b57cec5SDimitry Andric     if (Defined *b = dyn_cast<Defined>(sym)) {
14740b57cec5SDimitry Andric       dir[TLS_TABLE].RelativeVirtualAddress = b->getRVA();
14750b57cec5SDimitry Andric       dir[TLS_TABLE].Size = config->is64()
14760b57cec5SDimitry Andric                                 ? sizeof(object::coff_tls_directory64)
14770b57cec5SDimitry Andric                                 : sizeof(object::coff_tls_directory32);
14780b57cec5SDimitry Andric     }
14790b57cec5SDimitry Andric   }
14800b57cec5SDimitry Andric   if (debugDirectory) {
14810b57cec5SDimitry Andric     dir[DEBUG_DIRECTORY].RelativeVirtualAddress = debugDirectory->getRVA();
14820b57cec5SDimitry Andric     dir[DEBUG_DIRECTORY].Size = debugDirectory->getSize();
14830b57cec5SDimitry Andric   }
1484349cc55cSDimitry Andric   if (Symbol *sym = ctx.symtab.findUnderscore("_load_config_used")) {
14850b57cec5SDimitry Andric     if (auto *b = dyn_cast<DefinedRegular>(sym)) {
14860b57cec5SDimitry Andric       SectionChunk *sc = b->getChunk();
14870b57cec5SDimitry Andric       assert(b->getRVA() >= sc->getRVA());
14880b57cec5SDimitry Andric       uint64_t offsetInChunk = b->getRVA() - sc->getRVA();
14890b57cec5SDimitry Andric       if (!sc->hasData || offsetInChunk + 4 > sc->getSize())
14900b57cec5SDimitry Andric         fatal("_load_config_used is malformed");
14910b57cec5SDimitry Andric 
14920b57cec5SDimitry Andric       ArrayRef<uint8_t> secContents = sc->getContents();
14930b57cec5SDimitry Andric       uint32_t loadConfigSize =
14940b57cec5SDimitry Andric           *reinterpret_cast<const ulittle32_t *>(&secContents[offsetInChunk]);
14950b57cec5SDimitry Andric       if (offsetInChunk + loadConfigSize > sc->getSize())
14960b57cec5SDimitry Andric         fatal("_load_config_used is too large");
14970b57cec5SDimitry Andric       dir[LOAD_CONFIG_TABLE].RelativeVirtualAddress = b->getRVA();
14980b57cec5SDimitry Andric       dir[LOAD_CONFIG_TABLE].Size = loadConfigSize;
14990b57cec5SDimitry Andric     }
15000b57cec5SDimitry Andric   }
15010b57cec5SDimitry Andric   if (!delayIdata.empty()) {
15020b57cec5SDimitry Andric     dir[DELAY_IMPORT_DESCRIPTOR].RelativeVirtualAddress =
15030b57cec5SDimitry Andric         delayIdata.getDirRVA();
15040b57cec5SDimitry Andric     dir[DELAY_IMPORT_DESCRIPTOR].Size = delayIdata.getDirSize();
15050b57cec5SDimitry Andric   }
15060b57cec5SDimitry Andric 
15070b57cec5SDimitry Andric   // Write section table
1508349cc55cSDimitry Andric   for (OutputSection *sec : ctx.outputSections) {
15090b57cec5SDimitry Andric     sec->writeHeaderTo(buf);
15100b57cec5SDimitry Andric     buf += sizeof(coff_section);
15110b57cec5SDimitry Andric   }
15120b57cec5SDimitry Andric   sectionTable = ArrayRef<uint8_t>(
1513349cc55cSDimitry Andric       buf - ctx.outputSections.size() * sizeof(coff_section), buf);
15140b57cec5SDimitry Andric 
15150b57cec5SDimitry Andric   if (outputSymtab.empty() && strtab.empty())
15160b57cec5SDimitry Andric     return;
15170b57cec5SDimitry Andric 
15180b57cec5SDimitry Andric   coff->PointerToSymbolTable = pointerToSymbolTable;
15190b57cec5SDimitry Andric   uint32_t numberOfSymbols = outputSymtab.size();
15200b57cec5SDimitry Andric   coff->NumberOfSymbols = numberOfSymbols;
15210b57cec5SDimitry Andric   auto *symbolTable = reinterpret_cast<coff_symbol16 *>(
15220b57cec5SDimitry Andric       buffer->getBufferStart() + coff->PointerToSymbolTable);
15230b57cec5SDimitry Andric   for (size_t i = 0; i != numberOfSymbols; ++i)
15240b57cec5SDimitry Andric     symbolTable[i] = outputSymtab[i];
15250b57cec5SDimitry Andric   // Create the string table, it follows immediately after the symbol table.
15260b57cec5SDimitry Andric   // The first 4 bytes is length including itself.
15270b57cec5SDimitry Andric   buf = reinterpret_cast<uint8_t *>(&symbolTable[numberOfSymbols]);
15280b57cec5SDimitry Andric   write32le(buf, strtab.size() + 4);
15290b57cec5SDimitry Andric   if (!strtab.empty())
15300b57cec5SDimitry Andric     memcpy(buf + 4, strtab.data(), strtab.size());
15310b57cec5SDimitry Andric }
15320b57cec5SDimitry Andric 
15330b57cec5SDimitry Andric void Writer::openFile(StringRef path) {
15340b57cec5SDimitry Andric   buffer = CHECK(
15350b57cec5SDimitry Andric       FileOutputBuffer::create(path, fileSize, FileOutputBuffer::F_executable),
15360b57cec5SDimitry Andric       "failed to open " + path);
15370b57cec5SDimitry Andric }
15380b57cec5SDimitry Andric 
15390b57cec5SDimitry Andric void Writer::createSEHTable() {
15400b57cec5SDimitry Andric   SymbolRVASet handlers;
1541349cc55cSDimitry Andric   for (ObjFile *file : ctx.objFileInstances) {
15420b57cec5SDimitry Andric     if (!file->hasSafeSEH())
15430b57cec5SDimitry Andric       error("/safeseh: " + file->getName() + " is not compatible with SEH");
15440b57cec5SDimitry Andric     markSymbolsForRVATable(file, file->getSXDataChunks(), handlers);
15450b57cec5SDimitry Andric   }
15460b57cec5SDimitry Andric 
15470b57cec5SDimitry Andric   // Set the "no SEH" characteristic if there really were no handlers, or if
15480b57cec5SDimitry Andric   // there is no load config object to point to the table of handlers.
15490b57cec5SDimitry Andric   setNoSEHCharacteristic =
1550349cc55cSDimitry Andric       handlers.empty() || !ctx.symtab.findUnderscore("_load_config_used");
15510b57cec5SDimitry Andric 
15520b57cec5SDimitry Andric   maybeAddRVATable(std::move(handlers), "__safe_se_handler_table",
15530b57cec5SDimitry Andric                    "__safe_se_handler_count");
15540b57cec5SDimitry Andric }
15550b57cec5SDimitry Andric 
15560b57cec5SDimitry Andric // Add a symbol to an RVA set. Two symbols may have the same RVA, but an RVA set
15570b57cec5SDimitry Andric // cannot contain duplicates. Therefore, the set is uniqued by Chunk and the
15580b57cec5SDimitry Andric // symbol's offset into that Chunk.
15590b57cec5SDimitry Andric static void addSymbolToRVASet(SymbolRVASet &rvaSet, Defined *s) {
15600b57cec5SDimitry Andric   Chunk *c = s->getChunk();
15610b57cec5SDimitry Andric   if (auto *sc = dyn_cast<SectionChunk>(c))
15620b57cec5SDimitry Andric     c = sc->repl; // Look through ICF replacement.
15630b57cec5SDimitry Andric   uint32_t off = s->getRVA() - (c ? c->getRVA() : 0);
15640b57cec5SDimitry Andric   rvaSet.insert({c, off});
15650b57cec5SDimitry Andric }
15660b57cec5SDimitry Andric 
15670b57cec5SDimitry Andric // Given a symbol, add it to the GFIDs table if it is a live, defined, function
15680b57cec5SDimitry Andric // symbol in an executable section.
15690b57cec5SDimitry Andric static void maybeAddAddressTakenFunction(SymbolRVASet &addressTakenSyms,
15700b57cec5SDimitry Andric                                          Symbol *s) {
15710b57cec5SDimitry Andric   if (!s)
15720b57cec5SDimitry Andric     return;
15730b57cec5SDimitry Andric 
15740b57cec5SDimitry Andric   switch (s->kind()) {
15750b57cec5SDimitry Andric   case Symbol::DefinedLocalImportKind:
15760b57cec5SDimitry Andric   case Symbol::DefinedImportDataKind:
15770b57cec5SDimitry Andric     // Defines an __imp_ pointer, so it is data, so it is ignored.
15780b57cec5SDimitry Andric     break;
15790b57cec5SDimitry Andric   case Symbol::DefinedCommonKind:
15800b57cec5SDimitry Andric     // Common is always data, so it is ignored.
15810b57cec5SDimitry Andric     break;
15820b57cec5SDimitry Andric   case Symbol::DefinedAbsoluteKind:
15830b57cec5SDimitry Andric   case Symbol::DefinedSyntheticKind:
15840b57cec5SDimitry Andric     // Absolute is never code, synthetic generally isn't and usually isn't
15850b57cec5SDimitry Andric     // determinable.
15860b57cec5SDimitry Andric     break;
158785868e8aSDimitry Andric   case Symbol::LazyArchiveKind:
158885868e8aSDimitry Andric   case Symbol::LazyObjectKind:
1589fe6060f1SDimitry Andric   case Symbol::LazyDLLSymbolKind:
15900b57cec5SDimitry Andric   case Symbol::UndefinedKind:
15910b57cec5SDimitry Andric     // Undefined symbols resolve to zero, so they don't have an RVA. Lazy
15920b57cec5SDimitry Andric     // symbols shouldn't have relocations.
15930b57cec5SDimitry Andric     break;
15940b57cec5SDimitry Andric 
15950b57cec5SDimitry Andric   case Symbol::DefinedImportThunkKind:
15960b57cec5SDimitry Andric     // Thunks are always code, include them.
15970b57cec5SDimitry Andric     addSymbolToRVASet(addressTakenSyms, cast<Defined>(s));
15980b57cec5SDimitry Andric     break;
15990b57cec5SDimitry Andric 
16000b57cec5SDimitry Andric   case Symbol::DefinedRegularKind: {
16010b57cec5SDimitry Andric     // This is a regular, defined, symbol from a COFF file. Mark the symbol as
16020b57cec5SDimitry Andric     // address taken if the symbol type is function and it's in an executable
16030b57cec5SDimitry Andric     // section.
16040b57cec5SDimitry Andric     auto *d = cast<DefinedRegular>(s);
16050b57cec5SDimitry Andric     if (d->getCOFFSymbol().getComplexType() == COFF::IMAGE_SYM_DTYPE_FUNCTION) {
16060b57cec5SDimitry Andric       SectionChunk *sc = dyn_cast<SectionChunk>(d->getChunk());
16070b57cec5SDimitry Andric       if (sc && sc->live &&
16080b57cec5SDimitry Andric           sc->getOutputCharacteristics() & IMAGE_SCN_MEM_EXECUTE)
16090b57cec5SDimitry Andric         addSymbolToRVASet(addressTakenSyms, d);
16100b57cec5SDimitry Andric     }
16110b57cec5SDimitry Andric     break;
16120b57cec5SDimitry Andric   }
16130b57cec5SDimitry Andric   }
16140b57cec5SDimitry Andric }
16150b57cec5SDimitry Andric 
16160b57cec5SDimitry Andric // Visit all relocations from all section contributions of this object file and
16170b57cec5SDimitry Andric // mark the relocation target as address-taken.
16180b57cec5SDimitry Andric static void markSymbolsWithRelocations(ObjFile *file,
16190b57cec5SDimitry Andric                                        SymbolRVASet &usedSymbols) {
16200b57cec5SDimitry Andric   for (Chunk *c : file->getChunks()) {
16210b57cec5SDimitry Andric     // We only care about live section chunks. Common chunks and other chunks
16220b57cec5SDimitry Andric     // don't generally contain relocations.
16230b57cec5SDimitry Andric     SectionChunk *sc = dyn_cast<SectionChunk>(c);
16240b57cec5SDimitry Andric     if (!sc || !sc->live)
16250b57cec5SDimitry Andric       continue;
16260b57cec5SDimitry Andric 
16270b57cec5SDimitry Andric     for (const coff_relocation &reloc : sc->getRelocs()) {
16280b57cec5SDimitry Andric       if (config->machine == I386 && reloc.Type == COFF::IMAGE_REL_I386_REL32)
16290b57cec5SDimitry Andric         // Ignore relative relocations on x86. On x86_64 they can't be ignored
16300b57cec5SDimitry Andric         // since they're also used to compute absolute addresses.
16310b57cec5SDimitry Andric         continue;
16320b57cec5SDimitry Andric 
16330b57cec5SDimitry Andric       Symbol *ref = sc->file->getSymbol(reloc.SymbolTableIndex);
16340b57cec5SDimitry Andric       maybeAddAddressTakenFunction(usedSymbols, ref);
16350b57cec5SDimitry Andric     }
16360b57cec5SDimitry Andric   }
16370b57cec5SDimitry Andric }
16380b57cec5SDimitry Andric 
16390b57cec5SDimitry Andric // Create the guard function id table. This is a table of RVAs of all
16400b57cec5SDimitry Andric // address-taken functions. It is sorted and uniqued, just like the safe SEH
16410b57cec5SDimitry Andric // table.
16420b57cec5SDimitry Andric void Writer::createGuardCFTables() {
16430b57cec5SDimitry Andric   SymbolRVASet addressTakenSyms;
1644e8d8bef9SDimitry Andric   SymbolRVASet giatsRVASet;
1645e8d8bef9SDimitry Andric   std::vector<Symbol *> giatsSymbols;
16460b57cec5SDimitry Andric   SymbolRVASet longJmpTargets;
1647fe6060f1SDimitry Andric   SymbolRVASet ehContTargets;
1648349cc55cSDimitry Andric   for (ObjFile *file : ctx.objFileInstances) {
16490b57cec5SDimitry Andric     // If the object was compiled with /guard:cf, the address taken symbols
1650fe6060f1SDimitry Andric     // are in .gfids$y sections, the longjmp targets are in .gljmp$y sections,
1651fe6060f1SDimitry Andric     // and ehcont targets are in .gehcont$y sections. If the object was not
1652fe6060f1SDimitry Andric     // compiled with /guard:cf, we assume there were no setjmp and ehcont
1653fe6060f1SDimitry Andric     // targets, and that all code symbols with relocations are possibly
1654fe6060f1SDimitry Andric     // address-taken.
16550b57cec5SDimitry Andric     if (file->hasGuardCF()) {
16560b57cec5SDimitry Andric       markSymbolsForRVATable(file, file->getGuardFidChunks(), addressTakenSyms);
1657e8d8bef9SDimitry Andric       markSymbolsForRVATable(file, file->getGuardIATChunks(), giatsRVASet);
1658e8d8bef9SDimitry Andric       getSymbolsFromSections(file, file->getGuardIATChunks(), giatsSymbols);
16590b57cec5SDimitry Andric       markSymbolsForRVATable(file, file->getGuardLJmpChunks(), longJmpTargets);
1660fe6060f1SDimitry Andric       markSymbolsForRVATable(file, file->getGuardEHContChunks(), ehContTargets);
16610b57cec5SDimitry Andric     } else {
16620b57cec5SDimitry Andric       markSymbolsWithRelocations(file, addressTakenSyms);
16630b57cec5SDimitry Andric     }
16640b57cec5SDimitry Andric   }
16650b57cec5SDimitry Andric 
16660b57cec5SDimitry Andric   // Mark the image entry as address-taken.
16670b57cec5SDimitry Andric   if (config->entry)
16680b57cec5SDimitry Andric     maybeAddAddressTakenFunction(addressTakenSyms, config->entry);
16690b57cec5SDimitry Andric 
16700b57cec5SDimitry Andric   // Mark exported symbols in executable sections as address-taken.
16710b57cec5SDimitry Andric   for (Export &e : config->exports)
16720b57cec5SDimitry Andric     maybeAddAddressTakenFunction(addressTakenSyms, e.sym);
16730b57cec5SDimitry Andric 
1674e8d8bef9SDimitry Andric   // For each entry in the .giats table, check if it has a corresponding load
1675e8d8bef9SDimitry Andric   // thunk (e.g. because the DLL that defines it will be delay-loaded) and, if
1676e8d8bef9SDimitry Andric   // so, add the load thunk to the address taken (.gfids) table.
1677e8d8bef9SDimitry Andric   for (Symbol *s : giatsSymbols) {
1678e8d8bef9SDimitry Andric     if (auto *di = dyn_cast<DefinedImportData>(s)) {
1679e8d8bef9SDimitry Andric       if (di->loadThunkSym)
1680e8d8bef9SDimitry Andric         addSymbolToRVASet(addressTakenSyms, di->loadThunkSym);
1681e8d8bef9SDimitry Andric     }
1682e8d8bef9SDimitry Andric   }
1683e8d8bef9SDimitry Andric 
16840b57cec5SDimitry Andric   // Ensure sections referenced in the gfid table are 16-byte aligned.
16850b57cec5SDimitry Andric   for (const ChunkAndOffset &c : addressTakenSyms)
16860b57cec5SDimitry Andric     if (c.inputChunk->getAlignment() < 16)
16870b57cec5SDimitry Andric       c.inputChunk->setAlignment(16);
16880b57cec5SDimitry Andric 
16890b57cec5SDimitry Andric   maybeAddRVATable(std::move(addressTakenSyms), "__guard_fids_table",
16900b57cec5SDimitry Andric                    "__guard_fids_count");
16910b57cec5SDimitry Andric 
1692e8d8bef9SDimitry Andric   // Add the Guard Address Taken IAT Entry Table (.giats).
1693e8d8bef9SDimitry Andric   maybeAddRVATable(std::move(giatsRVASet), "__guard_iat_table",
1694e8d8bef9SDimitry Andric                    "__guard_iat_count");
1695e8d8bef9SDimitry Andric 
16960b57cec5SDimitry Andric   // Add the longjmp target table unless the user told us not to.
1697fe6060f1SDimitry Andric   if (config->guardCF & GuardCFLevel::LongJmp)
16980b57cec5SDimitry Andric     maybeAddRVATable(std::move(longJmpTargets), "__guard_longjmp_table",
16990b57cec5SDimitry Andric                      "__guard_longjmp_count");
17000b57cec5SDimitry Andric 
1701fe6060f1SDimitry Andric   // Add the ehcont target table unless the user told us not to.
1702fe6060f1SDimitry Andric   if (config->guardCF & GuardCFLevel::EHCont)
1703fe6060f1SDimitry Andric     maybeAddRVATable(std::move(ehContTargets), "__guard_eh_cont_table",
1704fe6060f1SDimitry Andric                      "__guard_eh_cont_count", true);
1705fe6060f1SDimitry Andric 
17060b57cec5SDimitry Andric   // Set __guard_flags, which will be used in the load config to indicate that
17070b57cec5SDimitry Andric   // /guard:cf was enabled.
17080b57cec5SDimitry Andric   uint32_t guardFlags = uint32_t(coff_guard_flags::CFInstrumented) |
17090b57cec5SDimitry Andric                         uint32_t(coff_guard_flags::HasFidTable);
1710fe6060f1SDimitry Andric   if (config->guardCF & GuardCFLevel::LongJmp)
17110b57cec5SDimitry Andric     guardFlags |= uint32_t(coff_guard_flags::HasLongJmpTable);
1712fe6060f1SDimitry Andric   if (config->guardCF & GuardCFLevel::EHCont)
1713fe6060f1SDimitry Andric     guardFlags |= uint32_t(coff_guard_flags::HasEHContTable);
1714349cc55cSDimitry Andric   Symbol *flagSym = ctx.symtab.findUnderscore("__guard_flags");
17150b57cec5SDimitry Andric   cast<DefinedAbsolute>(flagSym)->setVA(guardFlags);
17160b57cec5SDimitry Andric }
17170b57cec5SDimitry Andric 
17180b57cec5SDimitry Andric // Take a list of input sections containing symbol table indices and add those
1719e8d8bef9SDimitry Andric // symbols to a vector. The challenge is that symbol RVAs are not known and
17200b57cec5SDimitry Andric // depend on the table size, so we can't directly build a set of integers.
1721e8d8bef9SDimitry Andric void Writer::getSymbolsFromSections(ObjFile *file,
17220b57cec5SDimitry Andric                                     ArrayRef<SectionChunk *> symIdxChunks,
1723e8d8bef9SDimitry Andric                                     std::vector<Symbol *> &symbols) {
17240b57cec5SDimitry Andric   for (SectionChunk *c : symIdxChunks) {
17250b57cec5SDimitry Andric     // Skip sections discarded by linker GC. This comes up when a .gfids section
17260b57cec5SDimitry Andric     // is associated with something like a vtable and the vtable is discarded.
17270b57cec5SDimitry Andric     // In this case, the associated gfids section is discarded, and we don't
17280b57cec5SDimitry Andric     // mark the virtual member functions as address-taken by the vtable.
17290b57cec5SDimitry Andric     if (!c->live)
17300b57cec5SDimitry Andric       continue;
17310b57cec5SDimitry Andric 
17320b57cec5SDimitry Andric     // Validate that the contents look like symbol table indices.
17330b57cec5SDimitry Andric     ArrayRef<uint8_t> data = c->getContents();
17340b57cec5SDimitry Andric     if (data.size() % 4 != 0) {
17350b57cec5SDimitry Andric       warn("ignoring " + c->getSectionName() +
17360b57cec5SDimitry Andric            " symbol table index section in object " + toString(file));
17370b57cec5SDimitry Andric       continue;
17380b57cec5SDimitry Andric     }
17390b57cec5SDimitry Andric 
17400b57cec5SDimitry Andric     // Read each symbol table index and check if that symbol was included in the
1741e8d8bef9SDimitry Andric     // final link. If so, add it to the vector of symbols.
17420b57cec5SDimitry Andric     ArrayRef<ulittle32_t> symIndices(
17430b57cec5SDimitry Andric         reinterpret_cast<const ulittle32_t *>(data.data()), data.size() / 4);
17440b57cec5SDimitry Andric     ArrayRef<Symbol *> objSymbols = file->getSymbols();
17450b57cec5SDimitry Andric     for (uint32_t symIndex : symIndices) {
17460b57cec5SDimitry Andric       if (symIndex >= objSymbols.size()) {
17470b57cec5SDimitry Andric         warn("ignoring invalid symbol table index in section " +
17480b57cec5SDimitry Andric              c->getSectionName() + " in object " + toString(file));
17490b57cec5SDimitry Andric         continue;
17500b57cec5SDimitry Andric       }
17510b57cec5SDimitry Andric       if (Symbol *s = objSymbols[symIndex]) {
17520b57cec5SDimitry Andric         if (s->isLive())
1753e8d8bef9SDimitry Andric           symbols.push_back(cast<Symbol>(s));
1754e8d8bef9SDimitry Andric       }
1755e8d8bef9SDimitry Andric     }
1756e8d8bef9SDimitry Andric   }
1757e8d8bef9SDimitry Andric }
1758e8d8bef9SDimitry Andric 
1759e8d8bef9SDimitry Andric // Take a list of input sections containing symbol table indices and add those
1760e8d8bef9SDimitry Andric // symbols to an RVA table.
1761e8d8bef9SDimitry Andric void Writer::markSymbolsForRVATable(ObjFile *file,
1762e8d8bef9SDimitry Andric                                     ArrayRef<SectionChunk *> symIdxChunks,
1763e8d8bef9SDimitry Andric                                     SymbolRVASet &tableSymbols) {
1764e8d8bef9SDimitry Andric   std::vector<Symbol *> syms;
1765e8d8bef9SDimitry Andric   getSymbolsFromSections(file, symIdxChunks, syms);
1766e8d8bef9SDimitry Andric 
1767e8d8bef9SDimitry Andric   for (Symbol *s : syms)
17680b57cec5SDimitry Andric     addSymbolToRVASet(tableSymbols, cast<Defined>(s));
17690b57cec5SDimitry Andric }
17700b57cec5SDimitry Andric 
17710b57cec5SDimitry Andric // Replace the absolute table symbol with a synthetic symbol pointing to
17720b57cec5SDimitry Andric // tableChunk so that we can emit base relocations for it and resolve section
17730b57cec5SDimitry Andric // relative relocations.
17740b57cec5SDimitry Andric void Writer::maybeAddRVATable(SymbolRVASet tableSymbols, StringRef tableSym,
1775fe6060f1SDimitry Andric                               StringRef countSym, bool hasFlag) {
17760b57cec5SDimitry Andric   if (tableSymbols.empty())
17770b57cec5SDimitry Andric     return;
17780b57cec5SDimitry Andric 
1779fe6060f1SDimitry Andric   NonSectionChunk *tableChunk;
1780fe6060f1SDimitry Andric   if (hasFlag)
1781fe6060f1SDimitry Andric     tableChunk = make<RVAFlagTableChunk>(std::move(tableSymbols));
1782fe6060f1SDimitry Andric   else
1783fe6060f1SDimitry Andric     tableChunk = make<RVATableChunk>(std::move(tableSymbols));
17840b57cec5SDimitry Andric   rdataSec->addChunk(tableChunk);
17850b57cec5SDimitry Andric 
1786349cc55cSDimitry Andric   Symbol *t = ctx.symtab.findUnderscore(tableSym);
1787349cc55cSDimitry Andric   Symbol *c = ctx.symtab.findUnderscore(countSym);
17880b57cec5SDimitry Andric   replaceSymbol<DefinedSynthetic>(t, t->getName(), tableChunk);
1789fe6060f1SDimitry Andric   cast<DefinedAbsolute>(c)->setVA(tableChunk->getSize() / (hasFlag ? 5 : 4));
17900b57cec5SDimitry Andric }
17910b57cec5SDimitry Andric 
17920b57cec5SDimitry Andric // MinGW specific. Gather all relocations that are imported from a DLL even
17930b57cec5SDimitry Andric // though the code didn't expect it to, produce the table that the runtime
17940b57cec5SDimitry Andric // uses for fixing them up, and provide the synthetic symbols that the
17950b57cec5SDimitry Andric // runtime uses for finding the table.
17960b57cec5SDimitry Andric void Writer::createRuntimePseudoRelocs() {
17970b57cec5SDimitry Andric   std::vector<RuntimePseudoReloc> rels;
17980b57cec5SDimitry Andric 
1799349cc55cSDimitry Andric   for (Chunk *c : ctx.symtab.getChunks()) {
18000b57cec5SDimitry Andric     auto *sc = dyn_cast<SectionChunk>(c);
18010b57cec5SDimitry Andric     if (!sc || !sc->live)
18020b57cec5SDimitry Andric       continue;
18030b57cec5SDimitry Andric     sc->getRuntimePseudoRelocs(rels);
18040b57cec5SDimitry Andric   }
18050b57cec5SDimitry Andric 
18065ffd83dbSDimitry Andric   if (!config->pseudoRelocs) {
18075ffd83dbSDimitry Andric     // Not writing any pseudo relocs; if some were needed, error out and
18085ffd83dbSDimitry Andric     // indicate what required them.
18095ffd83dbSDimitry Andric     for (const RuntimePseudoReloc &rpr : rels)
18105ffd83dbSDimitry Andric       error("automatic dllimport of " + rpr.sym->getName() + " in " +
18115ffd83dbSDimitry Andric             toString(rpr.target->file) + " requires pseudo relocations");
18125ffd83dbSDimitry Andric     return;
18135ffd83dbSDimitry Andric   }
18145ffd83dbSDimitry Andric 
18150b57cec5SDimitry Andric   if (!rels.empty())
18160b57cec5SDimitry Andric     log("Writing " + Twine(rels.size()) + " runtime pseudo relocations");
18170b57cec5SDimitry Andric   PseudoRelocTableChunk *table = make<PseudoRelocTableChunk>(rels);
18180b57cec5SDimitry Andric   rdataSec->addChunk(table);
18190b57cec5SDimitry Andric   EmptyChunk *endOfList = make<EmptyChunk>();
18200b57cec5SDimitry Andric   rdataSec->addChunk(endOfList);
18210b57cec5SDimitry Andric 
1822349cc55cSDimitry Andric   Symbol *headSym = ctx.symtab.findUnderscore("__RUNTIME_PSEUDO_RELOC_LIST__");
1823349cc55cSDimitry Andric   Symbol *endSym =
1824349cc55cSDimitry Andric       ctx.symtab.findUnderscore("__RUNTIME_PSEUDO_RELOC_LIST_END__");
18250b57cec5SDimitry Andric   replaceSymbol<DefinedSynthetic>(headSym, headSym->getName(), table);
18260b57cec5SDimitry Andric   replaceSymbol<DefinedSynthetic>(endSym, endSym->getName(), endOfList);
18270b57cec5SDimitry Andric }
18280b57cec5SDimitry Andric 
18290b57cec5SDimitry Andric // MinGW specific.
18300b57cec5SDimitry Andric // The MinGW .ctors and .dtors lists have sentinels at each end;
18310b57cec5SDimitry Andric // a (uintptr_t)-1 at the start and a (uintptr_t)0 at the end.
18320b57cec5SDimitry Andric // There's a symbol pointing to the start sentinel pointer, __CTOR_LIST__
18330b57cec5SDimitry Andric // and __DTOR_LIST__ respectively.
18340b57cec5SDimitry Andric void Writer::insertCtorDtorSymbols() {
18350b57cec5SDimitry Andric   AbsolutePointerChunk *ctorListHead = make<AbsolutePointerChunk>(-1);
18360b57cec5SDimitry Andric   AbsolutePointerChunk *ctorListEnd = make<AbsolutePointerChunk>(0);
18370b57cec5SDimitry Andric   AbsolutePointerChunk *dtorListHead = make<AbsolutePointerChunk>(-1);
18380b57cec5SDimitry Andric   AbsolutePointerChunk *dtorListEnd = make<AbsolutePointerChunk>(0);
18390b57cec5SDimitry Andric   ctorsSec->insertChunkAtStart(ctorListHead);
18400b57cec5SDimitry Andric   ctorsSec->addChunk(ctorListEnd);
18410b57cec5SDimitry Andric   dtorsSec->insertChunkAtStart(dtorListHead);
18420b57cec5SDimitry Andric   dtorsSec->addChunk(dtorListEnd);
18430b57cec5SDimitry Andric 
1844349cc55cSDimitry Andric   Symbol *ctorListSym = ctx.symtab.findUnderscore("__CTOR_LIST__");
1845349cc55cSDimitry Andric   Symbol *dtorListSym = ctx.symtab.findUnderscore("__DTOR_LIST__");
18460b57cec5SDimitry Andric   replaceSymbol<DefinedSynthetic>(ctorListSym, ctorListSym->getName(),
18470b57cec5SDimitry Andric                                   ctorListHead);
18480b57cec5SDimitry Andric   replaceSymbol<DefinedSynthetic>(dtorListSym, dtorListSym->getName(),
18490b57cec5SDimitry Andric                                   dtorListHead);
18500b57cec5SDimitry Andric }
18510b57cec5SDimitry Andric 
18520b57cec5SDimitry Andric // Handles /section options to allow users to overwrite
18530b57cec5SDimitry Andric // section attributes.
18540b57cec5SDimitry Andric void Writer::setSectionPermissions() {
18550b57cec5SDimitry Andric   for (auto &p : config->section) {
18560b57cec5SDimitry Andric     StringRef name = p.first;
18570b57cec5SDimitry Andric     uint32_t perm = p.second;
1858349cc55cSDimitry Andric     for (OutputSection *sec : ctx.outputSections)
18590b57cec5SDimitry Andric       if (sec->name == name)
18600b57cec5SDimitry Andric         sec->setPermissions(perm);
18610b57cec5SDimitry Andric   }
18620b57cec5SDimitry Andric }
18630b57cec5SDimitry Andric 
18640b57cec5SDimitry Andric // Write section contents to a mmap'ed file.
18650b57cec5SDimitry Andric void Writer::writeSections() {
18660b57cec5SDimitry Andric   // Record the number of sections to apply section index relocations
18670b57cec5SDimitry Andric   // against absolute symbols. See applySecIdx in Chunks.cpp..
1868349cc55cSDimitry Andric   DefinedAbsolute::numOutputSections = ctx.outputSections.size();
18690b57cec5SDimitry Andric 
18700b57cec5SDimitry Andric   uint8_t *buf = buffer->getBufferStart();
1871349cc55cSDimitry Andric   for (OutputSection *sec : ctx.outputSections) {
18720b57cec5SDimitry Andric     uint8_t *secBuf = buf + sec->getFileOff();
18730b57cec5SDimitry Andric     // Fill gaps between functions in .text with INT3 instructions
18740b57cec5SDimitry Andric     // instead of leaving as NUL bytes (which can be interpreted as
18750b57cec5SDimitry Andric     // ADD instructions).
18760b57cec5SDimitry Andric     if (sec->header.Characteristics & IMAGE_SCN_CNT_CODE)
18770b57cec5SDimitry Andric       memset(secBuf, 0xCC, sec->getRawSize());
18780b57cec5SDimitry Andric     parallelForEach(sec->chunks, [&](Chunk *c) {
18790b57cec5SDimitry Andric       c->writeTo(secBuf + c->getRVA() - sec->getRVA());
18800b57cec5SDimitry Andric     });
18810b57cec5SDimitry Andric   }
18820b57cec5SDimitry Andric }
18830b57cec5SDimitry Andric 
18840b57cec5SDimitry Andric void Writer::writeBuildId() {
18850b57cec5SDimitry Andric   // There are two important parts to the build ID.
18860b57cec5SDimitry Andric   // 1) If building with debug info, the COFF debug directory contains a
18870b57cec5SDimitry Andric   //    timestamp as well as a Guid and Age of the PDB.
18880b57cec5SDimitry Andric   // 2) In all cases, the PE COFF file header also contains a timestamp.
18890b57cec5SDimitry Andric   // For reproducibility, instead of a timestamp we want to use a hash of the
18900b57cec5SDimitry Andric   // PE contents.
18910b57cec5SDimitry Andric   if (config->debug) {
18920b57cec5SDimitry Andric     assert(buildId && "BuildId is not set!");
18930b57cec5SDimitry Andric     // BuildId->BuildId was filled in when the PDB was written.
18940b57cec5SDimitry Andric   }
18950b57cec5SDimitry Andric 
18960b57cec5SDimitry Andric   // At this point the only fields in the COFF file which remain unset are the
18970b57cec5SDimitry Andric   // "timestamp" in the COFF file header, and the ones in the coff debug
18980b57cec5SDimitry Andric   // directory.  Now we can hash the file and write that hash to the various
18990b57cec5SDimitry Andric   // timestamp fields in the file.
19000b57cec5SDimitry Andric   StringRef outputFileData(
19010b57cec5SDimitry Andric       reinterpret_cast<const char *>(buffer->getBufferStart()),
19020b57cec5SDimitry Andric       buffer->getBufferSize());
19030b57cec5SDimitry Andric 
19040b57cec5SDimitry Andric   uint32_t timestamp = config->timestamp;
19050b57cec5SDimitry Andric   uint64_t hash = 0;
19060b57cec5SDimitry Andric   bool generateSyntheticBuildId =
19070b57cec5SDimitry Andric       config->mingw && config->debug && config->pdbPath.empty();
19080b57cec5SDimitry Andric 
19090b57cec5SDimitry Andric   if (config->repro || generateSyntheticBuildId)
19100b57cec5SDimitry Andric     hash = xxHash64(outputFileData);
19110b57cec5SDimitry Andric 
19120b57cec5SDimitry Andric   if (config->repro)
19130b57cec5SDimitry Andric     timestamp = static_cast<uint32_t>(hash);
19140b57cec5SDimitry Andric 
19150b57cec5SDimitry Andric   if (generateSyntheticBuildId) {
19160b57cec5SDimitry Andric     // For MinGW builds without a PDB file, we still generate a build id
19170b57cec5SDimitry Andric     // to allow associating a crash dump to the executable.
19180b57cec5SDimitry Andric     buildId->buildId->PDB70.CVSignature = OMF::Signature::PDB70;
19190b57cec5SDimitry Andric     buildId->buildId->PDB70.Age = 1;
19200b57cec5SDimitry Andric     memcpy(buildId->buildId->PDB70.Signature, &hash, 8);
19210b57cec5SDimitry Andric     // xxhash only gives us 8 bytes, so put some fixed data in the other half.
19220b57cec5SDimitry Andric     memcpy(&buildId->buildId->PDB70.Signature[8], "LLD PDB.", 8);
19230b57cec5SDimitry Andric   }
19240b57cec5SDimitry Andric 
19250b57cec5SDimitry Andric   if (debugDirectory)
19260b57cec5SDimitry Andric     debugDirectory->setTimeDateStamp(timestamp);
19270b57cec5SDimitry Andric 
19280b57cec5SDimitry Andric   uint8_t *buf = buffer->getBufferStart();
19290b57cec5SDimitry Andric   buf += dosStubSize + sizeof(PEMagic);
19300b57cec5SDimitry Andric   object::coff_file_header *coffHeader =
19310b57cec5SDimitry Andric       reinterpret_cast<coff_file_header *>(buf);
19320b57cec5SDimitry Andric   coffHeader->TimeDateStamp = timestamp;
19330b57cec5SDimitry Andric }
19340b57cec5SDimitry Andric 
19350b57cec5SDimitry Andric // Sort .pdata section contents according to PE/COFF spec 5.5.
19360b57cec5SDimitry Andric void Writer::sortExceptionTable() {
19370b57cec5SDimitry Andric   if (!firstPdata)
19380b57cec5SDimitry Andric     return;
19390b57cec5SDimitry Andric   // We assume .pdata contains function table entries only.
19400b57cec5SDimitry Andric   auto bufAddr = [&](Chunk *c) {
1941349cc55cSDimitry Andric     OutputSection *os = ctx.getOutputSection(c);
19420b57cec5SDimitry Andric     return buffer->getBufferStart() + os->getFileOff() + c->getRVA() -
19430b57cec5SDimitry Andric            os->getRVA();
19440b57cec5SDimitry Andric   };
19450b57cec5SDimitry Andric   uint8_t *begin = bufAddr(firstPdata);
19460b57cec5SDimitry Andric   uint8_t *end = bufAddr(lastPdata) + lastPdata->getSize();
19470b57cec5SDimitry Andric   if (config->machine == AMD64) {
19480b57cec5SDimitry Andric     struct Entry { ulittle32_t begin, end, unwind; };
19495ffd83dbSDimitry Andric     if ((end - begin) % sizeof(Entry) != 0) {
19505ffd83dbSDimitry Andric       fatal("unexpected .pdata size: " + Twine(end - begin) +
19515ffd83dbSDimitry Andric             " is not a multiple of " + Twine(sizeof(Entry)));
19525ffd83dbSDimitry Andric     }
19530b57cec5SDimitry Andric     parallelSort(
19540b57cec5SDimitry Andric         MutableArrayRef<Entry>((Entry *)begin, (Entry *)end),
19550b57cec5SDimitry Andric         [](const Entry &a, const Entry &b) { return a.begin < b.begin; });
19560b57cec5SDimitry Andric     return;
19570b57cec5SDimitry Andric   }
19580b57cec5SDimitry Andric   if (config->machine == ARMNT || config->machine == ARM64) {
19590b57cec5SDimitry Andric     struct Entry { ulittle32_t begin, unwind; };
19605ffd83dbSDimitry Andric     if ((end - begin) % sizeof(Entry) != 0) {
19615ffd83dbSDimitry Andric       fatal("unexpected .pdata size: " + Twine(end - begin) +
19625ffd83dbSDimitry Andric             " is not a multiple of " + Twine(sizeof(Entry)));
19635ffd83dbSDimitry Andric     }
19640b57cec5SDimitry Andric     parallelSort(
19650b57cec5SDimitry Andric         MutableArrayRef<Entry>((Entry *)begin, (Entry *)end),
19660b57cec5SDimitry Andric         [](const Entry &a, const Entry &b) { return a.begin < b.begin; });
19670b57cec5SDimitry Andric     return;
19680b57cec5SDimitry Andric   }
1969480093f4SDimitry Andric   lld::errs() << "warning: don't know how to handle .pdata.\n";
19700b57cec5SDimitry Andric }
19710b57cec5SDimitry Andric 
19720b57cec5SDimitry Andric // The CRT section contains, among other things, the array of function
19730b57cec5SDimitry Andric // pointers that initialize every global variable that is not trivially
19740b57cec5SDimitry Andric // constructed. The CRT calls them one after the other prior to invoking
19750b57cec5SDimitry Andric // main().
19760b57cec5SDimitry Andric //
19770b57cec5SDimitry Andric // As per C++ spec, 3.6.2/2.3,
19780b57cec5SDimitry Andric // "Variables with ordered initialization defined within a single
19790b57cec5SDimitry Andric // translation unit shall be initialized in the order of their definitions
19800b57cec5SDimitry Andric // in the translation unit"
19810b57cec5SDimitry Andric //
19820b57cec5SDimitry Andric // It is therefore critical to sort the chunks containing the function
19830b57cec5SDimitry Andric // pointers in the order that they are listed in the object file (top to
19840b57cec5SDimitry Andric // bottom), otherwise global objects might not be initialized in the
19850b57cec5SDimitry Andric // correct order.
19860b57cec5SDimitry Andric void Writer::sortCRTSectionChunks(std::vector<Chunk *> &chunks) {
19870b57cec5SDimitry Andric   auto sectionChunkOrder = [](const Chunk *a, const Chunk *b) {
19880b57cec5SDimitry Andric     auto sa = dyn_cast<SectionChunk>(a);
19890b57cec5SDimitry Andric     auto sb = dyn_cast<SectionChunk>(b);
19900b57cec5SDimitry Andric     assert(sa && sb && "Non-section chunks in CRT section!");
19910b57cec5SDimitry Andric 
19920b57cec5SDimitry Andric     StringRef sAObj = sa->file->mb.getBufferIdentifier();
19930b57cec5SDimitry Andric     StringRef sBObj = sb->file->mb.getBufferIdentifier();
19940b57cec5SDimitry Andric 
19950b57cec5SDimitry Andric     return sAObj == sBObj && sa->getSectionNumber() < sb->getSectionNumber();
19960b57cec5SDimitry Andric   };
19970b57cec5SDimitry Andric   llvm::stable_sort(chunks, sectionChunkOrder);
19980b57cec5SDimitry Andric 
19990b57cec5SDimitry Andric   if (config->verbose) {
20000b57cec5SDimitry Andric     for (auto &c : chunks) {
20010b57cec5SDimitry Andric       auto sc = dyn_cast<SectionChunk>(c);
20020b57cec5SDimitry Andric       log("  " + sc->file->mb.getBufferIdentifier().str() +
20030b57cec5SDimitry Andric           ", SectionID: " + Twine(sc->getSectionNumber()));
20040b57cec5SDimitry Andric     }
20050b57cec5SDimitry Andric   }
20060b57cec5SDimitry Andric }
20070b57cec5SDimitry Andric 
20080b57cec5SDimitry Andric OutputSection *Writer::findSection(StringRef name) {
2009349cc55cSDimitry Andric   for (OutputSection *sec : ctx.outputSections)
20100b57cec5SDimitry Andric     if (sec->name == name)
20110b57cec5SDimitry Andric       return sec;
20120b57cec5SDimitry Andric   return nullptr;
20130b57cec5SDimitry Andric }
20140b57cec5SDimitry Andric 
20150b57cec5SDimitry Andric uint32_t Writer::getSizeOfInitializedData() {
20160b57cec5SDimitry Andric   uint32_t res = 0;
2017349cc55cSDimitry Andric   for (OutputSection *s : ctx.outputSections)
20180b57cec5SDimitry Andric     if (s->header.Characteristics & IMAGE_SCN_CNT_INITIALIZED_DATA)
20190b57cec5SDimitry Andric       res += s->getRawSize();
20200b57cec5SDimitry Andric   return res;
20210b57cec5SDimitry Andric }
20220b57cec5SDimitry Andric 
20230b57cec5SDimitry Andric // Add base relocations to .reloc section.
20240b57cec5SDimitry Andric void Writer::addBaserels() {
20250b57cec5SDimitry Andric   if (!config->relocatable)
20260b57cec5SDimitry Andric     return;
20270b57cec5SDimitry Andric   relocSec->chunks.clear();
20280b57cec5SDimitry Andric   std::vector<Baserel> v;
2029349cc55cSDimitry Andric   for (OutputSection *sec : ctx.outputSections) {
20300b57cec5SDimitry Andric     if (sec->header.Characteristics & IMAGE_SCN_MEM_DISCARDABLE)
20310b57cec5SDimitry Andric       continue;
20320b57cec5SDimitry Andric     // Collect all locations for base relocations.
20330b57cec5SDimitry Andric     for (Chunk *c : sec->chunks)
20340b57cec5SDimitry Andric       c->getBaserels(&v);
20350b57cec5SDimitry Andric     // Add the addresses to .reloc section.
20360b57cec5SDimitry Andric     if (!v.empty())
20370b57cec5SDimitry Andric       addBaserelBlocks(v);
20380b57cec5SDimitry Andric     v.clear();
20390b57cec5SDimitry Andric   }
20400b57cec5SDimitry Andric }
20410b57cec5SDimitry Andric 
20420b57cec5SDimitry Andric // Add addresses to .reloc section. Note that addresses are grouped by page.
20430b57cec5SDimitry Andric void Writer::addBaserelBlocks(std::vector<Baserel> &v) {
20440b57cec5SDimitry Andric   const uint32_t mask = ~uint32_t(pageSize - 1);
20450b57cec5SDimitry Andric   uint32_t page = v[0].rva & mask;
20460b57cec5SDimitry Andric   size_t i = 0, j = 1;
20470b57cec5SDimitry Andric   for (size_t e = v.size(); j < e; ++j) {
20480b57cec5SDimitry Andric     uint32_t p = v[j].rva & mask;
20490b57cec5SDimitry Andric     if (p == page)
20500b57cec5SDimitry Andric       continue;
20510b57cec5SDimitry Andric     relocSec->addChunk(make<BaserelChunk>(page, &v[i], &v[0] + j));
20520b57cec5SDimitry Andric     i = j;
20530b57cec5SDimitry Andric     page = p;
20540b57cec5SDimitry Andric   }
20550b57cec5SDimitry Andric   if (i == j)
20560b57cec5SDimitry Andric     return;
20570b57cec5SDimitry Andric   relocSec->addChunk(make<BaserelChunk>(page, &v[i], &v[0] + j));
20580b57cec5SDimitry Andric }
20590b57cec5SDimitry Andric 
20600b57cec5SDimitry Andric PartialSection *Writer::createPartialSection(StringRef name,
20610b57cec5SDimitry Andric                                              uint32_t outChars) {
20620b57cec5SDimitry Andric   PartialSection *&pSec = partialSections[{name, outChars}];
20630b57cec5SDimitry Andric   if (pSec)
20640b57cec5SDimitry Andric     return pSec;
20650b57cec5SDimitry Andric   pSec = make<PartialSection>(name, outChars);
20660b57cec5SDimitry Andric   return pSec;
20670b57cec5SDimitry Andric }
20680b57cec5SDimitry Andric 
20690b57cec5SDimitry Andric PartialSection *Writer::findPartialSection(StringRef name, uint32_t outChars) {
20700b57cec5SDimitry Andric   auto it = partialSections.find({name, outChars});
20710b57cec5SDimitry Andric   if (it != partialSections.end())
20720b57cec5SDimitry Andric     return it->second;
20730b57cec5SDimitry Andric   return nullptr;
20740b57cec5SDimitry Andric }
2075e8d8bef9SDimitry Andric 
2076e8d8bef9SDimitry Andric void Writer::fixTlsAlignment() {
2077e8d8bef9SDimitry Andric   Defined *tlsSym =
2078349cc55cSDimitry Andric       dyn_cast_or_null<Defined>(ctx.symtab.findUnderscore("_tls_used"));
2079e8d8bef9SDimitry Andric   if (!tlsSym)
2080e8d8bef9SDimitry Andric     return;
2081e8d8bef9SDimitry Andric 
2082349cc55cSDimitry Andric   OutputSection *sec = ctx.getOutputSection(tlsSym->getChunk());
2083e8d8bef9SDimitry Andric   assert(sec && tlsSym->getRVA() >= sec->getRVA() &&
2084e8d8bef9SDimitry Andric          "no output section for _tls_used");
2085e8d8bef9SDimitry Andric 
2086e8d8bef9SDimitry Andric   uint8_t *secBuf = buffer->getBufferStart() + sec->getFileOff();
2087e8d8bef9SDimitry Andric   uint64_t tlsOffset = tlsSym->getRVA() - sec->getRVA();
2088e8d8bef9SDimitry Andric   uint64_t directorySize = config->is64()
2089e8d8bef9SDimitry Andric                                ? sizeof(object::coff_tls_directory64)
2090e8d8bef9SDimitry Andric                                : sizeof(object::coff_tls_directory32);
2091e8d8bef9SDimitry Andric 
2092e8d8bef9SDimitry Andric   if (tlsOffset + directorySize > sec->getRawSize())
2093e8d8bef9SDimitry Andric     fatal("_tls_used sym is malformed");
2094e8d8bef9SDimitry Andric 
2095e8d8bef9SDimitry Andric   if (config->is64()) {
2096e8d8bef9SDimitry Andric     object::coff_tls_directory64 *tlsDir =
2097e8d8bef9SDimitry Andric         reinterpret_cast<object::coff_tls_directory64 *>(&secBuf[tlsOffset]);
2098e8d8bef9SDimitry Andric     tlsDir->setAlignment(tlsAlignment);
2099e8d8bef9SDimitry Andric   } else {
2100e8d8bef9SDimitry Andric     object::coff_tls_directory32 *tlsDir =
2101e8d8bef9SDimitry Andric         reinterpret_cast<object::coff_tls_directory32 *>(&secBuf[tlsOffset]);
2102e8d8bef9SDimitry Andric     tlsDir->setAlignment(tlsAlignment);
2103e8d8bef9SDimitry Andric   }
2104e8d8bef9SDimitry Andric }
2105