10b57cec5SDimitry Andric //===- Writer.cpp ---------------------------------------------------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #include "Writer.h" 10349cc55cSDimitry Andric #include "COFFLinkerContext.h" 11e8d8bef9SDimitry Andric #include "CallGraphSort.h" 120b57cec5SDimitry Andric #include "Config.h" 130b57cec5SDimitry Andric #include "DLL.h" 140b57cec5SDimitry Andric #include "InputFiles.h" 155ffd83dbSDimitry Andric #include "LLDMapFile.h" 160b57cec5SDimitry Andric #include "MapFile.h" 170b57cec5SDimitry Andric #include "PDB.h" 180b57cec5SDimitry Andric #include "SymbolTable.h" 190b57cec5SDimitry Andric #include "Symbols.h" 200b57cec5SDimitry Andric #include "lld/Common/ErrorHandler.h" 210b57cec5SDimitry Andric #include "lld/Common/Memory.h" 220b57cec5SDimitry Andric #include "lld/Common/Timer.h" 230b57cec5SDimitry Andric #include "llvm/ADT/DenseMap.h" 240b57cec5SDimitry Andric #include "llvm/ADT/STLExtras.h" 25480093f4SDimitry Andric #include "llvm/ADT/StringSet.h" 26*bdd1243dSDimitry Andric #include "llvm/BinaryFormat/COFF.h" 270b57cec5SDimitry Andric #include "llvm/Support/BinaryStreamReader.h" 280b57cec5SDimitry Andric #include "llvm/Support/Debug.h" 290b57cec5SDimitry Andric #include "llvm/Support/Endian.h" 300b57cec5SDimitry Andric #include "llvm/Support/FileOutputBuffer.h" 310b57cec5SDimitry Andric #include "llvm/Support/Parallel.h" 320b57cec5SDimitry Andric #include "llvm/Support/Path.h" 330b57cec5SDimitry Andric #include "llvm/Support/RandomNumberGenerator.h" 340b57cec5SDimitry Andric #include "llvm/Support/xxhash.h" 350b57cec5SDimitry Andric #include <algorithm> 360b57cec5SDimitry Andric #include <cstdio> 370b57cec5SDimitry Andric #include <map> 380b57cec5SDimitry Andric #include <memory> 390b57cec5SDimitry Andric #include <utility> 400b57cec5SDimitry Andric 410b57cec5SDimitry Andric using namespace llvm; 420b57cec5SDimitry Andric using namespace llvm::COFF; 430b57cec5SDimitry Andric using namespace llvm::object; 440b57cec5SDimitry Andric using namespace llvm::support; 450b57cec5SDimitry Andric using namespace llvm::support::endian; 465ffd83dbSDimitry Andric using namespace lld; 475ffd83dbSDimitry Andric using namespace lld::coff; 480b57cec5SDimitry Andric 490b57cec5SDimitry Andric /* To re-generate DOSProgram: 500b57cec5SDimitry Andric $ cat > /tmp/DOSProgram.asm 510b57cec5SDimitry Andric org 0 520b57cec5SDimitry Andric ; Copy cs to ds. 530b57cec5SDimitry Andric push cs 540b57cec5SDimitry Andric pop ds 550b57cec5SDimitry Andric ; Point ds:dx at the $-terminated string. 560b57cec5SDimitry Andric mov dx, str 570b57cec5SDimitry Andric ; Int 21/AH=09h: Write string to standard output. 580b57cec5SDimitry Andric mov ah, 0x9 590b57cec5SDimitry Andric int 0x21 600b57cec5SDimitry Andric ; Int 21/AH=4Ch: Exit with return code (in AL). 610b57cec5SDimitry Andric mov ax, 0x4C01 620b57cec5SDimitry Andric int 0x21 630b57cec5SDimitry Andric str: 640b57cec5SDimitry Andric db 'This program cannot be run in DOS mode.$' 650b57cec5SDimitry Andric align 8, db 0 660b57cec5SDimitry Andric $ nasm -fbin /tmp/DOSProgram.asm -o /tmp/DOSProgram.bin 670b57cec5SDimitry Andric $ xxd -i /tmp/DOSProgram.bin 680b57cec5SDimitry Andric */ 690b57cec5SDimitry Andric static unsigned char dosProgram[] = { 700b57cec5SDimitry Andric 0x0e, 0x1f, 0xba, 0x0e, 0x00, 0xb4, 0x09, 0xcd, 0x21, 0xb8, 0x01, 0x4c, 710b57cec5SDimitry Andric 0xcd, 0x21, 0x54, 0x68, 0x69, 0x73, 0x20, 0x70, 0x72, 0x6f, 0x67, 0x72, 720b57cec5SDimitry Andric 0x61, 0x6d, 0x20, 0x63, 0x61, 0x6e, 0x6e, 0x6f, 0x74, 0x20, 0x62, 0x65, 730b57cec5SDimitry Andric 0x20, 0x72, 0x75, 0x6e, 0x20, 0x69, 0x6e, 0x20, 0x44, 0x4f, 0x53, 0x20, 740b57cec5SDimitry Andric 0x6d, 0x6f, 0x64, 0x65, 0x2e, 0x24, 0x00, 0x00 750b57cec5SDimitry Andric }; 760b57cec5SDimitry Andric static_assert(sizeof(dosProgram) % 8 == 0, 770b57cec5SDimitry Andric "DOSProgram size must be multiple of 8"); 780b57cec5SDimitry Andric 790b57cec5SDimitry Andric static const int dosStubSize = sizeof(dos_header) + sizeof(dosProgram); 800b57cec5SDimitry Andric static_assert(dosStubSize % 8 == 0, "DOSStub size must be multiple of 8"); 810b57cec5SDimitry Andric 820b57cec5SDimitry Andric static const int numberOfDataDirectory = 16; 830b57cec5SDimitry Andric 840b57cec5SDimitry Andric namespace { 850b57cec5SDimitry Andric 860b57cec5SDimitry Andric class DebugDirectoryChunk : public NonSectionChunk { 870b57cec5SDimitry Andric public: 88*bdd1243dSDimitry Andric DebugDirectoryChunk(const COFFLinkerContext &c, 89349cc55cSDimitry Andric const std::vector<std::pair<COFF::DebugType, Chunk *>> &r, 905ffd83dbSDimitry Andric bool writeRepro) 91349cc55cSDimitry Andric : records(r), writeRepro(writeRepro), ctx(c) {} 920b57cec5SDimitry Andric 930b57cec5SDimitry Andric size_t getSize() const override { 940b57cec5SDimitry Andric return (records.size() + int(writeRepro)) * sizeof(debug_directory); 950b57cec5SDimitry Andric } 960b57cec5SDimitry Andric 970b57cec5SDimitry Andric void writeTo(uint8_t *b) const override { 980b57cec5SDimitry Andric auto *d = reinterpret_cast<debug_directory *>(b); 990b57cec5SDimitry Andric 1005ffd83dbSDimitry Andric for (const std::pair<COFF::DebugType, Chunk *>& record : records) { 1015ffd83dbSDimitry Andric Chunk *c = record.second; 102*bdd1243dSDimitry Andric const OutputSection *os = ctx.getOutputSection(c); 1035ffd83dbSDimitry Andric uint64_t offs = os->getFileOff() + (c->getRVA() - os->getRVA()); 1045ffd83dbSDimitry Andric fillEntry(d, record.first, c->getSize(), c->getRVA(), offs); 1050b57cec5SDimitry Andric ++d; 1060b57cec5SDimitry Andric } 1070b57cec5SDimitry Andric 1080b57cec5SDimitry Andric if (writeRepro) { 1090b57cec5SDimitry Andric // FIXME: The COFF spec allows either a 0-sized entry to just say 1100b57cec5SDimitry Andric // "the timestamp field is really a hash", or a 4-byte size field 1110b57cec5SDimitry Andric // followed by that many bytes containing a longer hash (with the 1120b57cec5SDimitry Andric // lowest 4 bytes usually being the timestamp in little-endian order). 1130b57cec5SDimitry Andric // Consider storing the full 8 bytes computed by xxHash64 here. 1140b57cec5SDimitry Andric fillEntry(d, COFF::IMAGE_DEBUG_TYPE_REPRO, 0, 0, 0); 1150b57cec5SDimitry Andric } 1160b57cec5SDimitry Andric } 1170b57cec5SDimitry Andric 1180b57cec5SDimitry Andric void setTimeDateStamp(uint32_t timeDateStamp) { 1190b57cec5SDimitry Andric for (support::ulittle32_t *tds : timeDateStamps) 1200b57cec5SDimitry Andric *tds = timeDateStamp; 1210b57cec5SDimitry Andric } 1220b57cec5SDimitry Andric 1230b57cec5SDimitry Andric private: 1240b57cec5SDimitry Andric void fillEntry(debug_directory *d, COFF::DebugType debugType, size_t size, 1250b57cec5SDimitry Andric uint64_t rva, uint64_t offs) const { 1260b57cec5SDimitry Andric d->Characteristics = 0; 1270b57cec5SDimitry Andric d->TimeDateStamp = 0; 1280b57cec5SDimitry Andric d->MajorVersion = 0; 1290b57cec5SDimitry Andric d->MinorVersion = 0; 1300b57cec5SDimitry Andric d->Type = debugType; 1310b57cec5SDimitry Andric d->SizeOfData = size; 1320b57cec5SDimitry Andric d->AddressOfRawData = rva; 1330b57cec5SDimitry Andric d->PointerToRawData = offs; 1340b57cec5SDimitry Andric 1350b57cec5SDimitry Andric timeDateStamps.push_back(&d->TimeDateStamp); 1360b57cec5SDimitry Andric } 1370b57cec5SDimitry Andric 1380b57cec5SDimitry Andric mutable std::vector<support::ulittle32_t *> timeDateStamps; 1395ffd83dbSDimitry Andric const std::vector<std::pair<COFF::DebugType, Chunk *>> &records; 1400b57cec5SDimitry Andric bool writeRepro; 141*bdd1243dSDimitry Andric const COFFLinkerContext &ctx; 1420b57cec5SDimitry Andric }; 1430b57cec5SDimitry Andric 1440b57cec5SDimitry Andric class CVDebugRecordChunk : public NonSectionChunk { 1450b57cec5SDimitry Andric public: 146*bdd1243dSDimitry Andric CVDebugRecordChunk(const COFFLinkerContext &c) : ctx(c) {} 147*bdd1243dSDimitry Andric 1480b57cec5SDimitry Andric size_t getSize() const override { 149*bdd1243dSDimitry Andric return sizeof(codeview::DebugInfo) + ctx.config.pdbAltPath.size() + 1; 1500b57cec5SDimitry Andric } 1510b57cec5SDimitry Andric 1520b57cec5SDimitry Andric void writeTo(uint8_t *b) const override { 1530b57cec5SDimitry Andric // Save off the DebugInfo entry to backfill the file signature (build id) 1540b57cec5SDimitry Andric // in Writer::writeBuildId 1550b57cec5SDimitry Andric buildId = reinterpret_cast<codeview::DebugInfo *>(b); 1560b57cec5SDimitry Andric 1570b57cec5SDimitry Andric // variable sized field (PDB Path) 1580b57cec5SDimitry Andric char *p = reinterpret_cast<char *>(b + sizeof(*buildId)); 159*bdd1243dSDimitry Andric if (!ctx.config.pdbAltPath.empty()) 160*bdd1243dSDimitry Andric memcpy(p, ctx.config.pdbAltPath.data(), ctx.config.pdbAltPath.size()); 161*bdd1243dSDimitry Andric p[ctx.config.pdbAltPath.size()] = '\0'; 1620b57cec5SDimitry Andric } 1630b57cec5SDimitry Andric 1640b57cec5SDimitry Andric mutable codeview::DebugInfo *buildId = nullptr; 165*bdd1243dSDimitry Andric 166*bdd1243dSDimitry Andric private: 167*bdd1243dSDimitry Andric const COFFLinkerContext &ctx; 1680b57cec5SDimitry Andric }; 1690b57cec5SDimitry Andric 1705ffd83dbSDimitry Andric class ExtendedDllCharacteristicsChunk : public NonSectionChunk { 1715ffd83dbSDimitry Andric public: 1725ffd83dbSDimitry Andric ExtendedDllCharacteristicsChunk(uint32_t c) : characteristics(c) {} 1735ffd83dbSDimitry Andric 1745ffd83dbSDimitry Andric size_t getSize() const override { return 4; } 1755ffd83dbSDimitry Andric 1765ffd83dbSDimitry Andric void writeTo(uint8_t *buf) const override { write32le(buf, characteristics); } 1775ffd83dbSDimitry Andric 1785ffd83dbSDimitry Andric uint32_t characteristics = 0; 1795ffd83dbSDimitry Andric }; 1805ffd83dbSDimitry Andric 1810b57cec5SDimitry Andric // PartialSection represents a group of chunks that contribute to an 1820b57cec5SDimitry Andric // OutputSection. Collating a collection of PartialSections of same name and 1830b57cec5SDimitry Andric // characteristics constitutes the OutputSection. 1840b57cec5SDimitry Andric class PartialSectionKey { 1850b57cec5SDimitry Andric public: 1860b57cec5SDimitry Andric StringRef name; 1870b57cec5SDimitry Andric unsigned characteristics; 1880b57cec5SDimitry Andric 1890b57cec5SDimitry Andric bool operator<(const PartialSectionKey &other) const { 1900b57cec5SDimitry Andric int c = name.compare(other.name); 191*bdd1243dSDimitry Andric if (c > 0) 1920b57cec5SDimitry Andric return false; 1930b57cec5SDimitry Andric if (c == 0) 1940b57cec5SDimitry Andric return characteristics < other.characteristics; 1950b57cec5SDimitry Andric return true; 1960b57cec5SDimitry Andric } 1970b57cec5SDimitry Andric }; 1980b57cec5SDimitry Andric 1990b57cec5SDimitry Andric // The writer writes a SymbolTable result to a file. 2000b57cec5SDimitry Andric class Writer { 2010b57cec5SDimitry Andric public: 202*bdd1243dSDimitry Andric Writer(COFFLinkerContext &c) 203*bdd1243dSDimitry Andric : buffer(errorHandler().outputBuffer), delayIdata(c), edata(c), ctx(c) {} 2040b57cec5SDimitry Andric void run(); 2050b57cec5SDimitry Andric 2060b57cec5SDimitry Andric private: 2070b57cec5SDimitry Andric void createSections(); 2080b57cec5SDimitry Andric void createMiscChunks(); 2090b57cec5SDimitry Andric void createImportTables(); 2100b57cec5SDimitry Andric void appendImportThunks(); 2110b57cec5SDimitry Andric void locateImportTables(); 2120b57cec5SDimitry Andric void createExportTable(); 2130b57cec5SDimitry Andric void mergeSections(); 2140b57cec5SDimitry Andric void removeUnusedSections(); 2150b57cec5SDimitry Andric void assignAddresses(); 216*bdd1243dSDimitry Andric bool isInRange(uint16_t relType, uint64_t s, uint64_t p, int margin); 217*bdd1243dSDimitry Andric std::pair<Defined *, bool> getThunk(DenseMap<uint64_t, Defined *> &lastThunks, 218*bdd1243dSDimitry Andric Defined *target, uint64_t p, 219*bdd1243dSDimitry Andric uint16_t type, int margin); 220*bdd1243dSDimitry Andric bool createThunks(OutputSection *os, int margin); 221*bdd1243dSDimitry Andric bool verifyRanges(const std::vector<Chunk *> chunks); 2220b57cec5SDimitry Andric void finalizeAddresses(); 2230b57cec5SDimitry Andric void removeEmptySections(); 2240b57cec5SDimitry Andric void assignOutputSectionIndices(); 2250b57cec5SDimitry Andric void createSymbolAndStringTable(); 2260b57cec5SDimitry Andric void openFile(StringRef outputPath); 2270b57cec5SDimitry Andric template <typename PEHeaderTy> void writeHeader(); 2280b57cec5SDimitry Andric void createSEHTable(); 2290b57cec5SDimitry Andric void createRuntimePseudoRelocs(); 2300b57cec5SDimitry Andric void insertCtorDtorSymbols(); 231*bdd1243dSDimitry Andric void markSymbolsWithRelocations(ObjFile *file, SymbolRVASet &usedSymbols); 2320b57cec5SDimitry Andric void createGuardCFTables(); 2330b57cec5SDimitry Andric void markSymbolsForRVATable(ObjFile *file, 2340b57cec5SDimitry Andric ArrayRef<SectionChunk *> symIdxChunks, 2350b57cec5SDimitry Andric SymbolRVASet &tableSymbols); 236e8d8bef9SDimitry Andric void getSymbolsFromSections(ObjFile *file, 237e8d8bef9SDimitry Andric ArrayRef<SectionChunk *> symIdxChunks, 238e8d8bef9SDimitry Andric std::vector<Symbol *> &symbols); 2390b57cec5SDimitry Andric void maybeAddRVATable(SymbolRVASet tableSymbols, StringRef tableSym, 240fe6060f1SDimitry Andric StringRef countSym, bool hasFlag=false); 2410b57cec5SDimitry Andric void setSectionPermissions(); 2420b57cec5SDimitry Andric void writeSections(); 2430b57cec5SDimitry Andric void writeBuildId(); 244*bdd1243dSDimitry Andric void writePEChecksum(); 245e8d8bef9SDimitry Andric void sortSections(); 2460b57cec5SDimitry Andric void sortExceptionTable(); 2470b57cec5SDimitry Andric void sortCRTSectionChunks(std::vector<Chunk *> &chunks); 2480b57cec5SDimitry Andric void addSyntheticIdata(); 249*bdd1243dSDimitry Andric void sortBySectionOrder(std::vector<Chunk *> &chunks); 2500b57cec5SDimitry Andric void fixPartialSectionChars(StringRef name, uint32_t chars); 2510b57cec5SDimitry Andric bool fixGnuImportChunks(); 252e8d8bef9SDimitry Andric void fixTlsAlignment(); 2530b57cec5SDimitry Andric PartialSection *createPartialSection(StringRef name, uint32_t outChars); 2540b57cec5SDimitry Andric PartialSection *findPartialSection(StringRef name, uint32_t outChars); 2550b57cec5SDimitry Andric 256*bdd1243dSDimitry Andric std::optional<coff_symbol16> createSymbol(Defined *d); 2570b57cec5SDimitry Andric size_t addEntryToStringTable(StringRef str); 2580b57cec5SDimitry Andric 2590b57cec5SDimitry Andric OutputSection *findSection(StringRef name); 2600b57cec5SDimitry Andric void addBaserels(); 2610b57cec5SDimitry Andric void addBaserelBlocks(std::vector<Baserel> &v); 2620b57cec5SDimitry Andric 2630b57cec5SDimitry Andric uint32_t getSizeOfInitializedData(); 2640b57cec5SDimitry Andric 265*bdd1243dSDimitry Andric void checkLoadConfig(); 266*bdd1243dSDimitry Andric template <typename T> void checkLoadConfigGuardData(const T *loadConfig); 267*bdd1243dSDimitry Andric 2680b57cec5SDimitry Andric std::unique_ptr<FileOutputBuffer> &buffer; 2690b57cec5SDimitry Andric std::map<PartialSectionKey, PartialSection *> partialSections; 2700b57cec5SDimitry Andric std::vector<char> strtab; 2710b57cec5SDimitry Andric std::vector<llvm::object::coff_symbol16> outputSymtab; 2720b57cec5SDimitry Andric IdataContents idata; 2730b57cec5SDimitry Andric Chunk *importTableStart = nullptr; 2740b57cec5SDimitry Andric uint64_t importTableSize = 0; 27585868e8aSDimitry Andric Chunk *edataStart = nullptr; 27685868e8aSDimitry Andric Chunk *edataEnd = nullptr; 2770b57cec5SDimitry Andric Chunk *iatStart = nullptr; 2780b57cec5SDimitry Andric uint64_t iatSize = 0; 2790b57cec5SDimitry Andric DelayLoadContents delayIdata; 2800b57cec5SDimitry Andric EdataContents edata; 2810b57cec5SDimitry Andric bool setNoSEHCharacteristic = false; 282e8d8bef9SDimitry Andric uint32_t tlsAlignment = 0; 2830b57cec5SDimitry Andric 2840b57cec5SDimitry Andric DebugDirectoryChunk *debugDirectory = nullptr; 2855ffd83dbSDimitry Andric std::vector<std::pair<COFF::DebugType, Chunk *>> debugRecords; 2860b57cec5SDimitry Andric CVDebugRecordChunk *buildId = nullptr; 2870b57cec5SDimitry Andric ArrayRef<uint8_t> sectionTable; 2880b57cec5SDimitry Andric 2890b57cec5SDimitry Andric uint64_t fileSize; 2900b57cec5SDimitry Andric uint32_t pointerToSymbolTable = 0; 2910b57cec5SDimitry Andric uint64_t sizeOfImage; 2920b57cec5SDimitry Andric uint64_t sizeOfHeaders; 2930b57cec5SDimitry Andric 2940b57cec5SDimitry Andric OutputSection *textSec; 2950b57cec5SDimitry Andric OutputSection *rdataSec; 2960b57cec5SDimitry Andric OutputSection *buildidSec; 2970b57cec5SDimitry Andric OutputSection *dataSec; 2980b57cec5SDimitry Andric OutputSection *pdataSec; 2990b57cec5SDimitry Andric OutputSection *idataSec; 3000b57cec5SDimitry Andric OutputSection *edataSec; 3010b57cec5SDimitry Andric OutputSection *didatSec; 3020b57cec5SDimitry Andric OutputSection *rsrcSec; 3030b57cec5SDimitry Andric OutputSection *relocSec; 3040b57cec5SDimitry Andric OutputSection *ctorsSec; 3050b57cec5SDimitry Andric OutputSection *dtorsSec; 3060b57cec5SDimitry Andric 3070b57cec5SDimitry Andric // The first and last .pdata sections in the output file. 3080b57cec5SDimitry Andric // 3090b57cec5SDimitry Andric // We need to keep track of the location of .pdata in whichever section it 3100b57cec5SDimitry Andric // gets merged into so that we can sort its contents and emit a correct data 3110b57cec5SDimitry Andric // directory entry for the exception table. This is also the case for some 3120b57cec5SDimitry Andric // other sections (such as .edata) but because the contents of those sections 3130b57cec5SDimitry Andric // are entirely linker-generated we can keep track of their locations using 3140b57cec5SDimitry Andric // the chunks that the linker creates. All .pdata chunks come from input 3150b57cec5SDimitry Andric // files, so we need to keep track of them separately. 3160b57cec5SDimitry Andric Chunk *firstPdata = nullptr; 3170b57cec5SDimitry Andric Chunk *lastPdata; 318349cc55cSDimitry Andric 319349cc55cSDimitry Andric COFFLinkerContext &ctx; 3200b57cec5SDimitry Andric }; 3210b57cec5SDimitry Andric } // anonymous namespace 3220b57cec5SDimitry Andric 323349cc55cSDimitry Andric void lld::coff::writeResult(COFFLinkerContext &ctx) { Writer(ctx).run(); } 3240b57cec5SDimitry Andric 3250b57cec5SDimitry Andric void OutputSection::addChunk(Chunk *c) { 3260b57cec5SDimitry Andric chunks.push_back(c); 3270b57cec5SDimitry Andric } 3280b57cec5SDimitry Andric 3290b57cec5SDimitry Andric void OutputSection::insertChunkAtStart(Chunk *c) { 3300b57cec5SDimitry Andric chunks.insert(chunks.begin(), c); 3310b57cec5SDimitry Andric } 3320b57cec5SDimitry Andric 3330b57cec5SDimitry Andric void OutputSection::setPermissions(uint32_t c) { 3340b57cec5SDimitry Andric header.Characteristics &= ~permMask; 3350b57cec5SDimitry Andric header.Characteristics |= c; 3360b57cec5SDimitry Andric } 3370b57cec5SDimitry Andric 3380b57cec5SDimitry Andric void OutputSection::merge(OutputSection *other) { 3390b57cec5SDimitry Andric chunks.insert(chunks.end(), other->chunks.begin(), other->chunks.end()); 3400b57cec5SDimitry Andric other->chunks.clear(); 3410b57cec5SDimitry Andric contribSections.insert(contribSections.end(), other->contribSections.begin(), 3420b57cec5SDimitry Andric other->contribSections.end()); 3430b57cec5SDimitry Andric other->contribSections.clear(); 3440b57cec5SDimitry Andric } 3450b57cec5SDimitry Andric 3460b57cec5SDimitry Andric // Write the section header to a given buffer. 347*bdd1243dSDimitry Andric void OutputSection::writeHeaderTo(uint8_t *buf, bool isDebug) { 3480b57cec5SDimitry Andric auto *hdr = reinterpret_cast<coff_section *>(buf); 3490b57cec5SDimitry Andric *hdr = header; 3500b57cec5SDimitry Andric if (stringTableOff) { 3510b57cec5SDimitry Andric // If name is too long, write offset into the string table as a name. 35281ad6265SDimitry Andric encodeSectionName(hdr->Name, stringTableOff); 3530b57cec5SDimitry Andric } else { 354*bdd1243dSDimitry Andric assert(!isDebug || name.size() <= COFF::NameSize || 3550b57cec5SDimitry Andric (hdr->Characteristics & IMAGE_SCN_MEM_DISCARDABLE) == 0); 3560b57cec5SDimitry Andric strncpy(hdr->Name, name.data(), 3570b57cec5SDimitry Andric std::min(name.size(), (size_t)COFF::NameSize)); 3580b57cec5SDimitry Andric } 3590b57cec5SDimitry Andric } 3600b57cec5SDimitry Andric 3610b57cec5SDimitry Andric void OutputSection::addContributingPartialSection(PartialSection *sec) { 3620b57cec5SDimitry Andric contribSections.push_back(sec); 3630b57cec5SDimitry Andric } 3640b57cec5SDimitry Andric 3650b57cec5SDimitry Andric // Check whether the target address S is in range from a relocation 3660b57cec5SDimitry Andric // of type relType at address P. 367*bdd1243dSDimitry Andric bool Writer::isInRange(uint16_t relType, uint64_t s, uint64_t p, int margin) { 368*bdd1243dSDimitry Andric if (ctx.config.machine == ARMNT) { 3690b57cec5SDimitry Andric int64_t diff = AbsoluteDifference(s, p + 4) + margin; 3700b57cec5SDimitry Andric switch (relType) { 3710b57cec5SDimitry Andric case IMAGE_REL_ARM_BRANCH20T: 3720b57cec5SDimitry Andric return isInt<21>(diff); 3730b57cec5SDimitry Andric case IMAGE_REL_ARM_BRANCH24T: 3740b57cec5SDimitry Andric case IMAGE_REL_ARM_BLX23T: 3750b57cec5SDimitry Andric return isInt<25>(diff); 3760b57cec5SDimitry Andric default: 3770b57cec5SDimitry Andric return true; 3780b57cec5SDimitry Andric } 379*bdd1243dSDimitry Andric } else if (ctx.config.machine == ARM64) { 3800b57cec5SDimitry Andric int64_t diff = AbsoluteDifference(s, p) + margin; 3810b57cec5SDimitry Andric switch (relType) { 3820b57cec5SDimitry Andric case IMAGE_REL_ARM64_BRANCH26: 3830b57cec5SDimitry Andric return isInt<28>(diff); 3840b57cec5SDimitry Andric case IMAGE_REL_ARM64_BRANCH19: 3850b57cec5SDimitry Andric return isInt<21>(diff); 3860b57cec5SDimitry Andric case IMAGE_REL_ARM64_BRANCH14: 3870b57cec5SDimitry Andric return isInt<16>(diff); 3880b57cec5SDimitry Andric default: 3890b57cec5SDimitry Andric return true; 3900b57cec5SDimitry Andric } 3910b57cec5SDimitry Andric } else { 3920b57cec5SDimitry Andric llvm_unreachable("Unexpected architecture"); 3930b57cec5SDimitry Andric } 3940b57cec5SDimitry Andric } 3950b57cec5SDimitry Andric 3960b57cec5SDimitry Andric // Return the last thunk for the given target if it is in range, 3970b57cec5SDimitry Andric // or create a new one. 398*bdd1243dSDimitry Andric std::pair<Defined *, bool> 399*bdd1243dSDimitry Andric Writer::getThunk(DenseMap<uint64_t, Defined *> &lastThunks, Defined *target, 400*bdd1243dSDimitry Andric uint64_t p, uint16_t type, int margin) { 4010b57cec5SDimitry Andric Defined *&lastThunk = lastThunks[target->getRVA()]; 4020b57cec5SDimitry Andric if (lastThunk && isInRange(type, lastThunk->getRVA(), p, margin)) 4030b57cec5SDimitry Andric return {lastThunk, false}; 4040b57cec5SDimitry Andric Chunk *c; 405*bdd1243dSDimitry Andric switch (ctx.config.machine) { 4060b57cec5SDimitry Andric case ARMNT: 407*bdd1243dSDimitry Andric c = make<RangeExtensionThunkARM>(ctx, target); 4080b57cec5SDimitry Andric break; 4090b57cec5SDimitry Andric case ARM64: 410*bdd1243dSDimitry Andric c = make<RangeExtensionThunkARM64>(ctx, target); 4110b57cec5SDimitry Andric break; 4120b57cec5SDimitry Andric default: 4130b57cec5SDimitry Andric llvm_unreachable("Unexpected architecture"); 4140b57cec5SDimitry Andric } 4156246ae0bSDimitry Andric Defined *d = make<DefinedSynthetic>("range_extension_thunk", c); 4160b57cec5SDimitry Andric lastThunk = d; 4170b57cec5SDimitry Andric return {d, true}; 4180b57cec5SDimitry Andric } 4190b57cec5SDimitry Andric 4200b57cec5SDimitry Andric // This checks all relocations, and for any relocation which isn't in range 4210b57cec5SDimitry Andric // it adds a thunk after the section chunk that contains the relocation. 4220b57cec5SDimitry Andric // If the latest thunk for the specific target is in range, that is used 4230b57cec5SDimitry Andric // instead of creating a new thunk. All range checks are done with the 4240b57cec5SDimitry Andric // specified margin, to make sure that relocations that originally are in 4250b57cec5SDimitry Andric // range, but only barely, also get thunks - in case other added thunks makes 4260b57cec5SDimitry Andric // the target go out of range. 4270b57cec5SDimitry Andric // 4280b57cec5SDimitry Andric // After adding thunks, we verify that all relocations are in range (with 4290b57cec5SDimitry Andric // no extra margin requirements). If this failed, we restart (throwing away 4300b57cec5SDimitry Andric // the previously created thunks) and retry with a wider margin. 431*bdd1243dSDimitry Andric bool Writer::createThunks(OutputSection *os, int margin) { 4320b57cec5SDimitry Andric bool addressesChanged = false; 4330b57cec5SDimitry Andric DenseMap<uint64_t, Defined *> lastThunks; 4340b57cec5SDimitry Andric DenseMap<std::pair<ObjFile *, Defined *>, uint32_t> thunkSymtabIndices; 4350b57cec5SDimitry Andric size_t thunksSize = 0; 4360b57cec5SDimitry Andric // Recheck Chunks.size() each iteration, since we can insert more 4370b57cec5SDimitry Andric // elements into it. 4380b57cec5SDimitry Andric for (size_t i = 0; i != os->chunks.size(); ++i) { 4390b57cec5SDimitry Andric SectionChunk *sc = dyn_cast_or_null<SectionChunk>(os->chunks[i]); 4400b57cec5SDimitry Andric if (!sc) 4410b57cec5SDimitry Andric continue; 4420b57cec5SDimitry Andric size_t thunkInsertionSpot = i + 1; 4430b57cec5SDimitry Andric 4440b57cec5SDimitry Andric // Try to get a good enough estimate of where new thunks will be placed. 4450b57cec5SDimitry Andric // Offset this by the size of the new thunks added so far, to make the 4460b57cec5SDimitry Andric // estimate slightly better. 4470b57cec5SDimitry Andric size_t thunkInsertionRVA = sc->getRVA() + sc->getSize() + thunksSize; 4480b57cec5SDimitry Andric ObjFile *file = sc->file; 4490b57cec5SDimitry Andric std::vector<std::pair<uint32_t, uint32_t>> relocReplacements; 4500b57cec5SDimitry Andric ArrayRef<coff_relocation> originalRelocs = 4510b57cec5SDimitry Andric file->getCOFFObj()->getRelocations(sc->header); 4520b57cec5SDimitry Andric for (size_t j = 0, e = originalRelocs.size(); j < e; ++j) { 4530b57cec5SDimitry Andric const coff_relocation &rel = originalRelocs[j]; 4540b57cec5SDimitry Andric Symbol *relocTarget = file->getSymbol(rel.SymbolTableIndex); 4550b57cec5SDimitry Andric 4560b57cec5SDimitry Andric // The estimate of the source address P should be pretty accurate, 4570b57cec5SDimitry Andric // but we don't know whether the target Symbol address should be 4580b57cec5SDimitry Andric // offset by thunksSize or not (or by some of thunksSize but not all of 4590b57cec5SDimitry Andric // it), giving us some uncertainty once we have added one thunk. 4600b57cec5SDimitry Andric uint64_t p = sc->getRVA() + rel.VirtualAddress + thunksSize; 4610b57cec5SDimitry Andric 4620b57cec5SDimitry Andric Defined *sym = dyn_cast_or_null<Defined>(relocTarget); 4630b57cec5SDimitry Andric if (!sym) 4640b57cec5SDimitry Andric continue; 4650b57cec5SDimitry Andric 4660b57cec5SDimitry Andric uint64_t s = sym->getRVA(); 4670b57cec5SDimitry Andric 4680b57cec5SDimitry Andric if (isInRange(rel.Type, s, p, margin)) 4690b57cec5SDimitry Andric continue; 4700b57cec5SDimitry Andric 471*bdd1243dSDimitry Andric // If the target isn't in range, hook it up to an existing or new thunk. 472*bdd1243dSDimitry Andric auto [thunk, wasNew] = getThunk(lastThunks, sym, p, rel.Type, margin); 4730b57cec5SDimitry Andric if (wasNew) { 4740b57cec5SDimitry Andric Chunk *thunkChunk = thunk->getChunk(); 4750b57cec5SDimitry Andric thunkChunk->setRVA( 4760b57cec5SDimitry Andric thunkInsertionRVA); // Estimate of where it will be located. 4770b57cec5SDimitry Andric os->chunks.insert(os->chunks.begin() + thunkInsertionSpot, thunkChunk); 4780b57cec5SDimitry Andric thunkInsertionSpot++; 4790b57cec5SDimitry Andric thunksSize += thunkChunk->getSize(); 4800b57cec5SDimitry Andric thunkInsertionRVA += thunkChunk->getSize(); 4810b57cec5SDimitry Andric addressesChanged = true; 4820b57cec5SDimitry Andric } 4830b57cec5SDimitry Andric 4840b57cec5SDimitry Andric // To redirect the relocation, add a symbol to the parent object file's 4850b57cec5SDimitry Andric // symbol table, and replace the relocation symbol table index with the 4860b57cec5SDimitry Andric // new index. 4870b57cec5SDimitry Andric auto insertion = thunkSymtabIndices.insert({{file, thunk}, ~0U}); 4880b57cec5SDimitry Andric uint32_t &thunkSymbolIndex = insertion.first->second; 4890b57cec5SDimitry Andric if (insertion.second) 4900b57cec5SDimitry Andric thunkSymbolIndex = file->addRangeThunkSymbol(thunk); 4910b57cec5SDimitry Andric relocReplacements.push_back({j, thunkSymbolIndex}); 4920b57cec5SDimitry Andric } 4930b57cec5SDimitry Andric 4940b57cec5SDimitry Andric // Get a writable copy of this section's relocations so they can be 4950b57cec5SDimitry Andric // modified. If the relocations point into the object file, allocate new 4960b57cec5SDimitry Andric // memory. Otherwise, this must be previously allocated memory that can be 4970b57cec5SDimitry Andric // modified in place. 4980b57cec5SDimitry Andric ArrayRef<coff_relocation> curRelocs = sc->getRelocs(); 4990b57cec5SDimitry Andric MutableArrayRef<coff_relocation> newRelocs; 5000b57cec5SDimitry Andric if (originalRelocs.data() == curRelocs.data()) { 501*bdd1243dSDimitry Andric newRelocs = MutableArrayRef( 50204eeddc0SDimitry Andric bAlloc().Allocate<coff_relocation>(originalRelocs.size()), 5030b57cec5SDimitry Andric originalRelocs.size()); 5040b57cec5SDimitry Andric } else { 505*bdd1243dSDimitry Andric newRelocs = MutableArrayRef( 5060b57cec5SDimitry Andric const_cast<coff_relocation *>(curRelocs.data()), curRelocs.size()); 5070b57cec5SDimitry Andric } 5080b57cec5SDimitry Andric 5090b57cec5SDimitry Andric // Copy each relocation, but replace the symbol table indices which need 5100b57cec5SDimitry Andric // thunks. 5110b57cec5SDimitry Andric auto nextReplacement = relocReplacements.begin(); 5120b57cec5SDimitry Andric auto endReplacement = relocReplacements.end(); 5130b57cec5SDimitry Andric for (size_t i = 0, e = originalRelocs.size(); i != e; ++i) { 5140b57cec5SDimitry Andric newRelocs[i] = originalRelocs[i]; 5150b57cec5SDimitry Andric if (nextReplacement != endReplacement && nextReplacement->first == i) { 5160b57cec5SDimitry Andric newRelocs[i].SymbolTableIndex = nextReplacement->second; 5170b57cec5SDimitry Andric ++nextReplacement; 5180b57cec5SDimitry Andric } 5190b57cec5SDimitry Andric } 5200b57cec5SDimitry Andric 5210b57cec5SDimitry Andric sc->setRelocs(newRelocs); 5220b57cec5SDimitry Andric } 5230b57cec5SDimitry Andric return addressesChanged; 5240b57cec5SDimitry Andric } 5250b57cec5SDimitry Andric 5260b57cec5SDimitry Andric // Verify that all relocations are in range, with no extra margin requirements. 527*bdd1243dSDimitry Andric bool Writer::verifyRanges(const std::vector<Chunk *> chunks) { 5280b57cec5SDimitry Andric for (Chunk *c : chunks) { 5290b57cec5SDimitry Andric SectionChunk *sc = dyn_cast_or_null<SectionChunk>(c); 5300b57cec5SDimitry Andric if (!sc) 5310b57cec5SDimitry Andric continue; 5320b57cec5SDimitry Andric 5330b57cec5SDimitry Andric ArrayRef<coff_relocation> relocs = sc->getRelocs(); 5340b57cec5SDimitry Andric for (size_t j = 0, e = relocs.size(); j < e; ++j) { 5350b57cec5SDimitry Andric const coff_relocation &rel = relocs[j]; 5360b57cec5SDimitry Andric Symbol *relocTarget = sc->file->getSymbol(rel.SymbolTableIndex); 5370b57cec5SDimitry Andric 5380b57cec5SDimitry Andric Defined *sym = dyn_cast_or_null<Defined>(relocTarget); 5390b57cec5SDimitry Andric if (!sym) 5400b57cec5SDimitry Andric continue; 5410b57cec5SDimitry Andric 5420b57cec5SDimitry Andric uint64_t p = sc->getRVA() + rel.VirtualAddress; 5430b57cec5SDimitry Andric uint64_t s = sym->getRVA(); 5440b57cec5SDimitry Andric 5450b57cec5SDimitry Andric if (!isInRange(rel.Type, s, p, 0)) 5460b57cec5SDimitry Andric return false; 5470b57cec5SDimitry Andric } 5480b57cec5SDimitry Andric } 5490b57cec5SDimitry Andric return true; 5500b57cec5SDimitry Andric } 5510b57cec5SDimitry Andric 5520b57cec5SDimitry Andric // Assign addresses and add thunks if necessary. 5530b57cec5SDimitry Andric void Writer::finalizeAddresses() { 5540b57cec5SDimitry Andric assignAddresses(); 555*bdd1243dSDimitry Andric if (ctx.config.machine != ARMNT && ctx.config.machine != ARM64) 5560b57cec5SDimitry Andric return; 5570b57cec5SDimitry Andric 5580b57cec5SDimitry Andric size_t origNumChunks = 0; 559349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) { 5600b57cec5SDimitry Andric sec->origChunks = sec->chunks; 5610b57cec5SDimitry Andric origNumChunks += sec->chunks.size(); 5620b57cec5SDimitry Andric } 5630b57cec5SDimitry Andric 5640b57cec5SDimitry Andric int pass = 0; 5650b57cec5SDimitry Andric int margin = 1024 * 100; 5660b57cec5SDimitry Andric while (true) { 5670b57cec5SDimitry Andric // First check whether we need thunks at all, or if the previous pass of 5680b57cec5SDimitry Andric // adding them turned out ok. 5690b57cec5SDimitry Andric bool rangesOk = true; 5700b57cec5SDimitry Andric size_t numChunks = 0; 571349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) { 5720b57cec5SDimitry Andric if (!verifyRanges(sec->chunks)) { 5730b57cec5SDimitry Andric rangesOk = false; 5740b57cec5SDimitry Andric break; 5750b57cec5SDimitry Andric } 5760b57cec5SDimitry Andric numChunks += sec->chunks.size(); 5770b57cec5SDimitry Andric } 5780b57cec5SDimitry Andric if (rangesOk) { 5790b57cec5SDimitry Andric if (pass > 0) 5800b57cec5SDimitry Andric log("Added " + Twine(numChunks - origNumChunks) + " thunks with " + 5810b57cec5SDimitry Andric "margin " + Twine(margin) + " in " + Twine(pass) + " passes"); 5820b57cec5SDimitry Andric return; 5830b57cec5SDimitry Andric } 5840b57cec5SDimitry Andric 5850b57cec5SDimitry Andric if (pass >= 10) 5860b57cec5SDimitry Andric fatal("adding thunks hasn't converged after " + Twine(pass) + " passes"); 5870b57cec5SDimitry Andric 5880b57cec5SDimitry Andric if (pass > 0) { 5890b57cec5SDimitry Andric // If the previous pass didn't work out, reset everything back to the 5900b57cec5SDimitry Andric // original conditions before retrying with a wider margin. This should 5910b57cec5SDimitry Andric // ideally never happen under real circumstances. 592349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) 5930b57cec5SDimitry Andric sec->chunks = sec->origChunks; 5940b57cec5SDimitry Andric margin *= 2; 5950b57cec5SDimitry Andric } 5960b57cec5SDimitry Andric 5970b57cec5SDimitry Andric // Try adding thunks everywhere where it is needed, with a margin 5980b57cec5SDimitry Andric // to avoid things going out of range due to the added thunks. 5990b57cec5SDimitry Andric bool addressesChanged = false; 600349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) 6010b57cec5SDimitry Andric addressesChanged |= createThunks(sec, margin); 6020b57cec5SDimitry Andric // If the verification above thought we needed thunks, we should have 6030b57cec5SDimitry Andric // added some. 6040b57cec5SDimitry Andric assert(addressesChanged); 605fe6060f1SDimitry Andric (void)addressesChanged; 6060b57cec5SDimitry Andric 6070b57cec5SDimitry Andric // Recalculate the layout for the whole image (and verify the ranges at 6080b57cec5SDimitry Andric // the start of the next round). 6090b57cec5SDimitry Andric assignAddresses(); 6100b57cec5SDimitry Andric 6110b57cec5SDimitry Andric pass++; 6120b57cec5SDimitry Andric } 6130b57cec5SDimitry Andric } 6140b57cec5SDimitry Andric 615*bdd1243dSDimitry Andric void Writer::writePEChecksum() { 616*bdd1243dSDimitry Andric if (!ctx.config.writeCheckSum) { 617*bdd1243dSDimitry Andric return; 618*bdd1243dSDimitry Andric } 619*bdd1243dSDimitry Andric 620*bdd1243dSDimitry Andric // https://docs.microsoft.com/en-us/windows/win32/debug/pe-format#checksum 621*bdd1243dSDimitry Andric uint32_t *buf = (uint32_t *)buffer->getBufferStart(); 622*bdd1243dSDimitry Andric uint32_t size = (uint32_t)(buffer->getBufferSize()); 623*bdd1243dSDimitry Andric 624*bdd1243dSDimitry Andric coff_file_header *coffHeader = 625*bdd1243dSDimitry Andric (coff_file_header *)((uint8_t *)buf + dosStubSize + sizeof(PEMagic)); 626*bdd1243dSDimitry Andric pe32_header *peHeader = 627*bdd1243dSDimitry Andric (pe32_header *)((uint8_t *)coffHeader + sizeof(coff_file_header)); 628*bdd1243dSDimitry Andric 629*bdd1243dSDimitry Andric uint64_t sum = 0; 630*bdd1243dSDimitry Andric uint32_t count = size; 631*bdd1243dSDimitry Andric ulittle16_t *addr = (ulittle16_t *)buf; 632*bdd1243dSDimitry Andric 633*bdd1243dSDimitry Andric // The PE checksum algorithm, implemented as suggested in RFC1071 634*bdd1243dSDimitry Andric while (count > 1) { 635*bdd1243dSDimitry Andric sum += *addr++; 636*bdd1243dSDimitry Andric count -= 2; 637*bdd1243dSDimitry Andric } 638*bdd1243dSDimitry Andric 639*bdd1243dSDimitry Andric // Add left-over byte, if any 640*bdd1243dSDimitry Andric if (count > 0) 641*bdd1243dSDimitry Andric sum += *(unsigned char *)addr; 642*bdd1243dSDimitry Andric 643*bdd1243dSDimitry Andric // Fold 32-bit sum to 16 bits 644*bdd1243dSDimitry Andric while (sum >> 16) { 645*bdd1243dSDimitry Andric sum = (sum & 0xffff) + (sum >> 16); 646*bdd1243dSDimitry Andric } 647*bdd1243dSDimitry Andric 648*bdd1243dSDimitry Andric sum += size; 649*bdd1243dSDimitry Andric peHeader->CheckSum = sum; 650*bdd1243dSDimitry Andric } 651*bdd1243dSDimitry Andric 6520b57cec5SDimitry Andric // The main function of the writer. 6530b57cec5SDimitry Andric void Writer::run() { 654349cc55cSDimitry Andric ScopedTimer t1(ctx.codeLayoutTimer); 6550b57cec5SDimitry Andric 6560b57cec5SDimitry Andric createImportTables(); 6570b57cec5SDimitry Andric createSections(); 6580b57cec5SDimitry Andric appendImportThunks(); 659e8d8bef9SDimitry Andric // Import thunks must be added before the Control Flow Guard tables are added. 660e8d8bef9SDimitry Andric createMiscChunks(); 6610b57cec5SDimitry Andric createExportTable(); 6620b57cec5SDimitry Andric mergeSections(); 6630b57cec5SDimitry Andric removeUnusedSections(); 6640b57cec5SDimitry Andric finalizeAddresses(); 6650b57cec5SDimitry Andric removeEmptySections(); 6660b57cec5SDimitry Andric assignOutputSectionIndices(); 6670b57cec5SDimitry Andric setSectionPermissions(); 6680b57cec5SDimitry Andric createSymbolAndStringTable(); 6690b57cec5SDimitry Andric 6700b57cec5SDimitry Andric if (fileSize > UINT32_MAX) 6710b57cec5SDimitry Andric fatal("image size (" + Twine(fileSize) + ") " + 6720b57cec5SDimitry Andric "exceeds maximum allowable size (" + Twine(UINT32_MAX) + ")"); 6730b57cec5SDimitry Andric 674*bdd1243dSDimitry Andric openFile(ctx.config.outputFile); 675*bdd1243dSDimitry Andric if (ctx.config.is64()) { 6760b57cec5SDimitry Andric writeHeader<pe32plus_header>(); 6770b57cec5SDimitry Andric } else { 6780b57cec5SDimitry Andric writeHeader<pe32_header>(); 6790b57cec5SDimitry Andric } 6800b57cec5SDimitry Andric writeSections(); 681*bdd1243dSDimitry Andric checkLoadConfig(); 6820b57cec5SDimitry Andric sortExceptionTable(); 6830b57cec5SDimitry Andric 684e8d8bef9SDimitry Andric // Fix up the alignment in the TLS Directory's characteristic field, 685e8d8bef9SDimitry Andric // if a specific alignment value is needed 686e8d8bef9SDimitry Andric if (tlsAlignment) 687e8d8bef9SDimitry Andric fixTlsAlignment(); 688e8d8bef9SDimitry Andric 6890b57cec5SDimitry Andric t1.stop(); 6900b57cec5SDimitry Andric 691*bdd1243dSDimitry Andric if (!ctx.config.pdbPath.empty() && ctx.config.debug) { 6920b57cec5SDimitry Andric assert(buildId); 693349cc55cSDimitry Andric createPDB(ctx, sectionTable, buildId->buildId); 6940b57cec5SDimitry Andric } 6950b57cec5SDimitry Andric writeBuildId(); 6960b57cec5SDimitry Andric 697349cc55cSDimitry Andric writeLLDMapFile(ctx); 698349cc55cSDimitry Andric writeMapFile(ctx); 6990b57cec5SDimitry Andric 700*bdd1243dSDimitry Andric writePEChecksum(); 701*bdd1243dSDimitry Andric 7020b57cec5SDimitry Andric if (errorCount()) 7030b57cec5SDimitry Andric return; 7040b57cec5SDimitry Andric 705349cc55cSDimitry Andric ScopedTimer t2(ctx.outputCommitTimer); 7060b57cec5SDimitry Andric if (auto e = buffer->commit()) 707*bdd1243dSDimitry Andric fatal("failed to write output '" + buffer->getPath() + 708*bdd1243dSDimitry Andric "': " + toString(std::move(e))); 7090b57cec5SDimitry Andric } 7100b57cec5SDimitry Andric 7110b57cec5SDimitry Andric static StringRef getOutputSectionName(StringRef name) { 7120b57cec5SDimitry Andric StringRef s = name.split('$').first; 7130b57cec5SDimitry Andric 7140b57cec5SDimitry Andric // Treat a later period as a separator for MinGW, for sections like 7150b57cec5SDimitry Andric // ".ctors.01234". 7160b57cec5SDimitry Andric return s.substr(0, s.find('.', 1)); 7170b57cec5SDimitry Andric } 7180b57cec5SDimitry Andric 7190b57cec5SDimitry Andric // For /order. 720*bdd1243dSDimitry Andric void Writer::sortBySectionOrder(std::vector<Chunk *> &chunks) { 721*bdd1243dSDimitry Andric auto getPriority = [&ctx = ctx](const Chunk *c) { 7220b57cec5SDimitry Andric if (auto *sec = dyn_cast<SectionChunk>(c)) 7230b57cec5SDimitry Andric if (sec->sym) 724*bdd1243dSDimitry Andric return ctx.config.order.lookup(sec->sym->getName()); 7250b57cec5SDimitry Andric return 0; 7260b57cec5SDimitry Andric }; 7270b57cec5SDimitry Andric 7280b57cec5SDimitry Andric llvm::stable_sort(chunks, [=](const Chunk *a, const Chunk *b) { 7290b57cec5SDimitry Andric return getPriority(a) < getPriority(b); 7300b57cec5SDimitry Andric }); 7310b57cec5SDimitry Andric } 7320b57cec5SDimitry Andric 7330b57cec5SDimitry Andric // Change the characteristics of existing PartialSections that belong to the 7340b57cec5SDimitry Andric // section Name to Chars. 7350b57cec5SDimitry Andric void Writer::fixPartialSectionChars(StringRef name, uint32_t chars) { 7360b57cec5SDimitry Andric for (auto it : partialSections) { 7370b57cec5SDimitry Andric PartialSection *pSec = it.second; 7380b57cec5SDimitry Andric StringRef curName = pSec->name; 7390b57cec5SDimitry Andric if (!curName.consume_front(name) || 7400b57cec5SDimitry Andric (!curName.empty() && !curName.startswith("$"))) 7410b57cec5SDimitry Andric continue; 7420b57cec5SDimitry Andric if (pSec->characteristics == chars) 7430b57cec5SDimitry Andric continue; 7440b57cec5SDimitry Andric PartialSection *destSec = createPartialSection(pSec->name, chars); 7450b57cec5SDimitry Andric destSec->chunks.insert(destSec->chunks.end(), pSec->chunks.begin(), 7460b57cec5SDimitry Andric pSec->chunks.end()); 7470b57cec5SDimitry Andric pSec->chunks.clear(); 7480b57cec5SDimitry Andric } 7490b57cec5SDimitry Andric } 7500b57cec5SDimitry Andric 7510b57cec5SDimitry Andric // Sort concrete section chunks from GNU import libraries. 7520b57cec5SDimitry Andric // 7530b57cec5SDimitry Andric // GNU binutils doesn't use short import files, but instead produces import 7540b57cec5SDimitry Andric // libraries that consist of object files, with section chunks for the .idata$* 7550b57cec5SDimitry Andric // sections. These are linked just as regular static libraries. Each import 7560b57cec5SDimitry Andric // library consists of one header object, one object file for every imported 7570b57cec5SDimitry Andric // symbol, and one trailer object. In order for the .idata tables/lists to 7580b57cec5SDimitry Andric // be formed correctly, the section chunks within each .idata$* section need 7590b57cec5SDimitry Andric // to be grouped by library, and sorted alphabetically within each library 7600b57cec5SDimitry Andric // (which makes sure the header comes first and the trailer last). 7610b57cec5SDimitry Andric bool Writer::fixGnuImportChunks() { 7620b57cec5SDimitry Andric uint32_t rdata = IMAGE_SCN_CNT_INITIALIZED_DATA | IMAGE_SCN_MEM_READ; 7630b57cec5SDimitry Andric 7640b57cec5SDimitry Andric // Make sure all .idata$* section chunks are mapped as RDATA in order to 7650b57cec5SDimitry Andric // be sorted into the same sections as our own synthesized .idata chunks. 7660b57cec5SDimitry Andric fixPartialSectionChars(".idata", rdata); 7670b57cec5SDimitry Andric 7680b57cec5SDimitry Andric bool hasIdata = false; 7690b57cec5SDimitry Andric // Sort all .idata$* chunks, grouping chunks from the same library, 77081ad6265SDimitry Andric // with alphabetical ordering of the object files within a library. 7710b57cec5SDimitry Andric for (auto it : partialSections) { 7720b57cec5SDimitry Andric PartialSection *pSec = it.second; 7730b57cec5SDimitry Andric if (!pSec->name.startswith(".idata")) 7740b57cec5SDimitry Andric continue; 7750b57cec5SDimitry Andric 7760b57cec5SDimitry Andric if (!pSec->chunks.empty()) 7770b57cec5SDimitry Andric hasIdata = true; 7780b57cec5SDimitry Andric llvm::stable_sort(pSec->chunks, [&](Chunk *s, Chunk *t) { 7790b57cec5SDimitry Andric SectionChunk *sc1 = dyn_cast_or_null<SectionChunk>(s); 7800b57cec5SDimitry Andric SectionChunk *sc2 = dyn_cast_or_null<SectionChunk>(t); 7810b57cec5SDimitry Andric if (!sc1 || !sc2) { 7820b57cec5SDimitry Andric // if SC1, order them ascending. If SC2 or both null, 7830b57cec5SDimitry Andric // S is not less than T. 7840b57cec5SDimitry Andric return sc1 != nullptr; 7850b57cec5SDimitry Andric } 7860b57cec5SDimitry Andric // Make a string with "libraryname/objectfile" for sorting, achieving 7870b57cec5SDimitry Andric // both grouping by library and sorting of objects within a library, 7880b57cec5SDimitry Andric // at once. 7890b57cec5SDimitry Andric std::string key1 = 7900b57cec5SDimitry Andric (sc1->file->parentName + "/" + sc1->file->getName()).str(); 7910b57cec5SDimitry Andric std::string key2 = 7920b57cec5SDimitry Andric (sc2->file->parentName + "/" + sc2->file->getName()).str(); 7930b57cec5SDimitry Andric return key1 < key2; 7940b57cec5SDimitry Andric }); 7950b57cec5SDimitry Andric } 7960b57cec5SDimitry Andric return hasIdata; 7970b57cec5SDimitry Andric } 7980b57cec5SDimitry Andric 7990b57cec5SDimitry Andric // Add generated idata chunks, for imported symbols and DLLs, and a 8000b57cec5SDimitry Andric // terminator in .idata$2. 8010b57cec5SDimitry Andric void Writer::addSyntheticIdata() { 8020b57cec5SDimitry Andric uint32_t rdata = IMAGE_SCN_CNT_INITIALIZED_DATA | IMAGE_SCN_MEM_READ; 803*bdd1243dSDimitry Andric idata.create(ctx); 8040b57cec5SDimitry Andric 8050b57cec5SDimitry Andric // Add the .idata content in the right section groups, to allow 8060b57cec5SDimitry Andric // chunks from other linked in object files to be grouped together. 8070b57cec5SDimitry Andric // See Microsoft PE/COFF spec 5.4 for details. 8080b57cec5SDimitry Andric auto add = [&](StringRef n, std::vector<Chunk *> &v) { 8090b57cec5SDimitry Andric PartialSection *pSec = createPartialSection(n, rdata); 8100b57cec5SDimitry Andric pSec->chunks.insert(pSec->chunks.end(), v.begin(), v.end()); 8110b57cec5SDimitry Andric }; 8120b57cec5SDimitry Andric 8130b57cec5SDimitry Andric // The loader assumes a specific order of data. 8140b57cec5SDimitry Andric // Add each type in the correct order. 8150b57cec5SDimitry Andric add(".idata$2", idata.dirs); 8160b57cec5SDimitry Andric add(".idata$4", idata.lookups); 8170b57cec5SDimitry Andric add(".idata$5", idata.addresses); 81885868e8aSDimitry Andric if (!idata.hints.empty()) 8190b57cec5SDimitry Andric add(".idata$6", idata.hints); 8200b57cec5SDimitry Andric add(".idata$7", idata.dllNames); 8210b57cec5SDimitry Andric } 8220b57cec5SDimitry Andric 8230b57cec5SDimitry Andric // Locate the first Chunk and size of the import directory list and the 8240b57cec5SDimitry Andric // IAT. 8250b57cec5SDimitry Andric void Writer::locateImportTables() { 8260b57cec5SDimitry Andric uint32_t rdata = IMAGE_SCN_CNT_INITIALIZED_DATA | IMAGE_SCN_MEM_READ; 8270b57cec5SDimitry Andric 8280b57cec5SDimitry Andric if (PartialSection *importDirs = findPartialSection(".idata$2", rdata)) { 8290b57cec5SDimitry Andric if (!importDirs->chunks.empty()) 8300b57cec5SDimitry Andric importTableStart = importDirs->chunks.front(); 8310b57cec5SDimitry Andric for (Chunk *c : importDirs->chunks) 8320b57cec5SDimitry Andric importTableSize += c->getSize(); 8330b57cec5SDimitry Andric } 8340b57cec5SDimitry Andric 8350b57cec5SDimitry Andric if (PartialSection *importAddresses = findPartialSection(".idata$5", rdata)) { 8360b57cec5SDimitry Andric if (!importAddresses->chunks.empty()) 8370b57cec5SDimitry Andric iatStart = importAddresses->chunks.front(); 8380b57cec5SDimitry Andric for (Chunk *c : importAddresses->chunks) 8390b57cec5SDimitry Andric iatSize += c->getSize(); 8400b57cec5SDimitry Andric } 8410b57cec5SDimitry Andric } 8420b57cec5SDimitry Andric 8430b57cec5SDimitry Andric // Return whether a SectionChunk's suffix (the dollar and any trailing 8440b57cec5SDimitry Andric // suffix) should be removed and sorted into the main suffixless 8450b57cec5SDimitry Andric // PartialSection. 846*bdd1243dSDimitry Andric static bool shouldStripSectionSuffix(SectionChunk *sc, StringRef name, 847*bdd1243dSDimitry Andric bool isMinGW) { 8480b57cec5SDimitry Andric // On MinGW, comdat groups are formed by putting the comdat group name 8490b57cec5SDimitry Andric // after the '$' in the section name. For .eh_frame$<symbol>, that must 8500b57cec5SDimitry Andric // still be sorted before the .eh_frame trailer from crtend.o, thus just 8510b57cec5SDimitry Andric // strip the section name trailer. For other sections, such as 8520b57cec5SDimitry Andric // .tls$$<symbol> (where non-comdat .tls symbols are otherwise stored in 8530b57cec5SDimitry Andric // ".tls$"), they must be strictly sorted after .tls. And for the 8540b57cec5SDimitry Andric // hypothetical case of comdat .CRT$XCU, we definitely need to keep the 8550b57cec5SDimitry Andric // suffix for sorting. Thus, to play it safe, only strip the suffix for 8560b57cec5SDimitry Andric // the standard sections. 857*bdd1243dSDimitry Andric if (!isMinGW) 8580b57cec5SDimitry Andric return false; 8590b57cec5SDimitry Andric if (!sc || !sc->isCOMDAT()) 8600b57cec5SDimitry Andric return false; 8610b57cec5SDimitry Andric return name.startswith(".text$") || name.startswith(".data$") || 8620b57cec5SDimitry Andric name.startswith(".rdata$") || name.startswith(".pdata$") || 8630b57cec5SDimitry Andric name.startswith(".xdata$") || name.startswith(".eh_frame$"); 8640b57cec5SDimitry Andric } 8650b57cec5SDimitry Andric 866e8d8bef9SDimitry Andric void Writer::sortSections() { 867*bdd1243dSDimitry Andric if (!ctx.config.callGraphProfile.empty()) { 868349cc55cSDimitry Andric DenseMap<const SectionChunk *, int> order = 869349cc55cSDimitry Andric computeCallGraphProfileOrder(ctx); 870e8d8bef9SDimitry Andric for (auto it : order) { 871e8d8bef9SDimitry Andric if (DefinedRegular *sym = it.first->sym) 872*bdd1243dSDimitry Andric ctx.config.order[sym->getName()] = it.second; 873e8d8bef9SDimitry Andric } 874e8d8bef9SDimitry Andric } 875*bdd1243dSDimitry Andric if (!ctx.config.order.empty()) 876e8d8bef9SDimitry Andric for (auto it : partialSections) 877e8d8bef9SDimitry Andric sortBySectionOrder(it.second->chunks); 878e8d8bef9SDimitry Andric } 879e8d8bef9SDimitry Andric 8800b57cec5SDimitry Andric // Create output section objects and add them to OutputSections. 8810b57cec5SDimitry Andric void Writer::createSections() { 8820b57cec5SDimitry Andric // First, create the builtin sections. 8830b57cec5SDimitry Andric const uint32_t data = IMAGE_SCN_CNT_INITIALIZED_DATA; 8840b57cec5SDimitry Andric const uint32_t bss = IMAGE_SCN_CNT_UNINITIALIZED_DATA; 8850b57cec5SDimitry Andric const uint32_t code = IMAGE_SCN_CNT_CODE; 8860b57cec5SDimitry Andric const uint32_t discardable = IMAGE_SCN_MEM_DISCARDABLE; 8870b57cec5SDimitry Andric const uint32_t r = IMAGE_SCN_MEM_READ; 8880b57cec5SDimitry Andric const uint32_t w = IMAGE_SCN_MEM_WRITE; 8890b57cec5SDimitry Andric const uint32_t x = IMAGE_SCN_MEM_EXECUTE; 8900b57cec5SDimitry Andric 8910b57cec5SDimitry Andric SmallDenseMap<std::pair<StringRef, uint32_t>, OutputSection *> sections; 8920b57cec5SDimitry Andric auto createSection = [&](StringRef name, uint32_t outChars) { 8930b57cec5SDimitry Andric OutputSection *&sec = sections[{name, outChars}]; 8940b57cec5SDimitry Andric if (!sec) { 8950b57cec5SDimitry Andric sec = make<OutputSection>(name, outChars); 896349cc55cSDimitry Andric ctx.outputSections.push_back(sec); 8970b57cec5SDimitry Andric } 8980b57cec5SDimitry Andric return sec; 8990b57cec5SDimitry Andric }; 9000b57cec5SDimitry Andric 9010b57cec5SDimitry Andric // Try to match the section order used by link.exe. 9020b57cec5SDimitry Andric textSec = createSection(".text", code | r | x); 9030b57cec5SDimitry Andric createSection(".bss", bss | r | w); 9040b57cec5SDimitry Andric rdataSec = createSection(".rdata", data | r); 9050b57cec5SDimitry Andric buildidSec = createSection(".buildid", data | r); 9060b57cec5SDimitry Andric dataSec = createSection(".data", data | r | w); 9070b57cec5SDimitry Andric pdataSec = createSection(".pdata", data | r); 9080b57cec5SDimitry Andric idataSec = createSection(".idata", data | r); 9090b57cec5SDimitry Andric edataSec = createSection(".edata", data | r); 9100b57cec5SDimitry Andric didatSec = createSection(".didat", data | r); 9110b57cec5SDimitry Andric rsrcSec = createSection(".rsrc", data | r); 9120b57cec5SDimitry Andric relocSec = createSection(".reloc", data | discardable | r); 9130b57cec5SDimitry Andric ctorsSec = createSection(".ctors", data | r | w); 9140b57cec5SDimitry Andric dtorsSec = createSection(".dtors", data | r | w); 9150b57cec5SDimitry Andric 9160b57cec5SDimitry Andric // Then bin chunks by name and output characteristics. 917349cc55cSDimitry Andric for (Chunk *c : ctx.symtab.getChunks()) { 9180b57cec5SDimitry Andric auto *sc = dyn_cast<SectionChunk>(c); 9190b57cec5SDimitry Andric if (sc && !sc->live) { 920*bdd1243dSDimitry Andric if (ctx.config.verbose) 9210b57cec5SDimitry Andric sc->printDiscardedMessage(); 9220b57cec5SDimitry Andric continue; 9230b57cec5SDimitry Andric } 9240b57cec5SDimitry Andric StringRef name = c->getSectionName(); 925*bdd1243dSDimitry Andric if (shouldStripSectionSuffix(sc, name, ctx.config.mingw)) 9260b57cec5SDimitry Andric name = name.split('$').first; 927e8d8bef9SDimitry Andric 928e8d8bef9SDimitry Andric if (name.startswith(".tls")) 929e8d8bef9SDimitry Andric tlsAlignment = std::max(tlsAlignment, c->getAlignment()); 930e8d8bef9SDimitry Andric 9310b57cec5SDimitry Andric PartialSection *pSec = createPartialSection(name, 9320b57cec5SDimitry Andric c->getOutputCharacteristics()); 9330b57cec5SDimitry Andric pSec->chunks.push_back(c); 9340b57cec5SDimitry Andric } 9350b57cec5SDimitry Andric 9360b57cec5SDimitry Andric fixPartialSectionChars(".rsrc", data | r); 93785868e8aSDimitry Andric fixPartialSectionChars(".edata", data | r); 9380b57cec5SDimitry Andric // Even in non MinGW cases, we might need to link against GNU import 9390b57cec5SDimitry Andric // libraries. 9400b57cec5SDimitry Andric bool hasIdata = fixGnuImportChunks(); 9410b57cec5SDimitry Andric if (!idata.empty()) 9420b57cec5SDimitry Andric hasIdata = true; 9430b57cec5SDimitry Andric 9440b57cec5SDimitry Andric if (hasIdata) 9450b57cec5SDimitry Andric addSyntheticIdata(); 9460b57cec5SDimitry Andric 947e8d8bef9SDimitry Andric sortSections(); 9480b57cec5SDimitry Andric 9490b57cec5SDimitry Andric if (hasIdata) 9500b57cec5SDimitry Andric locateImportTables(); 9510b57cec5SDimitry Andric 9520b57cec5SDimitry Andric // Then create an OutputSection for each section. 9530b57cec5SDimitry Andric // '$' and all following characters in input section names are 9540b57cec5SDimitry Andric // discarded when determining output section. So, .text$foo 9550b57cec5SDimitry Andric // contributes to .text, for example. See PE/COFF spec 3.2. 9560b57cec5SDimitry Andric for (auto it : partialSections) { 9570b57cec5SDimitry Andric PartialSection *pSec = it.second; 9580b57cec5SDimitry Andric StringRef name = getOutputSectionName(pSec->name); 9590b57cec5SDimitry Andric uint32_t outChars = pSec->characteristics; 9600b57cec5SDimitry Andric 9610b57cec5SDimitry Andric if (name == ".CRT") { 9620b57cec5SDimitry Andric // In link.exe, there is a special case for the I386 target where .CRT 9630b57cec5SDimitry Andric // sections are treated as if they have output characteristics DATA | R if 9640b57cec5SDimitry Andric // their characteristics are DATA | R | W. This implements the same 9650b57cec5SDimitry Andric // special case for all architectures. 9660b57cec5SDimitry Andric outChars = data | r; 9670b57cec5SDimitry Andric 9680b57cec5SDimitry Andric log("Processing section " + pSec->name + " -> " + name); 9690b57cec5SDimitry Andric 9700b57cec5SDimitry Andric sortCRTSectionChunks(pSec->chunks); 9710b57cec5SDimitry Andric } 9720b57cec5SDimitry Andric 9730b57cec5SDimitry Andric OutputSection *sec = createSection(name, outChars); 9740b57cec5SDimitry Andric for (Chunk *c : pSec->chunks) 9750b57cec5SDimitry Andric sec->addChunk(c); 9760b57cec5SDimitry Andric 9770b57cec5SDimitry Andric sec->addContributingPartialSection(pSec); 9780b57cec5SDimitry Andric } 9790b57cec5SDimitry Andric 9800b57cec5SDimitry Andric // Finally, move some output sections to the end. 9810b57cec5SDimitry Andric auto sectionOrder = [&](const OutputSection *s) { 9820b57cec5SDimitry Andric // Move DISCARDABLE (or non-memory-mapped) sections to the end of file 9830b57cec5SDimitry Andric // because the loader cannot handle holes. Stripping can remove other 9840b57cec5SDimitry Andric // discardable ones than .reloc, which is first of them (created early). 985fb03ea46SDimitry Andric if (s->header.Characteristics & IMAGE_SCN_MEM_DISCARDABLE) { 986fb03ea46SDimitry Andric // Move discardable sections named .debug_ to the end, after other 987fb03ea46SDimitry Andric // discardable sections. Stripping only removes the sections named 988fb03ea46SDimitry Andric // .debug_* - thus try to avoid leaving holes after stripping. 989fb03ea46SDimitry Andric if (s->name.startswith(".debug_")) 990fb03ea46SDimitry Andric return 3; 9910b57cec5SDimitry Andric return 2; 992fb03ea46SDimitry Andric } 9930b57cec5SDimitry Andric // .rsrc should come at the end of the non-discardable sections because its 9940b57cec5SDimitry Andric // size may change by the Win32 UpdateResources() function, causing 9950b57cec5SDimitry Andric // subsequent sections to move (see https://crbug.com/827082). 9960b57cec5SDimitry Andric if (s == rsrcSec) 9970b57cec5SDimitry Andric return 1; 9980b57cec5SDimitry Andric return 0; 9990b57cec5SDimitry Andric }; 1000349cc55cSDimitry Andric llvm::stable_sort(ctx.outputSections, 10010b57cec5SDimitry Andric [&](const OutputSection *s, const OutputSection *t) { 10020b57cec5SDimitry Andric return sectionOrder(s) < sectionOrder(t); 10030b57cec5SDimitry Andric }); 10040b57cec5SDimitry Andric } 10050b57cec5SDimitry Andric 10060b57cec5SDimitry Andric void Writer::createMiscChunks() { 1007*bdd1243dSDimitry Andric Configuration *config = &ctx.config; 1008*bdd1243dSDimitry Andric 1009349cc55cSDimitry Andric for (MergeChunk *p : ctx.mergeChunkInstances) { 10100b57cec5SDimitry Andric if (p) { 10110b57cec5SDimitry Andric p->finalizeContents(); 10120b57cec5SDimitry Andric rdataSec->addChunk(p); 10130b57cec5SDimitry Andric } 10140b57cec5SDimitry Andric } 10150b57cec5SDimitry Andric 10160b57cec5SDimitry Andric // Create thunks for locally-dllimported symbols. 1017349cc55cSDimitry Andric if (!ctx.symtab.localImportChunks.empty()) { 1018349cc55cSDimitry Andric for (Chunk *c : ctx.symtab.localImportChunks) 10190b57cec5SDimitry Andric rdataSec->addChunk(c); 10200b57cec5SDimitry Andric } 10210b57cec5SDimitry Andric 10220b57cec5SDimitry Andric // Create Debug Information Chunks 10230b57cec5SDimitry Andric OutputSection *debugInfoSec = config->mingw ? buildidSec : rdataSec; 10245ffd83dbSDimitry Andric if (config->debug || config->repro || config->cetCompat) { 1025349cc55cSDimitry Andric debugDirectory = 1026349cc55cSDimitry Andric make<DebugDirectoryChunk>(ctx, debugRecords, config->repro); 10275ffd83dbSDimitry Andric debugDirectory->setAlignment(4); 10280b57cec5SDimitry Andric debugInfoSec->addChunk(debugDirectory); 10290b57cec5SDimitry Andric } 10300b57cec5SDimitry Andric 10310b57cec5SDimitry Andric if (config->debug) { 10320b57cec5SDimitry Andric // Make a CVDebugRecordChunk even when /DEBUG:CV is not specified. We 10330b57cec5SDimitry Andric // output a PDB no matter what, and this chunk provides the only means of 10340b57cec5SDimitry Andric // allowing a debugger to match a PDB and an executable. So we need it even 10350b57cec5SDimitry Andric // if we're ultimately not going to write CodeView data to the PDB. 1036*bdd1243dSDimitry Andric buildId = make<CVDebugRecordChunk>(ctx); 10375ffd83dbSDimitry Andric debugRecords.push_back({COFF::IMAGE_DEBUG_TYPE_CODEVIEW, buildId}); 10385ffd83dbSDimitry Andric } 10390b57cec5SDimitry Andric 10405ffd83dbSDimitry Andric if (config->cetCompat) { 1041e8d8bef9SDimitry Andric debugRecords.push_back({COFF::IMAGE_DEBUG_TYPE_EX_DLLCHARACTERISTICS, 10425ffd83dbSDimitry Andric make<ExtendedDllCharacteristicsChunk>( 1043e8d8bef9SDimitry Andric IMAGE_DLL_CHARACTERISTICS_EX_CET_COMPAT)}); 10445ffd83dbSDimitry Andric } 10455ffd83dbSDimitry Andric 1046e8d8bef9SDimitry Andric // Align and add each chunk referenced by the debug data directory. 1047e8d8bef9SDimitry Andric for (std::pair<COFF::DebugType, Chunk *> r : debugRecords) { 1048e8d8bef9SDimitry Andric r.second->setAlignment(4); 10495ffd83dbSDimitry Andric debugInfoSec->addChunk(r.second); 10500b57cec5SDimitry Andric } 10510b57cec5SDimitry Andric 10520b57cec5SDimitry Andric // Create SEH table. x86-only. 10530b57cec5SDimitry Andric if (config->safeSEH) 10540b57cec5SDimitry Andric createSEHTable(); 10550b57cec5SDimitry Andric 10560b57cec5SDimitry Andric // Create /guard:cf tables if requested. 10570b57cec5SDimitry Andric if (config->guardCF != GuardCFLevel::Off) 10580b57cec5SDimitry Andric createGuardCFTables(); 10590b57cec5SDimitry Andric 10605ffd83dbSDimitry Andric if (config->autoImport) 10610b57cec5SDimitry Andric createRuntimePseudoRelocs(); 10620b57cec5SDimitry Andric 10635ffd83dbSDimitry Andric if (config->mingw) 10640b57cec5SDimitry Andric insertCtorDtorSymbols(); 10650b57cec5SDimitry Andric } 10660b57cec5SDimitry Andric 10670b57cec5SDimitry Andric // Create .idata section for the DLL-imported symbol table. 10680b57cec5SDimitry Andric // The format of this section is inherently Windows-specific. 10690b57cec5SDimitry Andric // IdataContents class abstracted away the details for us, 10700b57cec5SDimitry Andric // so we just let it create chunks and add them to the section. 10710b57cec5SDimitry Andric void Writer::createImportTables() { 10720b57cec5SDimitry Andric // Initialize DLLOrder so that import entries are ordered in 10730b57cec5SDimitry Andric // the same order as in the command line. (That affects DLL 10740b57cec5SDimitry Andric // initialization order, and this ordering is MSVC-compatible.) 1075349cc55cSDimitry Andric for (ImportFile *file : ctx.importFileInstances) { 10760b57cec5SDimitry Andric if (!file->live) 10770b57cec5SDimitry Andric continue; 10780b57cec5SDimitry Andric 10790b57cec5SDimitry Andric std::string dll = StringRef(file->dllName).lower(); 1080*bdd1243dSDimitry Andric if (ctx.config.dllOrder.count(dll) == 0) 1081*bdd1243dSDimitry Andric ctx.config.dllOrder[dll] = ctx.config.dllOrder.size(); 10820b57cec5SDimitry Andric 10830b57cec5SDimitry Andric if (file->impSym && !isa<DefinedImportData>(file->impSym)) 1084*bdd1243dSDimitry Andric fatal(toString(ctx, *file->impSym) + " was replaced"); 10850b57cec5SDimitry Andric DefinedImportData *impSym = cast_or_null<DefinedImportData>(file->impSym); 1086*bdd1243dSDimitry Andric if (ctx.config.delayLoads.count(StringRef(file->dllName).lower())) { 10870b57cec5SDimitry Andric if (!file->thunkSym) 10880b57cec5SDimitry Andric fatal("cannot delay-load " + toString(file) + 1089*bdd1243dSDimitry Andric " due to import of data: " + toString(ctx, *impSym)); 10900b57cec5SDimitry Andric delayIdata.add(impSym); 10910b57cec5SDimitry Andric } else { 10920b57cec5SDimitry Andric idata.add(impSym); 10930b57cec5SDimitry Andric } 10940b57cec5SDimitry Andric } 10950b57cec5SDimitry Andric } 10960b57cec5SDimitry Andric 10970b57cec5SDimitry Andric void Writer::appendImportThunks() { 1098349cc55cSDimitry Andric if (ctx.importFileInstances.empty()) 10990b57cec5SDimitry Andric return; 11000b57cec5SDimitry Andric 1101349cc55cSDimitry Andric for (ImportFile *file : ctx.importFileInstances) { 11020b57cec5SDimitry Andric if (!file->live) 11030b57cec5SDimitry Andric continue; 11040b57cec5SDimitry Andric 11050b57cec5SDimitry Andric if (!file->thunkSym) 11060b57cec5SDimitry Andric continue; 11070b57cec5SDimitry Andric 11080b57cec5SDimitry Andric if (!isa<DefinedImportThunk>(file->thunkSym)) 1109*bdd1243dSDimitry Andric fatal(toString(ctx, *file->thunkSym) + " was replaced"); 11100b57cec5SDimitry Andric DefinedImportThunk *thunk = cast<DefinedImportThunk>(file->thunkSym); 11110b57cec5SDimitry Andric if (file->thunkLive) 11120b57cec5SDimitry Andric textSec->addChunk(thunk->getChunk()); 11130b57cec5SDimitry Andric } 11140b57cec5SDimitry Andric 11150b57cec5SDimitry Andric if (!delayIdata.empty()) { 1116*bdd1243dSDimitry Andric Defined *helper = cast<Defined>(ctx.config.delayLoadHelper); 1117*bdd1243dSDimitry Andric delayIdata.create(helper); 11180b57cec5SDimitry Andric for (Chunk *c : delayIdata.getChunks()) 11190b57cec5SDimitry Andric didatSec->addChunk(c); 11200b57cec5SDimitry Andric for (Chunk *c : delayIdata.getDataChunks()) 11210b57cec5SDimitry Andric dataSec->addChunk(c); 11220b57cec5SDimitry Andric for (Chunk *c : delayIdata.getCodeChunks()) 11230b57cec5SDimitry Andric textSec->addChunk(c); 1124*bdd1243dSDimitry Andric for (Chunk *c : delayIdata.getCodePData()) 1125*bdd1243dSDimitry Andric pdataSec->addChunk(c); 1126*bdd1243dSDimitry Andric for (Chunk *c : delayIdata.getCodeUnwindInfo()) 1127*bdd1243dSDimitry Andric rdataSec->addChunk(c); 11280b57cec5SDimitry Andric } 11290b57cec5SDimitry Andric } 11300b57cec5SDimitry Andric 11310b57cec5SDimitry Andric void Writer::createExportTable() { 113285868e8aSDimitry Andric if (!edataSec->chunks.empty()) { 113385868e8aSDimitry Andric // Allow using a custom built export table from input object files, instead 113485868e8aSDimitry Andric // of having the linker synthesize the tables. 1135*bdd1243dSDimitry Andric if (ctx.config.hadExplicitExports) 113685868e8aSDimitry Andric warn("literal .edata sections override exports"); 1137*bdd1243dSDimitry Andric } else if (!ctx.config.exports.empty()) { 11380b57cec5SDimitry Andric for (Chunk *c : edata.chunks) 11390b57cec5SDimitry Andric edataSec->addChunk(c); 11400b57cec5SDimitry Andric } 114185868e8aSDimitry Andric if (!edataSec->chunks.empty()) { 114285868e8aSDimitry Andric edataStart = edataSec->chunks.front(); 114385868e8aSDimitry Andric edataEnd = edataSec->chunks.back(); 114485868e8aSDimitry Andric } 1145fe6060f1SDimitry Andric // Warn on exported deleting destructor. 1146*bdd1243dSDimitry Andric for (auto e : ctx.config.exports) 1147fe6060f1SDimitry Andric if (e.sym && e.sym->getName().startswith("??_G")) 1148*bdd1243dSDimitry Andric warn("export of deleting dtor: " + toString(ctx, *e.sym)); 114985868e8aSDimitry Andric } 11500b57cec5SDimitry Andric 11510b57cec5SDimitry Andric void Writer::removeUnusedSections() { 11520b57cec5SDimitry Andric // Remove sections that we can be sure won't get content, to avoid 11530b57cec5SDimitry Andric // allocating space for their section headers. 11540b57cec5SDimitry Andric auto isUnused = [this](OutputSection *s) { 11550b57cec5SDimitry Andric if (s == relocSec) 11560b57cec5SDimitry Andric return false; // This section is populated later. 11570b57cec5SDimitry Andric // MergeChunks have zero size at this point, as their size is finalized 11580b57cec5SDimitry Andric // later. Only remove sections that have no Chunks at all. 11590b57cec5SDimitry Andric return s->chunks.empty(); 11600b57cec5SDimitry Andric }; 1161349cc55cSDimitry Andric llvm::erase_if(ctx.outputSections, isUnused); 11620b57cec5SDimitry Andric } 11630b57cec5SDimitry Andric 11640b57cec5SDimitry Andric // The Windows loader doesn't seem to like empty sections, 11650b57cec5SDimitry Andric // so we remove them if any. 11660b57cec5SDimitry Andric void Writer::removeEmptySections() { 11670b57cec5SDimitry Andric auto isEmpty = [](OutputSection *s) { return s->getVirtualSize() == 0; }; 1168349cc55cSDimitry Andric llvm::erase_if(ctx.outputSections, isEmpty); 11690b57cec5SDimitry Andric } 11700b57cec5SDimitry Andric 11710b57cec5SDimitry Andric void Writer::assignOutputSectionIndices() { 11720b57cec5SDimitry Andric // Assign final output section indices, and assign each chunk to its output 11730b57cec5SDimitry Andric // section. 11740b57cec5SDimitry Andric uint32_t idx = 1; 1175349cc55cSDimitry Andric for (OutputSection *os : ctx.outputSections) { 11760b57cec5SDimitry Andric os->sectionIndex = idx; 11770b57cec5SDimitry Andric for (Chunk *c : os->chunks) 11780b57cec5SDimitry Andric c->setOutputSectionIdx(idx); 11790b57cec5SDimitry Andric ++idx; 11800b57cec5SDimitry Andric } 11810b57cec5SDimitry Andric 11820b57cec5SDimitry Andric // Merge chunks are containers of chunks, so assign those an output section 11830b57cec5SDimitry Andric // too. 1184349cc55cSDimitry Andric for (MergeChunk *mc : ctx.mergeChunkInstances) 11850b57cec5SDimitry Andric if (mc) 11860b57cec5SDimitry Andric for (SectionChunk *sc : mc->sections) 11870b57cec5SDimitry Andric if (sc && sc->live) 11880b57cec5SDimitry Andric sc->setOutputSectionIdx(mc->getOutputSectionIdx()); 11890b57cec5SDimitry Andric } 11900b57cec5SDimitry Andric 11910b57cec5SDimitry Andric size_t Writer::addEntryToStringTable(StringRef str) { 11920b57cec5SDimitry Andric assert(str.size() > COFF::NameSize); 11930b57cec5SDimitry Andric size_t offsetOfEntry = strtab.size() + 4; // +4 for the size field 11940b57cec5SDimitry Andric strtab.insert(strtab.end(), str.begin(), str.end()); 11950b57cec5SDimitry Andric strtab.push_back('\0'); 11960b57cec5SDimitry Andric return offsetOfEntry; 11970b57cec5SDimitry Andric } 11980b57cec5SDimitry Andric 1199*bdd1243dSDimitry Andric std::optional<coff_symbol16> Writer::createSymbol(Defined *def) { 12000b57cec5SDimitry Andric coff_symbol16 sym; 12010b57cec5SDimitry Andric switch (def->kind()) { 1202*bdd1243dSDimitry Andric case Symbol::DefinedAbsoluteKind: { 1203*bdd1243dSDimitry Andric auto *da = dyn_cast<DefinedAbsolute>(def); 1204*bdd1243dSDimitry Andric // Note: COFF symbol can only store 32-bit values, so 64-bit absolute 1205*bdd1243dSDimitry Andric // values will be truncated. 1206*bdd1243dSDimitry Andric sym.Value = da->getVA(); 12070b57cec5SDimitry Andric sym.SectionNumber = IMAGE_SYM_ABSOLUTE; 12080b57cec5SDimitry Andric break; 1209*bdd1243dSDimitry Andric } 12100b57cec5SDimitry Andric default: { 12110b57cec5SDimitry Andric // Don't write symbols that won't be written to the output to the symbol 12120b57cec5SDimitry Andric // table. 1213*bdd1243dSDimitry Andric // We also try to write DefinedSynthetic as a normal symbol. Some of these 1214*bdd1243dSDimitry Andric // symbols do point to an actual chunk, like __safe_se_handler_table. Others 1215*bdd1243dSDimitry Andric // like __ImageBase are outside of sections and thus cannot be represented. 12160b57cec5SDimitry Andric Chunk *c = def->getChunk(); 12170b57cec5SDimitry Andric if (!c) 1218*bdd1243dSDimitry Andric return std::nullopt; 1219349cc55cSDimitry Andric OutputSection *os = ctx.getOutputSection(c); 12200b57cec5SDimitry Andric if (!os) 1221*bdd1243dSDimitry Andric return std::nullopt; 12220b57cec5SDimitry Andric 12230b57cec5SDimitry Andric sym.Value = def->getRVA() - os->getRVA(); 12240b57cec5SDimitry Andric sym.SectionNumber = os->sectionIndex; 12250b57cec5SDimitry Andric break; 12260b57cec5SDimitry Andric } 12270b57cec5SDimitry Andric } 12280b57cec5SDimitry Andric 12290b57cec5SDimitry Andric // Symbols that are runtime pseudo relocations don't point to the actual 12300b57cec5SDimitry Andric // symbol data itself (as they are imported), but points to the IAT entry 12310b57cec5SDimitry Andric // instead. Avoid emitting them to the symbol table, as they can confuse 12320b57cec5SDimitry Andric // debuggers. 12330b57cec5SDimitry Andric if (def->isRuntimePseudoReloc) 1234*bdd1243dSDimitry Andric return std::nullopt; 12350b57cec5SDimitry Andric 12360b57cec5SDimitry Andric StringRef name = def->getName(); 12370b57cec5SDimitry Andric if (name.size() > COFF::NameSize) { 12380b57cec5SDimitry Andric sym.Name.Offset.Zeroes = 0; 12390b57cec5SDimitry Andric sym.Name.Offset.Offset = addEntryToStringTable(name); 12400b57cec5SDimitry Andric } else { 12410b57cec5SDimitry Andric memset(sym.Name.ShortName, 0, COFF::NameSize); 12420b57cec5SDimitry Andric memcpy(sym.Name.ShortName, name.data(), name.size()); 12430b57cec5SDimitry Andric } 12440b57cec5SDimitry Andric 12450b57cec5SDimitry Andric if (auto *d = dyn_cast<DefinedCOFF>(def)) { 12460b57cec5SDimitry Andric COFFSymbolRef ref = d->getCOFFSymbol(); 12470b57cec5SDimitry Andric sym.Type = ref.getType(); 12480b57cec5SDimitry Andric sym.StorageClass = ref.getStorageClass(); 1249*bdd1243dSDimitry Andric } else if (def->kind() == Symbol::DefinedImportThunkKind) { 1250*bdd1243dSDimitry Andric sym.Type = (IMAGE_SYM_DTYPE_FUNCTION << SCT_COMPLEX_TYPE_SHIFT) | 1251*bdd1243dSDimitry Andric IMAGE_SYM_TYPE_NULL; 1252*bdd1243dSDimitry Andric sym.StorageClass = IMAGE_SYM_CLASS_EXTERNAL; 12530b57cec5SDimitry Andric } else { 12540b57cec5SDimitry Andric sym.Type = IMAGE_SYM_TYPE_NULL; 12550b57cec5SDimitry Andric sym.StorageClass = IMAGE_SYM_CLASS_EXTERNAL; 12560b57cec5SDimitry Andric } 12570b57cec5SDimitry Andric sym.NumberOfAuxSymbols = 0; 12580b57cec5SDimitry Andric return sym; 12590b57cec5SDimitry Andric } 12600b57cec5SDimitry Andric 12610b57cec5SDimitry Andric void Writer::createSymbolAndStringTable() { 12620b57cec5SDimitry Andric // PE/COFF images are limited to 8 byte section names. Longer names can be 12630b57cec5SDimitry Andric // supported by writing a non-standard string table, but this string table is 12640b57cec5SDimitry Andric // not mapped at runtime and the long names will therefore be inaccessible. 12650b57cec5SDimitry Andric // link.exe always truncates section names to 8 bytes, whereas binutils always 12660b57cec5SDimitry Andric // preserves long section names via the string table. LLD adopts a hybrid 12670b57cec5SDimitry Andric // solution where discardable sections have long names preserved and 12680b57cec5SDimitry Andric // non-discardable sections have their names truncated, to ensure that any 12690b57cec5SDimitry Andric // section which is mapped at runtime also has its name mapped at runtime. 1270349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) { 12710b57cec5SDimitry Andric if (sec->name.size() <= COFF::NameSize) 12720b57cec5SDimitry Andric continue; 12730b57cec5SDimitry Andric if ((sec->header.Characteristics & IMAGE_SCN_MEM_DISCARDABLE) == 0) 12740b57cec5SDimitry Andric continue; 1275*bdd1243dSDimitry Andric if (ctx.config.warnLongSectionNames) { 1276480093f4SDimitry Andric warn("section name " + sec->name + 1277480093f4SDimitry Andric " is longer than 8 characters and will use a non-standard string " 1278480093f4SDimitry Andric "table"); 1279480093f4SDimitry Andric } 12800b57cec5SDimitry Andric sec->setStringTableOff(addEntryToStringTable(sec->name)); 12810b57cec5SDimitry Andric } 12820b57cec5SDimitry Andric 1283*bdd1243dSDimitry Andric if (ctx.config.debugDwarf || ctx.config.debugSymtab) { 1284349cc55cSDimitry Andric for (ObjFile *file : ctx.objFileInstances) { 12850b57cec5SDimitry Andric for (Symbol *b : file->getSymbols()) { 12860b57cec5SDimitry Andric auto *d = dyn_cast_or_null<Defined>(b); 12870b57cec5SDimitry Andric if (!d || d->writtenToSymtab) 12880b57cec5SDimitry Andric continue; 12890b57cec5SDimitry Andric d->writtenToSymtab = true; 12904824e7fdSDimitry Andric if (auto *dc = dyn_cast_or_null<DefinedCOFF>(d)) { 12914824e7fdSDimitry Andric COFFSymbolRef symRef = dc->getCOFFSymbol(); 12924824e7fdSDimitry Andric if (symRef.isSectionDefinition() || 12934824e7fdSDimitry Andric symRef.getStorageClass() == COFF::IMAGE_SYM_CLASS_LABEL) 12944824e7fdSDimitry Andric continue; 12954824e7fdSDimitry Andric } 12960b57cec5SDimitry Andric 1297*bdd1243dSDimitry Andric if (std::optional<coff_symbol16> sym = createSymbol(d)) 12980b57cec5SDimitry Andric outputSymtab.push_back(*sym); 1299*bdd1243dSDimitry Andric 1300*bdd1243dSDimitry Andric if (auto *dthunk = dyn_cast<DefinedImportThunk>(d)) { 1301*bdd1243dSDimitry Andric if (!dthunk->wrappedSym->writtenToSymtab) { 1302*bdd1243dSDimitry Andric dthunk->wrappedSym->writtenToSymtab = true; 1303*bdd1243dSDimitry Andric if (std::optional<coff_symbol16> sym = 1304*bdd1243dSDimitry Andric createSymbol(dthunk->wrappedSym)) 1305*bdd1243dSDimitry Andric outputSymtab.push_back(*sym); 1306*bdd1243dSDimitry Andric } 1307*bdd1243dSDimitry Andric } 13080b57cec5SDimitry Andric } 13090b57cec5SDimitry Andric } 13100b57cec5SDimitry Andric } 13110b57cec5SDimitry Andric 13120b57cec5SDimitry Andric if (outputSymtab.empty() && strtab.empty()) 13130b57cec5SDimitry Andric return; 13140b57cec5SDimitry Andric 13150b57cec5SDimitry Andric // We position the symbol table to be adjacent to the end of the last section. 13160b57cec5SDimitry Andric uint64_t fileOff = fileSize; 13170b57cec5SDimitry Andric pointerToSymbolTable = fileOff; 13180b57cec5SDimitry Andric fileOff += outputSymtab.size() * sizeof(coff_symbol16); 13190b57cec5SDimitry Andric fileOff += 4 + strtab.size(); 1320*bdd1243dSDimitry Andric fileSize = alignTo(fileOff, ctx.config.fileAlign); 13210b57cec5SDimitry Andric } 13220b57cec5SDimitry Andric 13230b57cec5SDimitry Andric void Writer::mergeSections() { 13240b57cec5SDimitry Andric if (!pdataSec->chunks.empty()) { 13250b57cec5SDimitry Andric firstPdata = pdataSec->chunks.front(); 13260b57cec5SDimitry Andric lastPdata = pdataSec->chunks.back(); 13270b57cec5SDimitry Andric } 13280b57cec5SDimitry Andric 1329*bdd1243dSDimitry Andric for (auto &p : ctx.config.merge) { 13300b57cec5SDimitry Andric StringRef toName = p.second; 13310b57cec5SDimitry Andric if (p.first == toName) 13320b57cec5SDimitry Andric continue; 13330b57cec5SDimitry Andric StringSet<> names; 133404eeddc0SDimitry Andric while (true) { 13350b57cec5SDimitry Andric if (!names.insert(toName).second) 13360b57cec5SDimitry Andric fatal("/merge: cycle found for section '" + p.first + "'"); 1337*bdd1243dSDimitry Andric auto i = ctx.config.merge.find(toName); 1338*bdd1243dSDimitry Andric if (i == ctx.config.merge.end()) 13390b57cec5SDimitry Andric break; 13400b57cec5SDimitry Andric toName = i->second; 13410b57cec5SDimitry Andric } 13420b57cec5SDimitry Andric OutputSection *from = findSection(p.first); 13430b57cec5SDimitry Andric OutputSection *to = findSection(toName); 13440b57cec5SDimitry Andric if (!from) 13450b57cec5SDimitry Andric continue; 13460b57cec5SDimitry Andric if (!to) { 13470b57cec5SDimitry Andric from->name = toName; 13480b57cec5SDimitry Andric continue; 13490b57cec5SDimitry Andric } 13500b57cec5SDimitry Andric to->merge(from); 13510b57cec5SDimitry Andric } 13520b57cec5SDimitry Andric } 13530b57cec5SDimitry Andric 13540b57cec5SDimitry Andric // Visits all sections to assign incremental, non-overlapping RVAs and 13550b57cec5SDimitry Andric // file offsets. 13560b57cec5SDimitry Andric void Writer::assignAddresses() { 1357*bdd1243dSDimitry Andric Configuration *config = &ctx.config; 1358*bdd1243dSDimitry Andric 13590b57cec5SDimitry Andric sizeOfHeaders = dosStubSize + sizeof(PEMagic) + sizeof(coff_file_header) + 13600b57cec5SDimitry Andric sizeof(data_directory) * numberOfDataDirectory + 1361349cc55cSDimitry Andric sizeof(coff_section) * ctx.outputSections.size(); 13620b57cec5SDimitry Andric sizeOfHeaders += 13630b57cec5SDimitry Andric config->is64() ? sizeof(pe32plus_header) : sizeof(pe32_header); 13640b57cec5SDimitry Andric sizeOfHeaders = alignTo(sizeOfHeaders, config->fileAlign); 13650b57cec5SDimitry Andric fileSize = sizeOfHeaders; 13660b57cec5SDimitry Andric 13670b57cec5SDimitry Andric // The first page is kept unmapped. 13680b57cec5SDimitry Andric uint64_t rva = alignTo(sizeOfHeaders, config->align); 13690b57cec5SDimitry Andric 1370349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) { 13710b57cec5SDimitry Andric if (sec == relocSec) 13720b57cec5SDimitry Andric addBaserels(); 13730b57cec5SDimitry Andric uint64_t rawSize = 0, virtualSize = 0; 13740b57cec5SDimitry Andric sec->header.VirtualAddress = rva; 13750b57cec5SDimitry Andric 13760b57cec5SDimitry Andric // If /FUNCTIONPADMIN is used, functions are padded in order to create a 13770b57cec5SDimitry Andric // hotpatchable image. 13780b57cec5SDimitry Andric const bool isCodeSection = 13790b57cec5SDimitry Andric (sec->header.Characteristics & IMAGE_SCN_CNT_CODE) && 13800b57cec5SDimitry Andric (sec->header.Characteristics & IMAGE_SCN_MEM_READ) && 13810b57cec5SDimitry Andric (sec->header.Characteristics & IMAGE_SCN_MEM_EXECUTE); 13820b57cec5SDimitry Andric uint32_t padding = isCodeSection ? config->functionPadMin : 0; 13830b57cec5SDimitry Andric 13840b57cec5SDimitry Andric for (Chunk *c : sec->chunks) { 13850b57cec5SDimitry Andric if (padding && c->isHotPatchable()) 13860b57cec5SDimitry Andric virtualSize += padding; 13870b57cec5SDimitry Andric virtualSize = alignTo(virtualSize, c->getAlignment()); 13880b57cec5SDimitry Andric c->setRVA(rva + virtualSize); 13890b57cec5SDimitry Andric virtualSize += c->getSize(); 13900b57cec5SDimitry Andric if (c->hasData) 13910b57cec5SDimitry Andric rawSize = alignTo(virtualSize, config->fileAlign); 13920b57cec5SDimitry Andric } 13930b57cec5SDimitry Andric if (virtualSize > UINT32_MAX) 13940b57cec5SDimitry Andric error("section larger than 4 GiB: " + sec->name); 13950b57cec5SDimitry Andric sec->header.VirtualSize = virtualSize; 13960b57cec5SDimitry Andric sec->header.SizeOfRawData = rawSize; 13970b57cec5SDimitry Andric if (rawSize != 0) 13980b57cec5SDimitry Andric sec->header.PointerToRawData = fileSize; 13990b57cec5SDimitry Andric rva += alignTo(virtualSize, config->align); 14000b57cec5SDimitry Andric fileSize += alignTo(rawSize, config->fileAlign); 14010b57cec5SDimitry Andric } 14020b57cec5SDimitry Andric sizeOfImage = alignTo(rva, config->align); 14030b57cec5SDimitry Andric 14040b57cec5SDimitry Andric // Assign addresses to sections in MergeChunks. 1405349cc55cSDimitry Andric for (MergeChunk *mc : ctx.mergeChunkInstances) 14060b57cec5SDimitry Andric if (mc) 14070b57cec5SDimitry Andric mc->assignSubsectionRVAs(); 14080b57cec5SDimitry Andric } 14090b57cec5SDimitry Andric 14100b57cec5SDimitry Andric template <typename PEHeaderTy> void Writer::writeHeader() { 14110b57cec5SDimitry Andric // Write DOS header. For backwards compatibility, the first part of a PE/COFF 14120b57cec5SDimitry Andric // executable consists of an MS-DOS MZ executable. If the executable is run 14130b57cec5SDimitry Andric // under DOS, that program gets run (usually to just print an error message). 14140b57cec5SDimitry Andric // When run under Windows, the loader looks at AddressOfNewExeHeader and uses 14150b57cec5SDimitry Andric // the PE header instead. 1416*bdd1243dSDimitry Andric Configuration *config = &ctx.config; 14170b57cec5SDimitry Andric uint8_t *buf = buffer->getBufferStart(); 14180b57cec5SDimitry Andric auto *dos = reinterpret_cast<dos_header *>(buf); 14190b57cec5SDimitry Andric buf += sizeof(dos_header); 14200b57cec5SDimitry Andric dos->Magic[0] = 'M'; 14210b57cec5SDimitry Andric dos->Magic[1] = 'Z'; 14220b57cec5SDimitry Andric dos->UsedBytesInTheLastPage = dosStubSize % 512; 14230b57cec5SDimitry Andric dos->FileSizeInPages = divideCeil(dosStubSize, 512); 14240b57cec5SDimitry Andric dos->HeaderSizeInParagraphs = sizeof(dos_header) / 16; 14250b57cec5SDimitry Andric 14260b57cec5SDimitry Andric dos->AddressOfRelocationTable = sizeof(dos_header); 14270b57cec5SDimitry Andric dos->AddressOfNewExeHeader = dosStubSize; 14280b57cec5SDimitry Andric 14290b57cec5SDimitry Andric // Write DOS program. 14300b57cec5SDimitry Andric memcpy(buf, dosProgram, sizeof(dosProgram)); 14310b57cec5SDimitry Andric buf += sizeof(dosProgram); 14320b57cec5SDimitry Andric 14330b57cec5SDimitry Andric // Write PE magic 14340b57cec5SDimitry Andric memcpy(buf, PEMagic, sizeof(PEMagic)); 14350b57cec5SDimitry Andric buf += sizeof(PEMagic); 14360b57cec5SDimitry Andric 14370b57cec5SDimitry Andric // Write COFF header 14380b57cec5SDimitry Andric auto *coff = reinterpret_cast<coff_file_header *>(buf); 14390b57cec5SDimitry Andric buf += sizeof(*coff); 14400b57cec5SDimitry Andric coff->Machine = config->machine; 1441349cc55cSDimitry Andric coff->NumberOfSections = ctx.outputSections.size(); 14420b57cec5SDimitry Andric coff->Characteristics = IMAGE_FILE_EXECUTABLE_IMAGE; 14430b57cec5SDimitry Andric if (config->largeAddressAware) 14440b57cec5SDimitry Andric coff->Characteristics |= IMAGE_FILE_LARGE_ADDRESS_AWARE; 14450b57cec5SDimitry Andric if (!config->is64()) 14460b57cec5SDimitry Andric coff->Characteristics |= IMAGE_FILE_32BIT_MACHINE; 14470b57cec5SDimitry Andric if (config->dll) 14480b57cec5SDimitry Andric coff->Characteristics |= IMAGE_FILE_DLL; 1449480093f4SDimitry Andric if (config->driverUponly) 1450480093f4SDimitry Andric coff->Characteristics |= IMAGE_FILE_UP_SYSTEM_ONLY; 14510b57cec5SDimitry Andric if (!config->relocatable) 14520b57cec5SDimitry Andric coff->Characteristics |= IMAGE_FILE_RELOCS_STRIPPED; 14530b57cec5SDimitry Andric if (config->swaprunCD) 14540b57cec5SDimitry Andric coff->Characteristics |= IMAGE_FILE_REMOVABLE_RUN_FROM_SWAP; 14550b57cec5SDimitry Andric if (config->swaprunNet) 14560b57cec5SDimitry Andric coff->Characteristics |= IMAGE_FILE_NET_RUN_FROM_SWAP; 14570b57cec5SDimitry Andric coff->SizeOfOptionalHeader = 14580b57cec5SDimitry Andric sizeof(PEHeaderTy) + sizeof(data_directory) * numberOfDataDirectory; 14590b57cec5SDimitry Andric 14600b57cec5SDimitry Andric // Write PE header 14610b57cec5SDimitry Andric auto *pe = reinterpret_cast<PEHeaderTy *>(buf); 14620b57cec5SDimitry Andric buf += sizeof(*pe); 14630b57cec5SDimitry Andric pe->Magic = config->is64() ? PE32Header::PE32_PLUS : PE32Header::PE32; 14640b57cec5SDimitry Andric 14650b57cec5SDimitry Andric // If {Major,Minor}LinkerVersion is left at 0.0, then for some 14660b57cec5SDimitry Andric // reason signing the resulting PE file with Authenticode produces a 14670b57cec5SDimitry Andric // signature that fails to validate on Windows 7 (but is OK on 10). 14680b57cec5SDimitry Andric // Set it to 14.0, which is what VS2015 outputs, and which avoids 14690b57cec5SDimitry Andric // that problem. 14700b57cec5SDimitry Andric pe->MajorLinkerVersion = 14; 14710b57cec5SDimitry Andric pe->MinorLinkerVersion = 0; 14720b57cec5SDimitry Andric 14730b57cec5SDimitry Andric pe->ImageBase = config->imageBase; 14740b57cec5SDimitry Andric pe->SectionAlignment = config->align; 14750b57cec5SDimitry Andric pe->FileAlignment = config->fileAlign; 14760b57cec5SDimitry Andric pe->MajorImageVersion = config->majorImageVersion; 14770b57cec5SDimitry Andric pe->MinorImageVersion = config->minorImageVersion; 14780b57cec5SDimitry Andric pe->MajorOperatingSystemVersion = config->majorOSVersion; 14790b57cec5SDimitry Andric pe->MinorOperatingSystemVersion = config->minorOSVersion; 1480e8d8bef9SDimitry Andric pe->MajorSubsystemVersion = config->majorSubsystemVersion; 1481e8d8bef9SDimitry Andric pe->MinorSubsystemVersion = config->minorSubsystemVersion; 14820b57cec5SDimitry Andric pe->Subsystem = config->subsystem; 14830b57cec5SDimitry Andric pe->SizeOfImage = sizeOfImage; 14840b57cec5SDimitry Andric pe->SizeOfHeaders = sizeOfHeaders; 14850b57cec5SDimitry Andric if (!config->noEntry) { 14860b57cec5SDimitry Andric Defined *entry = cast<Defined>(config->entry); 14870b57cec5SDimitry Andric pe->AddressOfEntryPoint = entry->getRVA(); 14880b57cec5SDimitry Andric // Pointer to thumb code must have the LSB set, so adjust it. 14890b57cec5SDimitry Andric if (config->machine == ARMNT) 14900b57cec5SDimitry Andric pe->AddressOfEntryPoint |= 1; 14910b57cec5SDimitry Andric } 14920b57cec5SDimitry Andric pe->SizeOfStackReserve = config->stackReserve; 14930b57cec5SDimitry Andric pe->SizeOfStackCommit = config->stackCommit; 14940b57cec5SDimitry Andric pe->SizeOfHeapReserve = config->heapReserve; 14950b57cec5SDimitry Andric pe->SizeOfHeapCommit = config->heapCommit; 14960b57cec5SDimitry Andric if (config->appContainer) 14970b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_APPCONTAINER; 1498480093f4SDimitry Andric if (config->driverWdm) 1499480093f4SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_WDM_DRIVER; 15000b57cec5SDimitry Andric if (config->dynamicBase) 15010b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_DYNAMIC_BASE; 15020b57cec5SDimitry Andric if (config->highEntropyVA) 15030b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_HIGH_ENTROPY_VA; 15040b57cec5SDimitry Andric if (!config->allowBind) 15050b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_NO_BIND; 15060b57cec5SDimitry Andric if (config->nxCompat) 15070b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_NX_COMPAT; 15080b57cec5SDimitry Andric if (!config->allowIsolation) 15090b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_NO_ISOLATION; 15100b57cec5SDimitry Andric if (config->guardCF != GuardCFLevel::Off) 15110b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_GUARD_CF; 15120b57cec5SDimitry Andric if (config->integrityCheck) 15130b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_FORCE_INTEGRITY; 1514979e22ffSDimitry Andric if (setNoSEHCharacteristic || config->noSEH) 15150b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_NO_SEH; 15160b57cec5SDimitry Andric if (config->terminalServerAware) 15170b57cec5SDimitry Andric pe->DLLCharacteristics |= IMAGE_DLL_CHARACTERISTICS_TERMINAL_SERVER_AWARE; 15180b57cec5SDimitry Andric pe->NumberOfRvaAndSize = numberOfDataDirectory; 15190b57cec5SDimitry Andric if (textSec->getVirtualSize()) { 15200b57cec5SDimitry Andric pe->BaseOfCode = textSec->getRVA(); 15210b57cec5SDimitry Andric pe->SizeOfCode = textSec->getRawSize(); 15220b57cec5SDimitry Andric } 15230b57cec5SDimitry Andric pe->SizeOfInitializedData = getSizeOfInitializedData(); 15240b57cec5SDimitry Andric 15250b57cec5SDimitry Andric // Write data directory 15260b57cec5SDimitry Andric auto *dir = reinterpret_cast<data_directory *>(buf); 15270b57cec5SDimitry Andric buf += sizeof(*dir) * numberOfDataDirectory; 152885868e8aSDimitry Andric if (edataStart) { 152985868e8aSDimitry Andric dir[EXPORT_TABLE].RelativeVirtualAddress = edataStart->getRVA(); 153085868e8aSDimitry Andric dir[EXPORT_TABLE].Size = 153185868e8aSDimitry Andric edataEnd->getRVA() + edataEnd->getSize() - edataStart->getRVA(); 15320b57cec5SDimitry Andric } 15330b57cec5SDimitry Andric if (importTableStart) { 15340b57cec5SDimitry Andric dir[IMPORT_TABLE].RelativeVirtualAddress = importTableStart->getRVA(); 15350b57cec5SDimitry Andric dir[IMPORT_TABLE].Size = importTableSize; 15360b57cec5SDimitry Andric } 15370b57cec5SDimitry Andric if (iatStart) { 15380b57cec5SDimitry Andric dir[IAT].RelativeVirtualAddress = iatStart->getRVA(); 15390b57cec5SDimitry Andric dir[IAT].Size = iatSize; 15400b57cec5SDimitry Andric } 15410b57cec5SDimitry Andric if (rsrcSec->getVirtualSize()) { 15420b57cec5SDimitry Andric dir[RESOURCE_TABLE].RelativeVirtualAddress = rsrcSec->getRVA(); 15430b57cec5SDimitry Andric dir[RESOURCE_TABLE].Size = rsrcSec->getVirtualSize(); 15440b57cec5SDimitry Andric } 15450b57cec5SDimitry Andric if (firstPdata) { 15460b57cec5SDimitry Andric dir[EXCEPTION_TABLE].RelativeVirtualAddress = firstPdata->getRVA(); 15470b57cec5SDimitry Andric dir[EXCEPTION_TABLE].Size = 15480b57cec5SDimitry Andric lastPdata->getRVA() + lastPdata->getSize() - firstPdata->getRVA(); 15490b57cec5SDimitry Andric } 15500b57cec5SDimitry Andric if (relocSec->getVirtualSize()) { 15510b57cec5SDimitry Andric dir[BASE_RELOCATION_TABLE].RelativeVirtualAddress = relocSec->getRVA(); 15520b57cec5SDimitry Andric dir[BASE_RELOCATION_TABLE].Size = relocSec->getVirtualSize(); 15530b57cec5SDimitry Andric } 1554349cc55cSDimitry Andric if (Symbol *sym = ctx.symtab.findUnderscore("_tls_used")) { 15550b57cec5SDimitry Andric if (Defined *b = dyn_cast<Defined>(sym)) { 15560b57cec5SDimitry Andric dir[TLS_TABLE].RelativeVirtualAddress = b->getRVA(); 15570b57cec5SDimitry Andric dir[TLS_TABLE].Size = config->is64() 15580b57cec5SDimitry Andric ? sizeof(object::coff_tls_directory64) 15590b57cec5SDimitry Andric : sizeof(object::coff_tls_directory32); 15600b57cec5SDimitry Andric } 15610b57cec5SDimitry Andric } 15620b57cec5SDimitry Andric if (debugDirectory) { 15630b57cec5SDimitry Andric dir[DEBUG_DIRECTORY].RelativeVirtualAddress = debugDirectory->getRVA(); 15640b57cec5SDimitry Andric dir[DEBUG_DIRECTORY].Size = debugDirectory->getSize(); 15650b57cec5SDimitry Andric } 1566349cc55cSDimitry Andric if (Symbol *sym = ctx.symtab.findUnderscore("_load_config_used")) { 15670b57cec5SDimitry Andric if (auto *b = dyn_cast<DefinedRegular>(sym)) { 15680b57cec5SDimitry Andric SectionChunk *sc = b->getChunk(); 15690b57cec5SDimitry Andric assert(b->getRVA() >= sc->getRVA()); 15700b57cec5SDimitry Andric uint64_t offsetInChunk = b->getRVA() - sc->getRVA(); 15710b57cec5SDimitry Andric if (!sc->hasData || offsetInChunk + 4 > sc->getSize()) 15720b57cec5SDimitry Andric fatal("_load_config_used is malformed"); 15730b57cec5SDimitry Andric 15740b57cec5SDimitry Andric ArrayRef<uint8_t> secContents = sc->getContents(); 15750b57cec5SDimitry Andric uint32_t loadConfigSize = 15760b57cec5SDimitry Andric *reinterpret_cast<const ulittle32_t *>(&secContents[offsetInChunk]); 15770b57cec5SDimitry Andric if (offsetInChunk + loadConfigSize > sc->getSize()) 15780b57cec5SDimitry Andric fatal("_load_config_used is too large"); 15790b57cec5SDimitry Andric dir[LOAD_CONFIG_TABLE].RelativeVirtualAddress = b->getRVA(); 15800b57cec5SDimitry Andric dir[LOAD_CONFIG_TABLE].Size = loadConfigSize; 15810b57cec5SDimitry Andric } 15820b57cec5SDimitry Andric } 15830b57cec5SDimitry Andric if (!delayIdata.empty()) { 15840b57cec5SDimitry Andric dir[DELAY_IMPORT_DESCRIPTOR].RelativeVirtualAddress = 15850b57cec5SDimitry Andric delayIdata.getDirRVA(); 15860b57cec5SDimitry Andric dir[DELAY_IMPORT_DESCRIPTOR].Size = delayIdata.getDirSize(); 15870b57cec5SDimitry Andric } 15880b57cec5SDimitry Andric 15890b57cec5SDimitry Andric // Write section table 1590349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) { 1591*bdd1243dSDimitry Andric sec->writeHeaderTo(buf, config->debug); 15920b57cec5SDimitry Andric buf += sizeof(coff_section); 15930b57cec5SDimitry Andric } 15940b57cec5SDimitry Andric sectionTable = ArrayRef<uint8_t>( 1595349cc55cSDimitry Andric buf - ctx.outputSections.size() * sizeof(coff_section), buf); 15960b57cec5SDimitry Andric 15970b57cec5SDimitry Andric if (outputSymtab.empty() && strtab.empty()) 15980b57cec5SDimitry Andric return; 15990b57cec5SDimitry Andric 16000b57cec5SDimitry Andric coff->PointerToSymbolTable = pointerToSymbolTable; 16010b57cec5SDimitry Andric uint32_t numberOfSymbols = outputSymtab.size(); 16020b57cec5SDimitry Andric coff->NumberOfSymbols = numberOfSymbols; 16030b57cec5SDimitry Andric auto *symbolTable = reinterpret_cast<coff_symbol16 *>( 16040b57cec5SDimitry Andric buffer->getBufferStart() + coff->PointerToSymbolTable); 16050b57cec5SDimitry Andric for (size_t i = 0; i != numberOfSymbols; ++i) 16060b57cec5SDimitry Andric symbolTable[i] = outputSymtab[i]; 16070b57cec5SDimitry Andric // Create the string table, it follows immediately after the symbol table. 16080b57cec5SDimitry Andric // The first 4 bytes is length including itself. 16090b57cec5SDimitry Andric buf = reinterpret_cast<uint8_t *>(&symbolTable[numberOfSymbols]); 16100b57cec5SDimitry Andric write32le(buf, strtab.size() + 4); 16110b57cec5SDimitry Andric if (!strtab.empty()) 16120b57cec5SDimitry Andric memcpy(buf + 4, strtab.data(), strtab.size()); 16130b57cec5SDimitry Andric } 16140b57cec5SDimitry Andric 16150b57cec5SDimitry Andric void Writer::openFile(StringRef path) { 16160b57cec5SDimitry Andric buffer = CHECK( 16170b57cec5SDimitry Andric FileOutputBuffer::create(path, fileSize, FileOutputBuffer::F_executable), 16180b57cec5SDimitry Andric "failed to open " + path); 16190b57cec5SDimitry Andric } 16200b57cec5SDimitry Andric 16210b57cec5SDimitry Andric void Writer::createSEHTable() { 16220b57cec5SDimitry Andric SymbolRVASet handlers; 1623349cc55cSDimitry Andric for (ObjFile *file : ctx.objFileInstances) { 16240b57cec5SDimitry Andric if (!file->hasSafeSEH()) 16250b57cec5SDimitry Andric error("/safeseh: " + file->getName() + " is not compatible with SEH"); 16260b57cec5SDimitry Andric markSymbolsForRVATable(file, file->getSXDataChunks(), handlers); 16270b57cec5SDimitry Andric } 16280b57cec5SDimitry Andric 16290b57cec5SDimitry Andric // Set the "no SEH" characteristic if there really were no handlers, or if 16300b57cec5SDimitry Andric // there is no load config object to point to the table of handlers. 16310b57cec5SDimitry Andric setNoSEHCharacteristic = 1632349cc55cSDimitry Andric handlers.empty() || !ctx.symtab.findUnderscore("_load_config_used"); 16330b57cec5SDimitry Andric 16340b57cec5SDimitry Andric maybeAddRVATable(std::move(handlers), "__safe_se_handler_table", 16350b57cec5SDimitry Andric "__safe_se_handler_count"); 16360b57cec5SDimitry Andric } 16370b57cec5SDimitry Andric 16380b57cec5SDimitry Andric // Add a symbol to an RVA set. Two symbols may have the same RVA, but an RVA set 16390b57cec5SDimitry Andric // cannot contain duplicates. Therefore, the set is uniqued by Chunk and the 16400b57cec5SDimitry Andric // symbol's offset into that Chunk. 16410b57cec5SDimitry Andric static void addSymbolToRVASet(SymbolRVASet &rvaSet, Defined *s) { 16420b57cec5SDimitry Andric Chunk *c = s->getChunk(); 16430b57cec5SDimitry Andric if (auto *sc = dyn_cast<SectionChunk>(c)) 16440b57cec5SDimitry Andric c = sc->repl; // Look through ICF replacement. 16450b57cec5SDimitry Andric uint32_t off = s->getRVA() - (c ? c->getRVA() : 0); 16460b57cec5SDimitry Andric rvaSet.insert({c, off}); 16470b57cec5SDimitry Andric } 16480b57cec5SDimitry Andric 16490b57cec5SDimitry Andric // Given a symbol, add it to the GFIDs table if it is a live, defined, function 16500b57cec5SDimitry Andric // symbol in an executable section. 16510b57cec5SDimitry Andric static void maybeAddAddressTakenFunction(SymbolRVASet &addressTakenSyms, 16520b57cec5SDimitry Andric Symbol *s) { 16530b57cec5SDimitry Andric if (!s) 16540b57cec5SDimitry Andric return; 16550b57cec5SDimitry Andric 16560b57cec5SDimitry Andric switch (s->kind()) { 16570b57cec5SDimitry Andric case Symbol::DefinedLocalImportKind: 16580b57cec5SDimitry Andric case Symbol::DefinedImportDataKind: 16590b57cec5SDimitry Andric // Defines an __imp_ pointer, so it is data, so it is ignored. 16600b57cec5SDimitry Andric break; 16610b57cec5SDimitry Andric case Symbol::DefinedCommonKind: 16620b57cec5SDimitry Andric // Common is always data, so it is ignored. 16630b57cec5SDimitry Andric break; 16640b57cec5SDimitry Andric case Symbol::DefinedAbsoluteKind: 16650b57cec5SDimitry Andric case Symbol::DefinedSyntheticKind: 16660b57cec5SDimitry Andric // Absolute is never code, synthetic generally isn't and usually isn't 16670b57cec5SDimitry Andric // determinable. 16680b57cec5SDimitry Andric break; 166985868e8aSDimitry Andric case Symbol::LazyArchiveKind: 167085868e8aSDimitry Andric case Symbol::LazyObjectKind: 1671fe6060f1SDimitry Andric case Symbol::LazyDLLSymbolKind: 16720b57cec5SDimitry Andric case Symbol::UndefinedKind: 16730b57cec5SDimitry Andric // Undefined symbols resolve to zero, so they don't have an RVA. Lazy 16740b57cec5SDimitry Andric // symbols shouldn't have relocations. 16750b57cec5SDimitry Andric break; 16760b57cec5SDimitry Andric 16770b57cec5SDimitry Andric case Symbol::DefinedImportThunkKind: 16780b57cec5SDimitry Andric // Thunks are always code, include them. 16790b57cec5SDimitry Andric addSymbolToRVASet(addressTakenSyms, cast<Defined>(s)); 16800b57cec5SDimitry Andric break; 16810b57cec5SDimitry Andric 16820b57cec5SDimitry Andric case Symbol::DefinedRegularKind: { 16830b57cec5SDimitry Andric // This is a regular, defined, symbol from a COFF file. Mark the symbol as 16840b57cec5SDimitry Andric // address taken if the symbol type is function and it's in an executable 16850b57cec5SDimitry Andric // section. 16860b57cec5SDimitry Andric auto *d = cast<DefinedRegular>(s); 16870b57cec5SDimitry Andric if (d->getCOFFSymbol().getComplexType() == COFF::IMAGE_SYM_DTYPE_FUNCTION) { 16880b57cec5SDimitry Andric SectionChunk *sc = dyn_cast<SectionChunk>(d->getChunk()); 16890b57cec5SDimitry Andric if (sc && sc->live && 16900b57cec5SDimitry Andric sc->getOutputCharacteristics() & IMAGE_SCN_MEM_EXECUTE) 16910b57cec5SDimitry Andric addSymbolToRVASet(addressTakenSyms, d); 16920b57cec5SDimitry Andric } 16930b57cec5SDimitry Andric break; 16940b57cec5SDimitry Andric } 16950b57cec5SDimitry Andric } 16960b57cec5SDimitry Andric } 16970b57cec5SDimitry Andric 16980b57cec5SDimitry Andric // Visit all relocations from all section contributions of this object file and 16990b57cec5SDimitry Andric // mark the relocation target as address-taken. 1700*bdd1243dSDimitry Andric void Writer::markSymbolsWithRelocations(ObjFile *file, 17010b57cec5SDimitry Andric SymbolRVASet &usedSymbols) { 17020b57cec5SDimitry Andric for (Chunk *c : file->getChunks()) { 17030b57cec5SDimitry Andric // We only care about live section chunks. Common chunks and other chunks 17040b57cec5SDimitry Andric // don't generally contain relocations. 17050b57cec5SDimitry Andric SectionChunk *sc = dyn_cast<SectionChunk>(c); 17060b57cec5SDimitry Andric if (!sc || !sc->live) 17070b57cec5SDimitry Andric continue; 17080b57cec5SDimitry Andric 17090b57cec5SDimitry Andric for (const coff_relocation &reloc : sc->getRelocs()) { 1710*bdd1243dSDimitry Andric if (ctx.config.machine == I386 && 1711*bdd1243dSDimitry Andric reloc.Type == COFF::IMAGE_REL_I386_REL32) 17120b57cec5SDimitry Andric // Ignore relative relocations on x86. On x86_64 they can't be ignored 17130b57cec5SDimitry Andric // since they're also used to compute absolute addresses. 17140b57cec5SDimitry Andric continue; 17150b57cec5SDimitry Andric 17160b57cec5SDimitry Andric Symbol *ref = sc->file->getSymbol(reloc.SymbolTableIndex); 17170b57cec5SDimitry Andric maybeAddAddressTakenFunction(usedSymbols, ref); 17180b57cec5SDimitry Andric } 17190b57cec5SDimitry Andric } 17200b57cec5SDimitry Andric } 17210b57cec5SDimitry Andric 17220b57cec5SDimitry Andric // Create the guard function id table. This is a table of RVAs of all 17230b57cec5SDimitry Andric // address-taken functions. It is sorted and uniqued, just like the safe SEH 17240b57cec5SDimitry Andric // table. 17250b57cec5SDimitry Andric void Writer::createGuardCFTables() { 1726*bdd1243dSDimitry Andric Configuration *config = &ctx.config; 1727*bdd1243dSDimitry Andric 17280b57cec5SDimitry Andric SymbolRVASet addressTakenSyms; 1729e8d8bef9SDimitry Andric SymbolRVASet giatsRVASet; 1730e8d8bef9SDimitry Andric std::vector<Symbol *> giatsSymbols; 17310b57cec5SDimitry Andric SymbolRVASet longJmpTargets; 1732fe6060f1SDimitry Andric SymbolRVASet ehContTargets; 1733349cc55cSDimitry Andric for (ObjFile *file : ctx.objFileInstances) { 17340b57cec5SDimitry Andric // If the object was compiled with /guard:cf, the address taken symbols 1735fe6060f1SDimitry Andric // are in .gfids$y sections, the longjmp targets are in .gljmp$y sections, 1736fe6060f1SDimitry Andric // and ehcont targets are in .gehcont$y sections. If the object was not 1737fe6060f1SDimitry Andric // compiled with /guard:cf, we assume there were no setjmp and ehcont 1738fe6060f1SDimitry Andric // targets, and that all code symbols with relocations are possibly 1739fe6060f1SDimitry Andric // address-taken. 17400b57cec5SDimitry Andric if (file->hasGuardCF()) { 17410b57cec5SDimitry Andric markSymbolsForRVATable(file, file->getGuardFidChunks(), addressTakenSyms); 1742e8d8bef9SDimitry Andric markSymbolsForRVATable(file, file->getGuardIATChunks(), giatsRVASet); 1743e8d8bef9SDimitry Andric getSymbolsFromSections(file, file->getGuardIATChunks(), giatsSymbols); 17440b57cec5SDimitry Andric markSymbolsForRVATable(file, file->getGuardLJmpChunks(), longJmpTargets); 1745fe6060f1SDimitry Andric markSymbolsForRVATable(file, file->getGuardEHContChunks(), ehContTargets); 17460b57cec5SDimitry Andric } else { 17470b57cec5SDimitry Andric markSymbolsWithRelocations(file, addressTakenSyms); 17480b57cec5SDimitry Andric } 17490b57cec5SDimitry Andric } 17500b57cec5SDimitry Andric 17510b57cec5SDimitry Andric // Mark the image entry as address-taken. 17520b57cec5SDimitry Andric if (config->entry) 17530b57cec5SDimitry Andric maybeAddAddressTakenFunction(addressTakenSyms, config->entry); 17540b57cec5SDimitry Andric 17550b57cec5SDimitry Andric // Mark exported symbols in executable sections as address-taken. 17560b57cec5SDimitry Andric for (Export &e : config->exports) 17570b57cec5SDimitry Andric maybeAddAddressTakenFunction(addressTakenSyms, e.sym); 17580b57cec5SDimitry Andric 1759e8d8bef9SDimitry Andric // For each entry in the .giats table, check if it has a corresponding load 1760e8d8bef9SDimitry Andric // thunk (e.g. because the DLL that defines it will be delay-loaded) and, if 1761e8d8bef9SDimitry Andric // so, add the load thunk to the address taken (.gfids) table. 1762e8d8bef9SDimitry Andric for (Symbol *s : giatsSymbols) { 1763e8d8bef9SDimitry Andric if (auto *di = dyn_cast<DefinedImportData>(s)) { 1764e8d8bef9SDimitry Andric if (di->loadThunkSym) 1765e8d8bef9SDimitry Andric addSymbolToRVASet(addressTakenSyms, di->loadThunkSym); 1766e8d8bef9SDimitry Andric } 1767e8d8bef9SDimitry Andric } 1768e8d8bef9SDimitry Andric 17690b57cec5SDimitry Andric // Ensure sections referenced in the gfid table are 16-byte aligned. 17700b57cec5SDimitry Andric for (const ChunkAndOffset &c : addressTakenSyms) 17710b57cec5SDimitry Andric if (c.inputChunk->getAlignment() < 16) 17720b57cec5SDimitry Andric c.inputChunk->setAlignment(16); 17730b57cec5SDimitry Andric 17740b57cec5SDimitry Andric maybeAddRVATable(std::move(addressTakenSyms), "__guard_fids_table", 17750b57cec5SDimitry Andric "__guard_fids_count"); 17760b57cec5SDimitry Andric 1777e8d8bef9SDimitry Andric // Add the Guard Address Taken IAT Entry Table (.giats). 1778e8d8bef9SDimitry Andric maybeAddRVATable(std::move(giatsRVASet), "__guard_iat_table", 1779e8d8bef9SDimitry Andric "__guard_iat_count"); 1780e8d8bef9SDimitry Andric 17810b57cec5SDimitry Andric // Add the longjmp target table unless the user told us not to. 1782fe6060f1SDimitry Andric if (config->guardCF & GuardCFLevel::LongJmp) 17830b57cec5SDimitry Andric maybeAddRVATable(std::move(longJmpTargets), "__guard_longjmp_table", 17840b57cec5SDimitry Andric "__guard_longjmp_count"); 17850b57cec5SDimitry Andric 1786fe6060f1SDimitry Andric // Add the ehcont target table unless the user told us not to. 1787fe6060f1SDimitry Andric if (config->guardCF & GuardCFLevel::EHCont) 1788fe6060f1SDimitry Andric maybeAddRVATable(std::move(ehContTargets), "__guard_eh_cont_table", 1789fe6060f1SDimitry Andric "__guard_eh_cont_count", true); 1790fe6060f1SDimitry Andric 17910b57cec5SDimitry Andric // Set __guard_flags, which will be used in the load config to indicate that 17920b57cec5SDimitry Andric // /guard:cf was enabled. 1793*bdd1243dSDimitry Andric uint32_t guardFlags = uint32_t(GuardFlags::CF_INSTRUMENTED) | 1794*bdd1243dSDimitry Andric uint32_t(GuardFlags::CF_FUNCTION_TABLE_PRESENT); 1795fe6060f1SDimitry Andric if (config->guardCF & GuardCFLevel::LongJmp) 1796*bdd1243dSDimitry Andric guardFlags |= uint32_t(GuardFlags::CF_LONGJUMP_TABLE_PRESENT); 1797fe6060f1SDimitry Andric if (config->guardCF & GuardCFLevel::EHCont) 1798*bdd1243dSDimitry Andric guardFlags |= uint32_t(GuardFlags::EH_CONTINUATION_TABLE_PRESENT); 1799349cc55cSDimitry Andric Symbol *flagSym = ctx.symtab.findUnderscore("__guard_flags"); 18000b57cec5SDimitry Andric cast<DefinedAbsolute>(flagSym)->setVA(guardFlags); 18010b57cec5SDimitry Andric } 18020b57cec5SDimitry Andric 18030b57cec5SDimitry Andric // Take a list of input sections containing symbol table indices and add those 1804e8d8bef9SDimitry Andric // symbols to a vector. The challenge is that symbol RVAs are not known and 18050b57cec5SDimitry Andric // depend on the table size, so we can't directly build a set of integers. 1806e8d8bef9SDimitry Andric void Writer::getSymbolsFromSections(ObjFile *file, 18070b57cec5SDimitry Andric ArrayRef<SectionChunk *> symIdxChunks, 1808e8d8bef9SDimitry Andric std::vector<Symbol *> &symbols) { 18090b57cec5SDimitry Andric for (SectionChunk *c : symIdxChunks) { 18100b57cec5SDimitry Andric // Skip sections discarded by linker GC. This comes up when a .gfids section 18110b57cec5SDimitry Andric // is associated with something like a vtable and the vtable is discarded. 18120b57cec5SDimitry Andric // In this case, the associated gfids section is discarded, and we don't 18130b57cec5SDimitry Andric // mark the virtual member functions as address-taken by the vtable. 18140b57cec5SDimitry Andric if (!c->live) 18150b57cec5SDimitry Andric continue; 18160b57cec5SDimitry Andric 18170b57cec5SDimitry Andric // Validate that the contents look like symbol table indices. 18180b57cec5SDimitry Andric ArrayRef<uint8_t> data = c->getContents(); 18190b57cec5SDimitry Andric if (data.size() % 4 != 0) { 18200b57cec5SDimitry Andric warn("ignoring " + c->getSectionName() + 18210b57cec5SDimitry Andric " symbol table index section in object " + toString(file)); 18220b57cec5SDimitry Andric continue; 18230b57cec5SDimitry Andric } 18240b57cec5SDimitry Andric 18250b57cec5SDimitry Andric // Read each symbol table index and check if that symbol was included in the 1826e8d8bef9SDimitry Andric // final link. If so, add it to the vector of symbols. 18270b57cec5SDimitry Andric ArrayRef<ulittle32_t> symIndices( 18280b57cec5SDimitry Andric reinterpret_cast<const ulittle32_t *>(data.data()), data.size() / 4); 18290b57cec5SDimitry Andric ArrayRef<Symbol *> objSymbols = file->getSymbols(); 18300b57cec5SDimitry Andric for (uint32_t symIndex : symIndices) { 18310b57cec5SDimitry Andric if (symIndex >= objSymbols.size()) { 18320b57cec5SDimitry Andric warn("ignoring invalid symbol table index in section " + 18330b57cec5SDimitry Andric c->getSectionName() + " in object " + toString(file)); 18340b57cec5SDimitry Andric continue; 18350b57cec5SDimitry Andric } 18360b57cec5SDimitry Andric if (Symbol *s = objSymbols[symIndex]) { 18370b57cec5SDimitry Andric if (s->isLive()) 1838e8d8bef9SDimitry Andric symbols.push_back(cast<Symbol>(s)); 1839e8d8bef9SDimitry Andric } 1840e8d8bef9SDimitry Andric } 1841e8d8bef9SDimitry Andric } 1842e8d8bef9SDimitry Andric } 1843e8d8bef9SDimitry Andric 1844e8d8bef9SDimitry Andric // Take a list of input sections containing symbol table indices and add those 1845e8d8bef9SDimitry Andric // symbols to an RVA table. 1846e8d8bef9SDimitry Andric void Writer::markSymbolsForRVATable(ObjFile *file, 1847e8d8bef9SDimitry Andric ArrayRef<SectionChunk *> symIdxChunks, 1848e8d8bef9SDimitry Andric SymbolRVASet &tableSymbols) { 1849e8d8bef9SDimitry Andric std::vector<Symbol *> syms; 1850e8d8bef9SDimitry Andric getSymbolsFromSections(file, symIdxChunks, syms); 1851e8d8bef9SDimitry Andric 1852e8d8bef9SDimitry Andric for (Symbol *s : syms) 18530b57cec5SDimitry Andric addSymbolToRVASet(tableSymbols, cast<Defined>(s)); 18540b57cec5SDimitry Andric } 18550b57cec5SDimitry Andric 18560b57cec5SDimitry Andric // Replace the absolute table symbol with a synthetic symbol pointing to 18570b57cec5SDimitry Andric // tableChunk so that we can emit base relocations for it and resolve section 18580b57cec5SDimitry Andric // relative relocations. 18590b57cec5SDimitry Andric void Writer::maybeAddRVATable(SymbolRVASet tableSymbols, StringRef tableSym, 1860fe6060f1SDimitry Andric StringRef countSym, bool hasFlag) { 18610b57cec5SDimitry Andric if (tableSymbols.empty()) 18620b57cec5SDimitry Andric return; 18630b57cec5SDimitry Andric 1864fe6060f1SDimitry Andric NonSectionChunk *tableChunk; 1865fe6060f1SDimitry Andric if (hasFlag) 1866fe6060f1SDimitry Andric tableChunk = make<RVAFlagTableChunk>(std::move(tableSymbols)); 1867fe6060f1SDimitry Andric else 1868fe6060f1SDimitry Andric tableChunk = make<RVATableChunk>(std::move(tableSymbols)); 18690b57cec5SDimitry Andric rdataSec->addChunk(tableChunk); 18700b57cec5SDimitry Andric 1871349cc55cSDimitry Andric Symbol *t = ctx.symtab.findUnderscore(tableSym); 1872349cc55cSDimitry Andric Symbol *c = ctx.symtab.findUnderscore(countSym); 18730b57cec5SDimitry Andric replaceSymbol<DefinedSynthetic>(t, t->getName(), tableChunk); 1874fe6060f1SDimitry Andric cast<DefinedAbsolute>(c)->setVA(tableChunk->getSize() / (hasFlag ? 5 : 4)); 18750b57cec5SDimitry Andric } 18760b57cec5SDimitry Andric 18770b57cec5SDimitry Andric // MinGW specific. Gather all relocations that are imported from a DLL even 18780b57cec5SDimitry Andric // though the code didn't expect it to, produce the table that the runtime 18790b57cec5SDimitry Andric // uses for fixing them up, and provide the synthetic symbols that the 18800b57cec5SDimitry Andric // runtime uses for finding the table. 18810b57cec5SDimitry Andric void Writer::createRuntimePseudoRelocs() { 18820b57cec5SDimitry Andric std::vector<RuntimePseudoReloc> rels; 18830b57cec5SDimitry Andric 1884349cc55cSDimitry Andric for (Chunk *c : ctx.symtab.getChunks()) { 18850b57cec5SDimitry Andric auto *sc = dyn_cast<SectionChunk>(c); 18860b57cec5SDimitry Andric if (!sc || !sc->live) 18870b57cec5SDimitry Andric continue; 18880b57cec5SDimitry Andric sc->getRuntimePseudoRelocs(rels); 18890b57cec5SDimitry Andric } 18900b57cec5SDimitry Andric 1891*bdd1243dSDimitry Andric if (!ctx.config.pseudoRelocs) { 18925ffd83dbSDimitry Andric // Not writing any pseudo relocs; if some were needed, error out and 18935ffd83dbSDimitry Andric // indicate what required them. 18945ffd83dbSDimitry Andric for (const RuntimePseudoReloc &rpr : rels) 18955ffd83dbSDimitry Andric error("automatic dllimport of " + rpr.sym->getName() + " in " + 18965ffd83dbSDimitry Andric toString(rpr.target->file) + " requires pseudo relocations"); 18975ffd83dbSDimitry Andric return; 18985ffd83dbSDimitry Andric } 18995ffd83dbSDimitry Andric 19000b57cec5SDimitry Andric if (!rels.empty()) 19010b57cec5SDimitry Andric log("Writing " + Twine(rels.size()) + " runtime pseudo relocations"); 19020b57cec5SDimitry Andric PseudoRelocTableChunk *table = make<PseudoRelocTableChunk>(rels); 19030b57cec5SDimitry Andric rdataSec->addChunk(table); 19040b57cec5SDimitry Andric EmptyChunk *endOfList = make<EmptyChunk>(); 19050b57cec5SDimitry Andric rdataSec->addChunk(endOfList); 19060b57cec5SDimitry Andric 1907349cc55cSDimitry Andric Symbol *headSym = ctx.symtab.findUnderscore("__RUNTIME_PSEUDO_RELOC_LIST__"); 1908349cc55cSDimitry Andric Symbol *endSym = 1909349cc55cSDimitry Andric ctx.symtab.findUnderscore("__RUNTIME_PSEUDO_RELOC_LIST_END__"); 19100b57cec5SDimitry Andric replaceSymbol<DefinedSynthetic>(headSym, headSym->getName(), table); 19110b57cec5SDimitry Andric replaceSymbol<DefinedSynthetic>(endSym, endSym->getName(), endOfList); 19120b57cec5SDimitry Andric } 19130b57cec5SDimitry Andric 19140b57cec5SDimitry Andric // MinGW specific. 19150b57cec5SDimitry Andric // The MinGW .ctors and .dtors lists have sentinels at each end; 19160b57cec5SDimitry Andric // a (uintptr_t)-1 at the start and a (uintptr_t)0 at the end. 19170b57cec5SDimitry Andric // There's a symbol pointing to the start sentinel pointer, __CTOR_LIST__ 19180b57cec5SDimitry Andric // and __DTOR_LIST__ respectively. 19190b57cec5SDimitry Andric void Writer::insertCtorDtorSymbols() { 1920*bdd1243dSDimitry Andric AbsolutePointerChunk *ctorListHead = make<AbsolutePointerChunk>(ctx, -1); 1921*bdd1243dSDimitry Andric AbsolutePointerChunk *ctorListEnd = make<AbsolutePointerChunk>(ctx, 0); 1922*bdd1243dSDimitry Andric AbsolutePointerChunk *dtorListHead = make<AbsolutePointerChunk>(ctx, -1); 1923*bdd1243dSDimitry Andric AbsolutePointerChunk *dtorListEnd = make<AbsolutePointerChunk>(ctx, 0); 19240b57cec5SDimitry Andric ctorsSec->insertChunkAtStart(ctorListHead); 19250b57cec5SDimitry Andric ctorsSec->addChunk(ctorListEnd); 19260b57cec5SDimitry Andric dtorsSec->insertChunkAtStart(dtorListHead); 19270b57cec5SDimitry Andric dtorsSec->addChunk(dtorListEnd); 19280b57cec5SDimitry Andric 1929349cc55cSDimitry Andric Symbol *ctorListSym = ctx.symtab.findUnderscore("__CTOR_LIST__"); 1930349cc55cSDimitry Andric Symbol *dtorListSym = ctx.symtab.findUnderscore("__DTOR_LIST__"); 19310b57cec5SDimitry Andric replaceSymbol<DefinedSynthetic>(ctorListSym, ctorListSym->getName(), 19320b57cec5SDimitry Andric ctorListHead); 19330b57cec5SDimitry Andric replaceSymbol<DefinedSynthetic>(dtorListSym, dtorListSym->getName(), 19340b57cec5SDimitry Andric dtorListHead); 19350b57cec5SDimitry Andric } 19360b57cec5SDimitry Andric 19370b57cec5SDimitry Andric // Handles /section options to allow users to overwrite 19380b57cec5SDimitry Andric // section attributes. 19390b57cec5SDimitry Andric void Writer::setSectionPermissions() { 1940*bdd1243dSDimitry Andric for (auto &p : ctx.config.section) { 19410b57cec5SDimitry Andric StringRef name = p.first; 19420b57cec5SDimitry Andric uint32_t perm = p.second; 1943349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) 19440b57cec5SDimitry Andric if (sec->name == name) 19450b57cec5SDimitry Andric sec->setPermissions(perm); 19460b57cec5SDimitry Andric } 19470b57cec5SDimitry Andric } 19480b57cec5SDimitry Andric 19490b57cec5SDimitry Andric // Write section contents to a mmap'ed file. 19500b57cec5SDimitry Andric void Writer::writeSections() { 19510b57cec5SDimitry Andric uint8_t *buf = buffer->getBufferStart(); 1952349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) { 19530b57cec5SDimitry Andric uint8_t *secBuf = buf + sec->getFileOff(); 19540b57cec5SDimitry Andric // Fill gaps between functions in .text with INT3 instructions 19550b57cec5SDimitry Andric // instead of leaving as NUL bytes (which can be interpreted as 19560b57cec5SDimitry Andric // ADD instructions). 19570b57cec5SDimitry Andric if (sec->header.Characteristics & IMAGE_SCN_CNT_CODE) 19580b57cec5SDimitry Andric memset(secBuf, 0xCC, sec->getRawSize()); 19590b57cec5SDimitry Andric parallelForEach(sec->chunks, [&](Chunk *c) { 19600b57cec5SDimitry Andric c->writeTo(secBuf + c->getRVA() - sec->getRVA()); 19610b57cec5SDimitry Andric }); 19620b57cec5SDimitry Andric } 19630b57cec5SDimitry Andric } 19640b57cec5SDimitry Andric 19650b57cec5SDimitry Andric void Writer::writeBuildId() { 19660b57cec5SDimitry Andric // There are two important parts to the build ID. 19670b57cec5SDimitry Andric // 1) If building with debug info, the COFF debug directory contains a 19680b57cec5SDimitry Andric // timestamp as well as a Guid and Age of the PDB. 19690b57cec5SDimitry Andric // 2) In all cases, the PE COFF file header also contains a timestamp. 19700b57cec5SDimitry Andric // For reproducibility, instead of a timestamp we want to use a hash of the 19710b57cec5SDimitry Andric // PE contents. 1972*bdd1243dSDimitry Andric Configuration *config = &ctx.config; 1973*bdd1243dSDimitry Andric 19740b57cec5SDimitry Andric if (config->debug) { 19750b57cec5SDimitry Andric assert(buildId && "BuildId is not set!"); 19760b57cec5SDimitry Andric // BuildId->BuildId was filled in when the PDB was written. 19770b57cec5SDimitry Andric } 19780b57cec5SDimitry Andric 19790b57cec5SDimitry Andric // At this point the only fields in the COFF file which remain unset are the 19800b57cec5SDimitry Andric // "timestamp" in the COFF file header, and the ones in the coff debug 19810b57cec5SDimitry Andric // directory. Now we can hash the file and write that hash to the various 19820b57cec5SDimitry Andric // timestamp fields in the file. 19830b57cec5SDimitry Andric StringRef outputFileData( 19840b57cec5SDimitry Andric reinterpret_cast<const char *>(buffer->getBufferStart()), 19850b57cec5SDimitry Andric buffer->getBufferSize()); 19860b57cec5SDimitry Andric 19870b57cec5SDimitry Andric uint32_t timestamp = config->timestamp; 19880b57cec5SDimitry Andric uint64_t hash = 0; 19890b57cec5SDimitry Andric bool generateSyntheticBuildId = 19900b57cec5SDimitry Andric config->mingw && config->debug && config->pdbPath.empty(); 19910b57cec5SDimitry Andric 19920b57cec5SDimitry Andric if (config->repro || generateSyntheticBuildId) 19930b57cec5SDimitry Andric hash = xxHash64(outputFileData); 19940b57cec5SDimitry Andric 19950b57cec5SDimitry Andric if (config->repro) 19960b57cec5SDimitry Andric timestamp = static_cast<uint32_t>(hash); 19970b57cec5SDimitry Andric 19980b57cec5SDimitry Andric if (generateSyntheticBuildId) { 19990b57cec5SDimitry Andric // For MinGW builds without a PDB file, we still generate a build id 20000b57cec5SDimitry Andric // to allow associating a crash dump to the executable. 20010b57cec5SDimitry Andric buildId->buildId->PDB70.CVSignature = OMF::Signature::PDB70; 20020b57cec5SDimitry Andric buildId->buildId->PDB70.Age = 1; 20030b57cec5SDimitry Andric memcpy(buildId->buildId->PDB70.Signature, &hash, 8); 20040b57cec5SDimitry Andric // xxhash only gives us 8 bytes, so put some fixed data in the other half. 20050b57cec5SDimitry Andric memcpy(&buildId->buildId->PDB70.Signature[8], "LLD PDB.", 8); 20060b57cec5SDimitry Andric } 20070b57cec5SDimitry Andric 20080b57cec5SDimitry Andric if (debugDirectory) 20090b57cec5SDimitry Andric debugDirectory->setTimeDateStamp(timestamp); 20100b57cec5SDimitry Andric 20110b57cec5SDimitry Andric uint8_t *buf = buffer->getBufferStart(); 20120b57cec5SDimitry Andric buf += dosStubSize + sizeof(PEMagic); 20130b57cec5SDimitry Andric object::coff_file_header *coffHeader = 20140b57cec5SDimitry Andric reinterpret_cast<coff_file_header *>(buf); 20150b57cec5SDimitry Andric coffHeader->TimeDateStamp = timestamp; 20160b57cec5SDimitry Andric } 20170b57cec5SDimitry Andric 20180b57cec5SDimitry Andric // Sort .pdata section contents according to PE/COFF spec 5.5. 20190b57cec5SDimitry Andric void Writer::sortExceptionTable() { 20200b57cec5SDimitry Andric if (!firstPdata) 20210b57cec5SDimitry Andric return; 20220b57cec5SDimitry Andric // We assume .pdata contains function table entries only. 20230b57cec5SDimitry Andric auto bufAddr = [&](Chunk *c) { 2024349cc55cSDimitry Andric OutputSection *os = ctx.getOutputSection(c); 20250b57cec5SDimitry Andric return buffer->getBufferStart() + os->getFileOff() + c->getRVA() - 20260b57cec5SDimitry Andric os->getRVA(); 20270b57cec5SDimitry Andric }; 20280b57cec5SDimitry Andric uint8_t *begin = bufAddr(firstPdata); 20290b57cec5SDimitry Andric uint8_t *end = bufAddr(lastPdata) + lastPdata->getSize(); 2030*bdd1243dSDimitry Andric if (ctx.config.machine == AMD64) { 20310b57cec5SDimitry Andric struct Entry { ulittle32_t begin, end, unwind; }; 20325ffd83dbSDimitry Andric if ((end - begin) % sizeof(Entry) != 0) { 20335ffd83dbSDimitry Andric fatal("unexpected .pdata size: " + Twine(end - begin) + 20345ffd83dbSDimitry Andric " is not a multiple of " + Twine(sizeof(Entry))); 20355ffd83dbSDimitry Andric } 20360b57cec5SDimitry Andric parallelSort( 20370b57cec5SDimitry Andric MutableArrayRef<Entry>((Entry *)begin, (Entry *)end), 20380b57cec5SDimitry Andric [](const Entry &a, const Entry &b) { return a.begin < b.begin; }); 20390b57cec5SDimitry Andric return; 20400b57cec5SDimitry Andric } 2041*bdd1243dSDimitry Andric if (ctx.config.machine == ARMNT || ctx.config.machine == ARM64) { 20420b57cec5SDimitry Andric struct Entry { ulittle32_t begin, unwind; }; 20435ffd83dbSDimitry Andric if ((end - begin) % sizeof(Entry) != 0) { 20445ffd83dbSDimitry Andric fatal("unexpected .pdata size: " + Twine(end - begin) + 20455ffd83dbSDimitry Andric " is not a multiple of " + Twine(sizeof(Entry))); 20465ffd83dbSDimitry Andric } 20470b57cec5SDimitry Andric parallelSort( 20480b57cec5SDimitry Andric MutableArrayRef<Entry>((Entry *)begin, (Entry *)end), 20490b57cec5SDimitry Andric [](const Entry &a, const Entry &b) { return a.begin < b.begin; }); 20500b57cec5SDimitry Andric return; 20510b57cec5SDimitry Andric } 2052480093f4SDimitry Andric lld::errs() << "warning: don't know how to handle .pdata.\n"; 20530b57cec5SDimitry Andric } 20540b57cec5SDimitry Andric 20550b57cec5SDimitry Andric // The CRT section contains, among other things, the array of function 20560b57cec5SDimitry Andric // pointers that initialize every global variable that is not trivially 20570b57cec5SDimitry Andric // constructed. The CRT calls them one after the other prior to invoking 20580b57cec5SDimitry Andric // main(). 20590b57cec5SDimitry Andric // 20600b57cec5SDimitry Andric // As per C++ spec, 3.6.2/2.3, 20610b57cec5SDimitry Andric // "Variables with ordered initialization defined within a single 20620b57cec5SDimitry Andric // translation unit shall be initialized in the order of their definitions 20630b57cec5SDimitry Andric // in the translation unit" 20640b57cec5SDimitry Andric // 20650b57cec5SDimitry Andric // It is therefore critical to sort the chunks containing the function 20660b57cec5SDimitry Andric // pointers in the order that they are listed in the object file (top to 20670b57cec5SDimitry Andric // bottom), otherwise global objects might not be initialized in the 20680b57cec5SDimitry Andric // correct order. 20690b57cec5SDimitry Andric void Writer::sortCRTSectionChunks(std::vector<Chunk *> &chunks) { 20700b57cec5SDimitry Andric auto sectionChunkOrder = [](const Chunk *a, const Chunk *b) { 20710b57cec5SDimitry Andric auto sa = dyn_cast<SectionChunk>(a); 20720b57cec5SDimitry Andric auto sb = dyn_cast<SectionChunk>(b); 20730b57cec5SDimitry Andric assert(sa && sb && "Non-section chunks in CRT section!"); 20740b57cec5SDimitry Andric 20750b57cec5SDimitry Andric StringRef sAObj = sa->file->mb.getBufferIdentifier(); 20760b57cec5SDimitry Andric StringRef sBObj = sb->file->mb.getBufferIdentifier(); 20770b57cec5SDimitry Andric 20780b57cec5SDimitry Andric return sAObj == sBObj && sa->getSectionNumber() < sb->getSectionNumber(); 20790b57cec5SDimitry Andric }; 20800b57cec5SDimitry Andric llvm::stable_sort(chunks, sectionChunkOrder); 20810b57cec5SDimitry Andric 2082*bdd1243dSDimitry Andric if (ctx.config.verbose) { 20830b57cec5SDimitry Andric for (auto &c : chunks) { 20840b57cec5SDimitry Andric auto sc = dyn_cast<SectionChunk>(c); 20850b57cec5SDimitry Andric log(" " + sc->file->mb.getBufferIdentifier().str() + 20860b57cec5SDimitry Andric ", SectionID: " + Twine(sc->getSectionNumber())); 20870b57cec5SDimitry Andric } 20880b57cec5SDimitry Andric } 20890b57cec5SDimitry Andric } 20900b57cec5SDimitry Andric 20910b57cec5SDimitry Andric OutputSection *Writer::findSection(StringRef name) { 2092349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) 20930b57cec5SDimitry Andric if (sec->name == name) 20940b57cec5SDimitry Andric return sec; 20950b57cec5SDimitry Andric return nullptr; 20960b57cec5SDimitry Andric } 20970b57cec5SDimitry Andric 20980b57cec5SDimitry Andric uint32_t Writer::getSizeOfInitializedData() { 20990b57cec5SDimitry Andric uint32_t res = 0; 2100349cc55cSDimitry Andric for (OutputSection *s : ctx.outputSections) 21010b57cec5SDimitry Andric if (s->header.Characteristics & IMAGE_SCN_CNT_INITIALIZED_DATA) 21020b57cec5SDimitry Andric res += s->getRawSize(); 21030b57cec5SDimitry Andric return res; 21040b57cec5SDimitry Andric } 21050b57cec5SDimitry Andric 21060b57cec5SDimitry Andric // Add base relocations to .reloc section. 21070b57cec5SDimitry Andric void Writer::addBaserels() { 2108*bdd1243dSDimitry Andric if (!ctx.config.relocatable) 21090b57cec5SDimitry Andric return; 21100b57cec5SDimitry Andric relocSec->chunks.clear(); 21110b57cec5SDimitry Andric std::vector<Baserel> v; 2112349cc55cSDimitry Andric for (OutputSection *sec : ctx.outputSections) { 21130b57cec5SDimitry Andric if (sec->header.Characteristics & IMAGE_SCN_MEM_DISCARDABLE) 21140b57cec5SDimitry Andric continue; 21150b57cec5SDimitry Andric // Collect all locations for base relocations. 21160b57cec5SDimitry Andric for (Chunk *c : sec->chunks) 21170b57cec5SDimitry Andric c->getBaserels(&v); 21180b57cec5SDimitry Andric // Add the addresses to .reloc section. 21190b57cec5SDimitry Andric if (!v.empty()) 21200b57cec5SDimitry Andric addBaserelBlocks(v); 21210b57cec5SDimitry Andric v.clear(); 21220b57cec5SDimitry Andric } 21230b57cec5SDimitry Andric } 21240b57cec5SDimitry Andric 21250b57cec5SDimitry Andric // Add addresses to .reloc section. Note that addresses are grouped by page. 21260b57cec5SDimitry Andric void Writer::addBaserelBlocks(std::vector<Baserel> &v) { 21270b57cec5SDimitry Andric const uint32_t mask = ~uint32_t(pageSize - 1); 21280b57cec5SDimitry Andric uint32_t page = v[0].rva & mask; 21290b57cec5SDimitry Andric size_t i = 0, j = 1; 21300b57cec5SDimitry Andric for (size_t e = v.size(); j < e; ++j) { 21310b57cec5SDimitry Andric uint32_t p = v[j].rva & mask; 21320b57cec5SDimitry Andric if (p == page) 21330b57cec5SDimitry Andric continue; 21340b57cec5SDimitry Andric relocSec->addChunk(make<BaserelChunk>(page, &v[i], &v[0] + j)); 21350b57cec5SDimitry Andric i = j; 21360b57cec5SDimitry Andric page = p; 21370b57cec5SDimitry Andric } 21380b57cec5SDimitry Andric if (i == j) 21390b57cec5SDimitry Andric return; 21400b57cec5SDimitry Andric relocSec->addChunk(make<BaserelChunk>(page, &v[i], &v[0] + j)); 21410b57cec5SDimitry Andric } 21420b57cec5SDimitry Andric 21430b57cec5SDimitry Andric PartialSection *Writer::createPartialSection(StringRef name, 21440b57cec5SDimitry Andric uint32_t outChars) { 21450b57cec5SDimitry Andric PartialSection *&pSec = partialSections[{name, outChars}]; 21460b57cec5SDimitry Andric if (pSec) 21470b57cec5SDimitry Andric return pSec; 21480b57cec5SDimitry Andric pSec = make<PartialSection>(name, outChars); 21490b57cec5SDimitry Andric return pSec; 21500b57cec5SDimitry Andric } 21510b57cec5SDimitry Andric 21520b57cec5SDimitry Andric PartialSection *Writer::findPartialSection(StringRef name, uint32_t outChars) { 21530b57cec5SDimitry Andric auto it = partialSections.find({name, outChars}); 21540b57cec5SDimitry Andric if (it != partialSections.end()) 21550b57cec5SDimitry Andric return it->second; 21560b57cec5SDimitry Andric return nullptr; 21570b57cec5SDimitry Andric } 2158e8d8bef9SDimitry Andric 2159e8d8bef9SDimitry Andric void Writer::fixTlsAlignment() { 2160e8d8bef9SDimitry Andric Defined *tlsSym = 2161349cc55cSDimitry Andric dyn_cast_or_null<Defined>(ctx.symtab.findUnderscore("_tls_used")); 2162e8d8bef9SDimitry Andric if (!tlsSym) 2163e8d8bef9SDimitry Andric return; 2164e8d8bef9SDimitry Andric 2165349cc55cSDimitry Andric OutputSection *sec = ctx.getOutputSection(tlsSym->getChunk()); 2166e8d8bef9SDimitry Andric assert(sec && tlsSym->getRVA() >= sec->getRVA() && 2167e8d8bef9SDimitry Andric "no output section for _tls_used"); 2168e8d8bef9SDimitry Andric 2169e8d8bef9SDimitry Andric uint8_t *secBuf = buffer->getBufferStart() + sec->getFileOff(); 2170e8d8bef9SDimitry Andric uint64_t tlsOffset = tlsSym->getRVA() - sec->getRVA(); 2171*bdd1243dSDimitry Andric uint64_t directorySize = ctx.config.is64() 2172e8d8bef9SDimitry Andric ? sizeof(object::coff_tls_directory64) 2173e8d8bef9SDimitry Andric : sizeof(object::coff_tls_directory32); 2174e8d8bef9SDimitry Andric 2175e8d8bef9SDimitry Andric if (tlsOffset + directorySize > sec->getRawSize()) 2176e8d8bef9SDimitry Andric fatal("_tls_used sym is malformed"); 2177e8d8bef9SDimitry Andric 2178*bdd1243dSDimitry Andric if (ctx.config.is64()) { 2179e8d8bef9SDimitry Andric object::coff_tls_directory64 *tlsDir = 2180e8d8bef9SDimitry Andric reinterpret_cast<object::coff_tls_directory64 *>(&secBuf[tlsOffset]); 2181e8d8bef9SDimitry Andric tlsDir->setAlignment(tlsAlignment); 2182e8d8bef9SDimitry Andric } else { 2183e8d8bef9SDimitry Andric object::coff_tls_directory32 *tlsDir = 2184e8d8bef9SDimitry Andric reinterpret_cast<object::coff_tls_directory32 *>(&secBuf[tlsOffset]); 2185e8d8bef9SDimitry Andric tlsDir->setAlignment(tlsAlignment); 2186e8d8bef9SDimitry Andric } 2187e8d8bef9SDimitry Andric } 2188*bdd1243dSDimitry Andric 2189*bdd1243dSDimitry Andric void Writer::checkLoadConfig() { 2190*bdd1243dSDimitry Andric Symbol *sym = ctx.symtab.findUnderscore("_load_config_used"); 2191*bdd1243dSDimitry Andric auto *b = cast_if_present<DefinedRegular>(sym); 2192*bdd1243dSDimitry Andric if (!b) { 2193*bdd1243dSDimitry Andric if (ctx.config.guardCF != GuardCFLevel::Off) 2194*bdd1243dSDimitry Andric warn("Control Flow Guard is enabled but '_load_config_used' is missing"); 2195*bdd1243dSDimitry Andric return; 2196*bdd1243dSDimitry Andric } 2197*bdd1243dSDimitry Andric 2198*bdd1243dSDimitry Andric OutputSection *sec = ctx.getOutputSection(b->getChunk()); 2199*bdd1243dSDimitry Andric uint8_t *buf = buffer->getBufferStart(); 2200*bdd1243dSDimitry Andric uint8_t *secBuf = buf + sec->getFileOff(); 2201*bdd1243dSDimitry Andric uint8_t *symBuf = secBuf + (b->getRVA() - sec->getRVA()); 2202*bdd1243dSDimitry Andric uint32_t expectedAlign = ctx.config.is64() ? 8 : 4; 2203*bdd1243dSDimitry Andric if (b->getChunk()->getAlignment() < expectedAlign) 2204*bdd1243dSDimitry Andric warn("'_load_config_used' is misaligned (expected alignment to be " + 2205*bdd1243dSDimitry Andric Twine(expectedAlign) + " bytes, got " + 2206*bdd1243dSDimitry Andric Twine(b->getChunk()->getAlignment()) + " instead)"); 2207*bdd1243dSDimitry Andric else if (!isAligned(Align(expectedAlign), b->getRVA())) 2208*bdd1243dSDimitry Andric warn("'_load_config_used' is misaligned (RVA is 0x" + 2209*bdd1243dSDimitry Andric Twine::utohexstr(b->getRVA()) + " not aligned to " + 2210*bdd1243dSDimitry Andric Twine(expectedAlign) + " bytes)"); 2211*bdd1243dSDimitry Andric 2212*bdd1243dSDimitry Andric if (ctx.config.is64()) 2213*bdd1243dSDimitry Andric checkLoadConfigGuardData( 2214*bdd1243dSDimitry Andric reinterpret_cast<const coff_load_configuration64 *>(symBuf)); 2215*bdd1243dSDimitry Andric else 2216*bdd1243dSDimitry Andric checkLoadConfigGuardData( 2217*bdd1243dSDimitry Andric reinterpret_cast<const coff_load_configuration32 *>(symBuf)); 2218*bdd1243dSDimitry Andric } 2219*bdd1243dSDimitry Andric 2220*bdd1243dSDimitry Andric template <typename T> 2221*bdd1243dSDimitry Andric void Writer::checkLoadConfigGuardData(const T *loadConfig) { 2222*bdd1243dSDimitry Andric size_t loadConfigSize = loadConfig->Size; 2223*bdd1243dSDimitry Andric 2224*bdd1243dSDimitry Andric #define RETURN_IF_NOT_CONTAINS(field) \ 2225*bdd1243dSDimitry Andric if (loadConfigSize < offsetof(T, field) + sizeof(T::field)) { \ 2226*bdd1243dSDimitry Andric warn("'_load_config_used' structure too small to include " #field); \ 2227*bdd1243dSDimitry Andric return; \ 2228*bdd1243dSDimitry Andric } 2229*bdd1243dSDimitry Andric 2230*bdd1243dSDimitry Andric #define IF_CONTAINS(field) \ 2231*bdd1243dSDimitry Andric if (loadConfigSize >= offsetof(T, field) + sizeof(T::field)) 2232*bdd1243dSDimitry Andric 2233*bdd1243dSDimitry Andric #define CHECK_VA(field, sym) \ 2234*bdd1243dSDimitry Andric if (auto *s = dyn_cast<DefinedSynthetic>(ctx.symtab.findUnderscore(sym))) \ 2235*bdd1243dSDimitry Andric if (loadConfig->field != ctx.config.imageBase + s->getRVA()) \ 2236*bdd1243dSDimitry Andric warn(#field " not set correctly in '_load_config_used'"); 2237*bdd1243dSDimitry Andric 2238*bdd1243dSDimitry Andric #define CHECK_ABSOLUTE(field, sym) \ 2239*bdd1243dSDimitry Andric if (auto *s = dyn_cast<DefinedAbsolute>(ctx.symtab.findUnderscore(sym))) \ 2240*bdd1243dSDimitry Andric if (loadConfig->field != s->getVA()) \ 2241*bdd1243dSDimitry Andric warn(#field " not set correctly in '_load_config_used'"); 2242*bdd1243dSDimitry Andric 2243*bdd1243dSDimitry Andric if (ctx.config.guardCF == GuardCFLevel::Off) 2244*bdd1243dSDimitry Andric return; 2245*bdd1243dSDimitry Andric RETURN_IF_NOT_CONTAINS(GuardFlags) 2246*bdd1243dSDimitry Andric CHECK_VA(GuardCFFunctionTable, "__guard_fids_table") 2247*bdd1243dSDimitry Andric CHECK_ABSOLUTE(GuardCFFunctionCount, "__guard_fids_count") 2248*bdd1243dSDimitry Andric CHECK_ABSOLUTE(GuardFlags, "__guard_flags") 2249*bdd1243dSDimitry Andric IF_CONTAINS(GuardAddressTakenIatEntryCount) { 2250*bdd1243dSDimitry Andric CHECK_VA(GuardAddressTakenIatEntryTable, "__guard_iat_table") 2251*bdd1243dSDimitry Andric CHECK_ABSOLUTE(GuardAddressTakenIatEntryCount, "__guard_iat_count") 2252*bdd1243dSDimitry Andric } 2253*bdd1243dSDimitry Andric 2254*bdd1243dSDimitry Andric if (!(ctx.config.guardCF & GuardCFLevel::LongJmp)) 2255*bdd1243dSDimitry Andric return; 2256*bdd1243dSDimitry Andric RETURN_IF_NOT_CONTAINS(GuardLongJumpTargetCount) 2257*bdd1243dSDimitry Andric CHECK_VA(GuardLongJumpTargetTable, "__guard_longjmp_table") 2258*bdd1243dSDimitry Andric CHECK_ABSOLUTE(GuardLongJumpTargetCount, "__guard_longjmp_count") 2259*bdd1243dSDimitry Andric 2260*bdd1243dSDimitry Andric if (!(ctx.config.guardCF & GuardCFLevel::EHCont)) 2261*bdd1243dSDimitry Andric return; 2262*bdd1243dSDimitry Andric RETURN_IF_NOT_CONTAINS(GuardEHContinuationCount) 2263*bdd1243dSDimitry Andric CHECK_VA(GuardEHContinuationTable, "__guard_eh_cont_table") 2264*bdd1243dSDimitry Andric CHECK_ABSOLUTE(GuardEHContinuationCount, "__guard_eh_cont_count") 2265*bdd1243dSDimitry Andric 2266*bdd1243dSDimitry Andric #undef RETURN_IF_NOT_CONTAINS 2267*bdd1243dSDimitry Andric #undef IF_CONTAINS 2268*bdd1243dSDimitry Andric #undef CHECK_VA 2269*bdd1243dSDimitry Andric #undef CHECK_ABSOLUTE 2270*bdd1243dSDimitry Andric } 2271