1 //===- COFFWriter.cpp -----------------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "COFFWriter.h" 10 #include "COFFObject.h" 11 #include "llvm/ADT/ArrayRef.h" 12 #include "llvm/ADT/StringRef.h" 13 #include "llvm/BinaryFormat/COFF.h" 14 #include "llvm/Object/COFF.h" 15 #include "llvm/Support/Errc.h" 16 #include "llvm/Support/ErrorHandling.h" 17 #include <cstddef> 18 #include <cstdint> 19 20 namespace llvm { 21 namespace objcopy { 22 namespace coff { 23 24 using namespace object; 25 using namespace COFF; 26 27 Error COFFWriter::finalizeRelocTargets() { 28 for (Section &Sec : Obj.getMutableSections()) { 29 for (Relocation &R : Sec.Relocs) { 30 const Symbol *Sym = Obj.findSymbol(R.Target); 31 if (Sym == nullptr) 32 return createStringError(object_error::invalid_symbol_index, 33 "relocation target '%s' (%zu) not found", 34 R.TargetName.str().c_str(), R.Target); 35 R.Reloc.SymbolTableIndex = Sym->RawIndex; 36 } 37 } 38 return Error::success(); 39 } 40 41 Error COFFWriter::finalizeSymbolContents() { 42 for (Symbol &Sym : Obj.getMutableSymbols()) { 43 if (Sym.TargetSectionId <= 0) { 44 // Undefined, or a special kind of symbol. These negative values 45 // are stored in the SectionNumber field which is unsigned. 46 Sym.Sym.SectionNumber = static_cast<uint32_t>(Sym.TargetSectionId); 47 } else { 48 const Section *Sec = Obj.findSection(Sym.TargetSectionId); 49 if (Sec == nullptr) 50 return createStringError(object_error::invalid_symbol_index, 51 "symbol '%s' points to a removed section", 52 Sym.Name.str().c_str()); 53 Sym.Sym.SectionNumber = Sec->Index; 54 55 if (Sym.Sym.NumberOfAuxSymbols == 1 && 56 Sym.Sym.StorageClass == IMAGE_SYM_CLASS_STATIC) { 57 coff_aux_section_definition *SD = 58 reinterpret_cast<coff_aux_section_definition *>( 59 Sym.AuxData[0].Opaque); 60 uint32_t SDSectionNumber; 61 if (Sym.AssociativeComdatTargetSectionId == 0) { 62 // Not a comdat associative section; just set the Number field to 63 // the number of the section itself. 64 SDSectionNumber = Sec->Index; 65 } else { 66 Sec = Obj.findSection(Sym.AssociativeComdatTargetSectionId); 67 if (Sec == nullptr) 68 return createStringError( 69 object_error::invalid_symbol_index, 70 "symbol '%s' is associative to a removed section", 71 Sym.Name.str().c_str()); 72 SDSectionNumber = Sec->Index; 73 } 74 // Update the section definition with the new section number. 75 SD->NumberLowPart = static_cast<uint16_t>(SDSectionNumber); 76 SD->NumberHighPart = static_cast<uint16_t>(SDSectionNumber >> 16); 77 } 78 } 79 // Check that we actually have got AuxData to match the weak symbol target 80 // we want to set. Only >= 1 would be required, but only == 1 makes sense. 81 if (Sym.WeakTargetSymbolId && Sym.Sym.NumberOfAuxSymbols == 1) { 82 coff_aux_weak_external *WE = 83 reinterpret_cast<coff_aux_weak_external *>(Sym.AuxData[0].Opaque); 84 const Symbol *Target = Obj.findSymbol(*Sym.WeakTargetSymbolId); 85 if (Target == nullptr) 86 return createStringError(object_error::invalid_symbol_index, 87 "symbol '%s' is missing its weak target", 88 Sym.Name.str().c_str()); 89 WE->TagIndex = Target->RawIndex; 90 } 91 } 92 return Error::success(); 93 } 94 95 void COFFWriter::layoutSections() { 96 for (auto &S : Obj.getMutableSections()) { 97 if (S.Header.SizeOfRawData > 0) 98 S.Header.PointerToRawData = FileSize; 99 FileSize += S.Header.SizeOfRawData; // For executables, this is already 100 // aligned to FileAlignment. 101 if (S.Relocs.size() >= 0xffff) { 102 S.Header.Characteristics |= COFF::IMAGE_SCN_LNK_NRELOC_OVFL; 103 S.Header.NumberOfRelocations = 0xffff; 104 S.Header.PointerToRelocations = FileSize; 105 FileSize += sizeof(coff_relocation); 106 } else { 107 S.Header.NumberOfRelocations = S.Relocs.size(); 108 S.Header.PointerToRelocations = S.Relocs.size() ? FileSize : 0; 109 } 110 111 FileSize += S.Relocs.size() * sizeof(coff_relocation); 112 FileSize = alignTo(FileSize, FileAlignment); 113 114 if (S.Header.Characteristics & IMAGE_SCN_CNT_INITIALIZED_DATA) 115 SizeOfInitializedData += S.Header.SizeOfRawData; 116 } 117 } 118 119 Expected<size_t> COFFWriter::finalizeStringTable() { 120 for (const auto &S : Obj.getSections()) 121 if (S.Name.size() > COFF::NameSize) 122 StrTabBuilder.add(S.Name); 123 124 for (const auto &S : Obj.getSymbols()) 125 if (S.Name.size() > COFF::NameSize) 126 StrTabBuilder.add(S.Name); 127 128 StrTabBuilder.finalize(); 129 130 for (auto &S : Obj.getMutableSections()) { 131 memset(S.Header.Name, 0, sizeof(S.Header.Name)); 132 if (S.Name.size() <= COFF::NameSize) { 133 // Short names can go in the field directly. 134 memcpy(S.Header.Name, S.Name.data(), S.Name.size()); 135 } else { 136 // Offset of the section name in the string table. 137 size_t Offset = StrTabBuilder.getOffset(S.Name); 138 if (!COFF::encodeSectionName(S.Header.Name, Offset)) 139 return createStringError(object_error::invalid_section_index, 140 "COFF string table is greater than 64GB, " 141 "unable to encode section name offset"); 142 } 143 } 144 for (auto &S : Obj.getMutableSymbols()) { 145 if (S.Name.size() > COFF::NameSize) { 146 S.Sym.Name.Offset.Zeroes = 0; 147 S.Sym.Name.Offset.Offset = StrTabBuilder.getOffset(S.Name); 148 } else { 149 strncpy(S.Sym.Name.ShortName, S.Name.data(), COFF::NameSize); 150 } 151 } 152 return StrTabBuilder.getSize(); 153 } 154 155 template <class SymbolTy> 156 std::pair<size_t, size_t> COFFWriter::finalizeSymbolTable() { 157 size_t RawSymIndex = 0; 158 for (auto &S : Obj.getMutableSymbols()) { 159 // Symbols normally have NumberOfAuxSymbols set correctly all the time. 160 // For file symbols, we need to know the output file's symbol size to be 161 // able to calculate the number of slots it occupies. 162 if (!S.AuxFile.empty()) 163 S.Sym.NumberOfAuxSymbols = 164 alignTo(S.AuxFile.size(), sizeof(SymbolTy)) / sizeof(SymbolTy); 165 S.RawIndex = RawSymIndex; 166 RawSymIndex += 1 + S.Sym.NumberOfAuxSymbols; 167 } 168 return std::make_pair(RawSymIndex * sizeof(SymbolTy), sizeof(SymbolTy)); 169 } 170 171 Error COFFWriter::finalize(bool IsBigObj) { 172 size_t SymTabSize, SymbolSize; 173 std::tie(SymTabSize, SymbolSize) = IsBigObj 174 ? finalizeSymbolTable<coff_symbol32>() 175 : finalizeSymbolTable<coff_symbol16>(); 176 177 if (Error E = finalizeRelocTargets()) 178 return E; 179 if (Error E = finalizeSymbolContents()) 180 return E; 181 182 size_t SizeOfHeaders = 0; 183 FileAlignment = 1; 184 size_t PeHeaderSize = 0; 185 if (Obj.IsPE) { 186 Obj.DosHeader.AddressOfNewExeHeader = 187 sizeof(Obj.DosHeader) + Obj.DosStub.size(); 188 SizeOfHeaders += Obj.DosHeader.AddressOfNewExeHeader + sizeof(PEMagic); 189 190 FileAlignment = Obj.PeHeader.FileAlignment; 191 Obj.PeHeader.NumberOfRvaAndSize = Obj.DataDirectories.size(); 192 193 PeHeaderSize = Obj.Is64 ? sizeof(pe32plus_header) : sizeof(pe32_header); 194 SizeOfHeaders += 195 PeHeaderSize + sizeof(data_directory) * Obj.DataDirectories.size(); 196 } 197 Obj.CoffFileHeader.NumberOfSections = Obj.getSections().size(); 198 SizeOfHeaders += 199 IsBigObj ? sizeof(coff_bigobj_file_header) : sizeof(coff_file_header); 200 SizeOfHeaders += sizeof(coff_section) * Obj.getSections().size(); 201 SizeOfHeaders = alignTo(SizeOfHeaders, FileAlignment); 202 203 Obj.CoffFileHeader.SizeOfOptionalHeader = 204 PeHeaderSize + sizeof(data_directory) * Obj.DataDirectories.size(); 205 206 FileSize = SizeOfHeaders; 207 SizeOfInitializedData = 0; 208 209 layoutSections(); 210 211 if (Obj.IsPE) { 212 Obj.PeHeader.SizeOfHeaders = SizeOfHeaders; 213 Obj.PeHeader.SizeOfInitializedData = SizeOfInitializedData; 214 215 if (!Obj.getSections().empty()) { 216 const Section &S = Obj.getSections().back(); 217 Obj.PeHeader.SizeOfImage = 218 alignTo(S.Header.VirtualAddress + S.Header.VirtualSize, 219 Obj.PeHeader.SectionAlignment); 220 } 221 222 // If the PE header had a checksum, clear it, since it isn't valid 223 // any longer. (We don't calculate a new one.) 224 Obj.PeHeader.CheckSum = 0; 225 } 226 227 Expected<size_t> StrTabSizeOrErr = finalizeStringTable(); 228 if (!StrTabSizeOrErr) 229 return StrTabSizeOrErr.takeError(); 230 231 size_t StrTabSize = *StrTabSizeOrErr; 232 233 size_t PointerToSymbolTable = FileSize; 234 // StrTabSize <= 4 is the size of an empty string table, only consisting 235 // of the length field. 236 if (SymTabSize == 0 && StrTabSize <= 4 && Obj.IsPE) { 237 // For executables, don't point to the symbol table and skip writing 238 // the length field, if both the symbol and string tables are empty. 239 PointerToSymbolTable = 0; 240 StrTabSize = 0; 241 } 242 243 size_t NumRawSymbols = SymTabSize / SymbolSize; 244 Obj.CoffFileHeader.PointerToSymbolTable = PointerToSymbolTable; 245 Obj.CoffFileHeader.NumberOfSymbols = NumRawSymbols; 246 FileSize += SymTabSize + StrTabSize; 247 FileSize = alignTo(FileSize, FileAlignment); 248 249 return Error::success(); 250 } 251 252 void COFFWriter::writeHeaders(bool IsBigObj) { 253 uint8_t *Ptr = reinterpret_cast<uint8_t *>(Buf->getBufferStart()); 254 if (Obj.IsPE) { 255 memcpy(Ptr, &Obj.DosHeader, sizeof(Obj.DosHeader)); 256 Ptr += sizeof(Obj.DosHeader); 257 memcpy(Ptr, Obj.DosStub.data(), Obj.DosStub.size()); 258 Ptr += Obj.DosStub.size(); 259 memcpy(Ptr, PEMagic, sizeof(PEMagic)); 260 Ptr += sizeof(PEMagic); 261 } 262 if (!IsBigObj) { 263 memcpy(Ptr, &Obj.CoffFileHeader, sizeof(Obj.CoffFileHeader)); 264 Ptr += sizeof(Obj.CoffFileHeader); 265 } else { 266 // Generate a coff_bigobj_file_header, filling it in with the values 267 // from Obj.CoffFileHeader. All extra fields that don't exist in 268 // coff_file_header can be set to hardcoded values. 269 coff_bigobj_file_header BigObjHeader; 270 BigObjHeader.Sig1 = IMAGE_FILE_MACHINE_UNKNOWN; 271 BigObjHeader.Sig2 = 0xffff; 272 BigObjHeader.Version = BigObjHeader::MinBigObjectVersion; 273 BigObjHeader.Machine = Obj.CoffFileHeader.Machine; 274 BigObjHeader.TimeDateStamp = Obj.CoffFileHeader.TimeDateStamp; 275 memcpy(BigObjHeader.UUID, BigObjMagic, sizeof(BigObjMagic)); 276 BigObjHeader.unused1 = 0; 277 BigObjHeader.unused2 = 0; 278 BigObjHeader.unused3 = 0; 279 BigObjHeader.unused4 = 0; 280 // The value in Obj.CoffFileHeader.NumberOfSections is truncated, thus 281 // get the original one instead. 282 BigObjHeader.NumberOfSections = Obj.getSections().size(); 283 BigObjHeader.PointerToSymbolTable = Obj.CoffFileHeader.PointerToSymbolTable; 284 BigObjHeader.NumberOfSymbols = Obj.CoffFileHeader.NumberOfSymbols; 285 286 memcpy(Ptr, &BigObjHeader, sizeof(BigObjHeader)); 287 Ptr += sizeof(BigObjHeader); 288 } 289 if (Obj.IsPE) { 290 if (Obj.Is64) { 291 memcpy(Ptr, &Obj.PeHeader, sizeof(Obj.PeHeader)); 292 Ptr += sizeof(Obj.PeHeader); 293 } else { 294 pe32_header PeHeader; 295 copyPeHeader(PeHeader, Obj.PeHeader); 296 // The pe32plus_header (stored in Object) lacks the BaseOfData field. 297 PeHeader.BaseOfData = Obj.BaseOfData; 298 299 memcpy(Ptr, &PeHeader, sizeof(PeHeader)); 300 Ptr += sizeof(PeHeader); 301 } 302 for (const auto &DD : Obj.DataDirectories) { 303 memcpy(Ptr, &DD, sizeof(DD)); 304 Ptr += sizeof(DD); 305 } 306 } 307 for (const auto &S : Obj.getSections()) { 308 memcpy(Ptr, &S.Header, sizeof(S.Header)); 309 Ptr += sizeof(S.Header); 310 } 311 } 312 313 void COFFWriter::writeSections() { 314 for (const auto &S : Obj.getSections()) { 315 uint8_t *Ptr = reinterpret_cast<uint8_t *>(Buf->getBufferStart()) + 316 S.Header.PointerToRawData; 317 ArrayRef<uint8_t> Contents = S.getContents(); 318 std::copy(Contents.begin(), Contents.end(), Ptr); 319 320 // For executable sections, pad the remainder of the raw data size with 321 // 0xcc, which is int3 on x86. 322 if ((S.Header.Characteristics & IMAGE_SCN_CNT_CODE) && 323 S.Header.SizeOfRawData > Contents.size()) 324 memset(Ptr + Contents.size(), 0xcc, 325 S.Header.SizeOfRawData - Contents.size()); 326 327 Ptr += S.Header.SizeOfRawData; 328 329 if (S.Relocs.size() >= 0xffff) { 330 object::coff_relocation R; 331 R.VirtualAddress = S.Relocs.size() + 1; 332 R.SymbolTableIndex = 0; 333 R.Type = 0; 334 memcpy(Ptr, &R, sizeof(R)); 335 Ptr += sizeof(R); 336 } 337 for (const auto &R : S.Relocs) { 338 memcpy(Ptr, &R.Reloc, sizeof(R.Reloc)); 339 Ptr += sizeof(R.Reloc); 340 } 341 } 342 } 343 344 template <class SymbolTy> void COFFWriter::writeSymbolStringTables() { 345 uint8_t *Ptr = reinterpret_cast<uint8_t *>(Buf->getBufferStart()) + 346 Obj.CoffFileHeader.PointerToSymbolTable; 347 for (const auto &S : Obj.getSymbols()) { 348 // Convert symbols back to the right size, from coff_symbol32. 349 copySymbol<SymbolTy, coff_symbol32>(*reinterpret_cast<SymbolTy *>(Ptr), 350 S.Sym); 351 Ptr += sizeof(SymbolTy); 352 if (!S.AuxFile.empty()) { 353 // For file symbols, just write the string into the aux symbol slots, 354 // assuming that the unwritten parts are initialized to zero in the memory 355 // mapped file. 356 std::copy(S.AuxFile.begin(), S.AuxFile.end(), Ptr); 357 Ptr += S.Sym.NumberOfAuxSymbols * sizeof(SymbolTy); 358 } else { 359 // For other auxillary symbols, write their opaque payload into one symbol 360 // table slot each. For big object files, the symbols are larger than the 361 // opaque auxillary symbol struct and we leave padding at the end of each 362 // entry. 363 for (const AuxSymbol &AuxSym : S.AuxData) { 364 ArrayRef<uint8_t> Ref = AuxSym.getRef(); 365 std::copy(Ref.begin(), Ref.end(), Ptr); 366 Ptr += sizeof(SymbolTy); 367 } 368 } 369 } 370 if (StrTabBuilder.getSize() > 4 || !Obj.IsPE) { 371 // Always write a string table in object files, even an empty one. 372 StrTabBuilder.write(Ptr); 373 Ptr += StrTabBuilder.getSize(); 374 } 375 } 376 377 Error COFFWriter::write(bool IsBigObj) { 378 if (Error E = finalize(IsBigObj)) 379 return E; 380 381 Buf = WritableMemoryBuffer::getNewMemBuffer(FileSize); 382 if (!Buf) 383 return createStringError(llvm::errc::not_enough_memory, 384 "failed to allocate memory buffer of " + 385 Twine::utohexstr(FileSize) + " bytes."); 386 387 writeHeaders(IsBigObj); 388 writeSections(); 389 if (IsBigObj) 390 writeSymbolStringTables<coff_symbol32>(); 391 else 392 writeSymbolStringTables<coff_symbol16>(); 393 394 if (Obj.IsPE) 395 if (Error E = patchDebugDirectory()) 396 return E; 397 398 // TODO: Implement direct writing to the output stream (without intermediate 399 // memory buffer Buf). 400 Out.write(Buf->getBufferStart(), Buf->getBufferSize()); 401 return Error::success(); 402 } 403 404 Expected<uint32_t> COFFWriter::virtualAddressToFileAddress(uint32_t RVA) { 405 for (const auto &S : Obj.getSections()) { 406 if (RVA >= S.Header.VirtualAddress && 407 RVA < S.Header.VirtualAddress + S.Header.SizeOfRawData) 408 return S.Header.PointerToRawData + RVA - S.Header.VirtualAddress; 409 } 410 return createStringError(object_error::parse_failed, 411 "debug directory payload not found"); 412 } 413 414 // Locate which sections contain the debug directories, iterate over all 415 // the debug_directory structs in there, and set the PointerToRawData field 416 // in all of them, according to their new physical location in the file. 417 Error COFFWriter::patchDebugDirectory() { 418 if (Obj.DataDirectories.size() <= DEBUG_DIRECTORY) 419 return Error::success(); 420 const data_directory *Dir = &Obj.DataDirectories[DEBUG_DIRECTORY]; 421 if (Dir->Size <= 0) 422 return Error::success(); 423 for (const auto &S : Obj.getSections()) { 424 if (Dir->RelativeVirtualAddress >= S.Header.VirtualAddress && 425 Dir->RelativeVirtualAddress < 426 S.Header.VirtualAddress + S.Header.SizeOfRawData) { 427 if (Dir->RelativeVirtualAddress + Dir->Size > 428 S.Header.VirtualAddress + S.Header.SizeOfRawData) 429 return createStringError(object_error::parse_failed, 430 "debug directory extends past end of section"); 431 432 size_t Offset = Dir->RelativeVirtualAddress - S.Header.VirtualAddress; 433 uint8_t *Ptr = reinterpret_cast<uint8_t *>(Buf->getBufferStart()) + 434 S.Header.PointerToRawData + Offset; 435 uint8_t *End = Ptr + Dir->Size; 436 while (Ptr < End) { 437 debug_directory *Debug = reinterpret_cast<debug_directory *>(Ptr); 438 if (Debug->PointerToRawData) { 439 if (Expected<uint32_t> FilePosOrErr = 440 virtualAddressToFileAddress(Debug->AddressOfRawData)) 441 Debug->PointerToRawData = *FilePosOrErr; 442 else 443 return FilePosOrErr.takeError(); 444 } 445 Ptr += sizeof(debug_directory); 446 Offset += sizeof(debug_directory); 447 } 448 // Debug directory found and patched, all done. 449 return Error::success(); 450 } 451 } 452 return createStringError(object_error::parse_failed, 453 "debug directory not found"); 454 } 455 456 Error COFFWriter::write() { 457 bool IsBigObj = Obj.getSections().size() > MaxNumberOfSections16; 458 if (IsBigObj && Obj.IsPE) 459 return createStringError(object_error::parse_failed, 460 "too many sections for executable"); 461 return write(IsBigObj); 462 } 463 464 } // end namespace coff 465 } // end namespace objcopy 466 } // end namespace llvm 467