xref: /freebsd/contrib/llvm-project/llvm/lib/ObjCopy/COFF/COFFWriter.cpp (revision d9a42747950146bf03cda7f6e25d219253f8a57a)
1 //===- COFFWriter.cpp -----------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "COFFWriter.h"
10 #include "COFFObject.h"
11 #include "llvm/ADT/ArrayRef.h"
12 #include "llvm/ADT/StringRef.h"
13 #include "llvm/BinaryFormat/COFF.h"
14 #include "llvm/Object/COFF.h"
15 #include "llvm/Support/Errc.h"
16 #include "llvm/Support/ErrorHandling.h"
17 #include <cstddef>
18 #include <cstdint>
19 
20 namespace llvm {
21 namespace objcopy {
22 namespace coff {
23 
24 using namespace object;
25 using namespace COFF;
26 
27 Error COFFWriter::finalizeRelocTargets() {
28   for (Section &Sec : Obj.getMutableSections()) {
29     for (Relocation &R : Sec.Relocs) {
30       const Symbol *Sym = Obj.findSymbol(R.Target);
31       if (Sym == nullptr)
32         return createStringError(object_error::invalid_symbol_index,
33                                  "relocation target '%s' (%zu) not found",
34                                  R.TargetName.str().c_str(), R.Target);
35       R.Reloc.SymbolTableIndex = Sym->RawIndex;
36     }
37   }
38   return Error::success();
39 }
40 
41 Error COFFWriter::finalizeSymbolContents() {
42   for (Symbol &Sym : Obj.getMutableSymbols()) {
43     if (Sym.TargetSectionId <= 0) {
44       // Undefined, or a special kind of symbol. These negative values
45       // are stored in the SectionNumber field which is unsigned.
46       Sym.Sym.SectionNumber = static_cast<uint32_t>(Sym.TargetSectionId);
47     } else {
48       const Section *Sec = Obj.findSection(Sym.TargetSectionId);
49       if (Sec == nullptr)
50         return createStringError(object_error::invalid_symbol_index,
51                                  "symbol '%s' points to a removed section",
52                                  Sym.Name.str().c_str());
53       Sym.Sym.SectionNumber = Sec->Index;
54 
55       if (Sym.Sym.NumberOfAuxSymbols == 1 &&
56           Sym.Sym.StorageClass == IMAGE_SYM_CLASS_STATIC) {
57         coff_aux_section_definition *SD =
58             reinterpret_cast<coff_aux_section_definition *>(
59                 Sym.AuxData[0].Opaque);
60         uint32_t SDSectionNumber;
61         if (Sym.AssociativeComdatTargetSectionId == 0) {
62           // Not a comdat associative section; just set the Number field to
63           // the number of the section itself.
64           SDSectionNumber = Sec->Index;
65         } else {
66           Sec = Obj.findSection(Sym.AssociativeComdatTargetSectionId);
67           if (Sec == nullptr)
68             return createStringError(
69                 object_error::invalid_symbol_index,
70                 "symbol '%s' is associative to a removed section",
71                 Sym.Name.str().c_str());
72           SDSectionNumber = Sec->Index;
73         }
74         // Update the section definition with the new section number.
75         SD->NumberLowPart = static_cast<uint16_t>(SDSectionNumber);
76         SD->NumberHighPart = static_cast<uint16_t>(SDSectionNumber >> 16);
77       }
78     }
79     // Check that we actually have got AuxData to match the weak symbol target
80     // we want to set. Only >= 1 would be required, but only == 1 makes sense.
81     if (Sym.WeakTargetSymbolId && Sym.Sym.NumberOfAuxSymbols == 1) {
82       coff_aux_weak_external *WE =
83           reinterpret_cast<coff_aux_weak_external *>(Sym.AuxData[0].Opaque);
84       const Symbol *Target = Obj.findSymbol(*Sym.WeakTargetSymbolId);
85       if (Target == nullptr)
86         return createStringError(object_error::invalid_symbol_index,
87                                  "symbol '%s' is missing its weak target",
88                                  Sym.Name.str().c_str());
89       WE->TagIndex = Target->RawIndex;
90     }
91   }
92   return Error::success();
93 }
94 
95 void COFFWriter::layoutSections() {
96   for (auto &S : Obj.getMutableSections()) {
97     if (S.Header.SizeOfRawData > 0)
98       S.Header.PointerToRawData = FileSize;
99     FileSize += S.Header.SizeOfRawData; // For executables, this is already
100                                         // aligned to FileAlignment.
101     if (S.Relocs.size() >= 0xffff) {
102       S.Header.Characteristics |= COFF::IMAGE_SCN_LNK_NRELOC_OVFL;
103       S.Header.NumberOfRelocations = 0xffff;
104       S.Header.PointerToRelocations = FileSize;
105       FileSize += sizeof(coff_relocation);
106     } else {
107       S.Header.NumberOfRelocations = S.Relocs.size();
108       S.Header.PointerToRelocations = S.Relocs.size() ? FileSize : 0;
109     }
110 
111     FileSize += S.Relocs.size() * sizeof(coff_relocation);
112     FileSize = alignTo(FileSize, FileAlignment);
113 
114     if (S.Header.Characteristics & IMAGE_SCN_CNT_INITIALIZED_DATA)
115       SizeOfInitializedData += S.Header.SizeOfRawData;
116   }
117 }
118 
119 Expected<size_t> COFFWriter::finalizeStringTable() {
120   for (const auto &S : Obj.getSections())
121     if (S.Name.size() > COFF::NameSize)
122       StrTabBuilder.add(S.Name);
123 
124   for (const auto &S : Obj.getSymbols())
125     if (S.Name.size() > COFF::NameSize)
126       StrTabBuilder.add(S.Name);
127 
128   StrTabBuilder.finalize();
129 
130   for (auto &S : Obj.getMutableSections()) {
131     memset(S.Header.Name, 0, sizeof(S.Header.Name));
132     if (S.Name.size() <= COFF::NameSize) {
133       // Short names can go in the field directly.
134       memcpy(S.Header.Name, S.Name.data(), S.Name.size());
135     } else {
136       // Offset of the section name in the string table.
137       size_t Offset = StrTabBuilder.getOffset(S.Name);
138       if (!COFF::encodeSectionName(S.Header.Name, Offset))
139         return createStringError(object_error::invalid_section_index,
140                                  "COFF string table is greater than 64GB, "
141                                  "unable to encode section name offset");
142     }
143   }
144   for (auto &S : Obj.getMutableSymbols()) {
145     if (S.Name.size() > COFF::NameSize) {
146       S.Sym.Name.Offset.Zeroes = 0;
147       S.Sym.Name.Offset.Offset = StrTabBuilder.getOffset(S.Name);
148     } else {
149       strncpy(S.Sym.Name.ShortName, S.Name.data(), COFF::NameSize);
150     }
151   }
152   return StrTabBuilder.getSize();
153 }
154 
155 template <class SymbolTy>
156 std::pair<size_t, size_t> COFFWriter::finalizeSymbolTable() {
157   size_t RawSymIndex = 0;
158   for (auto &S : Obj.getMutableSymbols()) {
159     // Symbols normally have NumberOfAuxSymbols set correctly all the time.
160     // For file symbols, we need to know the output file's symbol size to be
161     // able to calculate the number of slots it occupies.
162     if (!S.AuxFile.empty())
163       S.Sym.NumberOfAuxSymbols =
164           alignTo(S.AuxFile.size(), sizeof(SymbolTy)) / sizeof(SymbolTy);
165     S.RawIndex = RawSymIndex;
166     RawSymIndex += 1 + S.Sym.NumberOfAuxSymbols;
167   }
168   return std::make_pair(RawSymIndex * sizeof(SymbolTy), sizeof(SymbolTy));
169 }
170 
171 Error COFFWriter::finalize(bool IsBigObj) {
172   size_t SymTabSize, SymbolSize;
173   std::tie(SymTabSize, SymbolSize) = IsBigObj
174                                          ? finalizeSymbolTable<coff_symbol32>()
175                                          : finalizeSymbolTable<coff_symbol16>();
176 
177   if (Error E = finalizeRelocTargets())
178     return E;
179   if (Error E = finalizeSymbolContents())
180     return E;
181 
182   size_t SizeOfHeaders = 0;
183   FileAlignment = 1;
184   size_t PeHeaderSize = 0;
185   if (Obj.IsPE) {
186     Obj.DosHeader.AddressOfNewExeHeader =
187         sizeof(Obj.DosHeader) + Obj.DosStub.size();
188     SizeOfHeaders += Obj.DosHeader.AddressOfNewExeHeader + sizeof(PEMagic);
189 
190     FileAlignment = Obj.PeHeader.FileAlignment;
191     Obj.PeHeader.NumberOfRvaAndSize = Obj.DataDirectories.size();
192 
193     PeHeaderSize = Obj.Is64 ? sizeof(pe32plus_header) : sizeof(pe32_header);
194     SizeOfHeaders +=
195         PeHeaderSize + sizeof(data_directory) * Obj.DataDirectories.size();
196   }
197   Obj.CoffFileHeader.NumberOfSections = Obj.getSections().size();
198   SizeOfHeaders +=
199       IsBigObj ? sizeof(coff_bigobj_file_header) : sizeof(coff_file_header);
200   SizeOfHeaders += sizeof(coff_section) * Obj.getSections().size();
201   SizeOfHeaders = alignTo(SizeOfHeaders, FileAlignment);
202 
203   Obj.CoffFileHeader.SizeOfOptionalHeader =
204       PeHeaderSize + sizeof(data_directory) * Obj.DataDirectories.size();
205 
206   FileSize = SizeOfHeaders;
207   SizeOfInitializedData = 0;
208 
209   layoutSections();
210 
211   if (Obj.IsPE) {
212     Obj.PeHeader.SizeOfHeaders = SizeOfHeaders;
213     Obj.PeHeader.SizeOfInitializedData = SizeOfInitializedData;
214 
215     if (!Obj.getSections().empty()) {
216       const Section &S = Obj.getSections().back();
217       Obj.PeHeader.SizeOfImage =
218           alignTo(S.Header.VirtualAddress + S.Header.VirtualSize,
219                   Obj.PeHeader.SectionAlignment);
220     }
221 
222     // If the PE header had a checksum, clear it, since it isn't valid
223     // any longer. (We don't calculate a new one.)
224     Obj.PeHeader.CheckSum = 0;
225   }
226 
227   Expected<size_t> StrTabSizeOrErr = finalizeStringTable();
228   if (!StrTabSizeOrErr)
229     return StrTabSizeOrErr.takeError();
230 
231   size_t StrTabSize = *StrTabSizeOrErr;
232 
233   size_t PointerToSymbolTable = FileSize;
234   // StrTabSize <= 4 is the size of an empty string table, only consisting
235   // of the length field.
236   if (SymTabSize == 0 && StrTabSize <= 4 && Obj.IsPE) {
237     // For executables, don't point to the symbol table and skip writing
238     // the length field, if both the symbol and string tables are empty.
239     PointerToSymbolTable = 0;
240     StrTabSize = 0;
241   }
242 
243   size_t NumRawSymbols = SymTabSize / SymbolSize;
244   Obj.CoffFileHeader.PointerToSymbolTable = PointerToSymbolTable;
245   Obj.CoffFileHeader.NumberOfSymbols = NumRawSymbols;
246   FileSize += SymTabSize + StrTabSize;
247   FileSize = alignTo(FileSize, FileAlignment);
248 
249   return Error::success();
250 }
251 
252 void COFFWriter::writeHeaders(bool IsBigObj) {
253   uint8_t *Ptr = reinterpret_cast<uint8_t *>(Buf->getBufferStart());
254   if (Obj.IsPE) {
255     memcpy(Ptr, &Obj.DosHeader, sizeof(Obj.DosHeader));
256     Ptr += sizeof(Obj.DosHeader);
257     memcpy(Ptr, Obj.DosStub.data(), Obj.DosStub.size());
258     Ptr += Obj.DosStub.size();
259     memcpy(Ptr, PEMagic, sizeof(PEMagic));
260     Ptr += sizeof(PEMagic);
261   }
262   if (!IsBigObj) {
263     memcpy(Ptr, &Obj.CoffFileHeader, sizeof(Obj.CoffFileHeader));
264     Ptr += sizeof(Obj.CoffFileHeader);
265   } else {
266     // Generate a coff_bigobj_file_header, filling it in with the values
267     // from Obj.CoffFileHeader. All extra fields that don't exist in
268     // coff_file_header can be set to hardcoded values.
269     coff_bigobj_file_header BigObjHeader;
270     BigObjHeader.Sig1 = IMAGE_FILE_MACHINE_UNKNOWN;
271     BigObjHeader.Sig2 = 0xffff;
272     BigObjHeader.Version = BigObjHeader::MinBigObjectVersion;
273     BigObjHeader.Machine = Obj.CoffFileHeader.Machine;
274     BigObjHeader.TimeDateStamp = Obj.CoffFileHeader.TimeDateStamp;
275     memcpy(BigObjHeader.UUID, BigObjMagic, sizeof(BigObjMagic));
276     BigObjHeader.unused1 = 0;
277     BigObjHeader.unused2 = 0;
278     BigObjHeader.unused3 = 0;
279     BigObjHeader.unused4 = 0;
280     // The value in Obj.CoffFileHeader.NumberOfSections is truncated, thus
281     // get the original one instead.
282     BigObjHeader.NumberOfSections = Obj.getSections().size();
283     BigObjHeader.PointerToSymbolTable = Obj.CoffFileHeader.PointerToSymbolTable;
284     BigObjHeader.NumberOfSymbols = Obj.CoffFileHeader.NumberOfSymbols;
285 
286     memcpy(Ptr, &BigObjHeader, sizeof(BigObjHeader));
287     Ptr += sizeof(BigObjHeader);
288   }
289   if (Obj.IsPE) {
290     if (Obj.Is64) {
291       memcpy(Ptr, &Obj.PeHeader, sizeof(Obj.PeHeader));
292       Ptr += sizeof(Obj.PeHeader);
293     } else {
294       pe32_header PeHeader;
295       copyPeHeader(PeHeader, Obj.PeHeader);
296       // The pe32plus_header (stored in Object) lacks the BaseOfData field.
297       PeHeader.BaseOfData = Obj.BaseOfData;
298 
299       memcpy(Ptr, &PeHeader, sizeof(PeHeader));
300       Ptr += sizeof(PeHeader);
301     }
302     for (const auto &DD : Obj.DataDirectories) {
303       memcpy(Ptr, &DD, sizeof(DD));
304       Ptr += sizeof(DD);
305     }
306   }
307   for (const auto &S : Obj.getSections()) {
308     memcpy(Ptr, &S.Header, sizeof(S.Header));
309     Ptr += sizeof(S.Header);
310   }
311 }
312 
313 void COFFWriter::writeSections() {
314   for (const auto &S : Obj.getSections()) {
315     uint8_t *Ptr = reinterpret_cast<uint8_t *>(Buf->getBufferStart()) +
316                    S.Header.PointerToRawData;
317     ArrayRef<uint8_t> Contents = S.getContents();
318     std::copy(Contents.begin(), Contents.end(), Ptr);
319 
320     // For executable sections, pad the remainder of the raw data size with
321     // 0xcc, which is int3 on x86.
322     if ((S.Header.Characteristics & IMAGE_SCN_CNT_CODE) &&
323         S.Header.SizeOfRawData > Contents.size())
324       memset(Ptr + Contents.size(), 0xcc,
325              S.Header.SizeOfRawData - Contents.size());
326 
327     Ptr += S.Header.SizeOfRawData;
328 
329     if (S.Relocs.size() >= 0xffff) {
330       object::coff_relocation R;
331       R.VirtualAddress = S.Relocs.size() + 1;
332       R.SymbolTableIndex = 0;
333       R.Type = 0;
334       memcpy(Ptr, &R, sizeof(R));
335       Ptr += sizeof(R);
336     }
337     for (const auto &R : S.Relocs) {
338       memcpy(Ptr, &R.Reloc, sizeof(R.Reloc));
339       Ptr += sizeof(R.Reloc);
340     }
341   }
342 }
343 
344 template <class SymbolTy> void COFFWriter::writeSymbolStringTables() {
345   uint8_t *Ptr = reinterpret_cast<uint8_t *>(Buf->getBufferStart()) +
346                  Obj.CoffFileHeader.PointerToSymbolTable;
347   for (const auto &S : Obj.getSymbols()) {
348     // Convert symbols back to the right size, from coff_symbol32.
349     copySymbol<SymbolTy, coff_symbol32>(*reinterpret_cast<SymbolTy *>(Ptr),
350                                         S.Sym);
351     Ptr += sizeof(SymbolTy);
352     if (!S.AuxFile.empty()) {
353       // For file symbols, just write the string into the aux symbol slots,
354       // assuming that the unwritten parts are initialized to zero in the memory
355       // mapped file.
356       std::copy(S.AuxFile.begin(), S.AuxFile.end(), Ptr);
357       Ptr += S.Sym.NumberOfAuxSymbols * sizeof(SymbolTy);
358     } else {
359       // For other auxillary symbols, write their opaque payload into one symbol
360       // table slot each. For big object files, the symbols are larger than the
361       // opaque auxillary symbol struct and we leave padding at the end of each
362       // entry.
363       for (const AuxSymbol &AuxSym : S.AuxData) {
364         ArrayRef<uint8_t> Ref = AuxSym.getRef();
365         std::copy(Ref.begin(), Ref.end(), Ptr);
366         Ptr += sizeof(SymbolTy);
367       }
368     }
369   }
370   if (StrTabBuilder.getSize() > 4 || !Obj.IsPE) {
371     // Always write a string table in object files, even an empty one.
372     StrTabBuilder.write(Ptr);
373     Ptr += StrTabBuilder.getSize();
374   }
375 }
376 
377 Error COFFWriter::write(bool IsBigObj) {
378   if (Error E = finalize(IsBigObj))
379     return E;
380 
381   Buf = WritableMemoryBuffer::getNewMemBuffer(FileSize);
382   if (!Buf)
383     return createStringError(llvm::errc::not_enough_memory,
384                              "failed to allocate memory buffer of " +
385                                  Twine::utohexstr(FileSize) + " bytes.");
386 
387   writeHeaders(IsBigObj);
388   writeSections();
389   if (IsBigObj)
390     writeSymbolStringTables<coff_symbol32>();
391   else
392     writeSymbolStringTables<coff_symbol16>();
393 
394   if (Obj.IsPE)
395     if (Error E = patchDebugDirectory())
396       return E;
397 
398   // TODO: Implement direct writing to the output stream (without intermediate
399   // memory buffer Buf).
400   Out.write(Buf->getBufferStart(), Buf->getBufferSize());
401   return Error::success();
402 }
403 
404 Expected<uint32_t> COFFWriter::virtualAddressToFileAddress(uint32_t RVA) {
405   for (const auto &S : Obj.getSections()) {
406     if (RVA >= S.Header.VirtualAddress &&
407         RVA < S.Header.VirtualAddress + S.Header.SizeOfRawData)
408       return S.Header.PointerToRawData + RVA - S.Header.VirtualAddress;
409   }
410   return createStringError(object_error::parse_failed,
411                            "debug directory payload not found");
412 }
413 
414 // Locate which sections contain the debug directories, iterate over all
415 // the debug_directory structs in there, and set the PointerToRawData field
416 // in all of them, according to their new physical location in the file.
417 Error COFFWriter::patchDebugDirectory() {
418   if (Obj.DataDirectories.size() <= DEBUG_DIRECTORY)
419     return Error::success();
420   const data_directory *Dir = &Obj.DataDirectories[DEBUG_DIRECTORY];
421   if (Dir->Size <= 0)
422     return Error::success();
423   for (const auto &S : Obj.getSections()) {
424     if (Dir->RelativeVirtualAddress >= S.Header.VirtualAddress &&
425         Dir->RelativeVirtualAddress <
426             S.Header.VirtualAddress + S.Header.SizeOfRawData) {
427       if (Dir->RelativeVirtualAddress + Dir->Size >
428           S.Header.VirtualAddress + S.Header.SizeOfRawData)
429         return createStringError(object_error::parse_failed,
430                                  "debug directory extends past end of section");
431 
432       size_t Offset = Dir->RelativeVirtualAddress - S.Header.VirtualAddress;
433       uint8_t *Ptr = reinterpret_cast<uint8_t *>(Buf->getBufferStart()) +
434                      S.Header.PointerToRawData + Offset;
435       uint8_t *End = Ptr + Dir->Size;
436       while (Ptr < End) {
437         debug_directory *Debug = reinterpret_cast<debug_directory *>(Ptr);
438         if (Debug->PointerToRawData) {
439           if (Expected<uint32_t> FilePosOrErr =
440                   virtualAddressToFileAddress(Debug->AddressOfRawData))
441             Debug->PointerToRawData = *FilePosOrErr;
442           else
443             return FilePosOrErr.takeError();
444         }
445         Ptr += sizeof(debug_directory);
446         Offset += sizeof(debug_directory);
447       }
448       // Debug directory found and patched, all done.
449       return Error::success();
450     }
451   }
452   return createStringError(object_error::parse_failed,
453                            "debug directory not found");
454 }
455 
456 Error COFFWriter::write() {
457   bool IsBigObj = Obj.getSections().size() > MaxNumberOfSections16;
458   if (IsBigObj && Obj.IsPE)
459     return createStringError(object_error::parse_failed,
460                              "too many sections for executable");
461   return write(IsBigObj);
462 }
463 
464 } // end namespace coff
465 } // end namespace objcopy
466 } // end namespace llvm
467