xref: /freebsd/contrib/llvm-project/clang/lib/CodeGen/Targets/PPC.cpp (revision 8311bc5f17dec348749f763b82dfe2737bc53cd7)
1 //===- PPC.cpp ------------------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "ABIInfoImpl.h"
10 #include "TargetInfo.h"
11 
12 using namespace clang;
13 using namespace clang::CodeGen;
14 
15 static Address complexTempStructure(CodeGenFunction &CGF, Address VAListAddr,
16                                     QualType Ty, CharUnits SlotSize,
17                                     CharUnits EltSize, const ComplexType *CTy) {
18   Address Addr =
19       emitVoidPtrDirectVAArg(CGF, VAListAddr, CGF.Int8Ty, SlotSize * 2,
20                              SlotSize, SlotSize, /*AllowHigher*/ true);
21 
22   Address RealAddr = Addr;
23   Address ImagAddr = RealAddr;
24   if (CGF.CGM.getDataLayout().isBigEndian()) {
25     RealAddr =
26         CGF.Builder.CreateConstInBoundsByteGEP(RealAddr, SlotSize - EltSize);
27     ImagAddr = CGF.Builder.CreateConstInBoundsByteGEP(ImagAddr,
28                                                       2 * SlotSize - EltSize);
29   } else {
30     ImagAddr = CGF.Builder.CreateConstInBoundsByteGEP(RealAddr, SlotSize);
31   }
32 
33   llvm::Type *EltTy = CGF.ConvertTypeForMem(CTy->getElementType());
34   RealAddr = RealAddr.withElementType(EltTy);
35   ImagAddr = ImagAddr.withElementType(EltTy);
36   llvm::Value *Real = CGF.Builder.CreateLoad(RealAddr, ".vareal");
37   llvm::Value *Imag = CGF.Builder.CreateLoad(ImagAddr, ".vaimag");
38 
39   Address Temp = CGF.CreateMemTemp(Ty, "vacplx");
40   CGF.EmitStoreOfComplex({Real, Imag}, CGF.MakeAddrLValue(Temp, Ty),
41                          /*init*/ true);
42   return Temp;
43 }
44 
45 static bool PPC_initDwarfEHRegSizeTable(CodeGen::CodeGenFunction &CGF,
46                                         llvm::Value *Address, bool Is64Bit,
47                                         bool IsAIX) {
48   // This is calculated from the LLVM and GCC tables and verified
49   // against gcc output.  AFAIK all PPC ABIs use the same encoding.
50 
51   CodeGen::CGBuilderTy &Builder = CGF.Builder;
52 
53   llvm::IntegerType *i8 = CGF.Int8Ty;
54   llvm::Value *Four8 = llvm::ConstantInt::get(i8, 4);
55   llvm::Value *Eight8 = llvm::ConstantInt::get(i8, 8);
56   llvm::Value *Sixteen8 = llvm::ConstantInt::get(i8, 16);
57 
58   // 0-31: r0-31, the 4-byte or 8-byte general-purpose registers
59   AssignToArrayRange(Builder, Address, Is64Bit ? Eight8 : Four8, 0, 31);
60 
61   // 32-63: fp0-31, the 8-byte floating-point registers
62   AssignToArrayRange(Builder, Address, Eight8, 32, 63);
63 
64   // 64-67 are various 4-byte or 8-byte special-purpose registers:
65   // 64: mq
66   // 65: lr
67   // 66: ctr
68   // 67: ap
69   AssignToArrayRange(Builder, Address, Is64Bit ? Eight8 : Four8, 64, 67);
70 
71   // 68-76 are various 4-byte special-purpose registers:
72   // 68-75 cr0-7
73   // 76: xer
74   AssignToArrayRange(Builder, Address, Four8, 68, 76);
75 
76   // 77-108: v0-31, the 16-byte vector registers
77   AssignToArrayRange(Builder, Address, Sixteen8, 77, 108);
78 
79   // 109: vrsave
80   // 110: vscr
81   AssignToArrayRange(Builder, Address, Is64Bit ? Eight8 : Four8, 109, 110);
82 
83   // AIX does not utilize the rest of the registers.
84   if (IsAIX)
85     return false;
86 
87   // 111: spe_acc
88   // 112: spefscr
89   // 113: sfp
90   AssignToArrayRange(Builder, Address, Is64Bit ? Eight8 : Four8, 111, 113);
91 
92   if (!Is64Bit)
93     return false;
94 
95   // TODO: Need to verify if these registers are used on 64 bit AIX with Power8
96   // or above CPU.
97   // 64-bit only registers:
98   // 114: tfhar
99   // 115: tfiar
100   // 116: texasr
101   AssignToArrayRange(Builder, Address, Eight8, 114, 116);
102 
103   return false;
104 }
105 
106 // AIX
107 namespace {
108 /// AIXABIInfo - The AIX XCOFF ABI information.
109 class AIXABIInfo : public ABIInfo {
110   const bool Is64Bit;
111   const unsigned PtrByteSize;
112   CharUnits getParamTypeAlignment(QualType Ty) const;
113 
114 public:
115   AIXABIInfo(CodeGen::CodeGenTypes &CGT, bool Is64Bit)
116       : ABIInfo(CGT), Is64Bit(Is64Bit), PtrByteSize(Is64Bit ? 8 : 4) {}
117 
118   bool isPromotableTypeForABI(QualType Ty) const;
119 
120   ABIArgInfo classifyReturnType(QualType RetTy) const;
121   ABIArgInfo classifyArgumentType(QualType Ty) const;
122 
123   void computeInfo(CGFunctionInfo &FI) const override {
124     if (!getCXXABI().classifyReturnType(FI))
125       FI.getReturnInfo() = classifyReturnType(FI.getReturnType());
126 
127     for (auto &I : FI.arguments())
128       I.info = classifyArgumentType(I.type);
129   }
130 
131   Address EmitVAArg(CodeGenFunction &CGF, Address VAListAddr,
132                     QualType Ty) const override;
133 };
134 
135 class AIXTargetCodeGenInfo : public TargetCodeGenInfo {
136   const bool Is64Bit;
137 
138 public:
139   AIXTargetCodeGenInfo(CodeGen::CodeGenTypes &CGT, bool Is64Bit)
140       : TargetCodeGenInfo(std::make_unique<AIXABIInfo>(CGT, Is64Bit)),
141         Is64Bit(Is64Bit) {}
142   int getDwarfEHStackPointer(CodeGen::CodeGenModule &M) const override {
143     return 1; // r1 is the dedicated stack pointer
144   }
145 
146   bool initDwarfEHRegSizeTable(CodeGen::CodeGenFunction &CGF,
147                                llvm::Value *Address) const override;
148 };
149 } // namespace
150 
151 // Return true if the ABI requires Ty to be passed sign- or zero-
152 // extended to 32/64 bits.
153 bool AIXABIInfo::isPromotableTypeForABI(QualType Ty) const {
154   // Treat an enum type as its underlying type.
155   if (const EnumType *EnumTy = Ty->getAs<EnumType>())
156     Ty = EnumTy->getDecl()->getIntegerType();
157 
158   // Promotable integer types are required to be promoted by the ABI.
159   if (getContext().isPromotableIntegerType(Ty))
160     return true;
161 
162   if (!Is64Bit)
163     return false;
164 
165   // For 64 bit mode, in addition to the usual promotable integer types, we also
166   // need to extend all 32-bit types, since the ABI requires promotion to 64
167   // bits.
168   if (const BuiltinType *BT = Ty->getAs<BuiltinType>())
169     switch (BT->getKind()) {
170     case BuiltinType::Int:
171     case BuiltinType::UInt:
172       return true;
173     default:
174       break;
175     }
176 
177   return false;
178 }
179 
180 ABIArgInfo AIXABIInfo::classifyReturnType(QualType RetTy) const {
181   if (RetTy->isAnyComplexType())
182     return ABIArgInfo::getDirect();
183 
184   if (RetTy->isVectorType())
185     return ABIArgInfo::getDirect();
186 
187   if (RetTy->isVoidType())
188     return ABIArgInfo::getIgnore();
189 
190   if (isAggregateTypeForABI(RetTy))
191     return getNaturalAlignIndirect(RetTy);
192 
193   return (isPromotableTypeForABI(RetTy) ? ABIArgInfo::getExtend(RetTy)
194                                         : ABIArgInfo::getDirect());
195 }
196 
197 ABIArgInfo AIXABIInfo::classifyArgumentType(QualType Ty) const {
198   Ty = useFirstFieldIfTransparentUnion(Ty);
199 
200   if (Ty->isAnyComplexType())
201     return ABIArgInfo::getDirect();
202 
203   if (Ty->isVectorType())
204     return ABIArgInfo::getDirect();
205 
206   if (isAggregateTypeForABI(Ty)) {
207     // Records with non-trivial destructors/copy-constructors should not be
208     // passed by value.
209     if (CGCXXABI::RecordArgABI RAA = getRecordArgABI(Ty, getCXXABI()))
210       return getNaturalAlignIndirect(Ty, RAA == CGCXXABI::RAA_DirectInMemory);
211 
212     CharUnits CCAlign = getParamTypeAlignment(Ty);
213     CharUnits TyAlign = getContext().getTypeAlignInChars(Ty);
214 
215     return ABIArgInfo::getIndirect(CCAlign, /*ByVal*/ true,
216                                    /*Realign*/ TyAlign > CCAlign);
217   }
218 
219   return (isPromotableTypeForABI(Ty) ? ABIArgInfo::getExtend(Ty)
220                                      : ABIArgInfo::getDirect());
221 }
222 
223 CharUnits AIXABIInfo::getParamTypeAlignment(QualType Ty) const {
224   // Complex types are passed just like their elements.
225   if (const ComplexType *CTy = Ty->getAs<ComplexType>())
226     Ty = CTy->getElementType();
227 
228   if (Ty->isVectorType())
229     return CharUnits::fromQuantity(16);
230 
231   // If the structure contains a vector type, the alignment is 16.
232   if (isRecordWithSIMDVectorType(getContext(), Ty))
233     return CharUnits::fromQuantity(16);
234 
235   return CharUnits::fromQuantity(PtrByteSize);
236 }
237 
238 Address AIXABIInfo::EmitVAArg(CodeGenFunction &CGF, Address VAListAddr,
239                               QualType Ty) const {
240 
241   auto TypeInfo = getContext().getTypeInfoInChars(Ty);
242   TypeInfo.Align = getParamTypeAlignment(Ty);
243 
244   CharUnits SlotSize = CharUnits::fromQuantity(PtrByteSize);
245 
246   // If we have a complex type and the base type is smaller than the register
247   // size, the ABI calls for the real and imaginary parts to be right-adjusted
248   // in separate words in 32bit mode or doublewords in 64bit mode. However,
249   // Clang expects us to produce a pointer to a structure with the two parts
250   // packed tightly. So generate loads of the real and imaginary parts relative
251   // to the va_list pointer, and store them to a temporary structure. We do the
252   // same as the PPC64ABI here.
253   if (const ComplexType *CTy = Ty->getAs<ComplexType>()) {
254     CharUnits EltSize = TypeInfo.Width / 2;
255     if (EltSize < SlotSize)
256       return complexTempStructure(CGF, VAListAddr, Ty, SlotSize, EltSize, CTy);
257   }
258 
259   return emitVoidPtrVAArg(CGF, VAListAddr, Ty, /*Indirect*/ false, TypeInfo,
260                           SlotSize, /*AllowHigher*/ true);
261 }
262 
263 bool AIXTargetCodeGenInfo::initDwarfEHRegSizeTable(
264     CodeGen::CodeGenFunction &CGF, llvm::Value *Address) const {
265   return PPC_initDwarfEHRegSizeTable(CGF, Address, Is64Bit, /*IsAIX*/ true);
266 }
267 
268 // PowerPC-32
269 namespace {
270 /// PPC32_SVR4_ABIInfo - The 32-bit PowerPC ELF (SVR4) ABI information.
271 class PPC32_SVR4_ABIInfo : public DefaultABIInfo {
272   bool IsSoftFloatABI;
273   bool IsRetSmallStructInRegABI;
274 
275   CharUnits getParamTypeAlignment(QualType Ty) const;
276 
277 public:
278   PPC32_SVR4_ABIInfo(CodeGen::CodeGenTypes &CGT, bool SoftFloatABI,
279                      bool RetSmallStructInRegABI)
280       : DefaultABIInfo(CGT), IsSoftFloatABI(SoftFloatABI),
281         IsRetSmallStructInRegABI(RetSmallStructInRegABI) {}
282 
283   ABIArgInfo classifyReturnType(QualType RetTy) const;
284 
285   void computeInfo(CGFunctionInfo &FI) const override {
286     if (!getCXXABI().classifyReturnType(FI))
287       FI.getReturnInfo() = classifyReturnType(FI.getReturnType());
288     for (auto &I : FI.arguments())
289       I.info = classifyArgumentType(I.type);
290   }
291 
292   Address EmitVAArg(CodeGenFunction &CGF, Address VAListAddr,
293                     QualType Ty) const override;
294 };
295 
296 class PPC32TargetCodeGenInfo : public TargetCodeGenInfo {
297 public:
298   PPC32TargetCodeGenInfo(CodeGenTypes &CGT, bool SoftFloatABI,
299                          bool RetSmallStructInRegABI)
300       : TargetCodeGenInfo(std::make_unique<PPC32_SVR4_ABIInfo>(
301             CGT, SoftFloatABI, RetSmallStructInRegABI)) {}
302 
303   static bool isStructReturnInRegABI(const llvm::Triple &Triple,
304                                      const CodeGenOptions &Opts);
305 
306   int getDwarfEHStackPointer(CodeGen::CodeGenModule &M) const override {
307     // This is recovered from gcc output.
308     return 1; // r1 is the dedicated stack pointer
309   }
310 
311   bool initDwarfEHRegSizeTable(CodeGen::CodeGenFunction &CGF,
312                                llvm::Value *Address) const override;
313 };
314 }
315 
316 CharUnits PPC32_SVR4_ABIInfo::getParamTypeAlignment(QualType Ty) const {
317   // Complex types are passed just like their elements.
318   if (const ComplexType *CTy = Ty->getAs<ComplexType>())
319     Ty = CTy->getElementType();
320 
321   if (Ty->isVectorType())
322     return CharUnits::fromQuantity(getContext().getTypeSize(Ty) == 128 ? 16
323                                                                        : 4);
324 
325   // For single-element float/vector structs, we consider the whole type
326   // to have the same alignment requirements as its single element.
327   const Type *AlignTy = nullptr;
328   if (const Type *EltType = isSingleElementStruct(Ty, getContext())) {
329     const BuiltinType *BT = EltType->getAs<BuiltinType>();
330     if ((EltType->isVectorType() && getContext().getTypeSize(EltType) == 128) ||
331         (BT && BT->isFloatingPoint()))
332       AlignTy = EltType;
333   }
334 
335   if (AlignTy)
336     return CharUnits::fromQuantity(AlignTy->isVectorType() ? 16 : 4);
337   return CharUnits::fromQuantity(4);
338 }
339 
340 ABIArgInfo PPC32_SVR4_ABIInfo::classifyReturnType(QualType RetTy) const {
341   uint64_t Size;
342 
343   // -msvr4-struct-return puts small aggregates in GPR3 and GPR4.
344   if (isAggregateTypeForABI(RetTy) && IsRetSmallStructInRegABI &&
345       (Size = getContext().getTypeSize(RetTy)) <= 64) {
346     // System V ABI (1995), page 3-22, specified:
347     // > A structure or union whose size is less than or equal to 8 bytes
348     // > shall be returned in r3 and r4, as if it were first stored in the
349     // > 8-byte aligned memory area and then the low addressed word were
350     // > loaded into r3 and the high-addressed word into r4.  Bits beyond
351     // > the last member of the structure or union are not defined.
352     //
353     // GCC for big-endian PPC32 inserts the pad before the first member,
354     // not "beyond the last member" of the struct.  To stay compatible
355     // with GCC, we coerce the struct to an integer of the same size.
356     // LLVM will extend it and return i32 in r3, or i64 in r3:r4.
357     if (Size == 0)
358       return ABIArgInfo::getIgnore();
359     else {
360       llvm::Type *CoerceTy = llvm::Type::getIntNTy(getVMContext(), Size);
361       return ABIArgInfo::getDirect(CoerceTy);
362     }
363   }
364 
365   return DefaultABIInfo::classifyReturnType(RetTy);
366 }
367 
368 // TODO: this implementation is now likely redundant with
369 // DefaultABIInfo::EmitVAArg.
370 Address PPC32_SVR4_ABIInfo::EmitVAArg(CodeGenFunction &CGF, Address VAList,
371                                       QualType Ty) const {
372   if (getTarget().getTriple().isOSDarwin()) {
373     auto TI = getContext().getTypeInfoInChars(Ty);
374     TI.Align = getParamTypeAlignment(Ty);
375 
376     CharUnits SlotSize = CharUnits::fromQuantity(4);
377     return emitVoidPtrVAArg(CGF, VAList, Ty,
378                             classifyArgumentType(Ty).isIndirect(), TI, SlotSize,
379                             /*AllowHigherAlign=*/true);
380   }
381 
382   const unsigned OverflowLimit = 8;
383   if (const ComplexType *CTy = Ty->getAs<ComplexType>()) {
384     // TODO: Implement this. For now ignore.
385     (void)CTy;
386     return Address::invalid(); // FIXME?
387   }
388 
389   // struct __va_list_tag {
390   //   unsigned char gpr;
391   //   unsigned char fpr;
392   //   unsigned short reserved;
393   //   void *overflow_arg_area;
394   //   void *reg_save_area;
395   // };
396 
397   bool isI64 = Ty->isIntegerType() && getContext().getTypeSize(Ty) == 64;
398   bool isInt = !Ty->isFloatingType();
399   bool isF64 = Ty->isFloatingType() && getContext().getTypeSize(Ty) == 64;
400 
401   // All aggregates are passed indirectly?  That doesn't seem consistent
402   // with the argument-lowering code.
403   bool isIndirect = isAggregateTypeForABI(Ty);
404 
405   CGBuilderTy &Builder = CGF.Builder;
406 
407   // The calling convention either uses 1-2 GPRs or 1 FPR.
408   Address NumRegsAddr = Address::invalid();
409   if (isInt || IsSoftFloatABI) {
410     NumRegsAddr = Builder.CreateStructGEP(VAList, 0, "gpr");
411   } else {
412     NumRegsAddr = Builder.CreateStructGEP(VAList, 1, "fpr");
413   }
414 
415   llvm::Value *NumRegs = Builder.CreateLoad(NumRegsAddr, "numUsedRegs");
416 
417   // "Align" the register count when TY is i64.
418   if (isI64 || (isF64 && IsSoftFloatABI)) {
419     NumRegs = Builder.CreateAdd(NumRegs, Builder.getInt8(1));
420     NumRegs = Builder.CreateAnd(NumRegs, Builder.getInt8((uint8_t) ~1U));
421   }
422 
423   llvm::Value *CC =
424       Builder.CreateICmpULT(NumRegs, Builder.getInt8(OverflowLimit), "cond");
425 
426   llvm::BasicBlock *UsingRegs = CGF.createBasicBlock("using_regs");
427   llvm::BasicBlock *UsingOverflow = CGF.createBasicBlock("using_overflow");
428   llvm::BasicBlock *Cont = CGF.createBasicBlock("cont");
429 
430   Builder.CreateCondBr(CC, UsingRegs, UsingOverflow);
431 
432   llvm::Type *DirectTy = CGF.ConvertType(Ty), *ElementTy = DirectTy;
433   if (isIndirect)
434     DirectTy = llvm::PointerType::getUnqual(CGF.getLLVMContext());
435 
436   // Case 1: consume registers.
437   Address RegAddr = Address::invalid();
438   {
439     CGF.EmitBlock(UsingRegs);
440 
441     Address RegSaveAreaPtr = Builder.CreateStructGEP(VAList, 4);
442     RegAddr = Address(Builder.CreateLoad(RegSaveAreaPtr), CGF.Int8Ty,
443                       CharUnits::fromQuantity(8));
444     assert(RegAddr.getElementType() == CGF.Int8Ty);
445 
446     // Floating-point registers start after the general-purpose registers.
447     if (!(isInt || IsSoftFloatABI)) {
448       RegAddr = Builder.CreateConstInBoundsByteGEP(RegAddr,
449                                                    CharUnits::fromQuantity(32));
450     }
451 
452     // Get the address of the saved value by scaling the number of
453     // registers we've used by the number of
454     CharUnits RegSize = CharUnits::fromQuantity((isInt || IsSoftFloatABI) ? 4 : 8);
455     llvm::Value *RegOffset =
456         Builder.CreateMul(NumRegs, Builder.getInt8(RegSize.getQuantity()));
457     RegAddr = Address(
458         Builder.CreateInBoundsGEP(CGF.Int8Ty, RegAddr.getPointer(), RegOffset),
459         DirectTy, RegAddr.getAlignment().alignmentOfArrayElement(RegSize));
460 
461     // Increase the used-register count.
462     NumRegs =
463       Builder.CreateAdd(NumRegs,
464                         Builder.getInt8((isI64 || (isF64 && IsSoftFloatABI)) ? 2 : 1));
465     Builder.CreateStore(NumRegs, NumRegsAddr);
466 
467     CGF.EmitBranch(Cont);
468   }
469 
470   // Case 2: consume space in the overflow area.
471   Address MemAddr = Address::invalid();
472   {
473     CGF.EmitBlock(UsingOverflow);
474 
475     Builder.CreateStore(Builder.getInt8(OverflowLimit), NumRegsAddr);
476 
477     // Everything in the overflow area is rounded up to a size of at least 4.
478     CharUnits OverflowAreaAlign = CharUnits::fromQuantity(4);
479 
480     CharUnits Size;
481     if (!isIndirect) {
482       auto TypeInfo = CGF.getContext().getTypeInfoInChars(Ty);
483       Size = TypeInfo.Width.alignTo(OverflowAreaAlign);
484     } else {
485       Size = CGF.getPointerSize();
486     }
487 
488     Address OverflowAreaAddr = Builder.CreateStructGEP(VAList, 3);
489     Address OverflowArea =
490         Address(Builder.CreateLoad(OverflowAreaAddr, "argp.cur"), CGF.Int8Ty,
491                 OverflowAreaAlign);
492     // Round up address of argument to alignment
493     CharUnits Align = CGF.getContext().getTypeAlignInChars(Ty);
494     if (Align > OverflowAreaAlign) {
495       llvm::Value *Ptr = OverflowArea.getPointer();
496       OverflowArea = Address(emitRoundPointerUpToAlignment(CGF, Ptr, Align),
497                              OverflowArea.getElementType(), Align);
498     }
499 
500     MemAddr = OverflowArea.withElementType(DirectTy);
501 
502     // Increase the overflow area.
503     OverflowArea = Builder.CreateConstInBoundsByteGEP(OverflowArea, Size);
504     Builder.CreateStore(OverflowArea.getPointer(), OverflowAreaAddr);
505     CGF.EmitBranch(Cont);
506   }
507 
508   CGF.EmitBlock(Cont);
509 
510   // Merge the cases with a phi.
511   Address Result = emitMergePHI(CGF, RegAddr, UsingRegs, MemAddr, UsingOverflow,
512                                 "vaarg.addr");
513 
514   // Load the pointer if the argument was passed indirectly.
515   if (isIndirect) {
516     Result = Address(Builder.CreateLoad(Result, "aggr"), ElementTy,
517                      getContext().getTypeAlignInChars(Ty));
518   }
519 
520   return Result;
521 }
522 
523 bool PPC32TargetCodeGenInfo::isStructReturnInRegABI(
524     const llvm::Triple &Triple, const CodeGenOptions &Opts) {
525   assert(Triple.isPPC32());
526 
527   switch (Opts.getStructReturnConvention()) {
528   case CodeGenOptions::SRCK_Default:
529     break;
530   case CodeGenOptions::SRCK_OnStack: // -maix-struct-return
531     return false;
532   case CodeGenOptions::SRCK_InRegs: // -msvr4-struct-return
533     return true;
534   }
535 
536   if (Triple.isOSBinFormatELF() && !Triple.isOSLinux())
537     return true;
538 
539   return false;
540 }
541 
542 bool
543 PPC32TargetCodeGenInfo::initDwarfEHRegSizeTable(CodeGen::CodeGenFunction &CGF,
544                                                 llvm::Value *Address) const {
545   return PPC_initDwarfEHRegSizeTable(CGF, Address, /*Is64Bit*/ false,
546                                      /*IsAIX*/ false);
547 }
548 
549 // PowerPC-64
550 
551 namespace {
552 
553 /// PPC64_SVR4_ABIInfo - The 64-bit PowerPC ELF (SVR4) ABI information.
554 class PPC64_SVR4_ABIInfo : public ABIInfo {
555   static const unsigned GPRBits = 64;
556   PPC64_SVR4_ABIKind Kind;
557   bool IsSoftFloatABI;
558 
559 public:
560   PPC64_SVR4_ABIInfo(CodeGen::CodeGenTypes &CGT, PPC64_SVR4_ABIKind Kind,
561                      bool SoftFloatABI)
562       : ABIInfo(CGT), Kind(Kind), IsSoftFloatABI(SoftFloatABI) {}
563 
564   bool isPromotableTypeForABI(QualType Ty) const;
565   CharUnits getParamTypeAlignment(QualType Ty) const;
566 
567   ABIArgInfo classifyReturnType(QualType RetTy) const;
568   ABIArgInfo classifyArgumentType(QualType Ty) const;
569 
570   bool isHomogeneousAggregateBaseType(QualType Ty) const override;
571   bool isHomogeneousAggregateSmallEnough(const Type *Ty,
572                                          uint64_t Members) const override;
573 
574   // TODO: We can add more logic to computeInfo to improve performance.
575   // Example: For aggregate arguments that fit in a register, we could
576   // use getDirectInReg (as is done below for structs containing a single
577   // floating-point value) to avoid pushing them to memory on function
578   // entry.  This would require changing the logic in PPCISelLowering
579   // when lowering the parameters in the caller and args in the callee.
580   void computeInfo(CGFunctionInfo &FI) const override {
581     if (!getCXXABI().classifyReturnType(FI))
582       FI.getReturnInfo() = classifyReturnType(FI.getReturnType());
583     for (auto &I : FI.arguments()) {
584       // We rely on the default argument classification for the most part.
585       // One exception:  An aggregate containing a single floating-point
586       // or vector item must be passed in a register if one is available.
587       const Type *T = isSingleElementStruct(I.type, getContext());
588       if (T) {
589         const BuiltinType *BT = T->getAs<BuiltinType>();
590         if ((T->isVectorType() && getContext().getTypeSize(T) == 128) ||
591             (BT && BT->isFloatingPoint())) {
592           QualType QT(T, 0);
593           I.info = ABIArgInfo::getDirectInReg(CGT.ConvertType(QT));
594           continue;
595         }
596       }
597       I.info = classifyArgumentType(I.type);
598     }
599   }
600 
601   Address EmitVAArg(CodeGenFunction &CGF, Address VAListAddr,
602                     QualType Ty) const override;
603 };
604 
605 class PPC64_SVR4_TargetCodeGenInfo : public TargetCodeGenInfo {
606 
607 public:
608   PPC64_SVR4_TargetCodeGenInfo(CodeGenTypes &CGT, PPC64_SVR4_ABIKind Kind,
609                                bool SoftFloatABI)
610       : TargetCodeGenInfo(
611             std::make_unique<PPC64_SVR4_ABIInfo>(CGT, Kind, SoftFloatABI)) {
612     SwiftInfo =
613         std::make_unique<SwiftABIInfo>(CGT, /*SwiftErrorInRegister=*/false);
614   }
615 
616   int getDwarfEHStackPointer(CodeGen::CodeGenModule &M) const override {
617     // This is recovered from gcc output.
618     return 1; // r1 is the dedicated stack pointer
619   }
620 
621   bool initDwarfEHRegSizeTable(CodeGen::CodeGenFunction &CGF,
622                                llvm::Value *Address) const override;
623 };
624 
625 class PPC64TargetCodeGenInfo : public TargetCodeGenInfo {
626 public:
627   PPC64TargetCodeGenInfo(CodeGenTypes &CGT)
628       : TargetCodeGenInfo(std::make_unique<DefaultABIInfo>(CGT)) {}
629 
630   int getDwarfEHStackPointer(CodeGen::CodeGenModule &M) const override {
631     // This is recovered from gcc output.
632     return 1; // r1 is the dedicated stack pointer
633   }
634 
635   bool initDwarfEHRegSizeTable(CodeGen::CodeGenFunction &CGF,
636                                llvm::Value *Address) const override;
637 };
638 }
639 
640 // Return true if the ABI requires Ty to be passed sign- or zero-
641 // extended to 64 bits.
642 bool
643 PPC64_SVR4_ABIInfo::isPromotableTypeForABI(QualType Ty) const {
644   // Treat an enum type as its underlying type.
645   if (const EnumType *EnumTy = Ty->getAs<EnumType>())
646     Ty = EnumTy->getDecl()->getIntegerType();
647 
648   // Promotable integer types are required to be promoted by the ABI.
649   if (isPromotableIntegerTypeForABI(Ty))
650     return true;
651 
652   // In addition to the usual promotable integer types, we also need to
653   // extend all 32-bit types, since the ABI requires promotion to 64 bits.
654   if (const BuiltinType *BT = Ty->getAs<BuiltinType>())
655     switch (BT->getKind()) {
656     case BuiltinType::Int:
657     case BuiltinType::UInt:
658       return true;
659     default:
660       break;
661     }
662 
663   if (const auto *EIT = Ty->getAs<BitIntType>())
664     if (EIT->getNumBits() < 64)
665       return true;
666 
667   return false;
668 }
669 
670 /// isAlignedParamType - Determine whether a type requires 16-byte or
671 /// higher alignment in the parameter area.  Always returns at least 8.
672 CharUnits PPC64_SVR4_ABIInfo::getParamTypeAlignment(QualType Ty) const {
673   // Complex types are passed just like their elements.
674   if (const ComplexType *CTy = Ty->getAs<ComplexType>())
675     Ty = CTy->getElementType();
676 
677   auto FloatUsesVector = [this](QualType Ty){
678     return Ty->isRealFloatingType() && &getContext().getFloatTypeSemantics(
679                                            Ty) == &llvm::APFloat::IEEEquad();
680   };
681 
682   // Only vector types of size 16 bytes need alignment (larger types are
683   // passed via reference, smaller types are not aligned).
684   if (Ty->isVectorType()) {
685     return CharUnits::fromQuantity(getContext().getTypeSize(Ty) == 128 ? 16 : 8);
686   } else if (FloatUsesVector(Ty)) {
687     // According to ABI document section 'Optional Save Areas': If extended
688     // precision floating-point values in IEEE BINARY 128 QUADRUPLE PRECISION
689     // format are supported, map them to a single quadword, quadword aligned.
690     return CharUnits::fromQuantity(16);
691   }
692 
693   // For single-element float/vector structs, we consider the whole type
694   // to have the same alignment requirements as its single element.
695   const Type *AlignAsType = nullptr;
696   const Type *EltType = isSingleElementStruct(Ty, getContext());
697   if (EltType) {
698     const BuiltinType *BT = EltType->getAs<BuiltinType>();
699     if ((EltType->isVectorType() && getContext().getTypeSize(EltType) == 128) ||
700         (BT && BT->isFloatingPoint()))
701       AlignAsType = EltType;
702   }
703 
704   // Likewise for ELFv2 homogeneous aggregates.
705   const Type *Base = nullptr;
706   uint64_t Members = 0;
707   if (!AlignAsType && Kind == PPC64_SVR4_ABIKind::ELFv2 &&
708       isAggregateTypeForABI(Ty) && isHomogeneousAggregate(Ty, Base, Members))
709     AlignAsType = Base;
710 
711   // With special case aggregates, only vector base types need alignment.
712   if (AlignAsType) {
713     bool UsesVector = AlignAsType->isVectorType() ||
714                       FloatUsesVector(QualType(AlignAsType, 0));
715     return CharUnits::fromQuantity(UsesVector ? 16 : 8);
716   }
717 
718   // Otherwise, we only need alignment for any aggregate type that
719   // has an alignment requirement of >= 16 bytes.
720   if (isAggregateTypeForABI(Ty) && getContext().getTypeAlign(Ty) >= 128) {
721     return CharUnits::fromQuantity(16);
722   }
723 
724   return CharUnits::fromQuantity(8);
725 }
726 
727 bool PPC64_SVR4_ABIInfo::isHomogeneousAggregateBaseType(QualType Ty) const {
728   // Homogeneous aggregates for ELFv2 must have base types of float,
729   // double, long double, or 128-bit vectors.
730   if (const BuiltinType *BT = Ty->getAs<BuiltinType>()) {
731     if (BT->getKind() == BuiltinType::Float ||
732         BT->getKind() == BuiltinType::Double ||
733         BT->getKind() == BuiltinType::LongDouble ||
734         BT->getKind() == BuiltinType::Ibm128 ||
735         (getContext().getTargetInfo().hasFloat128Type() &&
736          (BT->getKind() == BuiltinType::Float128))) {
737       if (IsSoftFloatABI)
738         return false;
739       return true;
740     }
741   }
742   if (const VectorType *VT = Ty->getAs<VectorType>()) {
743     if (getContext().getTypeSize(VT) == 128)
744       return true;
745   }
746   return false;
747 }
748 
749 bool PPC64_SVR4_ABIInfo::isHomogeneousAggregateSmallEnough(
750     const Type *Base, uint64_t Members) const {
751   // Vector and fp128 types require one register, other floating point types
752   // require one or two registers depending on their size.
753   uint32_t NumRegs =
754       ((getContext().getTargetInfo().hasFloat128Type() &&
755           Base->isFloat128Type()) ||
756         Base->isVectorType()) ? 1
757                               : (getContext().getTypeSize(Base) + 63) / 64;
758 
759   // Homogeneous Aggregates may occupy at most 8 registers.
760   return Members * NumRegs <= 8;
761 }
762 
763 ABIArgInfo
764 PPC64_SVR4_ABIInfo::classifyArgumentType(QualType Ty) const {
765   Ty = useFirstFieldIfTransparentUnion(Ty);
766 
767   if (Ty->isAnyComplexType())
768     return ABIArgInfo::getDirect();
769 
770   // Non-Altivec vector types are passed in GPRs (smaller than 16 bytes)
771   // or via reference (larger than 16 bytes).
772   if (Ty->isVectorType()) {
773     uint64_t Size = getContext().getTypeSize(Ty);
774     if (Size > 128)
775       return getNaturalAlignIndirect(Ty, /*ByVal=*/false);
776     else if (Size < 128) {
777       llvm::Type *CoerceTy = llvm::IntegerType::get(getVMContext(), Size);
778       return ABIArgInfo::getDirect(CoerceTy);
779     }
780   }
781 
782   if (const auto *EIT = Ty->getAs<BitIntType>())
783     if (EIT->getNumBits() > 128)
784       return getNaturalAlignIndirect(Ty, /*ByVal=*/true);
785 
786   if (isAggregateTypeForABI(Ty)) {
787     if (CGCXXABI::RecordArgABI RAA = getRecordArgABI(Ty, getCXXABI()))
788       return getNaturalAlignIndirect(Ty, RAA == CGCXXABI::RAA_DirectInMemory);
789 
790     uint64_t ABIAlign = getParamTypeAlignment(Ty).getQuantity();
791     uint64_t TyAlign = getContext().getTypeAlignInChars(Ty).getQuantity();
792 
793     // ELFv2 homogeneous aggregates are passed as array types.
794     const Type *Base = nullptr;
795     uint64_t Members = 0;
796     if (Kind == PPC64_SVR4_ABIKind::ELFv2 &&
797         isHomogeneousAggregate(Ty, Base, Members)) {
798       llvm::Type *BaseTy = CGT.ConvertType(QualType(Base, 0));
799       llvm::Type *CoerceTy = llvm::ArrayType::get(BaseTy, Members);
800       return ABIArgInfo::getDirect(CoerceTy);
801     }
802 
803     // If an aggregate may end up fully in registers, we do not
804     // use the ByVal method, but pass the aggregate as array.
805     // This is usually beneficial since we avoid forcing the
806     // back-end to store the argument to memory.
807     uint64_t Bits = getContext().getTypeSize(Ty);
808     if (Bits > 0 && Bits <= 8 * GPRBits) {
809       llvm::Type *CoerceTy;
810 
811       // Types up to 8 bytes are passed as integer type (which will be
812       // properly aligned in the argument save area doubleword).
813       if (Bits <= GPRBits)
814         CoerceTy =
815             llvm::IntegerType::get(getVMContext(), llvm::alignTo(Bits, 8));
816       // Larger types are passed as arrays, with the base type selected
817       // according to the required alignment in the save area.
818       else {
819         uint64_t RegBits = ABIAlign * 8;
820         uint64_t NumRegs = llvm::alignTo(Bits, RegBits) / RegBits;
821         llvm::Type *RegTy = llvm::IntegerType::get(getVMContext(), RegBits);
822         CoerceTy = llvm::ArrayType::get(RegTy, NumRegs);
823       }
824 
825       return ABIArgInfo::getDirect(CoerceTy);
826     }
827 
828     // All other aggregates are passed ByVal.
829     return ABIArgInfo::getIndirect(CharUnits::fromQuantity(ABIAlign),
830                                    /*ByVal=*/true,
831                                    /*Realign=*/TyAlign > ABIAlign);
832   }
833 
834   return (isPromotableTypeForABI(Ty) ? ABIArgInfo::getExtend(Ty)
835                                      : ABIArgInfo::getDirect());
836 }
837 
838 ABIArgInfo
839 PPC64_SVR4_ABIInfo::classifyReturnType(QualType RetTy) const {
840   if (RetTy->isVoidType())
841     return ABIArgInfo::getIgnore();
842 
843   if (RetTy->isAnyComplexType())
844     return ABIArgInfo::getDirect();
845 
846   // Non-Altivec vector types are returned in GPRs (smaller than 16 bytes)
847   // or via reference (larger than 16 bytes).
848   if (RetTy->isVectorType()) {
849     uint64_t Size = getContext().getTypeSize(RetTy);
850     if (Size > 128)
851       return getNaturalAlignIndirect(RetTy);
852     else if (Size < 128) {
853       llvm::Type *CoerceTy = llvm::IntegerType::get(getVMContext(), Size);
854       return ABIArgInfo::getDirect(CoerceTy);
855     }
856   }
857 
858   if (const auto *EIT = RetTy->getAs<BitIntType>())
859     if (EIT->getNumBits() > 128)
860       return getNaturalAlignIndirect(RetTy, /*ByVal=*/false);
861 
862   if (isAggregateTypeForABI(RetTy)) {
863     // ELFv2 homogeneous aggregates are returned as array types.
864     const Type *Base = nullptr;
865     uint64_t Members = 0;
866     if (Kind == PPC64_SVR4_ABIKind::ELFv2 &&
867         isHomogeneousAggregate(RetTy, Base, Members)) {
868       llvm::Type *BaseTy = CGT.ConvertType(QualType(Base, 0));
869       llvm::Type *CoerceTy = llvm::ArrayType::get(BaseTy, Members);
870       return ABIArgInfo::getDirect(CoerceTy);
871     }
872 
873     // ELFv2 small aggregates are returned in up to two registers.
874     uint64_t Bits = getContext().getTypeSize(RetTy);
875     if (Kind == PPC64_SVR4_ABIKind::ELFv2 && Bits <= 2 * GPRBits) {
876       if (Bits == 0)
877         return ABIArgInfo::getIgnore();
878 
879       llvm::Type *CoerceTy;
880       if (Bits > GPRBits) {
881         CoerceTy = llvm::IntegerType::get(getVMContext(), GPRBits);
882         CoerceTy = llvm::StructType::get(CoerceTy, CoerceTy);
883       } else
884         CoerceTy =
885             llvm::IntegerType::get(getVMContext(), llvm::alignTo(Bits, 8));
886       return ABIArgInfo::getDirect(CoerceTy);
887     }
888 
889     // All other aggregates are returned indirectly.
890     return getNaturalAlignIndirect(RetTy);
891   }
892 
893   return (isPromotableTypeForABI(RetTy) ? ABIArgInfo::getExtend(RetTy)
894                                         : ABIArgInfo::getDirect());
895 }
896 
897 // Based on ARMABIInfo::EmitVAArg, adjusted for 64-bit machine.
898 Address PPC64_SVR4_ABIInfo::EmitVAArg(CodeGenFunction &CGF, Address VAListAddr,
899                                       QualType Ty) const {
900   auto TypeInfo = getContext().getTypeInfoInChars(Ty);
901   TypeInfo.Align = getParamTypeAlignment(Ty);
902 
903   CharUnits SlotSize = CharUnits::fromQuantity(8);
904 
905   // If we have a complex type and the base type is smaller than 8 bytes,
906   // the ABI calls for the real and imaginary parts to be right-adjusted
907   // in separate doublewords.  However, Clang expects us to produce a
908   // pointer to a structure with the two parts packed tightly.  So generate
909   // loads of the real and imaginary parts relative to the va_list pointer,
910   // and store them to a temporary structure.
911   if (const ComplexType *CTy = Ty->getAs<ComplexType>()) {
912     CharUnits EltSize = TypeInfo.Width / 2;
913     if (EltSize < SlotSize)
914       return complexTempStructure(CGF, VAListAddr, Ty, SlotSize, EltSize, CTy);
915   }
916 
917   // Otherwise, just use the general rule.
918   //
919   // The PPC64 ABI passes some arguments in integer registers, even to variadic
920   // functions. To allow va_list to use the simple "void*" representation,
921   // variadic calls allocate space in the argument area for the integer argument
922   // registers, and variadic functions spill their integer argument registers to
923   // this area in their prologues. When aggregates smaller than a register are
924   // passed this way, they are passed in the least significant bits of the
925   // register, which means that after spilling on big-endian targets they will
926   // be right-aligned in their argument slot. This is uncommon; for a variety of
927   // reasons, other big-endian targets don't end up right-aligning aggregate
928   // types this way, and so right-alignment only applies to fundamental types.
929   // So on PPC64, we must force the use of right-alignment even for aggregates.
930   return emitVoidPtrVAArg(CGF, VAListAddr, Ty, /*Indirect*/ false, TypeInfo,
931                           SlotSize, /*AllowHigher*/ true,
932                           /*ForceRightAdjust*/ true);
933 }
934 
935 bool
936 PPC64_SVR4_TargetCodeGenInfo::initDwarfEHRegSizeTable(
937   CodeGen::CodeGenFunction &CGF,
938   llvm::Value *Address) const {
939   return PPC_initDwarfEHRegSizeTable(CGF, Address, /*Is64Bit*/ true,
940                                      /*IsAIX*/ false);
941 }
942 
943 bool
944 PPC64TargetCodeGenInfo::initDwarfEHRegSizeTable(CodeGen::CodeGenFunction &CGF,
945                                                 llvm::Value *Address) const {
946   return PPC_initDwarfEHRegSizeTable(CGF, Address, /*Is64Bit*/ true,
947                                      /*IsAIX*/ false);
948 }
949 
950 std::unique_ptr<TargetCodeGenInfo>
951 CodeGen::createAIXTargetCodeGenInfo(CodeGenModule &CGM, bool Is64Bit) {
952   return std::make_unique<AIXTargetCodeGenInfo>(CGM.getTypes(), Is64Bit);
953 }
954 
955 std::unique_ptr<TargetCodeGenInfo>
956 CodeGen::createPPC32TargetCodeGenInfo(CodeGenModule &CGM, bool SoftFloatABI) {
957   bool RetSmallStructInRegABI = PPC32TargetCodeGenInfo::isStructReturnInRegABI(
958       CGM.getTriple(), CGM.getCodeGenOpts());
959   return std::make_unique<PPC32TargetCodeGenInfo>(CGM.getTypes(), SoftFloatABI,
960                                                   RetSmallStructInRegABI);
961 }
962 
963 std::unique_ptr<TargetCodeGenInfo>
964 CodeGen::createPPC64TargetCodeGenInfo(CodeGenModule &CGM) {
965   return std::make_unique<PPC64TargetCodeGenInfo>(CGM.getTypes());
966 }
967 
968 std::unique_ptr<TargetCodeGenInfo> CodeGen::createPPC64_SVR4_TargetCodeGenInfo(
969     CodeGenModule &CGM, PPC64_SVR4_ABIKind Kind, bool SoftFloatABI) {
970   return std::make_unique<PPC64_SVR4_TargetCodeGenInfo>(CGM.getTypes(), Kind,
971                                                         SoftFloatABI);
972 }
973