1 //===- PPCInstructionSelector.cpp --------------------------------*- C++ -*-==// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 /// \file 9 /// This file implements the targeting of the InstructionSelector class for 10 /// PowerPC. 11 //===----------------------------------------------------------------------===// 12 13 #include "PPC.h" 14 #include "PPCInstrInfo.h" 15 #include "PPCMachineFunctionInfo.h" 16 #include "PPCRegisterBankInfo.h" 17 #include "PPCSubtarget.h" 18 #include "PPCTargetMachine.h" 19 #include "llvm/CodeGen/GlobalISel/GIMatchTableExecutorImpl.h" 20 #include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h" 21 #include "llvm/CodeGen/GlobalISel/InstructionSelector.h" 22 #include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h" 23 #include "llvm/CodeGen/MachineConstantPool.h" 24 #include "llvm/CodeGen/MachineFunction.h" 25 #include "llvm/IR/IntrinsicsPowerPC.h" 26 #include "llvm/Support/Debug.h" 27 28 #define DEBUG_TYPE "ppc-gisel" 29 30 using namespace llvm; 31 32 namespace { 33 34 #define GET_GLOBALISEL_PREDICATE_BITSET 35 #include "PPCGenGlobalISel.inc" 36 #undef GET_GLOBALISEL_PREDICATE_BITSET 37 38 class PPCInstructionSelector : public InstructionSelector { 39 public: 40 PPCInstructionSelector(const PPCTargetMachine &TM, const PPCSubtarget &STI, 41 const PPCRegisterBankInfo &RBI); 42 43 bool select(MachineInstr &I) override; 44 static const char *getName() { return DEBUG_TYPE; } 45 46 private: 47 /// tblgen generated 'select' implementation that is used as the initial 48 /// selector for the patterns that do not require complex C++. 49 bool selectImpl(MachineInstr &I, CodeGenCoverage &CoverageInfo) const; 50 51 bool selectFPToInt(MachineInstr &I, MachineBasicBlock &MBB, 52 MachineRegisterInfo &MRI) const; 53 bool selectIntToFP(MachineInstr &I, MachineBasicBlock &MBB, 54 MachineRegisterInfo &MRI) const; 55 56 bool selectZExt(MachineInstr &I, MachineBasicBlock &MBB, 57 MachineRegisterInfo &MRI) const; 58 bool selectConstantPool(MachineInstr &I, MachineBasicBlock &MBB, 59 MachineRegisterInfo &MRI) const; 60 61 std::optional<bool> selectI64ImmDirect(MachineInstr &I, 62 MachineBasicBlock &MBB, 63 MachineRegisterInfo &MRI, Register Reg, 64 uint64_t Imm) const; 65 bool selectI64Imm(MachineInstr &I, MachineBasicBlock &MBB, 66 MachineRegisterInfo &MRI) const; 67 68 const PPCTargetMachine &TM; 69 const PPCSubtarget &STI; 70 const PPCInstrInfo &TII; 71 const PPCRegisterInfo &TRI; 72 const PPCRegisterBankInfo &RBI; 73 74 #define GET_GLOBALISEL_PREDICATES_DECL 75 #include "PPCGenGlobalISel.inc" 76 #undef GET_GLOBALISEL_PREDICATES_DECL 77 78 #define GET_GLOBALISEL_TEMPORARIES_DECL 79 #include "PPCGenGlobalISel.inc" 80 #undef GET_GLOBALISEL_TEMPORARIES_DECL 81 }; 82 83 } // end anonymous namespace 84 85 #define GET_GLOBALISEL_IMPL 86 #include "PPCGenGlobalISel.inc" 87 #undef GET_GLOBALISEL_IMPL 88 89 PPCInstructionSelector::PPCInstructionSelector(const PPCTargetMachine &TM, 90 const PPCSubtarget &STI, 91 const PPCRegisterBankInfo &RBI) 92 : TM(TM), STI(STI), TII(*STI.getInstrInfo()), TRI(*STI.getRegisterInfo()), 93 RBI(RBI), 94 #define GET_GLOBALISEL_PREDICATES_INIT 95 #include "PPCGenGlobalISel.inc" 96 #undef GET_GLOBALISEL_PREDICATES_INIT 97 #define GET_GLOBALISEL_TEMPORARIES_INIT 98 #include "PPCGenGlobalISel.inc" 99 #undef GET_GLOBALISEL_TEMPORARIES_INIT 100 { 101 } 102 103 static const TargetRegisterClass *getRegClass(LLT Ty, const RegisterBank *RB) { 104 if (RB->getID() == PPC::GPRRegBankID) { 105 if (Ty.getSizeInBits() == 64) 106 return &PPC::G8RCRegClass; 107 if (Ty.getSizeInBits() <= 32) 108 return &PPC::GPRCRegClass; 109 } 110 if (RB->getID() == PPC::FPRRegBankID) { 111 if (Ty.getSizeInBits() == 32) 112 return &PPC::F4RCRegClass; 113 if (Ty.getSizeInBits() == 64) 114 return &PPC::F8RCRegClass; 115 } 116 if (RB->getID() == PPC::VECRegBankID) { 117 if (Ty.getSizeInBits() == 128) 118 return &PPC::VSRCRegClass; 119 } 120 if (RB->getID() == PPC::CRRegBankID) { 121 if (Ty.getSizeInBits() == 1) 122 return &PPC::CRBITRCRegClass; 123 if (Ty.getSizeInBits() == 4) 124 return &PPC::CRRCRegClass; 125 } 126 127 llvm_unreachable("Unknown RegBank!"); 128 } 129 130 static bool selectCopy(MachineInstr &I, const TargetInstrInfo &TII, 131 MachineRegisterInfo &MRI, const TargetRegisterInfo &TRI, 132 const RegisterBankInfo &RBI) { 133 Register DstReg = I.getOperand(0).getReg(); 134 135 if (DstReg.isPhysical()) 136 return true; 137 138 const RegisterBank *DstRegBank = RBI.getRegBank(DstReg, MRI, TRI); 139 const TargetRegisterClass *DstRC = 140 getRegClass(MRI.getType(DstReg), DstRegBank); 141 142 // No need to constrain SrcReg. It will get constrained when we hit another of 143 // its use or its defs. 144 // Copies do not have constraints. 145 if (!RBI.constrainGenericRegister(DstReg, *DstRC, MRI)) { 146 LLVM_DEBUG(dbgs() << "Failed to constrain " << TII.getName(I.getOpcode()) 147 << " operand\n"); 148 return false; 149 } 150 151 return true; 152 } 153 154 static unsigned selectLoadStoreOp(unsigned GenericOpc, unsigned RegBankID, 155 unsigned OpSize) { 156 const bool IsStore = GenericOpc == TargetOpcode::G_STORE; 157 switch (RegBankID) { 158 case PPC::GPRRegBankID: 159 switch (OpSize) { 160 case 32: 161 return IsStore ? PPC::STW : PPC::LWZ; 162 case 64: 163 return IsStore ? PPC::STD : PPC::LD; 164 default: 165 llvm_unreachable("Unexpected size!"); 166 } 167 break; 168 case PPC::FPRRegBankID: 169 switch (OpSize) { 170 case 32: 171 return IsStore ? PPC::STFS : PPC::LFS; 172 case 64: 173 return IsStore ? PPC::STFD : PPC::LFD; 174 default: 175 llvm_unreachable("Unexpected size!"); 176 } 177 break; 178 default: 179 llvm_unreachable("Unexpected register bank!"); 180 } 181 return GenericOpc; 182 } 183 184 bool PPCInstructionSelector::selectIntToFP(MachineInstr &I, 185 MachineBasicBlock &MBB, 186 MachineRegisterInfo &MRI) const { 187 if (!STI.hasDirectMove() || !STI.isPPC64() || !STI.hasFPCVT()) 188 return false; 189 190 const DebugLoc &DbgLoc = I.getDebugLoc(); 191 const Register DstReg = I.getOperand(0).getReg(); 192 const Register SrcReg = I.getOperand(1).getReg(); 193 194 Register MoveReg = MRI.createVirtualRegister(&PPC::VSFRCRegClass); 195 196 // For now, only handle the case for 64 bit integer. 197 BuildMI(MBB, I, DbgLoc, TII.get(PPC::MTVSRD), MoveReg).addReg(SrcReg); 198 199 bool IsSingle = MRI.getType(DstReg).getSizeInBits() == 32; 200 bool IsSigned = I.getOpcode() == TargetOpcode::G_SITOFP; 201 unsigned ConvOp = IsSingle ? (IsSigned ? PPC::XSCVSXDSP : PPC::XSCVUXDSP) 202 : (IsSigned ? PPC::XSCVSXDDP : PPC::XSCVUXDDP); 203 204 MachineInstr *MI = 205 BuildMI(MBB, I, DbgLoc, TII.get(ConvOp), DstReg).addReg(MoveReg); 206 207 I.eraseFromParent(); 208 return constrainSelectedInstRegOperands(*MI, TII, TRI, RBI); 209 } 210 211 bool PPCInstructionSelector::selectFPToInt(MachineInstr &I, 212 MachineBasicBlock &MBB, 213 MachineRegisterInfo &MRI) const { 214 if (!STI.hasDirectMove() || !STI.isPPC64() || !STI.hasFPCVT()) 215 return false; 216 217 const DebugLoc &DbgLoc = I.getDebugLoc(); 218 const Register DstReg = I.getOperand(0).getReg(); 219 const Register SrcReg = I.getOperand(1).getReg(); 220 221 Register CopyReg = MRI.createVirtualRegister(&PPC::VSFRCRegClass); 222 BuildMI(MBB, I, DbgLoc, TII.get(TargetOpcode::COPY), CopyReg).addReg(SrcReg); 223 224 Register ConvReg = MRI.createVirtualRegister(&PPC::VSFRCRegClass); 225 226 bool IsSigned = I.getOpcode() == TargetOpcode::G_FPTOSI; 227 228 // single-precision is stored as double-precision on PPC in registers, so 229 // always use double-precision convertions. 230 unsigned ConvOp = IsSigned ? PPC::XSCVDPSXDS : PPC::XSCVDPUXDS; 231 232 BuildMI(MBB, I, DbgLoc, TII.get(ConvOp), ConvReg).addReg(CopyReg); 233 234 MachineInstr *MI = 235 BuildMI(MBB, I, DbgLoc, TII.get(PPC::MFVSRD), DstReg).addReg(ConvReg); 236 237 I.eraseFromParent(); 238 return constrainSelectedInstRegOperands(*MI, TII, TRI, RBI); 239 } 240 241 bool PPCInstructionSelector::selectZExt(MachineInstr &I, MachineBasicBlock &MBB, 242 MachineRegisterInfo &MRI) const { 243 const Register DstReg = I.getOperand(0).getReg(); 244 const LLT DstTy = MRI.getType(DstReg); 245 const RegisterBank *DstRegBank = RBI.getRegBank(DstReg, MRI, TRI); 246 247 const Register SrcReg = I.getOperand(1).getReg(); 248 249 assert(DstTy.getSizeInBits() == 64 && "Unexpected dest size!"); 250 assert(MRI.getType(SrcReg).getSizeInBits() == 32 && "Unexpected src size!"); 251 252 Register ImpDefReg = 253 MRI.createVirtualRegister(getRegClass(DstTy, DstRegBank)); 254 BuildMI(MBB, I, I.getDebugLoc(), TII.get(TargetOpcode::IMPLICIT_DEF), 255 ImpDefReg); 256 257 Register NewDefReg = 258 MRI.createVirtualRegister(getRegClass(DstTy, DstRegBank)); 259 BuildMI(MBB, I, I.getDebugLoc(), TII.get(TargetOpcode::INSERT_SUBREG), 260 NewDefReg) 261 .addReg(ImpDefReg) 262 .addReg(SrcReg) 263 .addImm(PPC::sub_32); 264 265 MachineInstr *MI = 266 BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), DstReg) 267 .addReg(NewDefReg) 268 .addImm(0) 269 .addImm(32); 270 271 I.eraseFromParent(); 272 return constrainSelectedInstRegOperands(*MI, TII, TRI, RBI); 273 } 274 275 // For any 32 < Num < 64, check if the Imm contains at least Num consecutive 276 // zeros and return the number of bits by the left of these consecutive zeros. 277 static uint32_t findContiguousZerosAtLeast(uint64_t Imm, unsigned Num) { 278 uint32_t HiTZ = llvm::countr_zero<uint32_t>(Hi_32(Imm)); 279 uint32_t LoLZ = llvm::countl_zero<uint32_t>(Lo_32(Imm)); 280 if ((HiTZ + LoLZ) >= Num) 281 return (32 + HiTZ); 282 return 0; 283 } 284 285 // Direct materialization of 64-bit constants by enumerated patterns. 286 // Similar to PPCISelDAGToDAG::selectI64ImmDirect(). 287 std::optional<bool> PPCInstructionSelector::selectI64ImmDirect(MachineInstr &I, 288 MachineBasicBlock &MBB, 289 MachineRegisterInfo &MRI, 290 Register Reg, 291 uint64_t Imm) const { 292 unsigned TZ = llvm::countr_zero<uint64_t>(Imm); 293 unsigned LZ = llvm::countl_zero<uint64_t>(Imm); 294 unsigned TO = llvm::countr_one<uint64_t>(Imm); 295 unsigned LO = llvm::countl_one<uint64_t>(Imm); 296 uint32_t Hi32 = Hi_32(Imm); 297 uint32_t Lo32 = Lo_32(Imm); 298 uint32_t Shift = 0; 299 300 // Following patterns use 1 instructions to materialize the Imm. 301 302 // 1-1) Patterns : {zeros}{15-bit valve} 303 // {ones}{15-bit valve} 304 if (isInt<16>(Imm)) 305 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), Reg) 306 .addImm(Imm) 307 .constrainAllUses(TII, TRI, RBI); 308 // 1-2) Patterns : {zeros}{15-bit valve}{16 zeros} 309 // {ones}{15-bit valve}{16 zeros} 310 if (TZ > 15 && (LZ > 32 || LO > 32)) 311 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LIS8), Reg) 312 .addImm((Imm >> 16) & 0xffff) 313 .constrainAllUses(TII, TRI, RBI); 314 315 // Following patterns use 2 instructions to materialize the Imm. 316 317 assert(LZ < 64 && "Unexpected leading zeros here."); 318 // Count of ones follwing the leading zeros. 319 unsigned FO = llvm::countl_one<uint64_t>(Imm << LZ); 320 // 2-1) Patterns : {zeros}{31-bit value} 321 // {ones}{31-bit value} 322 if (isInt<32>(Imm)) { 323 uint64_t ImmHi16 = (Imm >> 16) & 0xffff; 324 unsigned Opcode = ImmHi16 ? PPC::LIS8 : PPC::LI8; 325 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 326 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(Opcode), TmpReg) 327 .addImm((Imm >> 16) & 0xffff) 328 .constrainAllUses(TII, TRI, RBI)) 329 return false; 330 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Reg) 331 .addReg(TmpReg, RegState::Kill) 332 .addImm(Imm & 0xffff) 333 .constrainAllUses(TII, TRI, RBI); 334 } 335 // 2-2) Patterns : {zeros}{ones}{15-bit value}{zeros} 336 // {zeros}{15-bit value}{zeros} 337 // {zeros}{ones}{15-bit value} 338 // {ones}{15-bit value}{zeros} 339 // We can take advantage of LI's sign-extension semantics to generate leading 340 // ones, and then use RLDIC to mask off the ones in both sides after rotation. 341 if ((LZ + FO + TZ) > 48) { 342 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 343 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg) 344 .addImm((Imm >> TZ) & 0xffff) 345 .constrainAllUses(TII, TRI, RBI)) 346 return false; 347 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDIC), Reg) 348 .addReg(TmpReg, RegState::Kill) 349 .addImm(TZ) 350 .addImm(LZ) 351 .constrainAllUses(TII, TRI, RBI); 352 } 353 // 2-3) Pattern : {zeros}{15-bit value}{ones} 354 // Shift right the Imm by (48 - LZ) bits to construct a negtive 16 bits value, 355 // therefore we can take advantage of LI's sign-extension semantics, and then 356 // mask them off after rotation. 357 // 358 // +--LZ--||-15-bit-||--TO--+ +-------------|--16-bit--+ 359 // |00000001bbbbbbbbb1111111| -> |00000000000001bbbbbbbbb1| 360 // +------------------------+ +------------------------+ 361 // 63 0 63 0 362 // Imm (Imm >> (48 - LZ) & 0xffff) 363 // +----sext-----|--16-bit--+ +clear-|-----------------+ 364 // |11111111111111bbbbbbbbb1| -> |00000001bbbbbbbbb1111111| 365 // +------------------------+ +------------------------+ 366 // 63 0 63 0 367 // LI8: sext many leading zeros RLDICL: rotate left (48 - LZ), clear left LZ 368 if ((LZ + TO) > 48) { 369 // Since the immediates with (LZ > 32) have been handled by previous 370 // patterns, here we have (LZ <= 32) to make sure we will not shift right 371 // the Imm by a negative value. 372 assert(LZ <= 32 && "Unexpected shift value."); 373 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 374 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg) 375 .addImm(Imm >> (48 - LZ) & 0xffff) 376 .constrainAllUses(TII, TRI, RBI)) 377 return false; 378 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg) 379 .addReg(TmpReg, RegState::Kill) 380 .addImm(48 - LZ) 381 .addImm(LZ) 382 .constrainAllUses(TII, TRI, RBI); 383 } 384 // 2-4) Patterns : {zeros}{ones}{15-bit value}{ones} 385 // {ones}{15-bit value}{ones} 386 // We can take advantage of LI's sign-extension semantics to generate leading 387 // ones, and then use RLDICL to mask off the ones in left sides (if required) 388 // after rotation. 389 // 390 // +-LZ-FO||-15-bit-||--TO--+ +-------------|--16-bit--+ 391 // |00011110bbbbbbbbb1111111| -> |000000000011110bbbbbbbbb| 392 // +------------------------+ +------------------------+ 393 // 63 0 63 0 394 // Imm (Imm >> TO) & 0xffff 395 // +----sext-----|--16-bit--+ +LZ|---------------------+ 396 // |111111111111110bbbbbbbbb| -> |00011110bbbbbbbbb1111111| 397 // +------------------------+ +------------------------+ 398 // 63 0 63 0 399 // LI8: sext many leading zeros RLDICL: rotate left TO, clear left LZ 400 if ((LZ + FO + TO) > 48) { 401 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 402 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg) 403 .addImm((Imm >> TO) & 0xffff) 404 .constrainAllUses(TII, TRI, RBI)) 405 return false; 406 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg) 407 .addReg(TmpReg, RegState::Kill) 408 .addImm(TO) 409 .addImm(LZ) 410 .constrainAllUses(TII, TRI, RBI); 411 } 412 // 2-5) Pattern : {32 zeros}{****}{0}{15-bit value} 413 // If Hi32 is zero and the Lo16(in Lo32) can be presented as a positive 16 bit 414 // value, we can use LI for Lo16 without generating leading ones then add the 415 // Hi16(in Lo32). 416 if (LZ == 32 && ((Lo32 & 0x8000) == 0)) { 417 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 418 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg) 419 .addImm(Lo32 & 0xffff) 420 .constrainAllUses(TII, TRI, RBI)) 421 return false; 422 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORIS8), Reg) 423 .addReg(TmpReg, RegState::Kill) 424 .addImm(Lo32 >> 16) 425 .constrainAllUses(TII, TRI, RBI); 426 } 427 // 2-6) Patterns : {******}{49 zeros}{******} 428 // {******}{49 ones}{******} 429 // If the Imm contains 49 consecutive zeros/ones, it means that a total of 15 430 // bits remain on both sides. Rotate right the Imm to construct an int<16> 431 // value, use LI for int<16> value and then use RLDICL without mask to rotate 432 // it back. 433 // 434 // 1) findContiguousZerosAtLeast(Imm, 49) 435 // +------|--zeros-|------+ +---ones--||---15 bit--+ 436 // |bbbbbb0000000000aaaaaa| -> |0000000000aaaaaabbbbbb| 437 // +----------------------+ +----------------------+ 438 // 63 0 63 0 439 // 440 // 2) findContiguousZerosAtLeast(~Imm, 49) 441 // +------|--ones--|------+ +---ones--||---15 bit--+ 442 // |bbbbbb1111111111aaaaaa| -> |1111111111aaaaaabbbbbb| 443 // +----------------------+ +----------------------+ 444 // 63 0 63 0 445 if ((Shift = findContiguousZerosAtLeast(Imm, 49)) || 446 (Shift = findContiguousZerosAtLeast(~Imm, 49))) { 447 uint64_t RotImm = APInt(64, Imm).rotr(Shift).getZExtValue(); 448 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 449 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LI8), TmpReg) 450 .addImm(RotImm & 0xffff) 451 .constrainAllUses(TII, TRI, RBI)) 452 return false; 453 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg) 454 .addReg(TmpReg, RegState::Kill) 455 .addImm(Shift) 456 .addImm(0) 457 .constrainAllUses(TII, TRI, RBI); 458 } 459 460 // Following patterns use 3 instructions to materialize the Imm. 461 462 // 3-1) Patterns : {zeros}{ones}{31-bit value}{zeros} 463 // {zeros}{31-bit value}{zeros} 464 // {zeros}{ones}{31-bit value} 465 // {ones}{31-bit value}{zeros} 466 // We can take advantage of LIS's sign-extension semantics to generate leading 467 // ones, add the remaining bits with ORI, and then use RLDIC to mask off the 468 // ones in both sides after rotation. 469 if ((LZ + FO + TZ) > 32) { 470 uint64_t ImmHi16 = (Imm >> (TZ + 16)) & 0xffff; 471 unsigned Opcode = ImmHi16 ? PPC::LIS8 : PPC::LI8; 472 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 473 Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 474 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(Opcode), TmpReg) 475 .addImm(ImmHi16) 476 .constrainAllUses(TII, TRI, RBI)) 477 return false; 478 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg) 479 .addReg(TmpReg, RegState::Kill) 480 .addImm((Imm >> TZ) & 0xffff) 481 .constrainAllUses(TII, TRI, RBI)) 482 return false; 483 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDIC), Reg) 484 .addReg(Tmp2Reg, RegState::Kill) 485 .addImm(TZ) 486 .addImm(LZ) 487 .constrainAllUses(TII, TRI, RBI); 488 } 489 // 3-2) Pattern : {zeros}{31-bit value}{ones} 490 // Shift right the Imm by (32 - LZ) bits to construct a negative 32 bits 491 // value, therefore we can take advantage of LIS's sign-extension semantics, 492 // add the remaining bits with ORI, and then mask them off after rotation. 493 // This is similar to Pattern 2-3, please refer to the diagram there. 494 if ((LZ + TO) > 32) { 495 // Since the immediates with (LZ > 32) have been handled by previous 496 // patterns, here we have (LZ <= 32) to make sure we will not shift right 497 // the Imm by a negative value. 498 assert(LZ <= 32 && "Unexpected shift value."); 499 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 500 Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 501 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LIS8), TmpReg) 502 .addImm((Imm >> (48 - LZ)) & 0xffff) 503 .constrainAllUses(TII, TRI, RBI)) 504 return false; 505 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg) 506 .addReg(TmpReg, RegState::Kill) 507 .addImm((Imm >> (32 - LZ)) & 0xffff) 508 .constrainAllUses(TII, TRI, RBI)) 509 return false; 510 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg) 511 .addReg(Tmp2Reg, RegState::Kill) 512 .addImm(32 - LZ) 513 .addImm(LZ) 514 .constrainAllUses(TII, TRI, RBI); 515 } 516 // 3-3) Patterns : {zeros}{ones}{31-bit value}{ones} 517 // {ones}{31-bit value}{ones} 518 // We can take advantage of LIS's sign-extension semantics to generate leading 519 // ones, add the remaining bits with ORI, and then use RLDICL to mask off the 520 // ones in left sides (if required) after rotation. 521 // This is similar to Pattern 2-4, please refer to the diagram there. 522 if ((LZ + FO + TO) > 32) { 523 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 524 Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 525 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::LIS8), TmpReg) 526 .addImm((Imm >> (TO + 16)) & 0xffff) 527 .constrainAllUses(TII, TRI, RBI)) 528 return false; 529 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg) 530 .addReg(TmpReg, RegState::Kill) 531 .addImm((Imm >> TO) & 0xffff) 532 .constrainAllUses(TII, TRI, RBI)) 533 return false; 534 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg) 535 .addReg(Tmp2Reg, RegState::Kill) 536 .addImm(TO) 537 .addImm(LZ) 538 .constrainAllUses(TII, TRI, RBI); 539 } 540 // 3-4) Patterns : High word == Low word 541 if (Hi32 == Lo32) { 542 // Handle the first 32 bits. 543 uint64_t ImmHi16 = (Lo32 >> 16) & 0xffff; 544 unsigned Opcode = ImmHi16 ? PPC::LIS8 : PPC::LI8; 545 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 546 Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 547 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(Opcode), TmpReg) 548 .addImm(ImmHi16) 549 .constrainAllUses(TII, TRI, RBI)) 550 return false; 551 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg) 552 .addReg(TmpReg, RegState::Kill) 553 .addImm(Lo32 & 0xffff) 554 .constrainAllUses(TII, TRI, RBI)) 555 return false; 556 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDIMI), Reg) 557 .addReg(Tmp2Reg) 558 .addReg(Tmp2Reg, RegState::Kill) 559 .addImm(32) 560 .addImm(0) 561 .constrainAllUses(TII, TRI, RBI); 562 } 563 // 3-5) Patterns : {******}{33 zeros}{******} 564 // {******}{33 ones}{******} 565 // If the Imm contains 33 consecutive zeros/ones, it means that a total of 31 566 // bits remain on both sides. Rotate right the Imm to construct an int<32> 567 // value, use LIS + ORI for int<32> value and then use RLDICL without mask to 568 // rotate it back. 569 // This is similar to Pattern 2-6, please refer to the diagram there. 570 if ((Shift = findContiguousZerosAtLeast(Imm, 33)) || 571 (Shift = findContiguousZerosAtLeast(~Imm, 33))) { 572 uint64_t RotImm = APInt(64, Imm).rotr(Shift).getZExtValue(); 573 uint64_t ImmHi16 = (RotImm >> 16) & 0xffff; 574 unsigned Opcode = ImmHi16 ? PPC::LIS8 : PPC::LI8; 575 Register TmpReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 576 Register Tmp2Reg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 577 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(Opcode), TmpReg) 578 .addImm(ImmHi16) 579 .constrainAllUses(TII, TRI, RBI)) 580 return false; 581 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), Tmp2Reg) 582 .addReg(TmpReg, RegState::Kill) 583 .addImm(RotImm & 0xffff) 584 .constrainAllUses(TII, TRI, RBI)) 585 return false; 586 return BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::RLDICL), Reg) 587 .addReg(Tmp2Reg, RegState::Kill) 588 .addImm(Shift) 589 .addImm(0) 590 .constrainAllUses(TII, TRI, RBI); 591 } 592 593 // If we end up here then no instructions were inserted. 594 return std::nullopt; 595 } 596 597 // Derived from PPCISelDAGToDAG::selectI64Imm(). 598 // TODO: Add support for prefixed instructions. 599 bool PPCInstructionSelector::selectI64Imm(MachineInstr &I, 600 MachineBasicBlock &MBB, 601 MachineRegisterInfo &MRI) const { 602 assert(I.getOpcode() == TargetOpcode::G_CONSTANT && "Unexpected G code"); 603 604 Register DstReg = I.getOperand(0).getReg(); 605 int64_t Imm = I.getOperand(1).getCImm()->getValue().getZExtValue(); 606 // No more than 3 instructions are used if we can select the i64 immediate 607 // directly. 608 if (std::optional<bool> Res = selectI64ImmDirect(I, MBB, MRI, DstReg, Imm)) { 609 I.eraseFromParent(); 610 return *Res; 611 } 612 613 // Calculate the last bits as required. 614 uint32_t Hi16 = (Lo_32(Imm) >> 16) & 0xffff; 615 uint32_t Lo16 = Lo_32(Imm) & 0xffff; 616 617 Register Reg = 618 (Hi16 || Lo16) ? MRI.createVirtualRegister(&PPC::G8RCRegClass) : DstReg; 619 620 // Handle the upper 32 bit value. 621 std::optional<bool> Res = 622 selectI64ImmDirect(I, MBB, MRI, Reg, Imm & 0xffffffff00000000); 623 if (!Res || !*Res) 624 return false; 625 626 // Add in the last bits as required. 627 if (Hi16) { 628 Register TmpReg = 629 Lo16 ? MRI.createVirtualRegister(&PPC::G8RCRegClass) : DstReg; 630 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORIS8), TmpReg) 631 .addReg(Reg, RegState::Kill) 632 .addImm(Hi16) 633 .constrainAllUses(TII, TRI, RBI)) 634 return false; 635 Reg = TmpReg; 636 } 637 if (Lo16) { 638 if (!BuildMI(MBB, I, I.getDebugLoc(), TII.get(PPC::ORI8), DstReg) 639 .addReg(Reg, RegState::Kill) 640 .addImm(Lo16) 641 .constrainAllUses(TII, TRI, RBI)) 642 return false; 643 } 644 I.eraseFromParent(); 645 return true; 646 } 647 648 bool PPCInstructionSelector::selectConstantPool( 649 MachineInstr &I, MachineBasicBlock &MBB, MachineRegisterInfo &MRI) const { 650 const DebugLoc &DbgLoc = I.getDebugLoc(); 651 MachineFunction *MF = MBB.getParent(); 652 653 // TODO: handle 32-bit. 654 // TODO: Enabling floating point constant pool selection on AIX requires 655 // global isel on big endian target enabled first. 656 // See CallLowering::enableBigEndian(). 657 if (!STI.isPPC64() || !STI.isLittleEndian()) 658 return false; 659 660 MF->getInfo<PPCFunctionInfo>()->setUsesTOCBasePtr(); 661 662 const Register DstReg = I.getOperand(0).getReg(); 663 unsigned CPI = I.getOperand(1).getIndex(); 664 665 // Address stored in the TOC entry. This is related to code model and the ABI 666 // we are currently using. For now we only handle 64-bit Linux LE. PowerPC 667 // only supports small, medium and large code model. 668 const CodeModel::Model CModel = TM.getCodeModel(); 669 assert(!(CModel == CodeModel::Tiny || CModel == CodeModel::Kernel) && 670 "PowerPC doesn't support tiny or kernel code models."); 671 672 const MCRegister TOCReg = STI.getTOCPointerRegister(); 673 MachineMemOperand *MMO = MF->getMachineMemOperand( 674 MachinePointerInfo::getGOT(*MF), MachineMemOperand::MOLoad, 675 MRI.getType(DstReg), MF->getDataLayout().getPointerABIAlignment(0)); 676 677 MachineInstr *MI = nullptr; 678 // For now we only handle 64-bit Linux. 679 if (CModel == CodeModel::Small) { 680 // For small code model, generate LDtocCPT(CPI, X2). 681 MI = BuildMI(MBB, I, DbgLoc, TII.get(PPC::LDtocCPT), DstReg) 682 .addConstantPoolIndex(CPI) 683 .addReg(TOCReg) 684 .addMemOperand(MMO); 685 } else { 686 Register HaAddrReg = MRI.createVirtualRegister(&PPC::G8RCRegClass); 687 BuildMI(MBB, I, DbgLoc, TII.get(PPC::ADDIStocHA8), HaAddrReg) 688 .addReg(TOCReg) 689 .addConstantPoolIndex(CPI); 690 691 if (CModel == CodeModel::Large) 692 // For large code model, generate LDtocL(CPI, ADDIStocHA8(X2, CPI)) 693 MI = BuildMI(MBB, I, DbgLoc, TII.get(PPC::LDtocL), DstReg) 694 .addConstantPoolIndex(CPI) 695 .addReg(HaAddrReg) 696 .addMemOperand(MMO); 697 else 698 // For medium code model, generate ADDItocL8(CPI, ADDIStocHA8(X2, CPI)) 699 MI = BuildMI(MBB, I, DbgLoc, TII.get(PPC::ADDItocL8), DstReg) 700 .addReg(HaAddrReg) 701 .addConstantPoolIndex(CPI); 702 } 703 704 I.eraseFromParent(); 705 return constrainSelectedInstRegOperands(*MI, TII, TRI, RBI); 706 } 707 708 bool PPCInstructionSelector::select(MachineInstr &I) { 709 auto &MBB = *I.getParent(); 710 auto &MF = *MBB.getParent(); 711 auto &MRI = MF.getRegInfo(); 712 713 if (!isPreISelGenericOpcode(I.getOpcode())) { 714 if (I.isCopy()) 715 return selectCopy(I, TII, MRI, TRI, RBI); 716 717 return true; 718 } 719 720 if (selectImpl(I, *CoverageInfo)) 721 return true; 722 723 unsigned Opcode = I.getOpcode(); 724 725 switch (Opcode) { 726 default: 727 return false; 728 case TargetOpcode::G_LOAD: 729 case TargetOpcode::G_STORE: { 730 GLoadStore &LdSt = cast<GLoadStore>(I); 731 LLT PtrTy = MRI.getType(LdSt.getPointerReg()); 732 733 if (PtrTy != LLT::pointer(0, 64)) { 734 LLVM_DEBUG(dbgs() << "Load/Store pointer has type: " << PtrTy 735 << ", expected: " << LLT::pointer(0, 64) << '\n'); 736 return false; 737 } 738 739 auto SelectLoadStoreAddressingMode = [&]() -> MachineInstr * { 740 const unsigned NewOpc = selectLoadStoreOp( 741 I.getOpcode(), RBI.getRegBank(LdSt.getReg(0), MRI, TRI)->getID(), 742 LdSt.getMemSizeInBits().getValue()); 743 744 if (NewOpc == I.getOpcode()) 745 return nullptr; 746 747 // For now, simply use DForm with load/store addr as base and 0 as imm. 748 // FIXME: optimize load/store with some specific address patterns. 749 I.setDesc(TII.get(NewOpc)); 750 Register AddrReg = I.getOperand(1).getReg(); 751 bool IsKill = I.getOperand(1).isKill(); 752 I.getOperand(1).ChangeToImmediate(0); 753 I.addOperand(*I.getParent()->getParent(), 754 MachineOperand::CreateReg(AddrReg, /* isDef */ false, 755 /* isImp */ false, IsKill)); 756 return &I; 757 }; 758 759 MachineInstr *LoadStore = SelectLoadStoreAddressingMode(); 760 if (!LoadStore) 761 return false; 762 763 return constrainSelectedInstRegOperands(*LoadStore, TII, TRI, RBI); 764 } 765 case TargetOpcode::G_SITOFP: 766 case TargetOpcode::G_UITOFP: 767 return selectIntToFP(I, MBB, MRI); 768 case TargetOpcode::G_FPTOSI: 769 case TargetOpcode::G_FPTOUI: 770 return selectFPToInt(I, MBB, MRI); 771 // G_SEXT will be selected in tb-gen pattern. 772 case TargetOpcode::G_ZEXT: 773 return selectZExt(I, MBB, MRI); 774 case TargetOpcode::G_CONSTANT: 775 return selectI64Imm(I, MBB, MRI); 776 case TargetOpcode::G_CONSTANT_POOL: 777 return selectConstantPool(I, MBB, MRI); 778 } 779 return false; 780 } 781 782 namespace llvm { 783 InstructionSelector * 784 createPPCInstructionSelector(const PPCTargetMachine &TM, 785 const PPCSubtarget &Subtarget, 786 const PPCRegisterBankInfo &RBI) { 787 return new PPCInstructionSelector(TM, Subtarget, RBI); 788 } 789 } // end namespace llvm 790