1 //===-- RISCVFrameLowering.cpp - RISC-V Frame Information -----------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file contains the RISC-V implementation of TargetFrameLowering class. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "RISCVFrameLowering.h" 14 #include "RISCVMachineFunctionInfo.h" 15 #include "RISCVSubtarget.h" 16 #include "llvm/BinaryFormat/Dwarf.h" 17 #include "llvm/CodeGen/MachineFrameInfo.h" 18 #include "llvm/CodeGen/MachineFunction.h" 19 #include "llvm/CodeGen/MachineInstrBuilder.h" 20 #include "llvm/CodeGen/MachineRegisterInfo.h" 21 #include "llvm/CodeGen/RegisterScavenging.h" 22 #include "llvm/IR/DiagnosticInfo.h" 23 #include "llvm/MC/MCDwarf.h" 24 #include "llvm/Support/LEB128.h" 25 26 #include <algorithm> 27 28 using namespace llvm; 29 30 static Align getABIStackAlignment(RISCVABI::ABI ABI) { 31 if (ABI == RISCVABI::ABI_ILP32E) 32 return Align(4); 33 if (ABI == RISCVABI::ABI_LP64E) 34 return Align(8); 35 return Align(16); 36 } 37 38 RISCVFrameLowering::RISCVFrameLowering(const RISCVSubtarget &STI) 39 : TargetFrameLowering( 40 StackGrowsDown, getABIStackAlignment(STI.getTargetABI()), 41 /*LocalAreaOffset=*/0, 42 /*TransientStackAlignment=*/getABIStackAlignment(STI.getTargetABI())), 43 STI(STI) {} 44 45 // Offsets which need to be scale by XLen representing locations of CSRs which 46 // are given a fixed location by save/restore libcalls or Zcmp Push/Pop. 47 static const std::pair<MCPhysReg, int8_t> FixedCSRFIMap[] = { 48 {/*ra*/ RISCV::X1, -1}, {/*s0*/ RISCV::X8, -2}, 49 {/*s1*/ RISCV::X9, -3}, {/*s2*/ RISCV::X18, -4}, 50 {/*s3*/ RISCV::X19, -5}, {/*s4*/ RISCV::X20, -6}, 51 {/*s5*/ RISCV::X21, -7}, {/*s6*/ RISCV::X22, -8}, 52 {/*s7*/ RISCV::X23, -9}, {/*s8*/ RISCV::X24, -10}, 53 {/*s9*/ RISCV::X25, -11}, {/*s10*/ RISCV::X26, -12}, 54 {/*s11*/ RISCV::X27, -13}}; 55 56 // For now we use x3, a.k.a gp, as pointer to shadow call stack. 57 // User should not use x3 in their asm. 58 static void emitSCSPrologue(MachineFunction &MF, MachineBasicBlock &MBB, 59 MachineBasicBlock::iterator MI, 60 const DebugLoc &DL) { 61 if (!MF.getFunction().hasFnAttribute(Attribute::ShadowCallStack)) 62 return; 63 64 const auto &STI = MF.getSubtarget<RISCVSubtarget>(); 65 const llvm::RISCVRegisterInfo *TRI = STI.getRegisterInfo(); 66 Register RAReg = TRI->getRARegister(); 67 68 // Do not save RA to the SCS if it's not saved to the regular stack, 69 // i.e. RA is not at risk of being overwritten. 70 std::vector<CalleeSavedInfo> &CSI = MF.getFrameInfo().getCalleeSavedInfo(); 71 if (llvm::none_of( 72 CSI, [&](CalleeSavedInfo &CSR) { return CSR.getReg() == RAReg; })) 73 return; 74 75 const RISCVInstrInfo *TII = STI.getInstrInfo(); 76 if (!STI.hasForcedSWShadowStack() && STI.hasStdExtZicfiss()) { 77 BuildMI(MBB, MI, DL, TII->get(RISCV::SSPUSH)).addReg(RAReg); 78 return; 79 } 80 81 Register SCSPReg = RISCVABI::getSCSPReg(); 82 83 bool IsRV64 = STI.hasFeature(RISCV::Feature64Bit); 84 int64_t SlotSize = STI.getXLen() / 8; 85 // Store return address to shadow call stack 86 // addi gp, gp, [4|8] 87 // s[w|d] ra, -[4|8](gp) 88 BuildMI(MBB, MI, DL, TII->get(RISCV::ADDI)) 89 .addReg(SCSPReg, RegState::Define) 90 .addReg(SCSPReg) 91 .addImm(SlotSize) 92 .setMIFlag(MachineInstr::FrameSetup); 93 BuildMI(MBB, MI, DL, TII->get(IsRV64 ? RISCV::SD : RISCV::SW)) 94 .addReg(RAReg) 95 .addReg(SCSPReg) 96 .addImm(-SlotSize) 97 .setMIFlag(MachineInstr::FrameSetup); 98 99 // Emit a CFI instruction that causes SlotSize to be subtracted from the value 100 // of the shadow stack pointer when unwinding past this frame. 101 char DwarfSCSReg = TRI->getDwarfRegNum(SCSPReg, /*IsEH*/ true); 102 assert(DwarfSCSReg < 32 && "SCS Register should be < 32 (X3)."); 103 104 char Offset = static_cast<char>(-SlotSize) & 0x7f; 105 const char CFIInst[] = { 106 dwarf::DW_CFA_val_expression, 107 DwarfSCSReg, // register 108 2, // length 109 static_cast<char>(unsigned(dwarf::DW_OP_breg0 + DwarfSCSReg)), 110 Offset, // addend (sleb128) 111 }; 112 113 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createEscape( 114 nullptr, StringRef(CFIInst, sizeof(CFIInst)))); 115 BuildMI(MBB, MI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION)) 116 .addCFIIndex(CFIIndex) 117 .setMIFlag(MachineInstr::FrameSetup); 118 } 119 120 static void emitSCSEpilogue(MachineFunction &MF, MachineBasicBlock &MBB, 121 MachineBasicBlock::iterator MI, 122 const DebugLoc &DL) { 123 if (!MF.getFunction().hasFnAttribute(Attribute::ShadowCallStack)) 124 return; 125 126 const auto &STI = MF.getSubtarget<RISCVSubtarget>(); 127 Register RAReg = STI.getRegisterInfo()->getRARegister(); 128 129 // See emitSCSPrologue() above. 130 std::vector<CalleeSavedInfo> &CSI = MF.getFrameInfo().getCalleeSavedInfo(); 131 if (llvm::none_of( 132 CSI, [&](CalleeSavedInfo &CSR) { return CSR.getReg() == RAReg; })) 133 return; 134 135 const RISCVInstrInfo *TII = STI.getInstrInfo(); 136 if (!STI.hasForcedSWShadowStack() && STI.hasStdExtZicfiss()) { 137 BuildMI(MBB, MI, DL, TII->get(RISCV::SSPOPCHK)).addReg(RAReg); 138 return; 139 } 140 141 Register SCSPReg = RISCVABI::getSCSPReg(); 142 143 bool IsRV64 = STI.hasFeature(RISCV::Feature64Bit); 144 int64_t SlotSize = STI.getXLen() / 8; 145 // Load return address from shadow call stack 146 // l[w|d] ra, -[4|8](gp) 147 // addi gp, gp, -[4|8] 148 BuildMI(MBB, MI, DL, TII->get(IsRV64 ? RISCV::LD : RISCV::LW)) 149 .addReg(RAReg, RegState::Define) 150 .addReg(SCSPReg) 151 .addImm(-SlotSize) 152 .setMIFlag(MachineInstr::FrameDestroy); 153 BuildMI(MBB, MI, DL, TII->get(RISCV::ADDI)) 154 .addReg(SCSPReg, RegState::Define) 155 .addReg(SCSPReg) 156 .addImm(-SlotSize) 157 .setMIFlag(MachineInstr::FrameDestroy); 158 // Restore the SCS pointer 159 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createRestore( 160 nullptr, STI.getRegisterInfo()->getDwarfRegNum(SCSPReg, /*IsEH*/ true))); 161 BuildMI(MBB, MI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION)) 162 .addCFIIndex(CFIIndex) 163 .setMIFlags(MachineInstr::FrameDestroy); 164 } 165 166 // Get the ID of the libcall used for spilling and restoring callee saved 167 // registers. The ID is representative of the number of registers saved or 168 // restored by the libcall, except it is zero-indexed - ID 0 corresponds to a 169 // single register. 170 static int getLibCallID(const MachineFunction &MF, 171 const std::vector<CalleeSavedInfo> &CSI) { 172 const auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 173 174 if (CSI.empty() || !RVFI->useSaveRestoreLibCalls(MF)) 175 return -1; 176 177 Register MaxReg = RISCV::NoRegister; 178 for (auto &CS : CSI) 179 // assignCalleeSavedSpillSlots assigns negative frame indexes to 180 // registers which can be saved by libcall. 181 if (CS.getFrameIdx() < 0) 182 MaxReg = std::max(MaxReg.id(), CS.getReg().id()); 183 184 if (MaxReg == RISCV::NoRegister) 185 return -1; 186 187 switch (MaxReg) { 188 default: 189 llvm_unreachable("Something has gone wrong!"); 190 case /*s11*/ RISCV::X27: return 12; 191 case /*s10*/ RISCV::X26: return 11; 192 case /*s9*/ RISCV::X25: return 10; 193 case /*s8*/ RISCV::X24: return 9; 194 case /*s7*/ RISCV::X23: return 8; 195 case /*s6*/ RISCV::X22: return 7; 196 case /*s5*/ RISCV::X21: return 6; 197 case /*s4*/ RISCV::X20: return 5; 198 case /*s3*/ RISCV::X19: return 4; 199 case /*s2*/ RISCV::X18: return 3; 200 case /*s1*/ RISCV::X9: return 2; 201 case /*s0*/ RISCV::X8: return 1; 202 case /*ra*/ RISCV::X1: return 0; 203 } 204 } 205 206 // Get the name of the libcall used for spilling callee saved registers. 207 // If this function will not use save/restore libcalls, then return a nullptr. 208 static const char * 209 getSpillLibCallName(const MachineFunction &MF, 210 const std::vector<CalleeSavedInfo> &CSI) { 211 static const char *const SpillLibCalls[] = { 212 "__riscv_save_0", 213 "__riscv_save_1", 214 "__riscv_save_2", 215 "__riscv_save_3", 216 "__riscv_save_4", 217 "__riscv_save_5", 218 "__riscv_save_6", 219 "__riscv_save_7", 220 "__riscv_save_8", 221 "__riscv_save_9", 222 "__riscv_save_10", 223 "__riscv_save_11", 224 "__riscv_save_12" 225 }; 226 227 int LibCallID = getLibCallID(MF, CSI); 228 if (LibCallID == -1) 229 return nullptr; 230 return SpillLibCalls[LibCallID]; 231 } 232 233 // Get the name of the libcall used for restoring callee saved registers. 234 // If this function will not use save/restore libcalls, then return a nullptr. 235 static const char * 236 getRestoreLibCallName(const MachineFunction &MF, 237 const std::vector<CalleeSavedInfo> &CSI) { 238 static const char *const RestoreLibCalls[] = { 239 "__riscv_restore_0", 240 "__riscv_restore_1", 241 "__riscv_restore_2", 242 "__riscv_restore_3", 243 "__riscv_restore_4", 244 "__riscv_restore_5", 245 "__riscv_restore_6", 246 "__riscv_restore_7", 247 "__riscv_restore_8", 248 "__riscv_restore_9", 249 "__riscv_restore_10", 250 "__riscv_restore_11", 251 "__riscv_restore_12" 252 }; 253 254 int LibCallID = getLibCallID(MF, CSI); 255 if (LibCallID == -1) 256 return nullptr; 257 return RestoreLibCalls[LibCallID]; 258 } 259 260 // Return encoded value and register count for PUSH/POP instruction, 261 // representing registers to store/load. 262 static std::pair<unsigned, unsigned> 263 getPushPopEncodingAndNum(const Register MaxReg) { 264 switch (MaxReg) { 265 default: 266 llvm_unreachable("Unexpected Reg for Push/Pop Inst"); 267 case RISCV::X27: /*s11*/ 268 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S11, 13); 269 case RISCV::X25: /*s9*/ 270 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S9, 11); 271 case RISCV::X24: /*s8*/ 272 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S8, 10); 273 case RISCV::X23: /*s7*/ 274 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S7, 9); 275 case RISCV::X22: /*s6*/ 276 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S6, 8); 277 case RISCV::X21: /*s5*/ 278 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S5, 7); 279 case RISCV::X20: /*s4*/ 280 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S4, 6); 281 case RISCV::X19: /*s3*/ 282 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S3, 5); 283 case RISCV::X18: /*s2*/ 284 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S2, 4); 285 case RISCV::X9: /*s1*/ 286 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S1, 3); 287 case RISCV::X8: /*s0*/ 288 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0, 2); 289 case RISCV::X1: /*ra*/ 290 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA, 1); 291 } 292 } 293 294 // Get the max reg of Push/Pop for restoring callee saved registers. 295 static Register getMaxPushPopReg(const MachineFunction &MF, 296 const std::vector<CalleeSavedInfo> &CSI) { 297 Register MaxPushPopReg = RISCV::NoRegister; 298 for (auto &CS : CSI) { 299 if (llvm::find_if(FixedCSRFIMap, [&](auto P) { 300 return P.first == CS.getReg(); 301 }) != std::end(FixedCSRFIMap)) 302 MaxPushPopReg = std::max(MaxPushPopReg.id(), CS.getReg().id()); 303 } 304 assert(MaxPushPopReg != RISCV::X26 && "x26 requires x27 to also be pushed"); 305 return MaxPushPopReg; 306 } 307 308 // Return true if the specified function should have a dedicated frame 309 // pointer register. This is true if frame pointer elimination is 310 // disabled, if it needs dynamic stack realignment, if the function has 311 // variable sized allocas, or if the frame address is taken. 312 bool RISCVFrameLowering::hasFP(const MachineFunction &MF) const { 313 const TargetRegisterInfo *RegInfo = MF.getSubtarget().getRegisterInfo(); 314 315 const MachineFrameInfo &MFI = MF.getFrameInfo(); 316 return MF.getTarget().Options.DisableFramePointerElim(MF) || 317 RegInfo->hasStackRealignment(MF) || MFI.hasVarSizedObjects() || 318 MFI.isFrameAddressTaken(); 319 } 320 321 bool RISCVFrameLowering::hasBP(const MachineFunction &MF) const { 322 const MachineFrameInfo &MFI = MF.getFrameInfo(); 323 const TargetRegisterInfo *TRI = STI.getRegisterInfo(); 324 325 // If we do not reserve stack space for outgoing arguments in prologue, 326 // we will adjust the stack pointer before call instruction. After the 327 // adjustment, we can not use SP to access the stack objects for the 328 // arguments. Instead, use BP to access these stack objects. 329 return (MFI.hasVarSizedObjects() || 330 (!hasReservedCallFrame(MF) && (!MFI.isMaxCallFrameSizeComputed() || 331 MFI.getMaxCallFrameSize() != 0))) && 332 TRI->hasStackRealignment(MF); 333 } 334 335 // Determines the size of the frame and maximum call frame size. 336 void RISCVFrameLowering::determineFrameLayout(MachineFunction &MF) const { 337 MachineFrameInfo &MFI = MF.getFrameInfo(); 338 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 339 340 // Get the number of bytes to allocate from the FrameInfo. 341 uint64_t FrameSize = MFI.getStackSize(); 342 343 // Get the alignment. 344 Align StackAlign = getStackAlign(); 345 346 // Make sure the frame is aligned. 347 FrameSize = alignTo(FrameSize, StackAlign); 348 349 // Update frame info. 350 MFI.setStackSize(FrameSize); 351 352 // When using SP or BP to access stack objects, we may require extra padding 353 // to ensure the bottom of the RVV stack is correctly aligned within the main 354 // stack. We calculate this as the amount required to align the scalar local 355 // variable section up to the RVV alignment. 356 const TargetRegisterInfo *TRI = STI.getRegisterInfo(); 357 if (RVFI->getRVVStackSize() && (!hasFP(MF) || TRI->hasStackRealignment(MF))) { 358 int ScalarLocalVarSize = FrameSize - RVFI->getCalleeSavedStackSize() - 359 RVFI->getVarArgsSaveSize(); 360 if (auto RVVPadding = 361 offsetToAlignment(ScalarLocalVarSize, RVFI->getRVVStackAlign())) 362 RVFI->setRVVPadding(RVVPadding); 363 } 364 } 365 366 // Returns the stack size including RVV padding (when required), rounded back 367 // up to the required stack alignment. 368 uint64_t RISCVFrameLowering::getStackSizeWithRVVPadding( 369 const MachineFunction &MF) const { 370 const MachineFrameInfo &MFI = MF.getFrameInfo(); 371 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 372 return alignTo(MFI.getStackSize() + RVFI->getRVVPadding(), getStackAlign()); 373 } 374 375 // Returns the register used to hold the frame pointer. 376 static Register getFPReg(const RISCVSubtarget &STI) { return RISCV::X8; } 377 378 // Returns the register used to hold the stack pointer. 379 static Register getSPReg(const RISCVSubtarget &STI) { return RISCV::X2; } 380 381 static SmallVector<CalleeSavedInfo, 8> 382 getUnmanagedCSI(const MachineFunction &MF, 383 const std::vector<CalleeSavedInfo> &CSI) { 384 const MachineFrameInfo &MFI = MF.getFrameInfo(); 385 SmallVector<CalleeSavedInfo, 8> NonLibcallCSI; 386 387 for (auto &CS : CSI) { 388 int FI = CS.getFrameIdx(); 389 if (FI >= 0 && MFI.getStackID(FI) == TargetStackID::Default) 390 NonLibcallCSI.push_back(CS); 391 } 392 393 return NonLibcallCSI; 394 } 395 396 static SmallVector<CalleeSavedInfo, 8> 397 getRVVCalleeSavedInfo(const MachineFunction &MF, 398 const std::vector<CalleeSavedInfo> &CSI) { 399 const MachineFrameInfo &MFI = MF.getFrameInfo(); 400 SmallVector<CalleeSavedInfo, 8> RVVCSI; 401 402 for (auto &CS : CSI) { 403 int FI = CS.getFrameIdx(); 404 if (FI >= 0 && MFI.getStackID(FI) == TargetStackID::ScalableVector) 405 RVVCSI.push_back(CS); 406 } 407 408 return RVVCSI; 409 } 410 411 void RISCVFrameLowering::adjustStackForRVV(MachineFunction &MF, 412 MachineBasicBlock &MBB, 413 MachineBasicBlock::iterator MBBI, 414 const DebugLoc &DL, int64_t Amount, 415 MachineInstr::MIFlag Flag) const { 416 assert(Amount != 0 && "Did not need to adjust stack pointer for RVV."); 417 418 const Register SPReg = getSPReg(STI); 419 420 // Optimize compile time offset case 421 StackOffset Offset = StackOffset::getScalable(Amount); 422 if (auto VLEN = STI.getRealVLen()) { 423 // 1. Multiply the number of v-slots by the (constant) length of register 424 const int64_t VLENB = *VLEN / 8; 425 assert(Amount % 8 == 0 && 426 "Reserve the stack by the multiple of one vector size."); 427 const int64_t NumOfVReg = Amount / 8; 428 const int64_t FixedOffset = NumOfVReg * VLENB; 429 if (!isInt<32>(FixedOffset)) { 430 report_fatal_error( 431 "Frame size outside of the signed 32-bit range not supported"); 432 } 433 Offset = StackOffset::getFixed(FixedOffset); 434 } 435 436 const RISCVRegisterInfo &RI = *STI.getRegisterInfo(); 437 // We must keep the stack pointer aligned through any intermediate 438 // updates. 439 RI.adjustReg(MBB, MBBI, DL, SPReg, SPReg, Offset, 440 Flag, getStackAlign()); 441 } 442 443 static void appendScalableVectorExpression(const TargetRegisterInfo &TRI, 444 SmallVectorImpl<char> &Expr, 445 int FixedOffset, int ScalableOffset, 446 llvm::raw_string_ostream &Comment) { 447 unsigned DwarfVLenB = TRI.getDwarfRegNum(RISCV::VLENB, true); 448 uint8_t Buffer[16]; 449 if (FixedOffset) { 450 Expr.push_back(dwarf::DW_OP_consts); 451 Expr.append(Buffer, Buffer + encodeSLEB128(FixedOffset, Buffer)); 452 Expr.push_back((uint8_t)dwarf::DW_OP_plus); 453 Comment << (FixedOffset < 0 ? " - " : " + ") << std::abs(FixedOffset); 454 } 455 456 Expr.push_back((uint8_t)dwarf::DW_OP_consts); 457 Expr.append(Buffer, Buffer + encodeSLEB128(ScalableOffset, Buffer)); 458 459 Expr.push_back((uint8_t)dwarf::DW_OP_bregx); 460 Expr.append(Buffer, Buffer + encodeULEB128(DwarfVLenB, Buffer)); 461 Expr.push_back(0); 462 463 Expr.push_back((uint8_t)dwarf::DW_OP_mul); 464 Expr.push_back((uint8_t)dwarf::DW_OP_plus); 465 466 Comment << (ScalableOffset < 0 ? " - " : " + ") << std::abs(ScalableOffset) 467 << " * vlenb"; 468 } 469 470 static MCCFIInstruction createDefCFAExpression(const TargetRegisterInfo &TRI, 471 Register Reg, 472 uint64_t FixedOffset, 473 uint64_t ScalableOffset) { 474 assert(ScalableOffset != 0 && "Did not need to adjust CFA for RVV"); 475 SmallString<64> Expr; 476 std::string CommentBuffer; 477 llvm::raw_string_ostream Comment(CommentBuffer); 478 // Build up the expression (Reg + FixedOffset + ScalableOffset * VLENB). 479 unsigned DwarfReg = TRI.getDwarfRegNum(Reg, true); 480 Expr.push_back((uint8_t)(dwarf::DW_OP_breg0 + DwarfReg)); 481 Expr.push_back(0); 482 if (Reg == RISCV::X2) 483 Comment << "sp"; 484 else 485 Comment << printReg(Reg, &TRI); 486 487 appendScalableVectorExpression(TRI, Expr, FixedOffset, ScalableOffset, 488 Comment); 489 490 SmallString<64> DefCfaExpr; 491 uint8_t Buffer[16]; 492 DefCfaExpr.push_back(dwarf::DW_CFA_def_cfa_expression); 493 DefCfaExpr.append(Buffer, Buffer + encodeULEB128(Expr.size(), Buffer)); 494 DefCfaExpr.append(Expr.str()); 495 496 return MCCFIInstruction::createEscape(nullptr, DefCfaExpr.str(), SMLoc(), 497 Comment.str()); 498 } 499 500 static MCCFIInstruction createDefCFAOffset(const TargetRegisterInfo &TRI, 501 Register Reg, uint64_t FixedOffset, 502 uint64_t ScalableOffset) { 503 assert(ScalableOffset != 0 && "Did not need to adjust CFA for RVV"); 504 SmallString<64> Expr; 505 std::string CommentBuffer; 506 llvm::raw_string_ostream Comment(CommentBuffer); 507 Comment << printReg(Reg, &TRI) << " @ cfa"; 508 509 // Build up the expression (FixedOffset + ScalableOffset * VLENB). 510 appendScalableVectorExpression(TRI, Expr, FixedOffset, ScalableOffset, 511 Comment); 512 513 SmallString<64> DefCfaExpr; 514 uint8_t Buffer[16]; 515 unsigned DwarfReg = TRI.getDwarfRegNum(Reg, true); 516 DefCfaExpr.push_back(dwarf::DW_CFA_expression); 517 DefCfaExpr.append(Buffer, Buffer + encodeULEB128(DwarfReg, Buffer)); 518 DefCfaExpr.append(Buffer, Buffer + encodeULEB128(Expr.size(), Buffer)); 519 DefCfaExpr.append(Expr.str()); 520 521 return MCCFIInstruction::createEscape(nullptr, DefCfaExpr.str(), SMLoc(), 522 Comment.str()); 523 } 524 525 void RISCVFrameLowering::emitPrologue(MachineFunction &MF, 526 MachineBasicBlock &MBB) const { 527 MachineFrameInfo &MFI = MF.getFrameInfo(); 528 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 529 const RISCVRegisterInfo *RI = STI.getRegisterInfo(); 530 const RISCVInstrInfo *TII = STI.getInstrInfo(); 531 MachineBasicBlock::iterator MBBI = MBB.begin(); 532 533 Register FPReg = getFPReg(STI); 534 Register SPReg = getSPReg(STI); 535 Register BPReg = RISCVABI::getBPReg(); 536 537 // Debug location must be unknown since the first debug location is used 538 // to determine the end of the prologue. 539 DebugLoc DL; 540 541 // All calls are tail calls in GHC calling conv, and functions have no 542 // prologue/epilogue. 543 if (MF.getFunction().getCallingConv() == CallingConv::GHC) 544 return; 545 546 // Emit prologue for shadow call stack. 547 emitSCSPrologue(MF, MBB, MBBI, DL); 548 549 auto FirstFrameSetup = MBBI; 550 551 // Since spillCalleeSavedRegisters may have inserted a libcall, skip past 552 // any instructions marked as FrameSetup 553 while (MBBI != MBB.end() && MBBI->getFlag(MachineInstr::FrameSetup)) 554 ++MBBI; 555 556 // Determine the correct frame layout 557 determineFrameLayout(MF); 558 559 // If libcalls are used to spill and restore callee-saved registers, the frame 560 // has two sections; the opaque section managed by the libcalls, and the 561 // section managed by MachineFrameInfo which can also hold callee saved 562 // registers in fixed stack slots, both of which have negative frame indices. 563 // This gets even more complicated when incoming arguments are passed via the 564 // stack, as these too have negative frame indices. An example is detailed 565 // below: 566 // 567 // | incoming arg | <- FI[-3] 568 // | libcallspill | 569 // | calleespill | <- FI[-2] 570 // | calleespill | <- FI[-1] 571 // | this_frame | <- FI[0] 572 // 573 // For negative frame indices, the offset from the frame pointer will differ 574 // depending on which of these groups the frame index applies to. 575 // The following calculates the correct offset knowing the number of callee 576 // saved registers spilt by the two methods. 577 if (int LibCallRegs = getLibCallID(MF, MFI.getCalleeSavedInfo()) + 1) { 578 // Calculate the size of the frame managed by the libcall. The stack 579 // alignment of these libcalls should be the same as how we set it in 580 // getABIStackAlignment. 581 unsigned LibCallFrameSize = 582 alignTo((STI.getXLen() / 8) * LibCallRegs, getStackAlign()); 583 RVFI->setLibCallStackSize(LibCallFrameSize); 584 } 585 586 // FIXME (note copied from Lanai): This appears to be overallocating. Needs 587 // investigation. Get the number of bytes to allocate from the FrameInfo. 588 uint64_t RealStackSize = getStackSizeWithRVVPadding(MF); 589 uint64_t StackSize = RealStackSize - RVFI->getReservedSpillsSize(); 590 uint64_t RVVStackSize = RVFI->getRVVStackSize(); 591 592 // Early exit if there is no need to allocate on the stack 593 if (RealStackSize == 0 && !MFI.adjustsStack() && RVVStackSize == 0) 594 return; 595 596 // If the stack pointer has been marked as reserved, then produce an error if 597 // the frame requires stack allocation 598 if (STI.isRegisterReservedByUser(SPReg)) 599 MF.getFunction().getContext().diagnose(DiagnosticInfoUnsupported{ 600 MF.getFunction(), "Stack pointer required, but has been reserved."}); 601 602 uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF); 603 // Split the SP adjustment to reduce the offsets of callee saved spill. 604 if (FirstSPAdjustAmount) { 605 StackSize = FirstSPAdjustAmount; 606 RealStackSize = FirstSPAdjustAmount; 607 } 608 609 if (RVFI->isPushable(MF) && FirstFrameSetup != MBB.end() && 610 FirstFrameSetup->getOpcode() == RISCV::CM_PUSH) { 611 // Use available stack adjustment in push instruction to allocate additional 612 // stack space. Align the stack size down to a multiple of 16. This is 613 // needed for RVE. 614 // FIXME: Can we increase the stack size to a multiple of 16 instead? 615 uint64_t Spimm = std::min(alignDown(StackSize, 16), (uint64_t)48); 616 FirstFrameSetup->getOperand(1).setImm(Spimm); 617 StackSize -= Spimm; 618 } 619 620 if (StackSize != 0) { 621 // Allocate space on the stack if necessary. 622 RI->adjustReg(MBB, MBBI, DL, SPReg, SPReg, 623 StackOffset::getFixed(-StackSize), MachineInstr::FrameSetup, 624 getStackAlign()); 625 } 626 627 // Emit ".cfi_def_cfa_offset RealStackSize" 628 unsigned CFIIndex = MF.addFrameInst( 629 MCCFIInstruction::cfiDefCfaOffset(nullptr, RealStackSize)); 630 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION)) 631 .addCFIIndex(CFIIndex) 632 .setMIFlag(MachineInstr::FrameSetup); 633 634 const auto &CSI = MFI.getCalleeSavedInfo(); 635 636 // The frame pointer is callee-saved, and code has been generated for us to 637 // save it to the stack. We need to skip over the storing of callee-saved 638 // registers as the frame pointer must be modified after it has been saved 639 // to the stack, not before. 640 // FIXME: assumes exactly one instruction is used to save each callee-saved 641 // register. 642 std::advance(MBBI, getUnmanagedCSI(MF, CSI).size()); 643 644 // Iterate over list of callee-saved registers and emit .cfi_offset 645 // directives. 646 for (const auto &Entry : CSI) { 647 int FrameIdx = Entry.getFrameIdx(); 648 if (FrameIdx >= 0 && 649 MFI.getStackID(FrameIdx) == TargetStackID::ScalableVector) 650 continue; 651 652 int64_t Offset = MFI.getObjectOffset(FrameIdx); 653 Register Reg = Entry.getReg(); 654 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createOffset( 655 nullptr, RI->getDwarfRegNum(Reg, true), Offset)); 656 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION)) 657 .addCFIIndex(CFIIndex) 658 .setMIFlag(MachineInstr::FrameSetup); 659 } 660 661 // Generate new FP. 662 if (hasFP(MF)) { 663 if (STI.isRegisterReservedByUser(FPReg)) 664 MF.getFunction().getContext().diagnose(DiagnosticInfoUnsupported{ 665 MF.getFunction(), "Frame pointer required, but has been reserved."}); 666 // The frame pointer does need to be reserved from register allocation. 667 assert(MF.getRegInfo().isReserved(FPReg) && "FP not reserved"); 668 669 RI->adjustReg(MBB, MBBI, DL, FPReg, SPReg, 670 StackOffset::getFixed(RealStackSize - RVFI->getVarArgsSaveSize()), 671 MachineInstr::FrameSetup, getStackAlign()); 672 673 // Emit ".cfi_def_cfa $fp, RVFI->getVarArgsSaveSize()" 674 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::cfiDefCfa( 675 nullptr, RI->getDwarfRegNum(FPReg, true), RVFI->getVarArgsSaveSize())); 676 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION)) 677 .addCFIIndex(CFIIndex) 678 .setMIFlag(MachineInstr::FrameSetup); 679 } 680 681 // Emit the second SP adjustment after saving callee saved registers. 682 if (FirstSPAdjustAmount) { 683 uint64_t SecondSPAdjustAmount = 684 getStackSizeWithRVVPadding(MF) - FirstSPAdjustAmount; 685 assert(SecondSPAdjustAmount > 0 && 686 "SecondSPAdjustAmount should be greater than zero"); 687 RI->adjustReg(MBB, MBBI, DL, SPReg, SPReg, 688 StackOffset::getFixed(-SecondSPAdjustAmount), 689 MachineInstr::FrameSetup, getStackAlign()); 690 691 // If we are using a frame-pointer, and thus emitted ".cfi_def_cfa fp, 0", 692 // don't emit an sp-based .cfi_def_cfa_offset 693 if (!hasFP(MF)) { 694 // Emit ".cfi_def_cfa_offset StackSize" 695 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::cfiDefCfaOffset( 696 nullptr, getStackSizeWithRVVPadding(MF))); 697 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION)) 698 .addCFIIndex(CFIIndex) 699 .setMIFlag(MachineInstr::FrameSetup); 700 } 701 } 702 703 if (RVVStackSize) { 704 adjustStackForRVV(MF, MBB, MBBI, DL, -RVVStackSize, 705 MachineInstr::FrameSetup); 706 if (!hasFP(MF)) { 707 // Emit .cfi_def_cfa_expression "sp + StackSize + RVVStackSize * vlenb". 708 unsigned CFIIndex = MF.addFrameInst(createDefCFAExpression( 709 *RI, SPReg, getStackSizeWithRVVPadding(MF), RVVStackSize / 8)); 710 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION)) 711 .addCFIIndex(CFIIndex) 712 .setMIFlag(MachineInstr::FrameSetup); 713 } 714 715 std::advance(MBBI, getRVVCalleeSavedInfo(MF, CSI).size()); 716 emitCalleeSavedRVVPrologCFI(MBB, MBBI, hasFP(MF)); 717 } 718 719 if (hasFP(MF)) { 720 // Realign Stack 721 const RISCVRegisterInfo *RI = STI.getRegisterInfo(); 722 if (RI->hasStackRealignment(MF)) { 723 Align MaxAlignment = MFI.getMaxAlign(); 724 725 const RISCVInstrInfo *TII = STI.getInstrInfo(); 726 if (isInt<12>(-(int)MaxAlignment.value())) { 727 BuildMI(MBB, MBBI, DL, TII->get(RISCV::ANDI), SPReg) 728 .addReg(SPReg) 729 .addImm(-(int)MaxAlignment.value()) 730 .setMIFlag(MachineInstr::FrameSetup); 731 } else { 732 unsigned ShiftAmount = Log2(MaxAlignment); 733 Register VR = 734 MF.getRegInfo().createVirtualRegister(&RISCV::GPRRegClass); 735 BuildMI(MBB, MBBI, DL, TII->get(RISCV::SRLI), VR) 736 .addReg(SPReg) 737 .addImm(ShiftAmount) 738 .setMIFlag(MachineInstr::FrameSetup); 739 BuildMI(MBB, MBBI, DL, TII->get(RISCV::SLLI), SPReg) 740 .addReg(VR) 741 .addImm(ShiftAmount) 742 .setMIFlag(MachineInstr::FrameSetup); 743 } 744 // FP will be used to restore the frame in the epilogue, so we need 745 // another base register BP to record SP after re-alignment. SP will 746 // track the current stack after allocating variable sized objects. 747 if (hasBP(MF)) { 748 // move BP, SP 749 BuildMI(MBB, MBBI, DL, TII->get(RISCV::ADDI), BPReg) 750 .addReg(SPReg) 751 .addImm(0) 752 .setMIFlag(MachineInstr::FrameSetup); 753 } 754 } 755 } 756 } 757 758 void RISCVFrameLowering::emitEpilogue(MachineFunction &MF, 759 MachineBasicBlock &MBB) const { 760 const RISCVRegisterInfo *RI = STI.getRegisterInfo(); 761 MachineFrameInfo &MFI = MF.getFrameInfo(); 762 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 763 Register FPReg = getFPReg(STI); 764 Register SPReg = getSPReg(STI); 765 766 // All calls are tail calls in GHC calling conv, and functions have no 767 // prologue/epilogue. 768 if (MF.getFunction().getCallingConv() == CallingConv::GHC) 769 return; 770 771 // Get the insert location for the epilogue. If there were no terminators in 772 // the block, get the last instruction. 773 MachineBasicBlock::iterator MBBI = MBB.end(); 774 DebugLoc DL; 775 if (!MBB.empty()) { 776 MBBI = MBB.getLastNonDebugInstr(); 777 if (MBBI != MBB.end()) 778 DL = MBBI->getDebugLoc(); 779 780 MBBI = MBB.getFirstTerminator(); 781 782 // If callee-saved registers are saved via libcall, place stack adjustment 783 // before this call. 784 while (MBBI != MBB.begin() && 785 std::prev(MBBI)->getFlag(MachineInstr::FrameDestroy)) 786 --MBBI; 787 } 788 789 const auto &CSI = getUnmanagedCSI(MF, MFI.getCalleeSavedInfo()); 790 791 // Skip to before the restores of scalar callee-saved registers 792 // FIXME: assumes exactly one instruction is used to restore each 793 // callee-saved register. 794 auto LastFrameDestroy = MBBI; 795 if (!CSI.empty()) 796 LastFrameDestroy = std::prev(MBBI, CSI.size()); 797 798 uint64_t RealStackSize = getStackSizeWithRVVPadding(MF); 799 uint64_t StackSize = RealStackSize - RVFI->getReservedSpillsSize(); 800 uint64_t FPOffset = RealStackSize - RVFI->getVarArgsSaveSize(); 801 uint64_t RVVStackSize = RVFI->getRVVStackSize(); 802 803 // Restore the stack pointer using the value of the frame pointer. Only 804 // necessary if the stack pointer was modified, meaning the stack size is 805 // unknown. 806 // 807 // In order to make sure the stack point is right through the EH region, 808 // we also need to restore stack pointer from the frame pointer if we 809 // don't preserve stack space within prologue/epilogue for outgoing variables, 810 // normally it's just checking the variable sized object is present or not 811 // is enough, but we also don't preserve that at prologue/epilogue when 812 // have vector objects in stack. 813 if (RI->hasStackRealignment(MF) || MFI.hasVarSizedObjects() || 814 !hasReservedCallFrame(MF)) { 815 assert(hasFP(MF) && "frame pointer should not have been eliminated"); 816 RI->adjustReg(MBB, LastFrameDestroy, DL, SPReg, FPReg, 817 StackOffset::getFixed(-FPOffset), 818 MachineInstr::FrameDestroy, getStackAlign()); 819 } else { 820 if (RVVStackSize) 821 adjustStackForRVV(MF, MBB, LastFrameDestroy, DL, RVVStackSize, 822 MachineInstr::FrameDestroy); 823 } 824 825 uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF); 826 if (FirstSPAdjustAmount) { 827 uint64_t SecondSPAdjustAmount = 828 getStackSizeWithRVVPadding(MF) - FirstSPAdjustAmount; 829 assert(SecondSPAdjustAmount > 0 && 830 "SecondSPAdjustAmount should be greater than zero"); 831 832 RI->adjustReg(MBB, LastFrameDestroy, DL, SPReg, SPReg, 833 StackOffset::getFixed(SecondSPAdjustAmount), 834 MachineInstr::FrameDestroy, getStackAlign()); 835 } 836 837 if (FirstSPAdjustAmount) 838 StackSize = FirstSPAdjustAmount; 839 840 if (RVFI->isPushable(MF) && MBBI != MBB.end() && 841 MBBI->getOpcode() == RISCV::CM_POP) { 842 // Use available stack adjustment in pop instruction to deallocate stack 843 // space. Align the stack size down to a multiple of 16. This is needed for 844 // RVE. 845 // FIXME: Can we increase the stack size to a multiple of 16 instead? 846 uint64_t Spimm = std::min(alignDown(StackSize, 16), (uint64_t)48); 847 MBBI->getOperand(1).setImm(Spimm); 848 StackSize -= Spimm; 849 } 850 851 // Deallocate stack 852 if (StackSize != 0) { 853 RI->adjustReg(MBB, MBBI, DL, SPReg, SPReg, StackOffset::getFixed(StackSize), 854 MachineInstr::FrameDestroy, getStackAlign()); 855 } 856 857 // Emit epilogue for shadow call stack. 858 emitSCSEpilogue(MF, MBB, MBBI, DL); 859 } 860 861 StackOffset 862 RISCVFrameLowering::getFrameIndexReference(const MachineFunction &MF, int FI, 863 Register &FrameReg) const { 864 const MachineFrameInfo &MFI = MF.getFrameInfo(); 865 const TargetRegisterInfo *RI = MF.getSubtarget().getRegisterInfo(); 866 const auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 867 868 // Callee-saved registers should be referenced relative to the stack 869 // pointer (positive offset), otherwise use the frame pointer (negative 870 // offset). 871 const auto &CSI = getUnmanagedCSI(MF, MFI.getCalleeSavedInfo()); 872 int MinCSFI = 0; 873 int MaxCSFI = -1; 874 StackOffset Offset; 875 auto StackID = MFI.getStackID(FI); 876 877 assert((StackID == TargetStackID::Default || 878 StackID == TargetStackID::ScalableVector) && 879 "Unexpected stack ID for the frame object."); 880 if (StackID == TargetStackID::Default) { 881 assert(getOffsetOfLocalArea() == 0 && "LocalAreaOffset is not 0!"); 882 Offset = StackOffset::getFixed(MFI.getObjectOffset(FI) + 883 MFI.getOffsetAdjustment()); 884 } else if (StackID == TargetStackID::ScalableVector) { 885 Offset = StackOffset::getScalable(MFI.getObjectOffset(FI)); 886 } 887 888 uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF); 889 890 if (CSI.size()) { 891 MinCSFI = CSI[0].getFrameIdx(); 892 MaxCSFI = CSI[CSI.size() - 1].getFrameIdx(); 893 } 894 895 if (FI >= MinCSFI && FI <= MaxCSFI) { 896 FrameReg = RISCV::X2; 897 898 if (FirstSPAdjustAmount) 899 Offset += StackOffset::getFixed(FirstSPAdjustAmount); 900 else 901 Offset += StackOffset::getFixed(getStackSizeWithRVVPadding(MF)); 902 return Offset; 903 } 904 905 if (RI->hasStackRealignment(MF) && !MFI.isFixedObjectIndex(FI)) { 906 // If the stack was realigned, the frame pointer is set in order to allow 907 // SP to be restored, so we need another base register to record the stack 908 // after realignment. 909 // |--------------------------| -- <-- FP 910 // | callee-allocated save | | <----| 911 // | area for register varargs| | | 912 // |--------------------------| | | 913 // | callee-saved registers | | | 914 // |--------------------------| -- | 915 // | realignment (the size of | | | 916 // | this area is not counted | | | 917 // | in MFI.getStackSize()) | | | 918 // |--------------------------| -- |-- MFI.getStackSize() 919 // | RVV alignment padding | | | 920 // | (not counted in | | | 921 // | MFI.getStackSize() but | | | 922 // | counted in | | | 923 // | RVFI.getRVVStackSize()) | | | 924 // |--------------------------| -- | 925 // | RVV objects | | | 926 // | (not counted in | | | 927 // | MFI.getStackSize()) | | | 928 // |--------------------------| -- | 929 // | padding before RVV | | | 930 // | (not counted in | | | 931 // | MFI.getStackSize() or in | | | 932 // | RVFI.getRVVStackSize()) | | | 933 // |--------------------------| -- | 934 // | scalar local variables | | <----' 935 // |--------------------------| -- <-- BP (if var sized objects present) 936 // | VarSize objects | | 937 // |--------------------------| -- <-- SP 938 if (hasBP(MF)) { 939 FrameReg = RISCVABI::getBPReg(); 940 } else { 941 // VarSize objects must be empty in this case! 942 assert(!MFI.hasVarSizedObjects()); 943 FrameReg = RISCV::X2; 944 } 945 } else { 946 FrameReg = RI->getFrameRegister(MF); 947 } 948 949 if (FrameReg == getFPReg(STI)) { 950 Offset += StackOffset::getFixed(RVFI->getVarArgsSaveSize()); 951 // When using FP to access scalable vector objects, we need to minus 952 // the frame size. 953 // 954 // |--------------------------| -- <-- FP 955 // | callee-allocated save | | 956 // | area for register varargs| | 957 // |--------------------------| | 958 // | callee-saved registers | | 959 // |--------------------------| | MFI.getStackSize() 960 // | scalar local variables | | 961 // |--------------------------| -- (Offset of RVV objects is from here.) 962 // | RVV objects | 963 // |--------------------------| 964 // | VarSize objects | 965 // |--------------------------| <-- SP 966 if (MFI.getStackID(FI) == TargetStackID::ScalableVector) { 967 assert(!RI->hasStackRealignment(MF) && 968 "Can't index across variable sized realign"); 969 // We don't expect any extra RVV alignment padding, as the stack size 970 // and RVV object sections should be correct aligned in their own 971 // right. 972 assert(MFI.getStackSize() == getStackSizeWithRVVPadding(MF) && 973 "Inconsistent stack layout"); 974 Offset -= StackOffset::getFixed(MFI.getStackSize()); 975 } 976 return Offset; 977 } 978 979 // This case handles indexing off both SP and BP. 980 // If indexing off SP, there must not be any var sized objects 981 assert(FrameReg == RISCVABI::getBPReg() || !MFI.hasVarSizedObjects()); 982 983 // When using SP to access frame objects, we need to add RVV stack size. 984 // 985 // |--------------------------| -- <-- FP 986 // | callee-allocated save | | <----| 987 // | area for register varargs| | | 988 // |--------------------------| | | 989 // | callee-saved registers | | | 990 // |--------------------------| -- | 991 // | RVV alignment padding | | | 992 // | (not counted in | | | 993 // | MFI.getStackSize() but | | | 994 // | counted in | | | 995 // | RVFI.getRVVStackSize()) | | | 996 // |--------------------------| -- | 997 // | RVV objects | | |-- MFI.getStackSize() 998 // | (not counted in | | | 999 // | MFI.getStackSize()) | | | 1000 // |--------------------------| -- | 1001 // | padding before RVV | | | 1002 // | (not counted in | | | 1003 // | MFI.getStackSize()) | | | 1004 // |--------------------------| -- | 1005 // | scalar local variables | | <----' 1006 // |--------------------------| -- <-- BP (if var sized objects present) 1007 // | VarSize objects | | 1008 // |--------------------------| -- <-- SP 1009 // 1010 // The total amount of padding surrounding RVV objects is described by 1011 // RVV->getRVVPadding() and it can be zero. It allows us to align the RVV 1012 // objects to the required alignment. 1013 if (MFI.getStackID(FI) == TargetStackID::Default) { 1014 if (MFI.isFixedObjectIndex(FI)) { 1015 assert(!RI->hasStackRealignment(MF) && 1016 "Can't index across variable sized realign"); 1017 Offset += StackOffset::get(getStackSizeWithRVVPadding(MF), 1018 RVFI->getRVVStackSize()); 1019 } else { 1020 Offset += StackOffset::getFixed(MFI.getStackSize()); 1021 } 1022 } else if (MFI.getStackID(FI) == TargetStackID::ScalableVector) { 1023 // Ensure the base of the RVV stack is correctly aligned: add on the 1024 // alignment padding. 1025 int ScalarLocalVarSize = MFI.getStackSize() - 1026 RVFI->getCalleeSavedStackSize() - 1027 RVFI->getRVPushStackSize() - 1028 RVFI->getVarArgsSaveSize() + RVFI->getRVVPadding(); 1029 Offset += StackOffset::get(ScalarLocalVarSize, RVFI->getRVVStackSize()); 1030 } 1031 return Offset; 1032 } 1033 1034 void RISCVFrameLowering::determineCalleeSaves(MachineFunction &MF, 1035 BitVector &SavedRegs, 1036 RegScavenger *RS) const { 1037 TargetFrameLowering::determineCalleeSaves(MF, SavedRegs, RS); 1038 // Unconditionally spill RA and FP only if the function uses a frame 1039 // pointer. 1040 if (hasFP(MF)) { 1041 SavedRegs.set(RISCV::X1); 1042 SavedRegs.set(RISCV::X8); 1043 } 1044 // Mark BP as used if function has dedicated base pointer. 1045 if (hasBP(MF)) 1046 SavedRegs.set(RISCVABI::getBPReg()); 1047 1048 // When using cm.push/pop we must save X27 if we save X26. 1049 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 1050 if (RVFI->isPushable(MF) && SavedRegs.test(RISCV::X26)) 1051 SavedRegs.set(RISCV::X27); 1052 } 1053 1054 std::pair<int64_t, Align> 1055 RISCVFrameLowering::assignRVVStackObjectOffsets(MachineFunction &MF) const { 1056 MachineFrameInfo &MFI = MF.getFrameInfo(); 1057 // Create a buffer of RVV objects to allocate. 1058 SmallVector<int, 8> ObjectsToAllocate; 1059 auto pushRVVObjects = [&](int FIBegin, int FIEnd) { 1060 for (int I = FIBegin, E = FIEnd; I != E; ++I) { 1061 unsigned StackID = MFI.getStackID(I); 1062 if (StackID != TargetStackID::ScalableVector) 1063 continue; 1064 if (MFI.isDeadObjectIndex(I)) 1065 continue; 1066 1067 ObjectsToAllocate.push_back(I); 1068 } 1069 }; 1070 // First push RVV Callee Saved object, then push RVV stack object 1071 std::vector<CalleeSavedInfo> &CSI = MF.getFrameInfo().getCalleeSavedInfo(); 1072 const auto &RVVCSI = getRVVCalleeSavedInfo(MF, CSI); 1073 if (!RVVCSI.empty()) 1074 pushRVVObjects(RVVCSI[0].getFrameIdx(), 1075 RVVCSI[RVVCSI.size() - 1].getFrameIdx() + 1); 1076 pushRVVObjects(0, MFI.getObjectIndexEnd() - RVVCSI.size()); 1077 1078 // The minimum alignment is 16 bytes. 1079 Align RVVStackAlign(16); 1080 const auto &ST = MF.getSubtarget<RISCVSubtarget>(); 1081 1082 if (!ST.hasVInstructions()) { 1083 assert(ObjectsToAllocate.empty() && 1084 "Can't allocate scalable-vector objects without V instructions"); 1085 return std::make_pair(0, RVVStackAlign); 1086 } 1087 1088 // Allocate all RVV locals and spills 1089 int64_t Offset = 0; 1090 for (int FI : ObjectsToAllocate) { 1091 // ObjectSize in bytes. 1092 int64_t ObjectSize = MFI.getObjectSize(FI); 1093 auto ObjectAlign = std::max(Align(8), MFI.getObjectAlign(FI)); 1094 // If the data type is the fractional vector type, reserve one vector 1095 // register for it. 1096 if (ObjectSize < 8) 1097 ObjectSize = 8; 1098 Offset = alignTo(Offset + ObjectSize, ObjectAlign); 1099 MFI.setObjectOffset(FI, -Offset); 1100 // Update the maximum alignment of the RVV stack section 1101 RVVStackAlign = std::max(RVVStackAlign, ObjectAlign); 1102 } 1103 1104 // Ensure the alignment of the RVV stack. Since we want the most-aligned 1105 // object right at the bottom (i.e., any padding at the top of the frame), 1106 // readjust all RVV objects down by the alignment padding. 1107 uint64_t StackSize = Offset; 1108 if (auto AlignmentPadding = offsetToAlignment(StackSize, RVVStackAlign)) { 1109 StackSize += AlignmentPadding; 1110 for (int FI : ObjectsToAllocate) 1111 MFI.setObjectOffset(FI, MFI.getObjectOffset(FI) - AlignmentPadding); 1112 } 1113 1114 return std::make_pair(StackSize, RVVStackAlign); 1115 } 1116 1117 static unsigned getScavSlotsNumForRVV(MachineFunction &MF) { 1118 // For RVV spill, scalable stack offsets computing requires up to two scratch 1119 // registers 1120 static constexpr unsigned ScavSlotsNumRVVSpillScalableObject = 2; 1121 1122 // For RVV spill, non-scalable stack offsets computing requires up to one 1123 // scratch register. 1124 static constexpr unsigned ScavSlotsNumRVVSpillNonScalableObject = 1; 1125 1126 // ADDI instruction's destination register can be used for computing 1127 // offsets. So Scalable stack offsets require up to one scratch register. 1128 static constexpr unsigned ScavSlotsADDIScalableObject = 1; 1129 1130 static constexpr unsigned MaxScavSlotsNumKnown = 1131 std::max({ScavSlotsADDIScalableObject, ScavSlotsNumRVVSpillScalableObject, 1132 ScavSlotsNumRVVSpillNonScalableObject}); 1133 1134 unsigned MaxScavSlotsNum = 0; 1135 if (!MF.getSubtarget<RISCVSubtarget>().hasVInstructions()) 1136 return false; 1137 for (const MachineBasicBlock &MBB : MF) 1138 for (const MachineInstr &MI : MBB) { 1139 bool IsRVVSpill = RISCV::isRVVSpill(MI); 1140 for (auto &MO : MI.operands()) { 1141 if (!MO.isFI()) 1142 continue; 1143 bool IsScalableVectorID = MF.getFrameInfo().getStackID(MO.getIndex()) == 1144 TargetStackID::ScalableVector; 1145 if (IsRVVSpill) { 1146 MaxScavSlotsNum = std::max( 1147 MaxScavSlotsNum, IsScalableVectorID 1148 ? ScavSlotsNumRVVSpillScalableObject 1149 : ScavSlotsNumRVVSpillNonScalableObject); 1150 } else if (MI.getOpcode() == RISCV::ADDI && IsScalableVectorID) { 1151 MaxScavSlotsNum = 1152 std::max(MaxScavSlotsNum, ScavSlotsADDIScalableObject); 1153 } 1154 } 1155 if (MaxScavSlotsNum == MaxScavSlotsNumKnown) 1156 return MaxScavSlotsNumKnown; 1157 } 1158 return MaxScavSlotsNum; 1159 } 1160 1161 static bool hasRVVFrameObject(const MachineFunction &MF) { 1162 // Originally, the function will scan all the stack objects to check whether 1163 // if there is any scalable vector object on the stack or not. However, it 1164 // causes errors in the register allocator. In issue 53016, it returns false 1165 // before RA because there is no RVV stack objects. After RA, it returns true 1166 // because there are spilling slots for RVV values during RA. It will not 1167 // reserve BP during register allocation and generate BP access in the PEI 1168 // pass due to the inconsistent behavior of the function. 1169 // 1170 // The function is changed to use hasVInstructions() as the return value. It 1171 // is not precise, but it can make the register allocation correct. 1172 // 1173 // FIXME: Find a better way to make the decision or revisit the solution in 1174 // D103622. 1175 // 1176 // Refer to https://github.com/llvm/llvm-project/issues/53016. 1177 return MF.getSubtarget<RISCVSubtarget>().hasVInstructions(); 1178 } 1179 1180 static unsigned estimateFunctionSizeInBytes(const MachineFunction &MF, 1181 const RISCVInstrInfo &TII) { 1182 unsigned FnSize = 0; 1183 for (auto &MBB : MF) { 1184 for (auto &MI : MBB) { 1185 // Far branches over 20-bit offset will be relaxed in branch relaxation 1186 // pass. In the worst case, conditional branches will be relaxed into 1187 // the following instruction sequence. Unconditional branches are 1188 // relaxed in the same way, with the exception that there is no first 1189 // branch instruction. 1190 // 1191 // foo 1192 // bne t5, t6, .rev_cond # `TII->getInstSizeInBytes(MI)` bytes 1193 // sd s11, 0(sp) # 4 bytes, or 2 bytes in RVC 1194 // jump .restore, s11 # 8 bytes 1195 // .rev_cond 1196 // bar 1197 // j .dest_bb # 4 bytes, or 2 bytes in RVC 1198 // .restore: 1199 // ld s11, 0(sp) # 4 bytes, or 2 bytes in RVC 1200 // .dest: 1201 // baz 1202 if (MI.isConditionalBranch()) 1203 FnSize += TII.getInstSizeInBytes(MI); 1204 if (MI.isConditionalBranch() || MI.isUnconditionalBranch()) { 1205 if (MF.getSubtarget<RISCVSubtarget>().hasStdExtCOrZca()) 1206 FnSize += 2 + 8 + 2 + 2; 1207 else 1208 FnSize += 4 + 8 + 4 + 4; 1209 continue; 1210 } 1211 1212 FnSize += TII.getInstSizeInBytes(MI); 1213 } 1214 } 1215 return FnSize; 1216 } 1217 1218 void RISCVFrameLowering::processFunctionBeforeFrameFinalized( 1219 MachineFunction &MF, RegScavenger *RS) const { 1220 const RISCVRegisterInfo *RegInfo = 1221 MF.getSubtarget<RISCVSubtarget>().getRegisterInfo(); 1222 const RISCVInstrInfo *TII = MF.getSubtarget<RISCVSubtarget>().getInstrInfo(); 1223 MachineFrameInfo &MFI = MF.getFrameInfo(); 1224 const TargetRegisterClass *RC = &RISCV::GPRRegClass; 1225 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 1226 1227 int64_t RVVStackSize; 1228 Align RVVStackAlign; 1229 std::tie(RVVStackSize, RVVStackAlign) = assignRVVStackObjectOffsets(MF); 1230 1231 RVFI->setRVVStackSize(RVVStackSize); 1232 RVFI->setRVVStackAlign(RVVStackAlign); 1233 1234 if (hasRVVFrameObject(MF)) { 1235 // Ensure the entire stack is aligned to at least the RVV requirement: some 1236 // scalable-vector object alignments are not considered by the 1237 // target-independent code. 1238 MFI.ensureMaxAlignment(RVVStackAlign); 1239 } 1240 1241 unsigned ScavSlotsNum = 0; 1242 1243 // estimateStackSize has been observed to under-estimate the final stack 1244 // size, so give ourselves wiggle-room by checking for stack size 1245 // representable an 11-bit signed field rather than 12-bits. 1246 if (!isInt<11>(MFI.estimateStackSize(MF))) 1247 ScavSlotsNum = 1; 1248 1249 // Far branches over 20-bit offset require a spill slot for scratch register. 1250 bool IsLargeFunction = !isInt<20>(estimateFunctionSizeInBytes(MF, *TII)); 1251 if (IsLargeFunction) 1252 ScavSlotsNum = std::max(ScavSlotsNum, 1u); 1253 1254 // RVV loads & stores have no capacity to hold the immediate address offsets 1255 // so we must always reserve an emergency spill slot if the MachineFunction 1256 // contains any RVV spills. 1257 ScavSlotsNum = std::max(ScavSlotsNum, getScavSlotsNumForRVV(MF)); 1258 1259 for (unsigned I = 0; I < ScavSlotsNum; I++) { 1260 int FI = MFI.CreateStackObject(RegInfo->getSpillSize(*RC), 1261 RegInfo->getSpillAlign(*RC), false); 1262 RS->addScavengingFrameIndex(FI); 1263 1264 if (IsLargeFunction && RVFI->getBranchRelaxationScratchFrameIndex() == -1) 1265 RVFI->setBranchRelaxationScratchFrameIndex(FI); 1266 } 1267 1268 unsigned Size = RVFI->getReservedSpillsSize(); 1269 for (const auto &Info : MFI.getCalleeSavedInfo()) { 1270 int FrameIdx = Info.getFrameIdx(); 1271 if (FrameIdx < 0 || MFI.getStackID(FrameIdx) != TargetStackID::Default) 1272 continue; 1273 1274 Size += MFI.getObjectSize(FrameIdx); 1275 } 1276 RVFI->setCalleeSavedStackSize(Size); 1277 } 1278 1279 // Not preserve stack space within prologue for outgoing variables when the 1280 // function contains variable size objects or there are vector objects accessed 1281 // by the frame pointer. 1282 // Let eliminateCallFramePseudoInstr preserve stack space for it. 1283 bool RISCVFrameLowering::hasReservedCallFrame(const MachineFunction &MF) const { 1284 return !MF.getFrameInfo().hasVarSizedObjects() && 1285 !(hasFP(MF) && hasRVVFrameObject(MF)); 1286 } 1287 1288 // Eliminate ADJCALLSTACKDOWN, ADJCALLSTACKUP pseudo instructions. 1289 MachineBasicBlock::iterator RISCVFrameLowering::eliminateCallFramePseudoInstr( 1290 MachineFunction &MF, MachineBasicBlock &MBB, 1291 MachineBasicBlock::iterator MI) const { 1292 Register SPReg = RISCV::X2; 1293 DebugLoc DL = MI->getDebugLoc(); 1294 1295 if (!hasReservedCallFrame(MF)) { 1296 // If space has not been reserved for a call frame, ADJCALLSTACKDOWN and 1297 // ADJCALLSTACKUP must be converted to instructions manipulating the stack 1298 // pointer. This is necessary when there is a variable length stack 1299 // allocation (e.g. alloca), which means it's not possible to allocate 1300 // space for outgoing arguments from within the function prologue. 1301 int64_t Amount = MI->getOperand(0).getImm(); 1302 1303 if (Amount != 0) { 1304 // Ensure the stack remains aligned after adjustment. 1305 Amount = alignSPAdjust(Amount); 1306 1307 if (MI->getOpcode() == RISCV::ADJCALLSTACKDOWN) 1308 Amount = -Amount; 1309 1310 const RISCVRegisterInfo &RI = *STI.getRegisterInfo(); 1311 RI.adjustReg(MBB, MI, DL, SPReg, SPReg, StackOffset::getFixed(Amount), 1312 MachineInstr::NoFlags, getStackAlign()); 1313 } 1314 } 1315 1316 return MBB.erase(MI); 1317 } 1318 1319 // We would like to split the SP adjustment to reduce prologue/epilogue 1320 // as following instructions. In this way, the offset of the callee saved 1321 // register could fit in a single store. Supposed that the first sp adjust 1322 // amount is 2032. 1323 // add sp,sp,-2032 1324 // sw ra,2028(sp) 1325 // sw s0,2024(sp) 1326 // sw s1,2020(sp) 1327 // sw s3,2012(sp) 1328 // sw s4,2008(sp) 1329 // add sp,sp,-64 1330 uint64_t 1331 RISCVFrameLowering::getFirstSPAdjustAmount(const MachineFunction &MF) const { 1332 const auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 1333 const MachineFrameInfo &MFI = MF.getFrameInfo(); 1334 const std::vector<CalleeSavedInfo> &CSI = MFI.getCalleeSavedInfo(); 1335 uint64_t StackSize = getStackSizeWithRVVPadding(MF); 1336 1337 // Disable SplitSPAdjust if save-restore libcall is used. The callee-saved 1338 // registers will be pushed by the save-restore libcalls, so we don't have to 1339 // split the SP adjustment in this case. 1340 if (RVFI->getReservedSpillsSize()) 1341 return 0; 1342 1343 // Return the FirstSPAdjustAmount if the StackSize can not fit in a signed 1344 // 12-bit and there exists a callee-saved register needing to be pushed. 1345 if (!isInt<12>(StackSize) && (CSI.size() > 0)) { 1346 // FirstSPAdjustAmount is chosen at most as (2048 - StackAlign) because 1347 // 2048 will cause sp = sp + 2048 in the epilogue to be split into multiple 1348 // instructions. Offsets smaller than 2048 can fit in a single load/store 1349 // instruction, and we have to stick with the stack alignment. 2048 has 1350 // 16-byte alignment. The stack alignment for RV32 and RV64 is 16 and for 1351 // RV32E it is 4. So (2048 - StackAlign) will satisfy the stack alignment. 1352 const uint64_t StackAlign = getStackAlign().value(); 1353 1354 // Amount of (2048 - StackAlign) will prevent callee saved and restored 1355 // instructions be compressed, so try to adjust the amount to the largest 1356 // offset that stack compression instructions accept when target supports 1357 // compression instructions. 1358 if (STI.hasStdExtCOrZca()) { 1359 // The compression extensions may support the following instructions: 1360 // riscv32: c.lwsp rd, offset[7:2] => 2^(6 + 2) 1361 // c.swsp rs2, offset[7:2] => 2^(6 + 2) 1362 // c.flwsp rd, offset[7:2] => 2^(6 + 2) 1363 // c.fswsp rs2, offset[7:2] => 2^(6 + 2) 1364 // riscv64: c.ldsp rd, offset[8:3] => 2^(6 + 3) 1365 // c.sdsp rs2, offset[8:3] => 2^(6 + 3) 1366 // c.fldsp rd, offset[8:3] => 2^(6 + 3) 1367 // c.fsdsp rs2, offset[8:3] => 2^(6 + 3) 1368 const uint64_t RVCompressLen = STI.getXLen() * 8; 1369 // Compared with amount (2048 - StackAlign), StackSize needs to 1370 // satisfy the following conditions to avoid using more instructions 1371 // to adjust the sp after adjusting the amount, such as 1372 // StackSize meets the condition (StackSize <= 2048 + RVCompressLen), 1373 // case1: Amount is 2048 - StackAlign: use addi + addi to adjust sp. 1374 // case2: Amount is RVCompressLen: use addi + addi to adjust sp. 1375 auto CanCompress = [&](uint64_t CompressLen) -> bool { 1376 if (StackSize <= 2047 + CompressLen || 1377 (StackSize > 2048 * 2 - StackAlign && 1378 StackSize <= 2047 * 2 + CompressLen) || 1379 StackSize > 2048 * 3 - StackAlign) 1380 return true; 1381 1382 return false; 1383 }; 1384 // In the epilogue, addi sp, sp, 496 is used to recover the sp and it 1385 // can be compressed(C.ADDI16SP, offset can be [-512, 496]), but 1386 // addi sp, sp, 512 can not be compressed. So try to use 496 first. 1387 const uint64_t ADDI16SPCompressLen = 496; 1388 if (STI.is64Bit() && CanCompress(ADDI16SPCompressLen)) 1389 return ADDI16SPCompressLen; 1390 if (CanCompress(RVCompressLen)) 1391 return RVCompressLen; 1392 } 1393 return 2048 - StackAlign; 1394 } 1395 return 0; 1396 } 1397 1398 bool RISCVFrameLowering::assignCalleeSavedSpillSlots( 1399 MachineFunction &MF, const TargetRegisterInfo *TRI, 1400 std::vector<CalleeSavedInfo> &CSI, unsigned &MinCSFrameIndex, 1401 unsigned &MaxCSFrameIndex) const { 1402 // Early exit if no callee saved registers are modified! 1403 if (CSI.empty()) 1404 return true; 1405 1406 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>(); 1407 1408 if (RVFI->isPushable(MF)) { 1409 // Determine how many GPRs we need to push and save it to RVFI. 1410 Register MaxReg = getMaxPushPopReg(MF, CSI); 1411 if (MaxReg != RISCV::NoRegister) { 1412 auto [RegEnc, PushedRegNum] = getPushPopEncodingAndNum(MaxReg); 1413 RVFI->setRVPushRegs(PushedRegNum); 1414 RVFI->setRVPushStackSize(alignTo((STI.getXLen() / 8) * PushedRegNum, 16)); 1415 1416 // Use encoded number to represent registers to spill. 1417 RVFI->setRVPushRlist(RegEnc); 1418 } 1419 } 1420 1421 MachineFrameInfo &MFI = MF.getFrameInfo(); 1422 const TargetRegisterInfo *RegInfo = MF.getSubtarget().getRegisterInfo(); 1423 1424 for (auto &CS : CSI) { 1425 unsigned Reg = CS.getReg(); 1426 const TargetRegisterClass *RC = RegInfo->getMinimalPhysRegClass(Reg); 1427 unsigned Size = RegInfo->getSpillSize(*RC); 1428 1429 // This might need a fixed stack slot. 1430 if (RVFI->useSaveRestoreLibCalls(MF) || RVFI->isPushable(MF)) { 1431 const auto *FII = llvm::find_if( 1432 FixedCSRFIMap, [&](auto P) { return P.first == CS.getReg(); }); 1433 if (FII != std::end(FixedCSRFIMap)) { 1434 int64_t Offset; 1435 if (RVFI->isPushable(MF)) 1436 Offset = -((FII->second + RVFI->getRVPushRegs() + 1) * (int64_t)Size); 1437 else 1438 Offset = FII->second * (int64_t)Size; 1439 1440 int FrameIdx = MFI.CreateFixedSpillStackObject(Size, Offset); 1441 assert(FrameIdx < 0); 1442 CS.setFrameIdx(FrameIdx); 1443 continue; 1444 } 1445 } 1446 1447 // Not a fixed slot. 1448 Align Alignment = RegInfo->getSpillAlign(*RC); 1449 // We may not be able to satisfy the desired alignment specification of 1450 // the TargetRegisterClass if the stack alignment is smaller. Use the 1451 // min. 1452 Alignment = std::min(Alignment, getStackAlign()); 1453 int FrameIdx = MFI.CreateStackObject(Size, Alignment, true); 1454 if ((unsigned)FrameIdx < MinCSFrameIndex) 1455 MinCSFrameIndex = FrameIdx; 1456 if ((unsigned)FrameIdx > MaxCSFrameIndex) 1457 MaxCSFrameIndex = FrameIdx; 1458 CS.setFrameIdx(FrameIdx); 1459 } 1460 1461 // Allocate a fixed object that covers the full push or libcall size. 1462 if (RVFI->isPushable(MF)) { 1463 if (int64_t PushSize = RVFI->getRVPushStackSize()) 1464 MFI.CreateFixedSpillStackObject(PushSize, -PushSize); 1465 } else if (int LibCallRegs = getLibCallID(MF, CSI) + 1) { 1466 int64_t LibCallFrameSize = 1467 alignTo((STI.getXLen() / 8) * LibCallRegs, getStackAlign()); 1468 MFI.CreateFixedSpillStackObject(LibCallFrameSize, -LibCallFrameSize); 1469 } 1470 1471 return true; 1472 } 1473 1474 bool RISCVFrameLowering::spillCalleeSavedRegisters( 1475 MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, 1476 ArrayRef<CalleeSavedInfo> CSI, const TargetRegisterInfo *TRI) const { 1477 if (CSI.empty()) 1478 return true; 1479 1480 MachineFunction *MF = MBB.getParent(); 1481 const TargetInstrInfo &TII = *MF->getSubtarget().getInstrInfo(); 1482 DebugLoc DL; 1483 if (MI != MBB.end() && !MI->isDebugInstr()) 1484 DL = MI->getDebugLoc(); 1485 1486 // Emit CM.PUSH with base SPimm & evaluate Push stack 1487 RISCVMachineFunctionInfo *RVFI = MF->getInfo<RISCVMachineFunctionInfo>(); 1488 if (RVFI->isPushable(*MF)) { 1489 unsigned PushedRegNum = RVFI->getRVPushRegs(); 1490 if (PushedRegNum > 0) { 1491 // Use encoded number to represent registers to spill. 1492 int RegEnc = RVFI->getRVPushRlist(); 1493 MachineInstrBuilder PushBuilder = 1494 BuildMI(MBB, MI, DL, TII.get(RISCV::CM_PUSH)) 1495 .setMIFlag(MachineInstr::FrameSetup); 1496 PushBuilder.addImm((int64_t)RegEnc); 1497 PushBuilder.addImm(0); 1498 1499 for (unsigned i = 0; i < PushedRegNum; i++) 1500 PushBuilder.addUse(FixedCSRFIMap[i].first, RegState::Implicit); 1501 } 1502 } else if (const char *SpillLibCall = getSpillLibCallName(*MF, CSI)) { 1503 // Add spill libcall via non-callee-saved register t0. 1504 BuildMI(MBB, MI, DL, TII.get(RISCV::PseudoCALLReg), RISCV::X5) 1505 .addExternalSymbol(SpillLibCall, RISCVII::MO_CALL) 1506 .setMIFlag(MachineInstr::FrameSetup); 1507 1508 // Add registers spilled in libcall as liveins. 1509 for (auto &CS : CSI) 1510 MBB.addLiveIn(CS.getReg()); 1511 } 1512 1513 // Manually spill values not spilled by libcall & Push/Pop. 1514 const auto &UnmanagedCSI = getUnmanagedCSI(*MF, CSI); 1515 const auto &RVVCSI = getRVVCalleeSavedInfo(*MF, CSI); 1516 1517 auto storeRegToStackSlot = [&](decltype(UnmanagedCSI) CSInfo) { 1518 for (auto &CS : CSInfo) { 1519 // Insert the spill to the stack frame. 1520 Register Reg = CS.getReg(); 1521 const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg); 1522 TII.storeRegToStackSlot(MBB, MI, Reg, !MBB.isLiveIn(Reg), 1523 CS.getFrameIdx(), RC, TRI, Register()); 1524 } 1525 }; 1526 storeRegToStackSlot(UnmanagedCSI); 1527 storeRegToStackSlot(RVVCSI); 1528 1529 return true; 1530 } 1531 1532 void RISCVFrameLowering::emitCalleeSavedRVVPrologCFI( 1533 MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, bool HasFP) const { 1534 MachineFunction *MF = MBB.getParent(); 1535 const MachineFrameInfo &MFI = MF->getFrameInfo(); 1536 RISCVMachineFunctionInfo *RVFI = MF->getInfo<RISCVMachineFunctionInfo>(); 1537 const TargetInstrInfo &TII = *STI.getInstrInfo(); 1538 DebugLoc DL = MBB.findDebugLoc(MI); 1539 1540 const auto &RVVCSI = getRVVCalleeSavedInfo(*MF, MFI.getCalleeSavedInfo()); 1541 if (RVVCSI.empty()) 1542 return; 1543 1544 uint64_t FixedSize = getStackSizeWithRVVPadding(*MF); 1545 if (!HasFP) { 1546 uint64_t ScalarLocalVarSize = 1547 MFI.getStackSize() - RVFI->getCalleeSavedStackSize() - 1548 RVFI->getRVPushStackSize() - RVFI->getVarArgsSaveSize() + 1549 RVFI->getRVVPadding(); 1550 FixedSize -= ScalarLocalVarSize; 1551 } 1552 1553 for (auto &CS : RVVCSI) { 1554 // Insert the spill to the stack frame. 1555 int FI = CS.getFrameIdx(); 1556 if (FI >= 0 && MFI.getStackID(FI) == TargetStackID::ScalableVector) { 1557 unsigned CFIIndex = MF->addFrameInst( 1558 createDefCFAOffset(*STI.getRegisterInfo(), CS.getReg(), -FixedSize, 1559 MFI.getObjectOffset(FI) / 8)); 1560 BuildMI(MBB, MI, DL, TII.get(TargetOpcode::CFI_INSTRUCTION)) 1561 .addCFIIndex(CFIIndex) 1562 .setMIFlag(MachineInstr::FrameSetup); 1563 } 1564 } 1565 } 1566 1567 bool RISCVFrameLowering::restoreCalleeSavedRegisters( 1568 MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, 1569 MutableArrayRef<CalleeSavedInfo> CSI, const TargetRegisterInfo *TRI) const { 1570 if (CSI.empty()) 1571 return true; 1572 1573 MachineFunction *MF = MBB.getParent(); 1574 const TargetInstrInfo &TII = *MF->getSubtarget().getInstrInfo(); 1575 DebugLoc DL; 1576 if (MI != MBB.end() && !MI->isDebugInstr()) 1577 DL = MI->getDebugLoc(); 1578 1579 // Manually restore values not restored by libcall & Push/Pop. 1580 // Reverse the restore order in epilog. In addition, the return 1581 // address will be restored first in the epilogue. It increases 1582 // the opportunity to avoid the load-to-use data hazard between 1583 // loading RA and return by RA. loadRegFromStackSlot can insert 1584 // multiple instructions. 1585 const auto &UnmanagedCSI = getUnmanagedCSI(*MF, CSI); 1586 const auto &RVVCSI = getRVVCalleeSavedInfo(*MF, CSI); 1587 1588 auto loadRegFromStackSlot = [&](decltype(UnmanagedCSI) CSInfo) { 1589 for (auto &CS : CSInfo) { 1590 Register Reg = CS.getReg(); 1591 const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg); 1592 TII.loadRegFromStackSlot(MBB, MI, Reg, CS.getFrameIdx(), RC, TRI, 1593 Register()); 1594 assert(MI != MBB.begin() && 1595 "loadRegFromStackSlot didn't insert any code!"); 1596 } 1597 }; 1598 loadRegFromStackSlot(RVVCSI); 1599 loadRegFromStackSlot(UnmanagedCSI); 1600 1601 RISCVMachineFunctionInfo *RVFI = MF->getInfo<RISCVMachineFunctionInfo>(); 1602 if (RVFI->isPushable(*MF)) { 1603 int RegEnc = RVFI->getRVPushRlist(); 1604 if (RegEnc != llvm::RISCVZC::RLISTENCODE::INVALID_RLIST) { 1605 MachineInstrBuilder PopBuilder = 1606 BuildMI(MBB, MI, DL, TII.get(RISCV::CM_POP)) 1607 .setMIFlag(MachineInstr::FrameDestroy); 1608 // Use encoded number to represent registers to restore. 1609 PopBuilder.addImm(RegEnc); 1610 PopBuilder.addImm(0); 1611 1612 for (unsigned i = 0; i < RVFI->getRVPushRegs(); i++) 1613 PopBuilder.addDef(FixedCSRFIMap[i].first, RegState::ImplicitDefine); 1614 } 1615 } else { 1616 const char *RestoreLibCall = getRestoreLibCallName(*MF, CSI); 1617 if (RestoreLibCall) { 1618 // Add restore libcall via tail call. 1619 MachineBasicBlock::iterator NewMI = 1620 BuildMI(MBB, MI, DL, TII.get(RISCV::PseudoTAIL)) 1621 .addExternalSymbol(RestoreLibCall, RISCVII::MO_CALL) 1622 .setMIFlag(MachineInstr::FrameDestroy); 1623 1624 // Remove trailing returns, since the terminator is now a tail call to the 1625 // restore function. 1626 if (MI != MBB.end() && MI->getOpcode() == RISCV::PseudoRET) { 1627 NewMI->copyImplicitOps(*MF, *MI); 1628 MI->eraseFromParent(); 1629 } 1630 } 1631 } 1632 return true; 1633 } 1634 1635 bool RISCVFrameLowering::enableShrinkWrapping(const MachineFunction &MF) const { 1636 // Keep the conventional code flow when not optimizing. 1637 if (MF.getFunction().hasOptNone()) 1638 return false; 1639 1640 return true; 1641 } 1642 1643 bool RISCVFrameLowering::canUseAsPrologue(const MachineBasicBlock &MBB) const { 1644 MachineBasicBlock *TmpMBB = const_cast<MachineBasicBlock *>(&MBB); 1645 const MachineFunction *MF = MBB.getParent(); 1646 const auto *RVFI = MF->getInfo<RISCVMachineFunctionInfo>(); 1647 1648 if (!RVFI->useSaveRestoreLibCalls(*MF)) 1649 return true; 1650 1651 // Inserting a call to a __riscv_save libcall requires the use of the register 1652 // t0 (X5) to hold the return address. Therefore if this register is already 1653 // used we can't insert the call. 1654 1655 RegScavenger RS; 1656 RS.enterBasicBlock(*TmpMBB); 1657 return !RS.isRegUsed(RISCV::X5); 1658 } 1659 1660 bool RISCVFrameLowering::canUseAsEpilogue(const MachineBasicBlock &MBB) const { 1661 const MachineFunction *MF = MBB.getParent(); 1662 MachineBasicBlock *TmpMBB = const_cast<MachineBasicBlock *>(&MBB); 1663 const auto *RVFI = MF->getInfo<RISCVMachineFunctionInfo>(); 1664 1665 if (!RVFI->useSaveRestoreLibCalls(*MF)) 1666 return true; 1667 1668 // Using the __riscv_restore libcalls to restore CSRs requires a tail call. 1669 // This means if we still need to continue executing code within this function 1670 // the restore cannot take place in this basic block. 1671 1672 if (MBB.succ_size() > 1) 1673 return false; 1674 1675 MachineBasicBlock *SuccMBB = 1676 MBB.succ_empty() ? TmpMBB->getFallThrough() : *MBB.succ_begin(); 1677 1678 // Doing a tail call should be safe if there are no successors, because either 1679 // we have a returning block or the end of the block is unreachable, so the 1680 // restore will be eliminated regardless. 1681 if (!SuccMBB) 1682 return true; 1683 1684 // The successor can only contain a return, since we would effectively be 1685 // replacing the successor with our own tail return at the end of our block. 1686 return SuccMBB->isReturnBlock() && SuccMBB->size() == 1; 1687 } 1688 1689 bool RISCVFrameLowering::isSupportedStackID(TargetStackID::Value ID) const { 1690 switch (ID) { 1691 case TargetStackID::Default: 1692 case TargetStackID::ScalableVector: 1693 return true; 1694 case TargetStackID::NoAlloc: 1695 case TargetStackID::SGPRSpill: 1696 case TargetStackID::WasmLocal: 1697 return false; 1698 } 1699 llvm_unreachable("Invalid TargetStackID::Value"); 1700 } 1701 1702 TargetStackID::Value RISCVFrameLowering::getStackIDForScalableVectors() const { 1703 return TargetStackID::ScalableVector; 1704 } 1705