1 //===-- RISCVFrameLowering.cpp - RISC-V Frame Information -----------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file contains the RISC-V implementation of TargetFrameLowering class.
10 //
11 //===----------------------------------------------------------------------===//
12
13 #include "RISCVFrameLowering.h"
14 #include "RISCVMachineFunctionInfo.h"
15 #include "RISCVSubtarget.h"
16 #include "llvm/BinaryFormat/Dwarf.h"
17 #include "llvm/CodeGen/MachineFrameInfo.h"
18 #include "llvm/CodeGen/MachineFunction.h"
19 #include "llvm/CodeGen/MachineInstrBuilder.h"
20 #include "llvm/CodeGen/MachineRegisterInfo.h"
21 #include "llvm/CodeGen/RegisterScavenging.h"
22 #include "llvm/IR/DiagnosticInfo.h"
23 #include "llvm/MC/MCDwarf.h"
24 #include "llvm/Support/LEB128.h"
25
26 #include <algorithm>
27
28 using namespace llvm;
29
getABIStackAlignment(RISCVABI::ABI ABI)30 static Align getABIStackAlignment(RISCVABI::ABI ABI) {
31 if (ABI == RISCVABI::ABI_ILP32E)
32 return Align(4);
33 if (ABI == RISCVABI::ABI_LP64E)
34 return Align(8);
35 return Align(16);
36 }
37
RISCVFrameLowering(const RISCVSubtarget & STI)38 RISCVFrameLowering::RISCVFrameLowering(const RISCVSubtarget &STI)
39 : TargetFrameLowering(
40 StackGrowsDown, getABIStackAlignment(STI.getTargetABI()),
41 /*LocalAreaOffset=*/0,
42 /*TransientStackAlignment=*/getABIStackAlignment(STI.getTargetABI())),
43 STI(STI) {}
44
45 // Offsets which need to be scale by XLen representing locations of CSRs which
46 // are given a fixed location by save/restore libcalls or Zcmp Push/Pop.
47 static const std::pair<MCPhysReg, int8_t> FixedCSRFIMap[] = {
48 {/*ra*/ RISCV::X1, -1}, {/*s0*/ RISCV::X8, -2},
49 {/*s1*/ RISCV::X9, -3}, {/*s2*/ RISCV::X18, -4},
50 {/*s3*/ RISCV::X19, -5}, {/*s4*/ RISCV::X20, -6},
51 {/*s5*/ RISCV::X21, -7}, {/*s6*/ RISCV::X22, -8},
52 {/*s7*/ RISCV::X23, -9}, {/*s8*/ RISCV::X24, -10},
53 {/*s9*/ RISCV::X25, -11}, {/*s10*/ RISCV::X26, -12},
54 {/*s11*/ RISCV::X27, -13}};
55
56 // For now we use x3, a.k.a gp, as pointer to shadow call stack.
57 // User should not use x3 in their asm.
emitSCSPrologue(MachineFunction & MF,MachineBasicBlock & MBB,MachineBasicBlock::iterator MI,const DebugLoc & DL)58 static void emitSCSPrologue(MachineFunction &MF, MachineBasicBlock &MBB,
59 MachineBasicBlock::iterator MI,
60 const DebugLoc &DL) {
61 if (!MF.getFunction().hasFnAttribute(Attribute::ShadowCallStack))
62 return;
63
64 const auto &STI = MF.getSubtarget<RISCVSubtarget>();
65 const llvm::RISCVRegisterInfo *TRI = STI.getRegisterInfo();
66 Register RAReg = TRI->getRARegister();
67
68 // Do not save RA to the SCS if it's not saved to the regular stack,
69 // i.e. RA is not at risk of being overwritten.
70 std::vector<CalleeSavedInfo> &CSI = MF.getFrameInfo().getCalleeSavedInfo();
71 if (llvm::none_of(
72 CSI, [&](CalleeSavedInfo &CSR) { return CSR.getReg() == RAReg; }))
73 return;
74
75 const RISCVInstrInfo *TII = STI.getInstrInfo();
76 if (!STI.hasForcedSWShadowStack() && STI.hasStdExtZicfiss()) {
77 BuildMI(MBB, MI, DL, TII->get(RISCV::SSPUSH)).addReg(RAReg);
78 return;
79 }
80
81 Register SCSPReg = RISCVABI::getSCSPReg();
82
83 bool IsRV64 = STI.hasFeature(RISCV::Feature64Bit);
84 int64_t SlotSize = STI.getXLen() / 8;
85 // Store return address to shadow call stack
86 // addi gp, gp, [4|8]
87 // s[w|d] ra, -[4|8](gp)
88 BuildMI(MBB, MI, DL, TII->get(RISCV::ADDI))
89 .addReg(SCSPReg, RegState::Define)
90 .addReg(SCSPReg)
91 .addImm(SlotSize)
92 .setMIFlag(MachineInstr::FrameSetup);
93 BuildMI(MBB, MI, DL, TII->get(IsRV64 ? RISCV::SD : RISCV::SW))
94 .addReg(RAReg)
95 .addReg(SCSPReg)
96 .addImm(-SlotSize)
97 .setMIFlag(MachineInstr::FrameSetup);
98
99 // Emit a CFI instruction that causes SlotSize to be subtracted from the value
100 // of the shadow stack pointer when unwinding past this frame.
101 char DwarfSCSReg = TRI->getDwarfRegNum(SCSPReg, /*IsEH*/ true);
102 assert(DwarfSCSReg < 32 && "SCS Register should be < 32 (X3).");
103
104 char Offset = static_cast<char>(-SlotSize) & 0x7f;
105 const char CFIInst[] = {
106 dwarf::DW_CFA_val_expression,
107 DwarfSCSReg, // register
108 2, // length
109 static_cast<char>(unsigned(dwarf::DW_OP_breg0 + DwarfSCSReg)),
110 Offset, // addend (sleb128)
111 };
112
113 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createEscape(
114 nullptr, StringRef(CFIInst, sizeof(CFIInst))));
115 BuildMI(MBB, MI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
116 .addCFIIndex(CFIIndex)
117 .setMIFlag(MachineInstr::FrameSetup);
118 }
119
emitSCSEpilogue(MachineFunction & MF,MachineBasicBlock & MBB,MachineBasicBlock::iterator MI,const DebugLoc & DL)120 static void emitSCSEpilogue(MachineFunction &MF, MachineBasicBlock &MBB,
121 MachineBasicBlock::iterator MI,
122 const DebugLoc &DL) {
123 if (!MF.getFunction().hasFnAttribute(Attribute::ShadowCallStack))
124 return;
125
126 const auto &STI = MF.getSubtarget<RISCVSubtarget>();
127 Register RAReg = STI.getRegisterInfo()->getRARegister();
128
129 // See emitSCSPrologue() above.
130 std::vector<CalleeSavedInfo> &CSI = MF.getFrameInfo().getCalleeSavedInfo();
131 if (llvm::none_of(
132 CSI, [&](CalleeSavedInfo &CSR) { return CSR.getReg() == RAReg; }))
133 return;
134
135 const RISCVInstrInfo *TII = STI.getInstrInfo();
136 if (!STI.hasForcedSWShadowStack() && STI.hasStdExtZicfiss()) {
137 BuildMI(MBB, MI, DL, TII->get(RISCV::SSPOPCHK)).addReg(RAReg);
138 return;
139 }
140
141 Register SCSPReg = RISCVABI::getSCSPReg();
142
143 bool IsRV64 = STI.hasFeature(RISCV::Feature64Bit);
144 int64_t SlotSize = STI.getXLen() / 8;
145 // Load return address from shadow call stack
146 // l[w|d] ra, -[4|8](gp)
147 // addi gp, gp, -[4|8]
148 BuildMI(MBB, MI, DL, TII->get(IsRV64 ? RISCV::LD : RISCV::LW))
149 .addReg(RAReg, RegState::Define)
150 .addReg(SCSPReg)
151 .addImm(-SlotSize)
152 .setMIFlag(MachineInstr::FrameDestroy);
153 BuildMI(MBB, MI, DL, TII->get(RISCV::ADDI))
154 .addReg(SCSPReg, RegState::Define)
155 .addReg(SCSPReg)
156 .addImm(-SlotSize)
157 .setMIFlag(MachineInstr::FrameDestroy);
158 // Restore the SCS pointer
159 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createRestore(
160 nullptr, STI.getRegisterInfo()->getDwarfRegNum(SCSPReg, /*IsEH*/ true)));
161 BuildMI(MBB, MI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
162 .addCFIIndex(CFIIndex)
163 .setMIFlags(MachineInstr::FrameDestroy);
164 }
165
166 // Get the ID of the libcall used for spilling and restoring callee saved
167 // registers. The ID is representative of the number of registers saved or
168 // restored by the libcall, except it is zero-indexed - ID 0 corresponds to a
169 // single register.
getLibCallID(const MachineFunction & MF,const std::vector<CalleeSavedInfo> & CSI)170 static int getLibCallID(const MachineFunction &MF,
171 const std::vector<CalleeSavedInfo> &CSI) {
172 const auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
173
174 if (CSI.empty() || !RVFI->useSaveRestoreLibCalls(MF))
175 return -1;
176
177 Register MaxReg = RISCV::NoRegister;
178 for (auto &CS : CSI)
179 // assignCalleeSavedSpillSlots assigns negative frame indexes to
180 // registers which can be saved by libcall.
181 if (CS.getFrameIdx() < 0)
182 MaxReg = std::max(MaxReg.id(), CS.getReg().id());
183
184 if (MaxReg == RISCV::NoRegister)
185 return -1;
186
187 switch (MaxReg) {
188 default:
189 llvm_unreachable("Something has gone wrong!");
190 case /*s11*/ RISCV::X27: return 12;
191 case /*s10*/ RISCV::X26: return 11;
192 case /*s9*/ RISCV::X25: return 10;
193 case /*s8*/ RISCV::X24: return 9;
194 case /*s7*/ RISCV::X23: return 8;
195 case /*s6*/ RISCV::X22: return 7;
196 case /*s5*/ RISCV::X21: return 6;
197 case /*s4*/ RISCV::X20: return 5;
198 case /*s3*/ RISCV::X19: return 4;
199 case /*s2*/ RISCV::X18: return 3;
200 case /*s1*/ RISCV::X9: return 2;
201 case /*s0*/ RISCV::X8: return 1;
202 case /*ra*/ RISCV::X1: return 0;
203 }
204 }
205
206 // Get the name of the libcall used for spilling callee saved registers.
207 // If this function will not use save/restore libcalls, then return a nullptr.
208 static const char *
getSpillLibCallName(const MachineFunction & MF,const std::vector<CalleeSavedInfo> & CSI)209 getSpillLibCallName(const MachineFunction &MF,
210 const std::vector<CalleeSavedInfo> &CSI) {
211 static const char *const SpillLibCalls[] = {
212 "__riscv_save_0",
213 "__riscv_save_1",
214 "__riscv_save_2",
215 "__riscv_save_3",
216 "__riscv_save_4",
217 "__riscv_save_5",
218 "__riscv_save_6",
219 "__riscv_save_7",
220 "__riscv_save_8",
221 "__riscv_save_9",
222 "__riscv_save_10",
223 "__riscv_save_11",
224 "__riscv_save_12"
225 };
226
227 int LibCallID = getLibCallID(MF, CSI);
228 if (LibCallID == -1)
229 return nullptr;
230 return SpillLibCalls[LibCallID];
231 }
232
233 // Get the name of the libcall used for restoring callee saved registers.
234 // If this function will not use save/restore libcalls, then return a nullptr.
235 static const char *
getRestoreLibCallName(const MachineFunction & MF,const std::vector<CalleeSavedInfo> & CSI)236 getRestoreLibCallName(const MachineFunction &MF,
237 const std::vector<CalleeSavedInfo> &CSI) {
238 static const char *const RestoreLibCalls[] = {
239 "__riscv_restore_0",
240 "__riscv_restore_1",
241 "__riscv_restore_2",
242 "__riscv_restore_3",
243 "__riscv_restore_4",
244 "__riscv_restore_5",
245 "__riscv_restore_6",
246 "__riscv_restore_7",
247 "__riscv_restore_8",
248 "__riscv_restore_9",
249 "__riscv_restore_10",
250 "__riscv_restore_11",
251 "__riscv_restore_12"
252 };
253
254 int LibCallID = getLibCallID(MF, CSI);
255 if (LibCallID == -1)
256 return nullptr;
257 return RestoreLibCalls[LibCallID];
258 }
259
260 // Return encoded value and register count for PUSH/POP instruction,
261 // representing registers to store/load.
262 static std::pair<unsigned, unsigned>
getPushPopEncodingAndNum(const Register MaxReg)263 getPushPopEncodingAndNum(const Register MaxReg) {
264 switch (MaxReg) {
265 default:
266 llvm_unreachable("Unexpected Reg for Push/Pop Inst");
267 case RISCV::X27: /*s11*/
268 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S11, 13);
269 case RISCV::X25: /*s9*/
270 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S9, 11);
271 case RISCV::X24: /*s8*/
272 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S8, 10);
273 case RISCV::X23: /*s7*/
274 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S7, 9);
275 case RISCV::X22: /*s6*/
276 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S6, 8);
277 case RISCV::X21: /*s5*/
278 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S5, 7);
279 case RISCV::X20: /*s4*/
280 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S4, 6);
281 case RISCV::X19: /*s3*/
282 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S3, 5);
283 case RISCV::X18: /*s2*/
284 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S2, 4);
285 case RISCV::X9: /*s1*/
286 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0_S1, 3);
287 case RISCV::X8: /*s0*/
288 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA_S0, 2);
289 case RISCV::X1: /*ra*/
290 return std::make_pair(llvm::RISCVZC::RLISTENCODE::RA, 1);
291 }
292 }
293
294 // Get the max reg of Push/Pop for restoring callee saved registers.
getMaxPushPopReg(const MachineFunction & MF,const std::vector<CalleeSavedInfo> & CSI)295 static Register getMaxPushPopReg(const MachineFunction &MF,
296 const std::vector<CalleeSavedInfo> &CSI) {
297 Register MaxPushPopReg = RISCV::NoRegister;
298 for (auto &CS : CSI) {
299 if (llvm::find_if(FixedCSRFIMap, [&](auto P) {
300 return P.first == CS.getReg();
301 }) != std::end(FixedCSRFIMap))
302 MaxPushPopReg = std::max(MaxPushPopReg.id(), CS.getReg().id());
303 }
304 assert(MaxPushPopReg != RISCV::X26 && "x26 requires x27 to also be pushed");
305 return MaxPushPopReg;
306 }
307
308 // Return true if the specified function should have a dedicated frame
309 // pointer register. This is true if frame pointer elimination is
310 // disabled, if it needs dynamic stack realignment, if the function has
311 // variable sized allocas, or if the frame address is taken.
hasFP(const MachineFunction & MF) const312 bool RISCVFrameLowering::hasFP(const MachineFunction &MF) const {
313 const TargetRegisterInfo *RegInfo = MF.getSubtarget().getRegisterInfo();
314
315 const MachineFrameInfo &MFI = MF.getFrameInfo();
316 return MF.getTarget().Options.DisableFramePointerElim(MF) ||
317 RegInfo->hasStackRealignment(MF) || MFI.hasVarSizedObjects() ||
318 MFI.isFrameAddressTaken();
319 }
320
hasBP(const MachineFunction & MF) const321 bool RISCVFrameLowering::hasBP(const MachineFunction &MF) const {
322 const MachineFrameInfo &MFI = MF.getFrameInfo();
323 const TargetRegisterInfo *TRI = STI.getRegisterInfo();
324
325 // If we do not reserve stack space for outgoing arguments in prologue,
326 // we will adjust the stack pointer before call instruction. After the
327 // adjustment, we can not use SP to access the stack objects for the
328 // arguments. Instead, use BP to access these stack objects.
329 return (MFI.hasVarSizedObjects() ||
330 (!hasReservedCallFrame(MF) && (!MFI.isMaxCallFrameSizeComputed() ||
331 MFI.getMaxCallFrameSize() != 0))) &&
332 TRI->hasStackRealignment(MF);
333 }
334
335 // Determines the size of the frame and maximum call frame size.
determineFrameLayout(MachineFunction & MF) const336 void RISCVFrameLowering::determineFrameLayout(MachineFunction &MF) const {
337 MachineFrameInfo &MFI = MF.getFrameInfo();
338 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
339
340 // Get the number of bytes to allocate from the FrameInfo.
341 uint64_t FrameSize = MFI.getStackSize();
342
343 // Get the alignment.
344 Align StackAlign = getStackAlign();
345
346 // Make sure the frame is aligned.
347 FrameSize = alignTo(FrameSize, StackAlign);
348
349 // Update frame info.
350 MFI.setStackSize(FrameSize);
351
352 // When using SP or BP to access stack objects, we may require extra padding
353 // to ensure the bottom of the RVV stack is correctly aligned within the main
354 // stack. We calculate this as the amount required to align the scalar local
355 // variable section up to the RVV alignment.
356 const TargetRegisterInfo *TRI = STI.getRegisterInfo();
357 if (RVFI->getRVVStackSize() && (!hasFP(MF) || TRI->hasStackRealignment(MF))) {
358 int ScalarLocalVarSize = FrameSize - RVFI->getCalleeSavedStackSize() -
359 RVFI->getVarArgsSaveSize();
360 if (auto RVVPadding =
361 offsetToAlignment(ScalarLocalVarSize, RVFI->getRVVStackAlign()))
362 RVFI->setRVVPadding(RVVPadding);
363 }
364 }
365
366 // Returns the stack size including RVV padding (when required), rounded back
367 // up to the required stack alignment.
getStackSizeWithRVVPadding(const MachineFunction & MF) const368 uint64_t RISCVFrameLowering::getStackSizeWithRVVPadding(
369 const MachineFunction &MF) const {
370 const MachineFrameInfo &MFI = MF.getFrameInfo();
371 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
372 return alignTo(MFI.getStackSize() + RVFI->getRVVPadding(), getStackAlign());
373 }
374
375 // Returns the register used to hold the frame pointer.
getFPReg(const RISCVSubtarget & STI)376 static Register getFPReg(const RISCVSubtarget &STI) { return RISCV::X8; }
377
378 // Returns the register used to hold the stack pointer.
getSPReg(const RISCVSubtarget & STI)379 static Register getSPReg(const RISCVSubtarget &STI) { return RISCV::X2; }
380
381 static SmallVector<CalleeSavedInfo, 8>
getUnmanagedCSI(const MachineFunction & MF,const std::vector<CalleeSavedInfo> & CSI)382 getUnmanagedCSI(const MachineFunction &MF,
383 const std::vector<CalleeSavedInfo> &CSI) {
384 const MachineFrameInfo &MFI = MF.getFrameInfo();
385 SmallVector<CalleeSavedInfo, 8> NonLibcallCSI;
386
387 for (auto &CS : CSI) {
388 int FI = CS.getFrameIdx();
389 if (FI >= 0 && MFI.getStackID(FI) == TargetStackID::Default)
390 NonLibcallCSI.push_back(CS);
391 }
392
393 return NonLibcallCSI;
394 }
395
396 static SmallVector<CalleeSavedInfo, 8>
getRVVCalleeSavedInfo(const MachineFunction & MF,const std::vector<CalleeSavedInfo> & CSI)397 getRVVCalleeSavedInfo(const MachineFunction &MF,
398 const std::vector<CalleeSavedInfo> &CSI) {
399 const MachineFrameInfo &MFI = MF.getFrameInfo();
400 SmallVector<CalleeSavedInfo, 8> RVVCSI;
401
402 for (auto &CS : CSI) {
403 int FI = CS.getFrameIdx();
404 if (FI >= 0 && MFI.getStackID(FI) == TargetStackID::ScalableVector)
405 RVVCSI.push_back(CS);
406 }
407
408 return RVVCSI;
409 }
410
adjustStackForRVV(MachineFunction & MF,MachineBasicBlock & MBB,MachineBasicBlock::iterator MBBI,const DebugLoc & DL,int64_t Amount,MachineInstr::MIFlag Flag) const411 void RISCVFrameLowering::adjustStackForRVV(MachineFunction &MF,
412 MachineBasicBlock &MBB,
413 MachineBasicBlock::iterator MBBI,
414 const DebugLoc &DL, int64_t Amount,
415 MachineInstr::MIFlag Flag) const {
416 assert(Amount != 0 && "Did not need to adjust stack pointer for RVV.");
417
418 const Register SPReg = getSPReg(STI);
419
420 // Optimize compile time offset case
421 StackOffset Offset = StackOffset::getScalable(Amount);
422 if (auto VLEN = STI.getRealVLen()) {
423 // 1. Multiply the number of v-slots by the (constant) length of register
424 const int64_t VLENB = *VLEN / 8;
425 assert(Amount % 8 == 0 &&
426 "Reserve the stack by the multiple of one vector size.");
427 const int64_t NumOfVReg = Amount / 8;
428 const int64_t FixedOffset = NumOfVReg * VLENB;
429 if (!isInt<32>(FixedOffset)) {
430 report_fatal_error(
431 "Frame size outside of the signed 32-bit range not supported");
432 }
433 Offset = StackOffset::getFixed(FixedOffset);
434 }
435
436 const RISCVRegisterInfo &RI = *STI.getRegisterInfo();
437 // We must keep the stack pointer aligned through any intermediate
438 // updates.
439 RI.adjustReg(MBB, MBBI, DL, SPReg, SPReg, Offset,
440 Flag, getStackAlign());
441 }
442
appendScalableVectorExpression(const TargetRegisterInfo & TRI,SmallVectorImpl<char> & Expr,int FixedOffset,int ScalableOffset,llvm::raw_string_ostream & Comment)443 static void appendScalableVectorExpression(const TargetRegisterInfo &TRI,
444 SmallVectorImpl<char> &Expr,
445 int FixedOffset, int ScalableOffset,
446 llvm::raw_string_ostream &Comment) {
447 unsigned DwarfVLenB = TRI.getDwarfRegNum(RISCV::VLENB, true);
448 uint8_t Buffer[16];
449 if (FixedOffset) {
450 Expr.push_back(dwarf::DW_OP_consts);
451 Expr.append(Buffer, Buffer + encodeSLEB128(FixedOffset, Buffer));
452 Expr.push_back((uint8_t)dwarf::DW_OP_plus);
453 Comment << (FixedOffset < 0 ? " - " : " + ") << std::abs(FixedOffset);
454 }
455
456 Expr.push_back((uint8_t)dwarf::DW_OP_consts);
457 Expr.append(Buffer, Buffer + encodeSLEB128(ScalableOffset, Buffer));
458
459 Expr.push_back((uint8_t)dwarf::DW_OP_bregx);
460 Expr.append(Buffer, Buffer + encodeULEB128(DwarfVLenB, Buffer));
461 Expr.push_back(0);
462
463 Expr.push_back((uint8_t)dwarf::DW_OP_mul);
464 Expr.push_back((uint8_t)dwarf::DW_OP_plus);
465
466 Comment << (ScalableOffset < 0 ? " - " : " + ") << std::abs(ScalableOffset)
467 << " * vlenb";
468 }
469
createDefCFAExpression(const TargetRegisterInfo & TRI,Register Reg,uint64_t FixedOffset,uint64_t ScalableOffset)470 static MCCFIInstruction createDefCFAExpression(const TargetRegisterInfo &TRI,
471 Register Reg,
472 uint64_t FixedOffset,
473 uint64_t ScalableOffset) {
474 assert(ScalableOffset != 0 && "Did not need to adjust CFA for RVV");
475 SmallString<64> Expr;
476 std::string CommentBuffer;
477 llvm::raw_string_ostream Comment(CommentBuffer);
478 // Build up the expression (Reg + FixedOffset + ScalableOffset * VLENB).
479 unsigned DwarfReg = TRI.getDwarfRegNum(Reg, true);
480 Expr.push_back((uint8_t)(dwarf::DW_OP_breg0 + DwarfReg));
481 Expr.push_back(0);
482 if (Reg == RISCV::X2)
483 Comment << "sp";
484 else
485 Comment << printReg(Reg, &TRI);
486
487 appendScalableVectorExpression(TRI, Expr, FixedOffset, ScalableOffset,
488 Comment);
489
490 SmallString<64> DefCfaExpr;
491 uint8_t Buffer[16];
492 DefCfaExpr.push_back(dwarf::DW_CFA_def_cfa_expression);
493 DefCfaExpr.append(Buffer, Buffer + encodeULEB128(Expr.size(), Buffer));
494 DefCfaExpr.append(Expr.str());
495
496 return MCCFIInstruction::createEscape(nullptr, DefCfaExpr.str(), SMLoc(),
497 Comment.str());
498 }
499
createDefCFAOffset(const TargetRegisterInfo & TRI,Register Reg,uint64_t FixedOffset,uint64_t ScalableOffset)500 static MCCFIInstruction createDefCFAOffset(const TargetRegisterInfo &TRI,
501 Register Reg, uint64_t FixedOffset,
502 uint64_t ScalableOffset) {
503 assert(ScalableOffset != 0 && "Did not need to adjust CFA for RVV");
504 SmallString<64> Expr;
505 std::string CommentBuffer;
506 llvm::raw_string_ostream Comment(CommentBuffer);
507 Comment << printReg(Reg, &TRI) << " @ cfa";
508
509 // Build up the expression (FixedOffset + ScalableOffset * VLENB).
510 appendScalableVectorExpression(TRI, Expr, FixedOffset, ScalableOffset,
511 Comment);
512
513 SmallString<64> DefCfaExpr;
514 uint8_t Buffer[16];
515 unsigned DwarfReg = TRI.getDwarfRegNum(Reg, true);
516 DefCfaExpr.push_back(dwarf::DW_CFA_expression);
517 DefCfaExpr.append(Buffer, Buffer + encodeULEB128(DwarfReg, Buffer));
518 DefCfaExpr.append(Buffer, Buffer + encodeULEB128(Expr.size(), Buffer));
519 DefCfaExpr.append(Expr.str());
520
521 return MCCFIInstruction::createEscape(nullptr, DefCfaExpr.str(), SMLoc(),
522 Comment.str());
523 }
524
emitPrologue(MachineFunction & MF,MachineBasicBlock & MBB) const525 void RISCVFrameLowering::emitPrologue(MachineFunction &MF,
526 MachineBasicBlock &MBB) const {
527 MachineFrameInfo &MFI = MF.getFrameInfo();
528 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
529 const RISCVRegisterInfo *RI = STI.getRegisterInfo();
530 const RISCVInstrInfo *TII = STI.getInstrInfo();
531 MachineBasicBlock::iterator MBBI = MBB.begin();
532
533 Register FPReg = getFPReg(STI);
534 Register SPReg = getSPReg(STI);
535 Register BPReg = RISCVABI::getBPReg();
536
537 // Debug location must be unknown since the first debug location is used
538 // to determine the end of the prologue.
539 DebugLoc DL;
540
541 // All calls are tail calls in GHC calling conv, and functions have no
542 // prologue/epilogue.
543 if (MF.getFunction().getCallingConv() == CallingConv::GHC)
544 return;
545
546 // Emit prologue for shadow call stack.
547 emitSCSPrologue(MF, MBB, MBBI, DL);
548
549 auto FirstFrameSetup = MBBI;
550
551 // Since spillCalleeSavedRegisters may have inserted a libcall, skip past
552 // any instructions marked as FrameSetup
553 while (MBBI != MBB.end() && MBBI->getFlag(MachineInstr::FrameSetup))
554 ++MBBI;
555
556 // Determine the correct frame layout
557 determineFrameLayout(MF);
558
559 // If libcalls are used to spill and restore callee-saved registers, the frame
560 // has two sections; the opaque section managed by the libcalls, and the
561 // section managed by MachineFrameInfo which can also hold callee saved
562 // registers in fixed stack slots, both of which have negative frame indices.
563 // This gets even more complicated when incoming arguments are passed via the
564 // stack, as these too have negative frame indices. An example is detailed
565 // below:
566 //
567 // | incoming arg | <- FI[-3]
568 // | libcallspill |
569 // | calleespill | <- FI[-2]
570 // | calleespill | <- FI[-1]
571 // | this_frame | <- FI[0]
572 //
573 // For negative frame indices, the offset from the frame pointer will differ
574 // depending on which of these groups the frame index applies to.
575 // The following calculates the correct offset knowing the number of callee
576 // saved registers spilt by the two methods.
577 if (int LibCallRegs = getLibCallID(MF, MFI.getCalleeSavedInfo()) + 1) {
578 // Calculate the size of the frame managed by the libcall. The stack
579 // alignment of these libcalls should be the same as how we set it in
580 // getABIStackAlignment.
581 unsigned LibCallFrameSize =
582 alignTo((STI.getXLen() / 8) * LibCallRegs, getStackAlign());
583 RVFI->setLibCallStackSize(LibCallFrameSize);
584 }
585
586 // FIXME (note copied from Lanai): This appears to be overallocating. Needs
587 // investigation. Get the number of bytes to allocate from the FrameInfo.
588 uint64_t RealStackSize = getStackSizeWithRVVPadding(MF);
589 uint64_t StackSize = RealStackSize - RVFI->getReservedSpillsSize();
590 uint64_t RVVStackSize = RVFI->getRVVStackSize();
591
592 // Early exit if there is no need to allocate on the stack
593 if (RealStackSize == 0 && !MFI.adjustsStack() && RVVStackSize == 0)
594 return;
595
596 // If the stack pointer has been marked as reserved, then produce an error if
597 // the frame requires stack allocation
598 if (STI.isRegisterReservedByUser(SPReg))
599 MF.getFunction().getContext().diagnose(DiagnosticInfoUnsupported{
600 MF.getFunction(), "Stack pointer required, but has been reserved."});
601
602 uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF);
603 // Split the SP adjustment to reduce the offsets of callee saved spill.
604 if (FirstSPAdjustAmount) {
605 StackSize = FirstSPAdjustAmount;
606 RealStackSize = FirstSPAdjustAmount;
607 }
608
609 if (RVFI->isPushable(MF) && FirstFrameSetup != MBB.end() &&
610 FirstFrameSetup->getOpcode() == RISCV::CM_PUSH) {
611 // Use available stack adjustment in push instruction to allocate additional
612 // stack space. Align the stack size down to a multiple of 16. This is
613 // needed for RVE.
614 // FIXME: Can we increase the stack size to a multiple of 16 instead?
615 uint64_t Spimm = std::min(alignDown(StackSize, 16), (uint64_t)48);
616 FirstFrameSetup->getOperand(1).setImm(Spimm);
617 StackSize -= Spimm;
618 }
619
620 if (StackSize != 0) {
621 // Allocate space on the stack if necessary.
622 RI->adjustReg(MBB, MBBI, DL, SPReg, SPReg,
623 StackOffset::getFixed(-StackSize), MachineInstr::FrameSetup,
624 getStackAlign());
625 }
626
627 // Emit ".cfi_def_cfa_offset RealStackSize"
628 unsigned CFIIndex = MF.addFrameInst(
629 MCCFIInstruction::cfiDefCfaOffset(nullptr, RealStackSize));
630 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
631 .addCFIIndex(CFIIndex)
632 .setMIFlag(MachineInstr::FrameSetup);
633
634 const auto &CSI = MFI.getCalleeSavedInfo();
635
636 // The frame pointer is callee-saved, and code has been generated for us to
637 // save it to the stack. We need to skip over the storing of callee-saved
638 // registers as the frame pointer must be modified after it has been saved
639 // to the stack, not before.
640 // FIXME: assumes exactly one instruction is used to save each callee-saved
641 // register.
642 std::advance(MBBI, getUnmanagedCSI(MF, CSI).size());
643
644 // Iterate over list of callee-saved registers and emit .cfi_offset
645 // directives.
646 for (const auto &Entry : CSI) {
647 int FrameIdx = Entry.getFrameIdx();
648 if (FrameIdx >= 0 &&
649 MFI.getStackID(FrameIdx) == TargetStackID::ScalableVector)
650 continue;
651
652 int64_t Offset = MFI.getObjectOffset(FrameIdx);
653 Register Reg = Entry.getReg();
654 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createOffset(
655 nullptr, RI->getDwarfRegNum(Reg, true), Offset));
656 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
657 .addCFIIndex(CFIIndex)
658 .setMIFlag(MachineInstr::FrameSetup);
659 }
660
661 // Generate new FP.
662 if (hasFP(MF)) {
663 if (STI.isRegisterReservedByUser(FPReg))
664 MF.getFunction().getContext().diagnose(DiagnosticInfoUnsupported{
665 MF.getFunction(), "Frame pointer required, but has been reserved."});
666 // The frame pointer does need to be reserved from register allocation.
667 assert(MF.getRegInfo().isReserved(FPReg) && "FP not reserved");
668
669 RI->adjustReg(MBB, MBBI, DL, FPReg, SPReg,
670 StackOffset::getFixed(RealStackSize - RVFI->getVarArgsSaveSize()),
671 MachineInstr::FrameSetup, getStackAlign());
672
673 // Emit ".cfi_def_cfa $fp, RVFI->getVarArgsSaveSize()"
674 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::cfiDefCfa(
675 nullptr, RI->getDwarfRegNum(FPReg, true), RVFI->getVarArgsSaveSize()));
676 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
677 .addCFIIndex(CFIIndex)
678 .setMIFlag(MachineInstr::FrameSetup);
679 }
680
681 // Emit the second SP adjustment after saving callee saved registers.
682 if (FirstSPAdjustAmount) {
683 uint64_t SecondSPAdjustAmount =
684 getStackSizeWithRVVPadding(MF) - FirstSPAdjustAmount;
685 assert(SecondSPAdjustAmount > 0 &&
686 "SecondSPAdjustAmount should be greater than zero");
687 RI->adjustReg(MBB, MBBI, DL, SPReg, SPReg,
688 StackOffset::getFixed(-SecondSPAdjustAmount),
689 MachineInstr::FrameSetup, getStackAlign());
690
691 // If we are using a frame-pointer, and thus emitted ".cfi_def_cfa fp, 0",
692 // don't emit an sp-based .cfi_def_cfa_offset
693 if (!hasFP(MF)) {
694 // Emit ".cfi_def_cfa_offset StackSize"
695 unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::cfiDefCfaOffset(
696 nullptr, getStackSizeWithRVVPadding(MF)));
697 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
698 .addCFIIndex(CFIIndex)
699 .setMIFlag(MachineInstr::FrameSetup);
700 }
701 }
702
703 if (RVVStackSize) {
704 adjustStackForRVV(MF, MBB, MBBI, DL, -RVVStackSize,
705 MachineInstr::FrameSetup);
706 if (!hasFP(MF)) {
707 // Emit .cfi_def_cfa_expression "sp + StackSize + RVVStackSize * vlenb".
708 unsigned CFIIndex = MF.addFrameInst(createDefCFAExpression(
709 *RI, SPReg, getStackSizeWithRVVPadding(MF), RVVStackSize / 8));
710 BuildMI(MBB, MBBI, DL, TII->get(TargetOpcode::CFI_INSTRUCTION))
711 .addCFIIndex(CFIIndex)
712 .setMIFlag(MachineInstr::FrameSetup);
713 }
714
715 std::advance(MBBI, getRVVCalleeSavedInfo(MF, CSI).size());
716 emitCalleeSavedRVVPrologCFI(MBB, MBBI, hasFP(MF));
717 }
718
719 if (hasFP(MF)) {
720 // Realign Stack
721 const RISCVRegisterInfo *RI = STI.getRegisterInfo();
722 if (RI->hasStackRealignment(MF)) {
723 Align MaxAlignment = MFI.getMaxAlign();
724
725 const RISCVInstrInfo *TII = STI.getInstrInfo();
726 if (isInt<12>(-(int)MaxAlignment.value())) {
727 BuildMI(MBB, MBBI, DL, TII->get(RISCV::ANDI), SPReg)
728 .addReg(SPReg)
729 .addImm(-(int)MaxAlignment.value())
730 .setMIFlag(MachineInstr::FrameSetup);
731 } else {
732 unsigned ShiftAmount = Log2(MaxAlignment);
733 Register VR =
734 MF.getRegInfo().createVirtualRegister(&RISCV::GPRRegClass);
735 BuildMI(MBB, MBBI, DL, TII->get(RISCV::SRLI), VR)
736 .addReg(SPReg)
737 .addImm(ShiftAmount)
738 .setMIFlag(MachineInstr::FrameSetup);
739 BuildMI(MBB, MBBI, DL, TII->get(RISCV::SLLI), SPReg)
740 .addReg(VR)
741 .addImm(ShiftAmount)
742 .setMIFlag(MachineInstr::FrameSetup);
743 }
744 // FP will be used to restore the frame in the epilogue, so we need
745 // another base register BP to record SP after re-alignment. SP will
746 // track the current stack after allocating variable sized objects.
747 if (hasBP(MF)) {
748 // move BP, SP
749 BuildMI(MBB, MBBI, DL, TII->get(RISCV::ADDI), BPReg)
750 .addReg(SPReg)
751 .addImm(0)
752 .setMIFlag(MachineInstr::FrameSetup);
753 }
754 }
755 }
756 }
757
emitEpilogue(MachineFunction & MF,MachineBasicBlock & MBB) const758 void RISCVFrameLowering::emitEpilogue(MachineFunction &MF,
759 MachineBasicBlock &MBB) const {
760 const RISCVRegisterInfo *RI = STI.getRegisterInfo();
761 MachineFrameInfo &MFI = MF.getFrameInfo();
762 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
763 Register FPReg = getFPReg(STI);
764 Register SPReg = getSPReg(STI);
765
766 // All calls are tail calls in GHC calling conv, and functions have no
767 // prologue/epilogue.
768 if (MF.getFunction().getCallingConv() == CallingConv::GHC)
769 return;
770
771 // Get the insert location for the epilogue. If there were no terminators in
772 // the block, get the last instruction.
773 MachineBasicBlock::iterator MBBI = MBB.end();
774 DebugLoc DL;
775 if (!MBB.empty()) {
776 MBBI = MBB.getLastNonDebugInstr();
777 if (MBBI != MBB.end())
778 DL = MBBI->getDebugLoc();
779
780 MBBI = MBB.getFirstTerminator();
781
782 // If callee-saved registers are saved via libcall, place stack adjustment
783 // before this call.
784 while (MBBI != MBB.begin() &&
785 std::prev(MBBI)->getFlag(MachineInstr::FrameDestroy))
786 --MBBI;
787 }
788
789 const auto &CSI = getUnmanagedCSI(MF, MFI.getCalleeSavedInfo());
790
791 // Skip to before the restores of scalar callee-saved registers
792 // FIXME: assumes exactly one instruction is used to restore each
793 // callee-saved register.
794 auto LastFrameDestroy = MBBI;
795 if (!CSI.empty())
796 LastFrameDestroy = std::prev(MBBI, CSI.size());
797
798 uint64_t RealStackSize = getStackSizeWithRVVPadding(MF);
799 uint64_t StackSize = RealStackSize - RVFI->getReservedSpillsSize();
800 uint64_t FPOffset = RealStackSize - RVFI->getVarArgsSaveSize();
801 uint64_t RVVStackSize = RVFI->getRVVStackSize();
802
803 // Restore the stack pointer using the value of the frame pointer. Only
804 // necessary if the stack pointer was modified, meaning the stack size is
805 // unknown.
806 //
807 // In order to make sure the stack point is right through the EH region,
808 // we also need to restore stack pointer from the frame pointer if we
809 // don't preserve stack space within prologue/epilogue for outgoing variables,
810 // normally it's just checking the variable sized object is present or not
811 // is enough, but we also don't preserve that at prologue/epilogue when
812 // have vector objects in stack.
813 if (RI->hasStackRealignment(MF) || MFI.hasVarSizedObjects() ||
814 !hasReservedCallFrame(MF)) {
815 assert(hasFP(MF) && "frame pointer should not have been eliminated");
816 RI->adjustReg(MBB, LastFrameDestroy, DL, SPReg, FPReg,
817 StackOffset::getFixed(-FPOffset),
818 MachineInstr::FrameDestroy, getStackAlign());
819 } else {
820 if (RVVStackSize)
821 adjustStackForRVV(MF, MBB, LastFrameDestroy, DL, RVVStackSize,
822 MachineInstr::FrameDestroy);
823 }
824
825 uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF);
826 if (FirstSPAdjustAmount) {
827 uint64_t SecondSPAdjustAmount =
828 getStackSizeWithRVVPadding(MF) - FirstSPAdjustAmount;
829 assert(SecondSPAdjustAmount > 0 &&
830 "SecondSPAdjustAmount should be greater than zero");
831
832 RI->adjustReg(MBB, LastFrameDestroy, DL, SPReg, SPReg,
833 StackOffset::getFixed(SecondSPAdjustAmount),
834 MachineInstr::FrameDestroy, getStackAlign());
835 }
836
837 if (FirstSPAdjustAmount)
838 StackSize = FirstSPAdjustAmount;
839
840 if (RVFI->isPushable(MF) && MBBI != MBB.end() &&
841 MBBI->getOpcode() == RISCV::CM_POP) {
842 // Use available stack adjustment in pop instruction to deallocate stack
843 // space. Align the stack size down to a multiple of 16. This is needed for
844 // RVE.
845 // FIXME: Can we increase the stack size to a multiple of 16 instead?
846 uint64_t Spimm = std::min(alignDown(StackSize, 16), (uint64_t)48);
847 MBBI->getOperand(1).setImm(Spimm);
848 StackSize -= Spimm;
849 }
850
851 // Deallocate stack
852 if (StackSize != 0) {
853 RI->adjustReg(MBB, MBBI, DL, SPReg, SPReg, StackOffset::getFixed(StackSize),
854 MachineInstr::FrameDestroy, getStackAlign());
855 }
856
857 // Emit epilogue for shadow call stack.
858 emitSCSEpilogue(MF, MBB, MBBI, DL);
859 }
860
861 StackOffset
getFrameIndexReference(const MachineFunction & MF,int FI,Register & FrameReg) const862 RISCVFrameLowering::getFrameIndexReference(const MachineFunction &MF, int FI,
863 Register &FrameReg) const {
864 const MachineFrameInfo &MFI = MF.getFrameInfo();
865 const TargetRegisterInfo *RI = MF.getSubtarget().getRegisterInfo();
866 const auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
867
868 // Callee-saved registers should be referenced relative to the stack
869 // pointer (positive offset), otherwise use the frame pointer (negative
870 // offset).
871 const auto &CSI = getUnmanagedCSI(MF, MFI.getCalleeSavedInfo());
872 int MinCSFI = 0;
873 int MaxCSFI = -1;
874 StackOffset Offset;
875 auto StackID = MFI.getStackID(FI);
876
877 assert((StackID == TargetStackID::Default ||
878 StackID == TargetStackID::ScalableVector) &&
879 "Unexpected stack ID for the frame object.");
880 if (StackID == TargetStackID::Default) {
881 assert(getOffsetOfLocalArea() == 0 && "LocalAreaOffset is not 0!");
882 Offset = StackOffset::getFixed(MFI.getObjectOffset(FI) +
883 MFI.getOffsetAdjustment());
884 } else if (StackID == TargetStackID::ScalableVector) {
885 Offset = StackOffset::getScalable(MFI.getObjectOffset(FI));
886 }
887
888 uint64_t FirstSPAdjustAmount = getFirstSPAdjustAmount(MF);
889
890 if (CSI.size()) {
891 MinCSFI = CSI[0].getFrameIdx();
892 MaxCSFI = CSI[CSI.size() - 1].getFrameIdx();
893 }
894
895 if (FI >= MinCSFI && FI <= MaxCSFI) {
896 FrameReg = RISCV::X2;
897
898 if (FirstSPAdjustAmount)
899 Offset += StackOffset::getFixed(FirstSPAdjustAmount);
900 else
901 Offset += StackOffset::getFixed(getStackSizeWithRVVPadding(MF));
902 return Offset;
903 }
904
905 if (RI->hasStackRealignment(MF) && !MFI.isFixedObjectIndex(FI)) {
906 // If the stack was realigned, the frame pointer is set in order to allow
907 // SP to be restored, so we need another base register to record the stack
908 // after realignment.
909 // |--------------------------| -- <-- FP
910 // | callee-allocated save | | <----|
911 // | area for register varargs| | |
912 // |--------------------------| | |
913 // | callee-saved registers | | |
914 // |--------------------------| -- |
915 // | realignment (the size of | | |
916 // | this area is not counted | | |
917 // | in MFI.getStackSize()) | | |
918 // |--------------------------| -- |-- MFI.getStackSize()
919 // | RVV alignment padding | | |
920 // | (not counted in | | |
921 // | MFI.getStackSize() but | | |
922 // | counted in | | |
923 // | RVFI.getRVVStackSize()) | | |
924 // |--------------------------| -- |
925 // | RVV objects | | |
926 // | (not counted in | | |
927 // | MFI.getStackSize()) | | |
928 // |--------------------------| -- |
929 // | padding before RVV | | |
930 // | (not counted in | | |
931 // | MFI.getStackSize() or in | | |
932 // | RVFI.getRVVStackSize()) | | |
933 // |--------------------------| -- |
934 // | scalar local variables | | <----'
935 // |--------------------------| -- <-- BP (if var sized objects present)
936 // | VarSize objects | |
937 // |--------------------------| -- <-- SP
938 if (hasBP(MF)) {
939 FrameReg = RISCVABI::getBPReg();
940 } else {
941 // VarSize objects must be empty in this case!
942 assert(!MFI.hasVarSizedObjects());
943 FrameReg = RISCV::X2;
944 }
945 } else {
946 FrameReg = RI->getFrameRegister(MF);
947 }
948
949 if (FrameReg == getFPReg(STI)) {
950 Offset += StackOffset::getFixed(RVFI->getVarArgsSaveSize());
951 // When using FP to access scalable vector objects, we need to minus
952 // the frame size.
953 //
954 // |--------------------------| -- <-- FP
955 // | callee-allocated save | |
956 // | area for register varargs| |
957 // |--------------------------| |
958 // | callee-saved registers | |
959 // |--------------------------| | MFI.getStackSize()
960 // | scalar local variables | |
961 // |--------------------------| -- (Offset of RVV objects is from here.)
962 // | RVV objects |
963 // |--------------------------|
964 // | VarSize objects |
965 // |--------------------------| <-- SP
966 if (MFI.getStackID(FI) == TargetStackID::ScalableVector) {
967 assert(!RI->hasStackRealignment(MF) &&
968 "Can't index across variable sized realign");
969 // We don't expect any extra RVV alignment padding, as the stack size
970 // and RVV object sections should be correct aligned in their own
971 // right.
972 assert(MFI.getStackSize() == getStackSizeWithRVVPadding(MF) &&
973 "Inconsistent stack layout");
974 Offset -= StackOffset::getFixed(MFI.getStackSize());
975 }
976 return Offset;
977 }
978
979 // This case handles indexing off both SP and BP.
980 // If indexing off SP, there must not be any var sized objects
981 assert(FrameReg == RISCVABI::getBPReg() || !MFI.hasVarSizedObjects());
982
983 // When using SP to access frame objects, we need to add RVV stack size.
984 //
985 // |--------------------------| -- <-- FP
986 // | callee-allocated save | | <----|
987 // | area for register varargs| | |
988 // |--------------------------| | |
989 // | callee-saved registers | | |
990 // |--------------------------| -- |
991 // | RVV alignment padding | | |
992 // | (not counted in | | |
993 // | MFI.getStackSize() but | | |
994 // | counted in | | |
995 // | RVFI.getRVVStackSize()) | | |
996 // |--------------------------| -- |
997 // | RVV objects | | |-- MFI.getStackSize()
998 // | (not counted in | | |
999 // | MFI.getStackSize()) | | |
1000 // |--------------------------| -- |
1001 // | padding before RVV | | |
1002 // | (not counted in | | |
1003 // | MFI.getStackSize()) | | |
1004 // |--------------------------| -- |
1005 // | scalar local variables | | <----'
1006 // |--------------------------| -- <-- BP (if var sized objects present)
1007 // | VarSize objects | |
1008 // |--------------------------| -- <-- SP
1009 //
1010 // The total amount of padding surrounding RVV objects is described by
1011 // RVV->getRVVPadding() and it can be zero. It allows us to align the RVV
1012 // objects to the required alignment.
1013 if (MFI.getStackID(FI) == TargetStackID::Default) {
1014 if (MFI.isFixedObjectIndex(FI)) {
1015 assert(!RI->hasStackRealignment(MF) &&
1016 "Can't index across variable sized realign");
1017 Offset += StackOffset::get(getStackSizeWithRVVPadding(MF),
1018 RVFI->getRVVStackSize());
1019 } else {
1020 Offset += StackOffset::getFixed(MFI.getStackSize());
1021 }
1022 } else if (MFI.getStackID(FI) == TargetStackID::ScalableVector) {
1023 // Ensure the base of the RVV stack is correctly aligned: add on the
1024 // alignment padding.
1025 int ScalarLocalVarSize = MFI.getStackSize() -
1026 RVFI->getCalleeSavedStackSize() -
1027 RVFI->getRVPushStackSize() -
1028 RVFI->getVarArgsSaveSize() + RVFI->getRVVPadding();
1029 Offset += StackOffset::get(ScalarLocalVarSize, RVFI->getRVVStackSize());
1030 }
1031 return Offset;
1032 }
1033
determineCalleeSaves(MachineFunction & MF,BitVector & SavedRegs,RegScavenger * RS) const1034 void RISCVFrameLowering::determineCalleeSaves(MachineFunction &MF,
1035 BitVector &SavedRegs,
1036 RegScavenger *RS) const {
1037 TargetFrameLowering::determineCalleeSaves(MF, SavedRegs, RS);
1038 // Unconditionally spill RA and FP only if the function uses a frame
1039 // pointer.
1040 if (hasFP(MF)) {
1041 SavedRegs.set(RISCV::X1);
1042 SavedRegs.set(RISCV::X8);
1043 }
1044 // Mark BP as used if function has dedicated base pointer.
1045 if (hasBP(MF))
1046 SavedRegs.set(RISCVABI::getBPReg());
1047
1048 // When using cm.push/pop we must save X27 if we save X26.
1049 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
1050 if (RVFI->isPushable(MF) && SavedRegs.test(RISCV::X26))
1051 SavedRegs.set(RISCV::X27);
1052 }
1053
1054 std::pair<int64_t, Align>
assignRVVStackObjectOffsets(MachineFunction & MF) const1055 RISCVFrameLowering::assignRVVStackObjectOffsets(MachineFunction &MF) const {
1056 MachineFrameInfo &MFI = MF.getFrameInfo();
1057 // Create a buffer of RVV objects to allocate.
1058 SmallVector<int, 8> ObjectsToAllocate;
1059 auto pushRVVObjects = [&](int FIBegin, int FIEnd) {
1060 for (int I = FIBegin, E = FIEnd; I != E; ++I) {
1061 unsigned StackID = MFI.getStackID(I);
1062 if (StackID != TargetStackID::ScalableVector)
1063 continue;
1064 if (MFI.isDeadObjectIndex(I))
1065 continue;
1066
1067 ObjectsToAllocate.push_back(I);
1068 }
1069 };
1070 // First push RVV Callee Saved object, then push RVV stack object
1071 std::vector<CalleeSavedInfo> &CSI = MF.getFrameInfo().getCalleeSavedInfo();
1072 const auto &RVVCSI = getRVVCalleeSavedInfo(MF, CSI);
1073 if (!RVVCSI.empty())
1074 pushRVVObjects(RVVCSI[0].getFrameIdx(),
1075 RVVCSI[RVVCSI.size() - 1].getFrameIdx() + 1);
1076 pushRVVObjects(0, MFI.getObjectIndexEnd() - RVVCSI.size());
1077
1078 // The minimum alignment is 16 bytes.
1079 Align RVVStackAlign(16);
1080 const auto &ST = MF.getSubtarget<RISCVSubtarget>();
1081
1082 if (!ST.hasVInstructions()) {
1083 assert(ObjectsToAllocate.empty() &&
1084 "Can't allocate scalable-vector objects without V instructions");
1085 return std::make_pair(0, RVVStackAlign);
1086 }
1087
1088 // Allocate all RVV locals and spills
1089 int64_t Offset = 0;
1090 for (int FI : ObjectsToAllocate) {
1091 // ObjectSize in bytes.
1092 int64_t ObjectSize = MFI.getObjectSize(FI);
1093 auto ObjectAlign = std::max(Align(8), MFI.getObjectAlign(FI));
1094 // If the data type is the fractional vector type, reserve one vector
1095 // register for it.
1096 if (ObjectSize < 8)
1097 ObjectSize = 8;
1098 Offset = alignTo(Offset + ObjectSize, ObjectAlign);
1099 MFI.setObjectOffset(FI, -Offset);
1100 // Update the maximum alignment of the RVV stack section
1101 RVVStackAlign = std::max(RVVStackAlign, ObjectAlign);
1102 }
1103
1104 // Ensure the alignment of the RVV stack. Since we want the most-aligned
1105 // object right at the bottom (i.e., any padding at the top of the frame),
1106 // readjust all RVV objects down by the alignment padding.
1107 uint64_t StackSize = Offset;
1108 if (auto AlignmentPadding = offsetToAlignment(StackSize, RVVStackAlign)) {
1109 StackSize += AlignmentPadding;
1110 for (int FI : ObjectsToAllocate)
1111 MFI.setObjectOffset(FI, MFI.getObjectOffset(FI) - AlignmentPadding);
1112 }
1113
1114 return std::make_pair(StackSize, RVVStackAlign);
1115 }
1116
getScavSlotsNumForRVV(MachineFunction & MF)1117 static unsigned getScavSlotsNumForRVV(MachineFunction &MF) {
1118 // For RVV spill, scalable stack offsets computing requires up to two scratch
1119 // registers
1120 static constexpr unsigned ScavSlotsNumRVVSpillScalableObject = 2;
1121
1122 // For RVV spill, non-scalable stack offsets computing requires up to one
1123 // scratch register.
1124 static constexpr unsigned ScavSlotsNumRVVSpillNonScalableObject = 1;
1125
1126 // ADDI instruction's destination register can be used for computing
1127 // offsets. So Scalable stack offsets require up to one scratch register.
1128 static constexpr unsigned ScavSlotsADDIScalableObject = 1;
1129
1130 static constexpr unsigned MaxScavSlotsNumKnown =
1131 std::max({ScavSlotsADDIScalableObject, ScavSlotsNumRVVSpillScalableObject,
1132 ScavSlotsNumRVVSpillNonScalableObject});
1133
1134 unsigned MaxScavSlotsNum = 0;
1135 if (!MF.getSubtarget<RISCVSubtarget>().hasVInstructions())
1136 return false;
1137 for (const MachineBasicBlock &MBB : MF)
1138 for (const MachineInstr &MI : MBB) {
1139 bool IsRVVSpill = RISCV::isRVVSpill(MI);
1140 for (auto &MO : MI.operands()) {
1141 if (!MO.isFI())
1142 continue;
1143 bool IsScalableVectorID = MF.getFrameInfo().getStackID(MO.getIndex()) ==
1144 TargetStackID::ScalableVector;
1145 if (IsRVVSpill) {
1146 MaxScavSlotsNum = std::max(
1147 MaxScavSlotsNum, IsScalableVectorID
1148 ? ScavSlotsNumRVVSpillScalableObject
1149 : ScavSlotsNumRVVSpillNonScalableObject);
1150 } else if (MI.getOpcode() == RISCV::ADDI && IsScalableVectorID) {
1151 MaxScavSlotsNum =
1152 std::max(MaxScavSlotsNum, ScavSlotsADDIScalableObject);
1153 }
1154 }
1155 if (MaxScavSlotsNum == MaxScavSlotsNumKnown)
1156 return MaxScavSlotsNumKnown;
1157 }
1158 return MaxScavSlotsNum;
1159 }
1160
hasRVVFrameObject(const MachineFunction & MF)1161 static bool hasRVVFrameObject(const MachineFunction &MF) {
1162 // Originally, the function will scan all the stack objects to check whether
1163 // if there is any scalable vector object on the stack or not. However, it
1164 // causes errors in the register allocator. In issue 53016, it returns false
1165 // before RA because there is no RVV stack objects. After RA, it returns true
1166 // because there are spilling slots for RVV values during RA. It will not
1167 // reserve BP during register allocation and generate BP access in the PEI
1168 // pass due to the inconsistent behavior of the function.
1169 //
1170 // The function is changed to use hasVInstructions() as the return value. It
1171 // is not precise, but it can make the register allocation correct.
1172 //
1173 // FIXME: Find a better way to make the decision or revisit the solution in
1174 // D103622.
1175 //
1176 // Refer to https://github.com/llvm/llvm-project/issues/53016.
1177 return MF.getSubtarget<RISCVSubtarget>().hasVInstructions();
1178 }
1179
estimateFunctionSizeInBytes(const MachineFunction & MF,const RISCVInstrInfo & TII)1180 static unsigned estimateFunctionSizeInBytes(const MachineFunction &MF,
1181 const RISCVInstrInfo &TII) {
1182 unsigned FnSize = 0;
1183 for (auto &MBB : MF) {
1184 for (auto &MI : MBB) {
1185 // Far branches over 20-bit offset will be relaxed in branch relaxation
1186 // pass. In the worst case, conditional branches will be relaxed into
1187 // the following instruction sequence. Unconditional branches are
1188 // relaxed in the same way, with the exception that there is no first
1189 // branch instruction.
1190 //
1191 // foo
1192 // bne t5, t6, .rev_cond # `TII->getInstSizeInBytes(MI)` bytes
1193 // sd s11, 0(sp) # 4 bytes, or 2 bytes in RVC
1194 // jump .restore, s11 # 8 bytes
1195 // .rev_cond
1196 // bar
1197 // j .dest_bb # 4 bytes, or 2 bytes in RVC
1198 // .restore:
1199 // ld s11, 0(sp) # 4 bytes, or 2 bytes in RVC
1200 // .dest:
1201 // baz
1202 if (MI.isConditionalBranch())
1203 FnSize += TII.getInstSizeInBytes(MI);
1204 if (MI.isConditionalBranch() || MI.isUnconditionalBranch()) {
1205 if (MF.getSubtarget<RISCVSubtarget>().hasStdExtCOrZca())
1206 FnSize += 2 + 8 + 2 + 2;
1207 else
1208 FnSize += 4 + 8 + 4 + 4;
1209 continue;
1210 }
1211
1212 FnSize += TII.getInstSizeInBytes(MI);
1213 }
1214 }
1215 return FnSize;
1216 }
1217
processFunctionBeforeFrameFinalized(MachineFunction & MF,RegScavenger * RS) const1218 void RISCVFrameLowering::processFunctionBeforeFrameFinalized(
1219 MachineFunction &MF, RegScavenger *RS) const {
1220 const RISCVRegisterInfo *RegInfo =
1221 MF.getSubtarget<RISCVSubtarget>().getRegisterInfo();
1222 const RISCVInstrInfo *TII = MF.getSubtarget<RISCVSubtarget>().getInstrInfo();
1223 MachineFrameInfo &MFI = MF.getFrameInfo();
1224 const TargetRegisterClass *RC = &RISCV::GPRRegClass;
1225 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
1226
1227 int64_t RVVStackSize;
1228 Align RVVStackAlign;
1229 std::tie(RVVStackSize, RVVStackAlign) = assignRVVStackObjectOffsets(MF);
1230
1231 RVFI->setRVVStackSize(RVVStackSize);
1232 RVFI->setRVVStackAlign(RVVStackAlign);
1233
1234 if (hasRVVFrameObject(MF)) {
1235 // Ensure the entire stack is aligned to at least the RVV requirement: some
1236 // scalable-vector object alignments are not considered by the
1237 // target-independent code.
1238 MFI.ensureMaxAlignment(RVVStackAlign);
1239 }
1240
1241 unsigned ScavSlotsNum = 0;
1242
1243 // estimateStackSize has been observed to under-estimate the final stack
1244 // size, so give ourselves wiggle-room by checking for stack size
1245 // representable an 11-bit signed field rather than 12-bits.
1246 if (!isInt<11>(MFI.estimateStackSize(MF)))
1247 ScavSlotsNum = 1;
1248
1249 // Far branches over 20-bit offset require a spill slot for scratch register.
1250 bool IsLargeFunction = !isInt<20>(estimateFunctionSizeInBytes(MF, *TII));
1251 if (IsLargeFunction)
1252 ScavSlotsNum = std::max(ScavSlotsNum, 1u);
1253
1254 // RVV loads & stores have no capacity to hold the immediate address offsets
1255 // so we must always reserve an emergency spill slot if the MachineFunction
1256 // contains any RVV spills.
1257 ScavSlotsNum = std::max(ScavSlotsNum, getScavSlotsNumForRVV(MF));
1258
1259 for (unsigned I = 0; I < ScavSlotsNum; I++) {
1260 int FI = MFI.CreateStackObject(RegInfo->getSpillSize(*RC),
1261 RegInfo->getSpillAlign(*RC), false);
1262 RS->addScavengingFrameIndex(FI);
1263
1264 if (IsLargeFunction && RVFI->getBranchRelaxationScratchFrameIndex() == -1)
1265 RVFI->setBranchRelaxationScratchFrameIndex(FI);
1266 }
1267
1268 unsigned Size = RVFI->getReservedSpillsSize();
1269 for (const auto &Info : MFI.getCalleeSavedInfo()) {
1270 int FrameIdx = Info.getFrameIdx();
1271 if (FrameIdx < 0 || MFI.getStackID(FrameIdx) != TargetStackID::Default)
1272 continue;
1273
1274 Size += MFI.getObjectSize(FrameIdx);
1275 }
1276 RVFI->setCalleeSavedStackSize(Size);
1277 }
1278
1279 // Not preserve stack space within prologue for outgoing variables when the
1280 // function contains variable size objects or there are vector objects accessed
1281 // by the frame pointer.
1282 // Let eliminateCallFramePseudoInstr preserve stack space for it.
hasReservedCallFrame(const MachineFunction & MF) const1283 bool RISCVFrameLowering::hasReservedCallFrame(const MachineFunction &MF) const {
1284 return !MF.getFrameInfo().hasVarSizedObjects() &&
1285 !(hasFP(MF) && hasRVVFrameObject(MF));
1286 }
1287
1288 // Eliminate ADJCALLSTACKDOWN, ADJCALLSTACKUP pseudo instructions.
eliminateCallFramePseudoInstr(MachineFunction & MF,MachineBasicBlock & MBB,MachineBasicBlock::iterator MI) const1289 MachineBasicBlock::iterator RISCVFrameLowering::eliminateCallFramePseudoInstr(
1290 MachineFunction &MF, MachineBasicBlock &MBB,
1291 MachineBasicBlock::iterator MI) const {
1292 Register SPReg = RISCV::X2;
1293 DebugLoc DL = MI->getDebugLoc();
1294
1295 if (!hasReservedCallFrame(MF)) {
1296 // If space has not been reserved for a call frame, ADJCALLSTACKDOWN and
1297 // ADJCALLSTACKUP must be converted to instructions manipulating the stack
1298 // pointer. This is necessary when there is a variable length stack
1299 // allocation (e.g. alloca), which means it's not possible to allocate
1300 // space for outgoing arguments from within the function prologue.
1301 int64_t Amount = MI->getOperand(0).getImm();
1302
1303 if (Amount != 0) {
1304 // Ensure the stack remains aligned after adjustment.
1305 Amount = alignSPAdjust(Amount);
1306
1307 if (MI->getOpcode() == RISCV::ADJCALLSTACKDOWN)
1308 Amount = -Amount;
1309
1310 const RISCVRegisterInfo &RI = *STI.getRegisterInfo();
1311 RI.adjustReg(MBB, MI, DL, SPReg, SPReg, StackOffset::getFixed(Amount),
1312 MachineInstr::NoFlags, getStackAlign());
1313 }
1314 }
1315
1316 return MBB.erase(MI);
1317 }
1318
1319 // We would like to split the SP adjustment to reduce prologue/epilogue
1320 // as following instructions. In this way, the offset of the callee saved
1321 // register could fit in a single store. Supposed that the first sp adjust
1322 // amount is 2032.
1323 // add sp,sp,-2032
1324 // sw ra,2028(sp)
1325 // sw s0,2024(sp)
1326 // sw s1,2020(sp)
1327 // sw s3,2012(sp)
1328 // sw s4,2008(sp)
1329 // add sp,sp,-64
1330 uint64_t
getFirstSPAdjustAmount(const MachineFunction & MF) const1331 RISCVFrameLowering::getFirstSPAdjustAmount(const MachineFunction &MF) const {
1332 const auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
1333 const MachineFrameInfo &MFI = MF.getFrameInfo();
1334 const std::vector<CalleeSavedInfo> &CSI = MFI.getCalleeSavedInfo();
1335 uint64_t StackSize = getStackSizeWithRVVPadding(MF);
1336
1337 // Disable SplitSPAdjust if save-restore libcall is used. The callee-saved
1338 // registers will be pushed by the save-restore libcalls, so we don't have to
1339 // split the SP adjustment in this case.
1340 if (RVFI->getReservedSpillsSize())
1341 return 0;
1342
1343 // Return the FirstSPAdjustAmount if the StackSize can not fit in a signed
1344 // 12-bit and there exists a callee-saved register needing to be pushed.
1345 if (!isInt<12>(StackSize) && (CSI.size() > 0)) {
1346 // FirstSPAdjustAmount is chosen at most as (2048 - StackAlign) because
1347 // 2048 will cause sp = sp + 2048 in the epilogue to be split into multiple
1348 // instructions. Offsets smaller than 2048 can fit in a single load/store
1349 // instruction, and we have to stick with the stack alignment. 2048 has
1350 // 16-byte alignment. The stack alignment for RV32 and RV64 is 16 and for
1351 // RV32E it is 4. So (2048 - StackAlign) will satisfy the stack alignment.
1352 const uint64_t StackAlign = getStackAlign().value();
1353
1354 // Amount of (2048 - StackAlign) will prevent callee saved and restored
1355 // instructions be compressed, so try to adjust the amount to the largest
1356 // offset that stack compression instructions accept when target supports
1357 // compression instructions.
1358 if (STI.hasStdExtCOrZca()) {
1359 // The compression extensions may support the following instructions:
1360 // riscv32: c.lwsp rd, offset[7:2] => 2^(6 + 2)
1361 // c.swsp rs2, offset[7:2] => 2^(6 + 2)
1362 // c.flwsp rd, offset[7:2] => 2^(6 + 2)
1363 // c.fswsp rs2, offset[7:2] => 2^(6 + 2)
1364 // riscv64: c.ldsp rd, offset[8:3] => 2^(6 + 3)
1365 // c.sdsp rs2, offset[8:3] => 2^(6 + 3)
1366 // c.fldsp rd, offset[8:3] => 2^(6 + 3)
1367 // c.fsdsp rs2, offset[8:3] => 2^(6 + 3)
1368 const uint64_t RVCompressLen = STI.getXLen() * 8;
1369 // Compared with amount (2048 - StackAlign), StackSize needs to
1370 // satisfy the following conditions to avoid using more instructions
1371 // to adjust the sp after adjusting the amount, such as
1372 // StackSize meets the condition (StackSize <= 2048 + RVCompressLen),
1373 // case1: Amount is 2048 - StackAlign: use addi + addi to adjust sp.
1374 // case2: Amount is RVCompressLen: use addi + addi to adjust sp.
1375 auto CanCompress = [&](uint64_t CompressLen) -> bool {
1376 if (StackSize <= 2047 + CompressLen ||
1377 (StackSize > 2048 * 2 - StackAlign &&
1378 StackSize <= 2047 * 2 + CompressLen) ||
1379 StackSize > 2048 * 3 - StackAlign)
1380 return true;
1381
1382 return false;
1383 };
1384 // In the epilogue, addi sp, sp, 496 is used to recover the sp and it
1385 // can be compressed(C.ADDI16SP, offset can be [-512, 496]), but
1386 // addi sp, sp, 512 can not be compressed. So try to use 496 first.
1387 const uint64_t ADDI16SPCompressLen = 496;
1388 if (STI.is64Bit() && CanCompress(ADDI16SPCompressLen))
1389 return ADDI16SPCompressLen;
1390 if (CanCompress(RVCompressLen))
1391 return RVCompressLen;
1392 }
1393 return 2048 - StackAlign;
1394 }
1395 return 0;
1396 }
1397
assignCalleeSavedSpillSlots(MachineFunction & MF,const TargetRegisterInfo * TRI,std::vector<CalleeSavedInfo> & CSI,unsigned & MinCSFrameIndex,unsigned & MaxCSFrameIndex) const1398 bool RISCVFrameLowering::assignCalleeSavedSpillSlots(
1399 MachineFunction &MF, const TargetRegisterInfo *TRI,
1400 std::vector<CalleeSavedInfo> &CSI, unsigned &MinCSFrameIndex,
1401 unsigned &MaxCSFrameIndex) const {
1402 // Early exit if no callee saved registers are modified!
1403 if (CSI.empty())
1404 return true;
1405
1406 auto *RVFI = MF.getInfo<RISCVMachineFunctionInfo>();
1407
1408 if (RVFI->isPushable(MF)) {
1409 // Determine how many GPRs we need to push and save it to RVFI.
1410 Register MaxReg = getMaxPushPopReg(MF, CSI);
1411 if (MaxReg != RISCV::NoRegister) {
1412 auto [RegEnc, PushedRegNum] = getPushPopEncodingAndNum(MaxReg);
1413 RVFI->setRVPushRegs(PushedRegNum);
1414 RVFI->setRVPushStackSize(alignTo((STI.getXLen() / 8) * PushedRegNum, 16));
1415
1416 // Use encoded number to represent registers to spill.
1417 RVFI->setRVPushRlist(RegEnc);
1418 }
1419 }
1420
1421 MachineFrameInfo &MFI = MF.getFrameInfo();
1422 const TargetRegisterInfo *RegInfo = MF.getSubtarget().getRegisterInfo();
1423
1424 for (auto &CS : CSI) {
1425 unsigned Reg = CS.getReg();
1426 const TargetRegisterClass *RC = RegInfo->getMinimalPhysRegClass(Reg);
1427 unsigned Size = RegInfo->getSpillSize(*RC);
1428
1429 // This might need a fixed stack slot.
1430 if (RVFI->useSaveRestoreLibCalls(MF) || RVFI->isPushable(MF)) {
1431 const auto *FII = llvm::find_if(
1432 FixedCSRFIMap, [&](auto P) { return P.first == CS.getReg(); });
1433 if (FII != std::end(FixedCSRFIMap)) {
1434 int64_t Offset;
1435 if (RVFI->isPushable(MF))
1436 Offset = -((FII->second + RVFI->getRVPushRegs() + 1) * (int64_t)Size);
1437 else
1438 Offset = FII->second * (int64_t)Size;
1439
1440 int FrameIdx = MFI.CreateFixedSpillStackObject(Size, Offset);
1441 assert(FrameIdx < 0);
1442 CS.setFrameIdx(FrameIdx);
1443 continue;
1444 }
1445 }
1446
1447 // Not a fixed slot.
1448 Align Alignment = RegInfo->getSpillAlign(*RC);
1449 // We may not be able to satisfy the desired alignment specification of
1450 // the TargetRegisterClass if the stack alignment is smaller. Use the
1451 // min.
1452 Alignment = std::min(Alignment, getStackAlign());
1453 int FrameIdx = MFI.CreateStackObject(Size, Alignment, true);
1454 if ((unsigned)FrameIdx < MinCSFrameIndex)
1455 MinCSFrameIndex = FrameIdx;
1456 if ((unsigned)FrameIdx > MaxCSFrameIndex)
1457 MaxCSFrameIndex = FrameIdx;
1458 CS.setFrameIdx(FrameIdx);
1459 }
1460
1461 // Allocate a fixed object that covers the full push or libcall size.
1462 if (RVFI->isPushable(MF)) {
1463 if (int64_t PushSize = RVFI->getRVPushStackSize())
1464 MFI.CreateFixedSpillStackObject(PushSize, -PushSize);
1465 } else if (int LibCallRegs = getLibCallID(MF, CSI) + 1) {
1466 int64_t LibCallFrameSize =
1467 alignTo((STI.getXLen() / 8) * LibCallRegs, getStackAlign());
1468 MFI.CreateFixedSpillStackObject(LibCallFrameSize, -LibCallFrameSize);
1469 }
1470
1471 return true;
1472 }
1473
spillCalleeSavedRegisters(MachineBasicBlock & MBB,MachineBasicBlock::iterator MI,ArrayRef<CalleeSavedInfo> CSI,const TargetRegisterInfo * TRI) const1474 bool RISCVFrameLowering::spillCalleeSavedRegisters(
1475 MachineBasicBlock &MBB, MachineBasicBlock::iterator MI,
1476 ArrayRef<CalleeSavedInfo> CSI, const TargetRegisterInfo *TRI) const {
1477 if (CSI.empty())
1478 return true;
1479
1480 MachineFunction *MF = MBB.getParent();
1481 const TargetInstrInfo &TII = *MF->getSubtarget().getInstrInfo();
1482 DebugLoc DL;
1483 if (MI != MBB.end() && !MI->isDebugInstr())
1484 DL = MI->getDebugLoc();
1485
1486 // Emit CM.PUSH with base SPimm & evaluate Push stack
1487 RISCVMachineFunctionInfo *RVFI = MF->getInfo<RISCVMachineFunctionInfo>();
1488 if (RVFI->isPushable(*MF)) {
1489 unsigned PushedRegNum = RVFI->getRVPushRegs();
1490 if (PushedRegNum > 0) {
1491 // Use encoded number to represent registers to spill.
1492 int RegEnc = RVFI->getRVPushRlist();
1493 MachineInstrBuilder PushBuilder =
1494 BuildMI(MBB, MI, DL, TII.get(RISCV::CM_PUSH))
1495 .setMIFlag(MachineInstr::FrameSetup);
1496 PushBuilder.addImm((int64_t)RegEnc);
1497 PushBuilder.addImm(0);
1498
1499 for (unsigned i = 0; i < PushedRegNum; i++)
1500 PushBuilder.addUse(FixedCSRFIMap[i].first, RegState::Implicit);
1501 }
1502 } else if (const char *SpillLibCall = getSpillLibCallName(*MF, CSI)) {
1503 // Add spill libcall via non-callee-saved register t0.
1504 BuildMI(MBB, MI, DL, TII.get(RISCV::PseudoCALLReg), RISCV::X5)
1505 .addExternalSymbol(SpillLibCall, RISCVII::MO_CALL)
1506 .setMIFlag(MachineInstr::FrameSetup);
1507
1508 // Add registers spilled in libcall as liveins.
1509 for (auto &CS : CSI)
1510 MBB.addLiveIn(CS.getReg());
1511 }
1512
1513 // Manually spill values not spilled by libcall & Push/Pop.
1514 const auto &UnmanagedCSI = getUnmanagedCSI(*MF, CSI);
1515 const auto &RVVCSI = getRVVCalleeSavedInfo(*MF, CSI);
1516
1517 auto storeRegToStackSlot = [&](decltype(UnmanagedCSI) CSInfo) {
1518 for (auto &CS : CSInfo) {
1519 // Insert the spill to the stack frame.
1520 Register Reg = CS.getReg();
1521 const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg);
1522 TII.storeRegToStackSlot(MBB, MI, Reg, !MBB.isLiveIn(Reg),
1523 CS.getFrameIdx(), RC, TRI, Register());
1524 }
1525 };
1526 storeRegToStackSlot(UnmanagedCSI);
1527 storeRegToStackSlot(RVVCSI);
1528
1529 return true;
1530 }
1531
emitCalleeSavedRVVPrologCFI(MachineBasicBlock & MBB,MachineBasicBlock::iterator MI,bool HasFP) const1532 void RISCVFrameLowering::emitCalleeSavedRVVPrologCFI(
1533 MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, bool HasFP) const {
1534 MachineFunction *MF = MBB.getParent();
1535 const MachineFrameInfo &MFI = MF->getFrameInfo();
1536 RISCVMachineFunctionInfo *RVFI = MF->getInfo<RISCVMachineFunctionInfo>();
1537 const TargetInstrInfo &TII = *STI.getInstrInfo();
1538 DebugLoc DL = MBB.findDebugLoc(MI);
1539
1540 const auto &RVVCSI = getRVVCalleeSavedInfo(*MF, MFI.getCalleeSavedInfo());
1541 if (RVVCSI.empty())
1542 return;
1543
1544 uint64_t FixedSize = getStackSizeWithRVVPadding(*MF);
1545 if (!HasFP) {
1546 uint64_t ScalarLocalVarSize =
1547 MFI.getStackSize() - RVFI->getCalleeSavedStackSize() -
1548 RVFI->getRVPushStackSize() - RVFI->getVarArgsSaveSize() +
1549 RVFI->getRVVPadding();
1550 FixedSize -= ScalarLocalVarSize;
1551 }
1552
1553 for (auto &CS : RVVCSI) {
1554 // Insert the spill to the stack frame.
1555 int FI = CS.getFrameIdx();
1556 if (FI >= 0 && MFI.getStackID(FI) == TargetStackID::ScalableVector) {
1557 unsigned CFIIndex = MF->addFrameInst(
1558 createDefCFAOffset(*STI.getRegisterInfo(), CS.getReg(), -FixedSize,
1559 MFI.getObjectOffset(FI) / 8));
1560 BuildMI(MBB, MI, DL, TII.get(TargetOpcode::CFI_INSTRUCTION))
1561 .addCFIIndex(CFIIndex)
1562 .setMIFlag(MachineInstr::FrameSetup);
1563 }
1564 }
1565 }
1566
restoreCalleeSavedRegisters(MachineBasicBlock & MBB,MachineBasicBlock::iterator MI,MutableArrayRef<CalleeSavedInfo> CSI,const TargetRegisterInfo * TRI) const1567 bool RISCVFrameLowering::restoreCalleeSavedRegisters(
1568 MachineBasicBlock &MBB, MachineBasicBlock::iterator MI,
1569 MutableArrayRef<CalleeSavedInfo> CSI, const TargetRegisterInfo *TRI) const {
1570 if (CSI.empty())
1571 return true;
1572
1573 MachineFunction *MF = MBB.getParent();
1574 const TargetInstrInfo &TII = *MF->getSubtarget().getInstrInfo();
1575 DebugLoc DL;
1576 if (MI != MBB.end() && !MI->isDebugInstr())
1577 DL = MI->getDebugLoc();
1578
1579 // Manually restore values not restored by libcall & Push/Pop.
1580 // Reverse the restore order in epilog. In addition, the return
1581 // address will be restored first in the epilogue. It increases
1582 // the opportunity to avoid the load-to-use data hazard between
1583 // loading RA and return by RA. loadRegFromStackSlot can insert
1584 // multiple instructions.
1585 const auto &UnmanagedCSI = getUnmanagedCSI(*MF, CSI);
1586 const auto &RVVCSI = getRVVCalleeSavedInfo(*MF, CSI);
1587
1588 auto loadRegFromStackSlot = [&](decltype(UnmanagedCSI) CSInfo) {
1589 for (auto &CS : CSInfo) {
1590 Register Reg = CS.getReg();
1591 const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg);
1592 TII.loadRegFromStackSlot(MBB, MI, Reg, CS.getFrameIdx(), RC, TRI,
1593 Register());
1594 assert(MI != MBB.begin() &&
1595 "loadRegFromStackSlot didn't insert any code!");
1596 }
1597 };
1598 loadRegFromStackSlot(RVVCSI);
1599 loadRegFromStackSlot(UnmanagedCSI);
1600
1601 RISCVMachineFunctionInfo *RVFI = MF->getInfo<RISCVMachineFunctionInfo>();
1602 if (RVFI->isPushable(*MF)) {
1603 int RegEnc = RVFI->getRVPushRlist();
1604 if (RegEnc != llvm::RISCVZC::RLISTENCODE::INVALID_RLIST) {
1605 MachineInstrBuilder PopBuilder =
1606 BuildMI(MBB, MI, DL, TII.get(RISCV::CM_POP))
1607 .setMIFlag(MachineInstr::FrameDestroy);
1608 // Use encoded number to represent registers to restore.
1609 PopBuilder.addImm(RegEnc);
1610 PopBuilder.addImm(0);
1611
1612 for (unsigned i = 0; i < RVFI->getRVPushRegs(); i++)
1613 PopBuilder.addDef(FixedCSRFIMap[i].first, RegState::ImplicitDefine);
1614 }
1615 } else {
1616 const char *RestoreLibCall = getRestoreLibCallName(*MF, CSI);
1617 if (RestoreLibCall) {
1618 // Add restore libcall via tail call.
1619 MachineBasicBlock::iterator NewMI =
1620 BuildMI(MBB, MI, DL, TII.get(RISCV::PseudoTAIL))
1621 .addExternalSymbol(RestoreLibCall, RISCVII::MO_CALL)
1622 .setMIFlag(MachineInstr::FrameDestroy);
1623
1624 // Remove trailing returns, since the terminator is now a tail call to the
1625 // restore function.
1626 if (MI != MBB.end() && MI->getOpcode() == RISCV::PseudoRET) {
1627 NewMI->copyImplicitOps(*MF, *MI);
1628 MI->eraseFromParent();
1629 }
1630 }
1631 }
1632 return true;
1633 }
1634
enableShrinkWrapping(const MachineFunction & MF) const1635 bool RISCVFrameLowering::enableShrinkWrapping(const MachineFunction &MF) const {
1636 // Keep the conventional code flow when not optimizing.
1637 if (MF.getFunction().hasOptNone())
1638 return false;
1639
1640 return true;
1641 }
1642
canUseAsPrologue(const MachineBasicBlock & MBB) const1643 bool RISCVFrameLowering::canUseAsPrologue(const MachineBasicBlock &MBB) const {
1644 MachineBasicBlock *TmpMBB = const_cast<MachineBasicBlock *>(&MBB);
1645 const MachineFunction *MF = MBB.getParent();
1646 const auto *RVFI = MF->getInfo<RISCVMachineFunctionInfo>();
1647
1648 if (!RVFI->useSaveRestoreLibCalls(*MF))
1649 return true;
1650
1651 // Inserting a call to a __riscv_save libcall requires the use of the register
1652 // t0 (X5) to hold the return address. Therefore if this register is already
1653 // used we can't insert the call.
1654
1655 RegScavenger RS;
1656 RS.enterBasicBlock(*TmpMBB);
1657 return !RS.isRegUsed(RISCV::X5);
1658 }
1659
canUseAsEpilogue(const MachineBasicBlock & MBB) const1660 bool RISCVFrameLowering::canUseAsEpilogue(const MachineBasicBlock &MBB) const {
1661 const MachineFunction *MF = MBB.getParent();
1662 MachineBasicBlock *TmpMBB = const_cast<MachineBasicBlock *>(&MBB);
1663 const auto *RVFI = MF->getInfo<RISCVMachineFunctionInfo>();
1664
1665 if (!RVFI->useSaveRestoreLibCalls(*MF))
1666 return true;
1667
1668 // Using the __riscv_restore libcalls to restore CSRs requires a tail call.
1669 // This means if we still need to continue executing code within this function
1670 // the restore cannot take place in this basic block.
1671
1672 if (MBB.succ_size() > 1)
1673 return false;
1674
1675 MachineBasicBlock *SuccMBB =
1676 MBB.succ_empty() ? TmpMBB->getFallThrough() : *MBB.succ_begin();
1677
1678 // Doing a tail call should be safe if there are no successors, because either
1679 // we have a returning block or the end of the block is unreachable, so the
1680 // restore will be eliminated regardless.
1681 if (!SuccMBB)
1682 return true;
1683
1684 // The successor can only contain a return, since we would effectively be
1685 // replacing the successor with our own tail return at the end of our block.
1686 return SuccMBB->isReturnBlock() && SuccMBB->size() == 1;
1687 }
1688
isSupportedStackID(TargetStackID::Value ID) const1689 bool RISCVFrameLowering::isSupportedStackID(TargetStackID::Value ID) const {
1690 switch (ID) {
1691 case TargetStackID::Default:
1692 case TargetStackID::ScalableVector:
1693 return true;
1694 case TargetStackID::NoAlloc:
1695 case TargetStackID::SGPRSpill:
1696 case TargetStackID::WasmLocal:
1697 return false;
1698 }
1699 llvm_unreachable("Invalid TargetStackID::Value");
1700 }
1701
getStackIDForScalableVectors() const1702 TargetStackID::Value RISCVFrameLowering::getStackIDForScalableVectors() const {
1703 return TargetStackID::ScalableVector;
1704 }
1705