1 //===- ARMLegalizerInfo.cpp --------------------------------------*- C++ -*-==// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 /// \file 9 /// This file implements the targeting of the Machinelegalizer class for ARM. 10 /// \todo This should be generated by TableGen. 11 //===----------------------------------------------------------------------===// 12 13 #include "ARMLegalizerInfo.h" 14 #include "ARMCallLowering.h" 15 #include "ARMSubtarget.h" 16 #include "llvm/CodeGen/GlobalISel/LegalizerHelper.h" 17 #include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h" 18 #include "llvm/CodeGen/LowLevelTypeUtils.h" 19 #include "llvm/CodeGen/MachineRegisterInfo.h" 20 #include "llvm/CodeGen/TargetOpcodes.h" 21 #include "llvm/CodeGen/ValueTypes.h" 22 #include "llvm/IR/DerivedTypes.h" 23 #include "llvm/IR/Type.h" 24 25 using namespace llvm; 26 using namespace LegalizeActions; 27 28 /// FIXME: The following static functions are SizeChangeStrategy functions 29 /// that are meant to temporarily mimic the behaviour of the old legalization 30 /// based on doubling/halving non-legal types as closely as possible. This is 31 /// not entirly possible as only legalizing the types that are exactly a power 32 /// of 2 times the size of the legal types would require specifying all those 33 /// sizes explicitly. 34 /// In practice, not specifying those isn't a problem, and the below functions 35 /// should disappear quickly as we add support for legalizing non-power-of-2 36 /// sized types further. 37 static void addAndInterleaveWithUnsupported( 38 LegacyLegalizerInfo::SizeAndActionsVec &result, 39 const LegacyLegalizerInfo::SizeAndActionsVec &v) { 40 for (unsigned i = 0; i < v.size(); ++i) { 41 result.push_back(v[i]); 42 if (i + 1 < v[i].first && i + 1 < v.size() && 43 v[i + 1].first != v[i].first + 1) 44 result.push_back({v[i].first + 1, LegacyLegalizeActions::Unsupported}); 45 } 46 } 47 48 static LegacyLegalizerInfo::SizeAndActionsVec 49 widen_8_16(const LegacyLegalizerInfo::SizeAndActionsVec &v) { 50 assert(v.size() >= 1); 51 assert(v[0].first > 17); 52 LegacyLegalizerInfo::SizeAndActionsVec result = { 53 {1, LegacyLegalizeActions::Unsupported}, 54 {8, LegacyLegalizeActions::WidenScalar}, 55 {9, LegacyLegalizeActions::Unsupported}, 56 {16, LegacyLegalizeActions::WidenScalar}, 57 {17, LegacyLegalizeActions::Unsupported}}; 58 addAndInterleaveWithUnsupported(result, v); 59 auto Largest = result.back().first; 60 result.push_back({Largest + 1, LegacyLegalizeActions::Unsupported}); 61 return result; 62 } 63 64 static bool AEABI(const ARMSubtarget &ST) { 65 return ST.isTargetAEABI() || ST.isTargetGNUAEABI() || ST.isTargetMuslAEABI(); 66 } 67 68 ARMLegalizerInfo::ARMLegalizerInfo(const ARMSubtarget &ST) { 69 using namespace TargetOpcode; 70 71 const LLT p0 = LLT::pointer(0, 32); 72 73 const LLT s1 = LLT::scalar(1); 74 const LLT s8 = LLT::scalar(8); 75 const LLT s16 = LLT::scalar(16); 76 const LLT s32 = LLT::scalar(32); 77 const LLT s64 = LLT::scalar(64); 78 79 auto &LegacyInfo = getLegacyLegalizerInfo(); 80 if (ST.isThumb1Only()) { 81 // Thumb1 is not supported yet. 82 LegacyInfo.computeTables(); 83 verify(*ST.getInstrInfo()); 84 return; 85 } 86 87 getActionDefinitionsBuilder({G_SEXT, G_ZEXT, G_ANYEXT}) 88 .legalForCartesianProduct({s8, s16, s32}, {s1, s8, s16}); 89 90 getActionDefinitionsBuilder(G_SEXT_INREG).lower(); 91 92 getActionDefinitionsBuilder({G_MUL, G_AND, G_OR, G_XOR}) 93 .legalFor({s32}) 94 .clampScalar(0, s32, s32); 95 96 if (ST.hasNEON()) 97 getActionDefinitionsBuilder({G_ADD, G_SUB}) 98 .legalFor({s32, s64}) 99 .minScalar(0, s32); 100 else 101 getActionDefinitionsBuilder({G_ADD, G_SUB}) 102 .legalFor({s32}) 103 .minScalar(0, s32); 104 105 getActionDefinitionsBuilder({G_ASHR, G_LSHR, G_SHL}) 106 .legalFor({{s32, s32}}) 107 .minScalar(0, s32) 108 .clampScalar(1, s32, s32); 109 110 bool HasHWDivide = (!ST.isThumb() && ST.hasDivideInARMMode()) || 111 (ST.isThumb() && ST.hasDivideInThumbMode()); 112 if (HasHWDivide) 113 getActionDefinitionsBuilder({G_SDIV, G_UDIV}) 114 .legalFor({s32}) 115 .clampScalar(0, s32, s32); 116 else 117 getActionDefinitionsBuilder({G_SDIV, G_UDIV}) 118 .libcallFor({s32}) 119 .clampScalar(0, s32, s32); 120 121 for (unsigned Op : {G_SREM, G_UREM}) { 122 LegacyInfo.setLegalizeScalarToDifferentSizeStrategy(Op, 0, widen_8_16); 123 if (HasHWDivide) 124 LegacyInfo.setAction({Op, s32}, LegacyLegalizeActions::Lower); 125 else if (AEABI(ST)) 126 LegacyInfo.setAction({Op, s32}, LegacyLegalizeActions::Custom); 127 else 128 LegacyInfo.setAction({Op, s32}, LegacyLegalizeActions::Libcall); 129 } 130 131 getActionDefinitionsBuilder(G_INTTOPTR) 132 .legalFor({{p0, s32}}) 133 .minScalar(1, s32); 134 getActionDefinitionsBuilder(G_PTRTOINT) 135 .legalFor({{s32, p0}}) 136 .minScalar(0, s32); 137 138 getActionDefinitionsBuilder(G_CONSTANT) 139 .legalFor({s32, p0}) 140 .clampScalar(0, s32, s32); 141 142 getActionDefinitionsBuilder(G_ICMP) 143 .legalForCartesianProduct({s1}, {s32, p0}) 144 .minScalar(1, s32); 145 146 getActionDefinitionsBuilder(G_SELECT) 147 .legalForCartesianProduct({s32, p0}, {s1}) 148 .minScalar(0, s32); 149 150 // We're keeping these builders around because we'll want to add support for 151 // floating point to them. 152 auto &LoadStoreBuilder = getActionDefinitionsBuilder({G_LOAD, G_STORE}) 153 .legalForTypesWithMemDesc({{s8, p0, s8, 8}, 154 {s16, p0, s16, 8}, 155 {s32, p0, s32, 8}, 156 {p0, p0, p0, 8}}) 157 .unsupportedIfMemSizeNotPow2(); 158 159 getActionDefinitionsBuilder(G_FRAME_INDEX).legalFor({p0}); 160 getActionDefinitionsBuilder(G_GLOBAL_VALUE).legalFor({p0}); 161 162 auto &PhiBuilder = 163 getActionDefinitionsBuilder(G_PHI) 164 .legalFor({s32, p0}) 165 .minScalar(0, s32); 166 167 getActionDefinitionsBuilder(G_PTR_ADD) 168 .legalFor({{p0, s32}}) 169 .minScalar(1, s32); 170 171 getActionDefinitionsBuilder(G_BRCOND).legalFor({s1}); 172 173 if (!ST.useSoftFloat() && ST.hasVFP2Base()) { 174 getActionDefinitionsBuilder( 175 {G_FADD, G_FSUB, G_FMUL, G_FDIV, G_FCONSTANT, G_FNEG}) 176 .legalFor({s32, s64}); 177 178 LoadStoreBuilder 179 .legalForTypesWithMemDesc({{s64, p0, s64, 32}}) 180 .maxScalar(0, s32); 181 PhiBuilder.legalFor({s64}); 182 183 getActionDefinitionsBuilder(G_FCMP).legalForCartesianProduct({s1}, 184 {s32, s64}); 185 186 getActionDefinitionsBuilder(G_MERGE_VALUES).legalFor({{s64, s32}}); 187 getActionDefinitionsBuilder(G_UNMERGE_VALUES).legalFor({{s32, s64}}); 188 189 getActionDefinitionsBuilder(G_FPEXT).legalFor({{s64, s32}}); 190 getActionDefinitionsBuilder(G_FPTRUNC).legalFor({{s32, s64}}); 191 192 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI}) 193 .legalForCartesianProduct({s32}, {s32, s64}); 194 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP}) 195 .legalForCartesianProduct({s32, s64}, {s32}); 196 } else { 197 getActionDefinitionsBuilder({G_FADD, G_FSUB, G_FMUL, G_FDIV}) 198 .libcallFor({s32, s64}); 199 200 LoadStoreBuilder.maxScalar(0, s32); 201 202 for (auto Ty : {s32, s64}) 203 LegacyInfo.setAction({G_FNEG, Ty}, LegacyLegalizeActions::Lower); 204 205 getActionDefinitionsBuilder(G_FCONSTANT).customFor({s32, s64}); 206 207 getActionDefinitionsBuilder(G_FCMP).customForCartesianProduct({s1}, 208 {s32, s64}); 209 210 if (AEABI(ST)) 211 setFCmpLibcallsAEABI(); 212 else 213 setFCmpLibcallsGNU(); 214 215 getActionDefinitionsBuilder(G_FPEXT).libcallFor({{s64, s32}}); 216 getActionDefinitionsBuilder(G_FPTRUNC).libcallFor({{s32, s64}}); 217 218 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI}) 219 .libcallForCartesianProduct({s32}, {s32, s64}); 220 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP}) 221 .libcallForCartesianProduct({s32, s64}, {s32}); 222 } 223 224 // Just expand whatever loads and stores are left. 225 LoadStoreBuilder.lower(); 226 227 if (!ST.useSoftFloat() && ST.hasVFP4Base()) 228 getActionDefinitionsBuilder(G_FMA).legalFor({s32, s64}); 229 else 230 getActionDefinitionsBuilder(G_FMA).libcallFor({s32, s64}); 231 232 getActionDefinitionsBuilder({G_FREM, G_FPOW}).libcallFor({s32, s64}); 233 234 if (ST.hasV5TOps()) { 235 getActionDefinitionsBuilder(G_CTLZ) 236 .legalFor({s32, s32}) 237 .clampScalar(1, s32, s32) 238 .clampScalar(0, s32, s32); 239 getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF) 240 .lowerFor({s32, s32}) 241 .clampScalar(1, s32, s32) 242 .clampScalar(0, s32, s32); 243 } else { 244 getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF) 245 .libcallFor({s32, s32}) 246 .clampScalar(1, s32, s32) 247 .clampScalar(0, s32, s32); 248 getActionDefinitionsBuilder(G_CTLZ) 249 .lowerFor({s32, s32}) 250 .clampScalar(1, s32, s32) 251 .clampScalar(0, s32, s32); 252 } 253 254 LegacyInfo.computeTables(); 255 verify(*ST.getInstrInfo()); 256 } 257 258 void ARMLegalizerInfo::setFCmpLibcallsAEABI() { 259 // FCMP_TRUE and FCMP_FALSE don't need libcalls, they should be 260 // default-initialized. 261 FCmp32Libcalls.resize(CmpInst::LAST_FCMP_PREDICATE + 1); 262 FCmp32Libcalls[CmpInst::FCMP_OEQ] = { 263 {RTLIB::OEQ_F32, CmpInst::BAD_ICMP_PREDICATE}}; 264 FCmp32Libcalls[CmpInst::FCMP_OGE] = { 265 {RTLIB::OGE_F32, CmpInst::BAD_ICMP_PREDICATE}}; 266 FCmp32Libcalls[CmpInst::FCMP_OGT] = { 267 {RTLIB::OGT_F32, CmpInst::BAD_ICMP_PREDICATE}}; 268 FCmp32Libcalls[CmpInst::FCMP_OLE] = { 269 {RTLIB::OLE_F32, CmpInst::BAD_ICMP_PREDICATE}}; 270 FCmp32Libcalls[CmpInst::FCMP_OLT] = { 271 {RTLIB::OLT_F32, CmpInst::BAD_ICMP_PREDICATE}}; 272 FCmp32Libcalls[CmpInst::FCMP_ORD] = {{RTLIB::UO_F32, CmpInst::ICMP_EQ}}; 273 FCmp32Libcalls[CmpInst::FCMP_UGE] = {{RTLIB::OLT_F32, CmpInst::ICMP_EQ}}; 274 FCmp32Libcalls[CmpInst::FCMP_UGT] = {{RTLIB::OLE_F32, CmpInst::ICMP_EQ}}; 275 FCmp32Libcalls[CmpInst::FCMP_ULE] = {{RTLIB::OGT_F32, CmpInst::ICMP_EQ}}; 276 FCmp32Libcalls[CmpInst::FCMP_ULT] = {{RTLIB::OGE_F32, CmpInst::ICMP_EQ}}; 277 FCmp32Libcalls[CmpInst::FCMP_UNE] = {{RTLIB::UNE_F32, CmpInst::ICMP_EQ}}; 278 FCmp32Libcalls[CmpInst::FCMP_UNO] = { 279 {RTLIB::UO_F32, CmpInst::BAD_ICMP_PREDICATE}}; 280 FCmp32Libcalls[CmpInst::FCMP_ONE] = { 281 {RTLIB::OGT_F32, CmpInst::BAD_ICMP_PREDICATE}, 282 {RTLIB::OLT_F32, CmpInst::BAD_ICMP_PREDICATE}}; 283 FCmp32Libcalls[CmpInst::FCMP_UEQ] = { 284 {RTLIB::OEQ_F32, CmpInst::BAD_ICMP_PREDICATE}, 285 {RTLIB::UO_F32, CmpInst::BAD_ICMP_PREDICATE}}; 286 287 FCmp64Libcalls.resize(CmpInst::LAST_FCMP_PREDICATE + 1); 288 FCmp64Libcalls[CmpInst::FCMP_OEQ] = { 289 {RTLIB::OEQ_F64, CmpInst::BAD_ICMP_PREDICATE}}; 290 FCmp64Libcalls[CmpInst::FCMP_OGE] = { 291 {RTLIB::OGE_F64, CmpInst::BAD_ICMP_PREDICATE}}; 292 FCmp64Libcalls[CmpInst::FCMP_OGT] = { 293 {RTLIB::OGT_F64, CmpInst::BAD_ICMP_PREDICATE}}; 294 FCmp64Libcalls[CmpInst::FCMP_OLE] = { 295 {RTLIB::OLE_F64, CmpInst::BAD_ICMP_PREDICATE}}; 296 FCmp64Libcalls[CmpInst::FCMP_OLT] = { 297 {RTLIB::OLT_F64, CmpInst::BAD_ICMP_PREDICATE}}; 298 FCmp64Libcalls[CmpInst::FCMP_ORD] = {{RTLIB::UO_F64, CmpInst::ICMP_EQ}}; 299 FCmp64Libcalls[CmpInst::FCMP_UGE] = {{RTLIB::OLT_F64, CmpInst::ICMP_EQ}}; 300 FCmp64Libcalls[CmpInst::FCMP_UGT] = {{RTLIB::OLE_F64, CmpInst::ICMP_EQ}}; 301 FCmp64Libcalls[CmpInst::FCMP_ULE] = {{RTLIB::OGT_F64, CmpInst::ICMP_EQ}}; 302 FCmp64Libcalls[CmpInst::FCMP_ULT] = {{RTLIB::OGE_F64, CmpInst::ICMP_EQ}}; 303 FCmp64Libcalls[CmpInst::FCMP_UNE] = {{RTLIB::UNE_F64, CmpInst::ICMP_EQ}}; 304 FCmp64Libcalls[CmpInst::FCMP_UNO] = { 305 {RTLIB::UO_F64, CmpInst::BAD_ICMP_PREDICATE}}; 306 FCmp64Libcalls[CmpInst::FCMP_ONE] = { 307 {RTLIB::OGT_F64, CmpInst::BAD_ICMP_PREDICATE}, 308 {RTLIB::OLT_F64, CmpInst::BAD_ICMP_PREDICATE}}; 309 FCmp64Libcalls[CmpInst::FCMP_UEQ] = { 310 {RTLIB::OEQ_F64, CmpInst::BAD_ICMP_PREDICATE}, 311 {RTLIB::UO_F64, CmpInst::BAD_ICMP_PREDICATE}}; 312 } 313 314 void ARMLegalizerInfo::setFCmpLibcallsGNU() { 315 // FCMP_TRUE and FCMP_FALSE don't need libcalls, they should be 316 // default-initialized. 317 FCmp32Libcalls.resize(CmpInst::LAST_FCMP_PREDICATE + 1); 318 FCmp32Libcalls[CmpInst::FCMP_OEQ] = {{RTLIB::OEQ_F32, CmpInst::ICMP_EQ}}; 319 FCmp32Libcalls[CmpInst::FCMP_OGE] = {{RTLIB::OGE_F32, CmpInst::ICMP_SGE}}; 320 FCmp32Libcalls[CmpInst::FCMP_OGT] = {{RTLIB::OGT_F32, CmpInst::ICMP_SGT}}; 321 FCmp32Libcalls[CmpInst::FCMP_OLE] = {{RTLIB::OLE_F32, CmpInst::ICMP_SLE}}; 322 FCmp32Libcalls[CmpInst::FCMP_OLT] = {{RTLIB::OLT_F32, CmpInst::ICMP_SLT}}; 323 FCmp32Libcalls[CmpInst::FCMP_ORD] = {{RTLIB::UO_F32, CmpInst::ICMP_EQ}}; 324 FCmp32Libcalls[CmpInst::FCMP_UGE] = {{RTLIB::OLT_F32, CmpInst::ICMP_SGE}}; 325 FCmp32Libcalls[CmpInst::FCMP_UGT] = {{RTLIB::OLE_F32, CmpInst::ICMP_SGT}}; 326 FCmp32Libcalls[CmpInst::FCMP_ULE] = {{RTLIB::OGT_F32, CmpInst::ICMP_SLE}}; 327 FCmp32Libcalls[CmpInst::FCMP_ULT] = {{RTLIB::OGE_F32, CmpInst::ICMP_SLT}}; 328 FCmp32Libcalls[CmpInst::FCMP_UNE] = {{RTLIB::UNE_F32, CmpInst::ICMP_NE}}; 329 FCmp32Libcalls[CmpInst::FCMP_UNO] = {{RTLIB::UO_F32, CmpInst::ICMP_NE}}; 330 FCmp32Libcalls[CmpInst::FCMP_ONE] = {{RTLIB::OGT_F32, CmpInst::ICMP_SGT}, 331 {RTLIB::OLT_F32, CmpInst::ICMP_SLT}}; 332 FCmp32Libcalls[CmpInst::FCMP_UEQ] = {{RTLIB::OEQ_F32, CmpInst::ICMP_EQ}, 333 {RTLIB::UO_F32, CmpInst::ICMP_NE}}; 334 335 FCmp64Libcalls.resize(CmpInst::LAST_FCMP_PREDICATE + 1); 336 FCmp64Libcalls[CmpInst::FCMP_OEQ] = {{RTLIB::OEQ_F64, CmpInst::ICMP_EQ}}; 337 FCmp64Libcalls[CmpInst::FCMP_OGE] = {{RTLIB::OGE_F64, CmpInst::ICMP_SGE}}; 338 FCmp64Libcalls[CmpInst::FCMP_OGT] = {{RTLIB::OGT_F64, CmpInst::ICMP_SGT}}; 339 FCmp64Libcalls[CmpInst::FCMP_OLE] = {{RTLIB::OLE_F64, CmpInst::ICMP_SLE}}; 340 FCmp64Libcalls[CmpInst::FCMP_OLT] = {{RTLIB::OLT_F64, CmpInst::ICMP_SLT}}; 341 FCmp64Libcalls[CmpInst::FCMP_ORD] = {{RTLIB::UO_F64, CmpInst::ICMP_EQ}}; 342 FCmp64Libcalls[CmpInst::FCMP_UGE] = {{RTLIB::OLT_F64, CmpInst::ICMP_SGE}}; 343 FCmp64Libcalls[CmpInst::FCMP_UGT] = {{RTLIB::OLE_F64, CmpInst::ICMP_SGT}}; 344 FCmp64Libcalls[CmpInst::FCMP_ULE] = {{RTLIB::OGT_F64, CmpInst::ICMP_SLE}}; 345 FCmp64Libcalls[CmpInst::FCMP_ULT] = {{RTLIB::OGE_F64, CmpInst::ICMP_SLT}}; 346 FCmp64Libcalls[CmpInst::FCMP_UNE] = {{RTLIB::UNE_F64, CmpInst::ICMP_NE}}; 347 FCmp64Libcalls[CmpInst::FCMP_UNO] = {{RTLIB::UO_F64, CmpInst::ICMP_NE}}; 348 FCmp64Libcalls[CmpInst::FCMP_ONE] = {{RTLIB::OGT_F64, CmpInst::ICMP_SGT}, 349 {RTLIB::OLT_F64, CmpInst::ICMP_SLT}}; 350 FCmp64Libcalls[CmpInst::FCMP_UEQ] = {{RTLIB::OEQ_F64, CmpInst::ICMP_EQ}, 351 {RTLIB::UO_F64, CmpInst::ICMP_NE}}; 352 } 353 354 ARMLegalizerInfo::FCmpLibcallsList 355 ARMLegalizerInfo::getFCmpLibcalls(CmpInst::Predicate Predicate, 356 unsigned Size) const { 357 assert(CmpInst::isFPPredicate(Predicate) && "Unsupported FCmp predicate"); 358 if (Size == 32) 359 return FCmp32Libcalls[Predicate]; 360 if (Size == 64) 361 return FCmp64Libcalls[Predicate]; 362 llvm_unreachable("Unsupported size for FCmp predicate"); 363 } 364 365 bool ARMLegalizerInfo::legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI, 366 LostDebugLocObserver &LocObserver) const { 367 using namespace TargetOpcode; 368 369 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder; 370 MachineRegisterInfo &MRI = *MIRBuilder.getMRI(); 371 LLVMContext &Ctx = MIRBuilder.getMF().getFunction().getContext(); 372 373 switch (MI.getOpcode()) { 374 default: 375 return false; 376 case G_SREM: 377 case G_UREM: { 378 Register OriginalResult = MI.getOperand(0).getReg(); 379 auto Size = MRI.getType(OriginalResult).getSizeInBits(); 380 if (Size != 32) 381 return false; 382 383 auto Libcall = 384 MI.getOpcode() == G_SREM ? RTLIB::SDIVREM_I32 : RTLIB::UDIVREM_I32; 385 386 // Our divmod libcalls return a struct containing the quotient and the 387 // remainder. Create a new, unused register for the quotient and use the 388 // destination of the original instruction for the remainder. 389 Type *ArgTy = Type::getInt32Ty(Ctx); 390 StructType *RetTy = StructType::get(Ctx, {ArgTy, ArgTy}, /* Packed */ true); 391 Register RetRegs[] = {MRI.createGenericVirtualRegister(LLT::scalar(32)), 392 OriginalResult}; 393 auto Status = createLibcall(MIRBuilder, Libcall, {RetRegs, RetTy, 0}, 394 {{MI.getOperand(1).getReg(), ArgTy, 0}, 395 {MI.getOperand(2).getReg(), ArgTy, 0}}, 396 LocObserver, &MI); 397 if (Status != LegalizerHelper::Legalized) 398 return false; 399 break; 400 } 401 case G_FCMP: { 402 assert(MRI.getType(MI.getOperand(2).getReg()) == 403 MRI.getType(MI.getOperand(3).getReg()) && 404 "Mismatched operands for G_FCMP"); 405 auto OpSize = MRI.getType(MI.getOperand(2).getReg()).getSizeInBits(); 406 407 auto OriginalResult = MI.getOperand(0).getReg(); 408 auto Predicate = 409 static_cast<CmpInst::Predicate>(MI.getOperand(1).getPredicate()); 410 auto Libcalls = getFCmpLibcalls(Predicate, OpSize); 411 412 if (Libcalls.empty()) { 413 assert((Predicate == CmpInst::FCMP_TRUE || 414 Predicate == CmpInst::FCMP_FALSE) && 415 "Predicate needs libcalls, but none specified"); 416 MIRBuilder.buildConstant(OriginalResult, 417 Predicate == CmpInst::FCMP_TRUE ? 1 : 0); 418 MI.eraseFromParent(); 419 return true; 420 } 421 422 assert((OpSize == 32 || OpSize == 64) && "Unsupported operand size"); 423 auto *ArgTy = OpSize == 32 ? Type::getFloatTy(Ctx) : Type::getDoubleTy(Ctx); 424 auto *RetTy = Type::getInt32Ty(Ctx); 425 426 SmallVector<Register, 2> Results; 427 for (auto Libcall : Libcalls) { 428 auto LibcallResult = MRI.createGenericVirtualRegister(LLT::scalar(32)); 429 auto Status = createLibcall(MIRBuilder, Libcall.LibcallID, 430 {LibcallResult, RetTy, 0}, 431 {{MI.getOperand(2).getReg(), ArgTy, 0}, 432 {MI.getOperand(3).getReg(), ArgTy, 0}}, 433 LocObserver, &MI); 434 435 if (Status != LegalizerHelper::Legalized) 436 return false; 437 438 auto ProcessedResult = 439 Libcalls.size() == 1 440 ? OriginalResult 441 : MRI.createGenericVirtualRegister(MRI.getType(OriginalResult)); 442 443 // We have a result, but we need to transform it into a proper 1-bit 0 or 444 // 1, taking into account the different peculiarities of the values 445 // returned by the comparison functions. 446 CmpInst::Predicate ResultPred = Libcall.Predicate; 447 if (ResultPred == CmpInst::BAD_ICMP_PREDICATE) { 448 // We have a nice 0 or 1, and we just need to truncate it back to 1 bit 449 // to keep the types consistent. 450 MIRBuilder.buildTrunc(ProcessedResult, LibcallResult); 451 } else { 452 // We need to compare against 0. 453 assert(CmpInst::isIntPredicate(ResultPred) && "Unsupported predicate"); 454 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0); 455 MIRBuilder.buildICmp(ResultPred, ProcessedResult, LibcallResult, Zero); 456 } 457 Results.push_back(ProcessedResult); 458 } 459 460 if (Results.size() != 1) { 461 assert(Results.size() == 2 && "Unexpected number of results"); 462 MIRBuilder.buildOr(OriginalResult, Results[0], Results[1]); 463 } 464 break; 465 } 466 case G_FCONSTANT: { 467 // Convert to integer constants, while preserving the binary representation. 468 auto AsInteger = 469 MI.getOperand(1).getFPImm()->getValueAPF().bitcastToAPInt(); 470 MIRBuilder.buildConstant(MI.getOperand(0), 471 *ConstantInt::get(Ctx, AsInteger)); 472 break; 473 } 474 } 475 476 MI.eraseFromParent(); 477 return true; 478 } 479