10b57cec5SDimitry Andric //===-- HexagonISelDAGToDAG.cpp - A dag to dag inst selector for Hexagon --===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file defines an instruction selector for the Hexagon target.
100b57cec5SDimitry Andric //
110b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
120b57cec5SDimitry Andric
130b57cec5SDimitry Andric #include "HexagonISelDAGToDAG.h"
14480093f4SDimitry Andric #include "Hexagon.h"
150b57cec5SDimitry Andric #include "HexagonISelLowering.h"
160b57cec5SDimitry Andric #include "HexagonMachineFunctionInfo.h"
170b57cec5SDimitry Andric #include "HexagonTargetMachine.h"
180b57cec5SDimitry Andric #include "llvm/CodeGen/FunctionLoweringInfo.h"
190b57cec5SDimitry Andric #include "llvm/CodeGen/MachineInstrBuilder.h"
200b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGISel.h"
210b57cec5SDimitry Andric #include "llvm/IR/Intrinsics.h"
22480093f4SDimitry Andric #include "llvm/IR/IntrinsicsHexagon.h"
230b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
240b57cec5SDimitry Andric #include "llvm/Support/Debug.h"
250b57cec5SDimitry Andric using namespace llvm;
260b57cec5SDimitry Andric
270b57cec5SDimitry Andric #define DEBUG_TYPE "hexagon-isel"
28bdd1243dSDimitry Andric #define PASS_NAME "Hexagon DAG->DAG Pattern Instruction Selection"
290b57cec5SDimitry Andric
300b57cec5SDimitry Andric static
310b57cec5SDimitry Andric cl::opt<bool>
320b57cec5SDimitry Andric EnableAddressRebalancing("isel-rebalance-addr", cl::Hidden, cl::init(true),
330b57cec5SDimitry Andric cl::desc("Rebalance address calculation trees to improve "
340b57cec5SDimitry Andric "instruction selection"));
350b57cec5SDimitry Andric
360b57cec5SDimitry Andric // Rebalance only if this allows e.g. combining a GA with an offset or
370b57cec5SDimitry Andric // factoring out a shift.
380b57cec5SDimitry Andric static
390b57cec5SDimitry Andric cl::opt<bool>
400b57cec5SDimitry Andric RebalanceOnlyForOptimizations("rebalance-only-opt", cl::Hidden, cl::init(false),
410b57cec5SDimitry Andric cl::desc("Rebalance address tree only if this allows optimizations"));
420b57cec5SDimitry Andric
430b57cec5SDimitry Andric static
440b57cec5SDimitry Andric cl::opt<bool>
450b57cec5SDimitry Andric RebalanceOnlyImbalancedTrees("rebalance-only-imbal", cl::Hidden,
460b57cec5SDimitry Andric cl::init(false), cl::desc("Rebalance address tree only if it is imbalanced"));
470b57cec5SDimitry Andric
480b57cec5SDimitry Andric static cl::opt<bool> CheckSingleUse("hexagon-isel-su", cl::Hidden,
490b57cec5SDimitry Andric cl::init(true), cl::desc("Enable checking of SDNode's single-use status"));
500b57cec5SDimitry Andric
510b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
520b57cec5SDimitry Andric // Instruction Selector Implementation
530b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
540b57cec5SDimitry Andric
550b57cec5SDimitry Andric #define GET_DAGISEL_BODY HexagonDAGToDAGISel
560b57cec5SDimitry Andric #include "HexagonGenDAGISel.inc"
570b57cec5SDimitry Andric
58fe6060f1SDimitry Andric namespace llvm {
590b57cec5SDimitry Andric /// createHexagonISelDag - This pass converts a legalized DAG into a
600b57cec5SDimitry Andric /// Hexagon-specific DAG, ready for instruction scheduling.
createHexagonISelDag(HexagonTargetMachine & TM,CodeGenOptLevel OptLevel)610b57cec5SDimitry Andric FunctionPass *createHexagonISelDag(HexagonTargetMachine &TM,
625f757f3fSDimitry Andric CodeGenOptLevel OptLevel) {
63*0fca6ea1SDimitry Andric return new HexagonDAGToDAGISelLegacy(TM, OptLevel);
640b57cec5SDimitry Andric }
650b57cec5SDimitry Andric }
660b57cec5SDimitry Andric
HexagonDAGToDAGISelLegacy(HexagonTargetMachine & tm,CodeGenOptLevel OptLevel)67*0fca6ea1SDimitry Andric HexagonDAGToDAGISelLegacy::HexagonDAGToDAGISelLegacy(HexagonTargetMachine &tm,
68*0fca6ea1SDimitry Andric CodeGenOptLevel OptLevel)
69*0fca6ea1SDimitry Andric : SelectionDAGISelLegacy(
70*0fca6ea1SDimitry Andric ID, std::make_unique<HexagonDAGToDAGISel>(tm, OptLevel)) {}
71bdd1243dSDimitry Andric
72*0fca6ea1SDimitry Andric char HexagonDAGToDAGISelLegacy::ID = 0;
73*0fca6ea1SDimitry Andric
INITIALIZE_PASS(HexagonDAGToDAGISelLegacy,DEBUG_TYPE,PASS_NAME,false,false)74*0fca6ea1SDimitry Andric INITIALIZE_PASS(HexagonDAGToDAGISelLegacy, DEBUG_TYPE, PASS_NAME, false, false)
75bdd1243dSDimitry Andric
760b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectIndexedLoad(LoadSDNode *LD, const SDLoc &dl) {
770b57cec5SDimitry Andric SDValue Chain = LD->getChain();
780b57cec5SDimitry Andric SDValue Base = LD->getBasePtr();
790b57cec5SDimitry Andric SDValue Offset = LD->getOffset();
800b57cec5SDimitry Andric int32_t Inc = cast<ConstantSDNode>(Offset.getNode())->getSExtValue();
810b57cec5SDimitry Andric EVT LoadedVT = LD->getMemoryVT();
820b57cec5SDimitry Andric unsigned Opcode = 0;
830b57cec5SDimitry Andric
840b57cec5SDimitry Andric // Check for zero extended loads. Treat any-extend loads as zero extended
850b57cec5SDimitry Andric // loads.
860b57cec5SDimitry Andric ISD::LoadExtType ExtType = LD->getExtensionType();
870b57cec5SDimitry Andric bool IsZeroExt = (ExtType == ISD::ZEXTLOAD || ExtType == ISD::EXTLOAD);
880b57cec5SDimitry Andric bool IsValidInc = HII->isValidAutoIncImm(LoadedVT, Inc);
890b57cec5SDimitry Andric
900b57cec5SDimitry Andric assert(LoadedVT.isSimple());
910b57cec5SDimitry Andric switch (LoadedVT.getSimpleVT().SimpleTy) {
920b57cec5SDimitry Andric case MVT::i8:
930b57cec5SDimitry Andric if (IsZeroExt)
940b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::L2_loadrub_pi : Hexagon::L2_loadrub_io;
950b57cec5SDimitry Andric else
960b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::L2_loadrb_pi : Hexagon::L2_loadrb_io;
970b57cec5SDimitry Andric break;
980b57cec5SDimitry Andric case MVT::i16:
990b57cec5SDimitry Andric if (IsZeroExt)
1000b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::L2_loadruh_pi : Hexagon::L2_loadruh_io;
1010b57cec5SDimitry Andric else
1020b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::L2_loadrh_pi : Hexagon::L2_loadrh_io;
1030b57cec5SDimitry Andric break;
1040b57cec5SDimitry Andric case MVT::i32:
1050b57cec5SDimitry Andric case MVT::f32:
1060b57cec5SDimitry Andric case MVT::v2i16:
1070b57cec5SDimitry Andric case MVT::v4i8:
1080b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::L2_loadri_pi : Hexagon::L2_loadri_io;
1090b57cec5SDimitry Andric break;
1100b57cec5SDimitry Andric case MVT::i64:
1110b57cec5SDimitry Andric case MVT::f64:
1120b57cec5SDimitry Andric case MVT::v2i32:
1130b57cec5SDimitry Andric case MVT::v4i16:
1140b57cec5SDimitry Andric case MVT::v8i8:
1150b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::L2_loadrd_pi : Hexagon::L2_loadrd_io;
1160b57cec5SDimitry Andric break;
1170b57cec5SDimitry Andric case MVT::v64i8:
1180b57cec5SDimitry Andric case MVT::v32i16:
1190b57cec5SDimitry Andric case MVT::v16i32:
1200b57cec5SDimitry Andric case MVT::v8i64:
1210b57cec5SDimitry Andric case MVT::v128i8:
1220b57cec5SDimitry Andric case MVT::v64i16:
1230b57cec5SDimitry Andric case MVT::v32i32:
1240b57cec5SDimitry Andric case MVT::v16i64:
1250b57cec5SDimitry Andric if (isAlignedMemNode(LD)) {
1260b57cec5SDimitry Andric if (LD->isNonTemporal())
1270b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::V6_vL32b_nt_pi : Hexagon::V6_vL32b_nt_ai;
1280b57cec5SDimitry Andric else
1290b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::V6_vL32b_pi : Hexagon::V6_vL32b_ai;
1300b57cec5SDimitry Andric } else {
1310b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::V6_vL32Ub_pi : Hexagon::V6_vL32Ub_ai;
1320b57cec5SDimitry Andric }
1330b57cec5SDimitry Andric break;
1340b57cec5SDimitry Andric default:
1350b57cec5SDimitry Andric llvm_unreachable("Unexpected memory type in indexed load");
1360b57cec5SDimitry Andric }
1370b57cec5SDimitry Andric
1380b57cec5SDimitry Andric SDValue IncV = CurDAG->getTargetConstant(Inc, dl, MVT::i32);
1390b57cec5SDimitry Andric MachineMemOperand *MemOp = LD->getMemOperand();
1400b57cec5SDimitry Andric
1410b57cec5SDimitry Andric auto getExt64 = [this,ExtType] (MachineSDNode *N, const SDLoc &dl)
1420b57cec5SDimitry Andric -> MachineSDNode* {
1430b57cec5SDimitry Andric if (ExtType == ISD::ZEXTLOAD || ExtType == ISD::EXTLOAD) {
1440b57cec5SDimitry Andric SDValue Zero = CurDAG->getTargetConstant(0, dl, MVT::i32);
1450b57cec5SDimitry Andric return CurDAG->getMachineNode(Hexagon::A4_combineir, dl, MVT::i64,
1460b57cec5SDimitry Andric Zero, SDValue(N, 0));
1470b57cec5SDimitry Andric }
1480b57cec5SDimitry Andric if (ExtType == ISD::SEXTLOAD)
1490b57cec5SDimitry Andric return CurDAG->getMachineNode(Hexagon::A2_sxtw, dl, MVT::i64,
1500b57cec5SDimitry Andric SDValue(N, 0));
1510b57cec5SDimitry Andric return N;
1520b57cec5SDimitry Andric };
1530b57cec5SDimitry Andric
1540b57cec5SDimitry Andric // Loaded value Next address Chain
1550b57cec5SDimitry Andric SDValue From[3] = { SDValue(LD,0), SDValue(LD,1), SDValue(LD,2) };
1560b57cec5SDimitry Andric SDValue To[3];
1570b57cec5SDimitry Andric
1580b57cec5SDimitry Andric EVT ValueVT = LD->getValueType(0);
1590b57cec5SDimitry Andric if (ValueVT == MVT::i64 && ExtType != ISD::NON_EXTLOAD) {
1600b57cec5SDimitry Andric // A load extending to i64 will actually produce i32, which will then
1610b57cec5SDimitry Andric // need to be extended to i64.
1620b57cec5SDimitry Andric assert(LoadedVT.getSizeInBits() <= 32);
1630b57cec5SDimitry Andric ValueVT = MVT::i32;
1640b57cec5SDimitry Andric }
1650b57cec5SDimitry Andric
1660b57cec5SDimitry Andric if (IsValidInc) {
1670b57cec5SDimitry Andric MachineSDNode *L = CurDAG->getMachineNode(Opcode, dl, ValueVT,
1680b57cec5SDimitry Andric MVT::i32, MVT::Other, Base,
1690b57cec5SDimitry Andric IncV, Chain);
1700b57cec5SDimitry Andric CurDAG->setNodeMemRefs(L, {MemOp});
1710b57cec5SDimitry Andric To[1] = SDValue(L, 1); // Next address.
1720b57cec5SDimitry Andric To[2] = SDValue(L, 2); // Chain.
1730b57cec5SDimitry Andric // Handle special case for extension to i64.
1740b57cec5SDimitry Andric if (LD->getValueType(0) == MVT::i64)
1750b57cec5SDimitry Andric L = getExt64(L, dl);
1760b57cec5SDimitry Andric To[0] = SDValue(L, 0); // Loaded (extended) value.
1770b57cec5SDimitry Andric } else {
1780b57cec5SDimitry Andric SDValue Zero = CurDAG->getTargetConstant(0, dl, MVT::i32);
1790b57cec5SDimitry Andric MachineSDNode *L = CurDAG->getMachineNode(Opcode, dl, ValueVT, MVT::Other,
1800b57cec5SDimitry Andric Base, Zero, Chain);
1810b57cec5SDimitry Andric CurDAG->setNodeMemRefs(L, {MemOp});
1820b57cec5SDimitry Andric To[2] = SDValue(L, 1); // Chain.
1830b57cec5SDimitry Andric MachineSDNode *A = CurDAG->getMachineNode(Hexagon::A2_addi, dl, MVT::i32,
1840b57cec5SDimitry Andric Base, IncV);
1850b57cec5SDimitry Andric To[1] = SDValue(A, 0); // Next address.
1860b57cec5SDimitry Andric // Handle special case for extension to i64.
1870b57cec5SDimitry Andric if (LD->getValueType(0) == MVT::i64)
1880b57cec5SDimitry Andric L = getExt64(L, dl);
1890b57cec5SDimitry Andric To[0] = SDValue(L, 0); // Loaded (extended) value.
1900b57cec5SDimitry Andric }
1910b57cec5SDimitry Andric ReplaceUses(From, To, 3);
1920b57cec5SDimitry Andric CurDAG->RemoveDeadNode(LD);
1930b57cec5SDimitry Andric }
1940b57cec5SDimitry Andric
LoadInstrForLoadIntrinsic(SDNode * IntN)1950b57cec5SDimitry Andric MachineSDNode *HexagonDAGToDAGISel::LoadInstrForLoadIntrinsic(SDNode *IntN) {
1960b57cec5SDimitry Andric if (IntN->getOpcode() != ISD::INTRINSIC_W_CHAIN)
1970b57cec5SDimitry Andric return nullptr;
1980b57cec5SDimitry Andric
1990b57cec5SDimitry Andric SDLoc dl(IntN);
200647cbc5dSDimitry Andric unsigned IntNo = IntN->getConstantOperandVal(1);
2010b57cec5SDimitry Andric
2020b57cec5SDimitry Andric static std::map<unsigned,unsigned> LoadPciMap = {
2030b57cec5SDimitry Andric { Intrinsic::hexagon_circ_ldb, Hexagon::L2_loadrb_pci },
2040b57cec5SDimitry Andric { Intrinsic::hexagon_circ_ldub, Hexagon::L2_loadrub_pci },
2050b57cec5SDimitry Andric { Intrinsic::hexagon_circ_ldh, Hexagon::L2_loadrh_pci },
2060b57cec5SDimitry Andric { Intrinsic::hexagon_circ_lduh, Hexagon::L2_loadruh_pci },
2070b57cec5SDimitry Andric { Intrinsic::hexagon_circ_ldw, Hexagon::L2_loadri_pci },
2080b57cec5SDimitry Andric { Intrinsic::hexagon_circ_ldd, Hexagon::L2_loadrd_pci },
2090b57cec5SDimitry Andric };
2100b57cec5SDimitry Andric auto FLC = LoadPciMap.find(IntNo);
2110b57cec5SDimitry Andric if (FLC != LoadPciMap.end()) {
2120b57cec5SDimitry Andric EVT ValTy = (IntNo == Intrinsic::hexagon_circ_ldd) ? MVT::i64 : MVT::i32;
2130b57cec5SDimitry Andric EVT RTys[] = { ValTy, MVT::i32, MVT::Other };
2140b57cec5SDimitry Andric // Operands: { Base, Increment, Modifier, Chain }
2150b57cec5SDimitry Andric auto Inc = cast<ConstantSDNode>(IntN->getOperand(5));
2160b57cec5SDimitry Andric SDValue I = CurDAG->getTargetConstant(Inc->getSExtValue(), dl, MVT::i32);
2170b57cec5SDimitry Andric MachineSDNode *Res = CurDAG->getMachineNode(FLC->second, dl, RTys,
2180b57cec5SDimitry Andric { IntN->getOperand(2), I, IntN->getOperand(4),
2190b57cec5SDimitry Andric IntN->getOperand(0) });
2200b57cec5SDimitry Andric return Res;
2210b57cec5SDimitry Andric }
2220b57cec5SDimitry Andric
2230b57cec5SDimitry Andric return nullptr;
2240b57cec5SDimitry Andric }
2250b57cec5SDimitry Andric
StoreInstrForLoadIntrinsic(MachineSDNode * LoadN,SDNode * IntN)2260b57cec5SDimitry Andric SDNode *HexagonDAGToDAGISel::StoreInstrForLoadIntrinsic(MachineSDNode *LoadN,
2270b57cec5SDimitry Andric SDNode *IntN) {
2280b57cec5SDimitry Andric // The "LoadN" is just a machine load instruction. The intrinsic also
2290b57cec5SDimitry Andric // involves storing it. Generate an appropriate store to the location
2300b57cec5SDimitry Andric // given in the intrinsic's operand(3).
2310b57cec5SDimitry Andric uint64_t F = HII->get(LoadN->getMachineOpcode()).TSFlags;
2320b57cec5SDimitry Andric unsigned SizeBits = (F >> HexagonII::MemAccessSizePos) &
2330b57cec5SDimitry Andric HexagonII::MemAccesSizeMask;
2340b57cec5SDimitry Andric unsigned Size = 1U << (SizeBits-1);
2350b57cec5SDimitry Andric
2360b57cec5SDimitry Andric SDLoc dl(IntN);
2370b57cec5SDimitry Andric MachinePointerInfo PI;
2380b57cec5SDimitry Andric SDValue TS;
2390b57cec5SDimitry Andric SDValue Loc = IntN->getOperand(3);
2400b57cec5SDimitry Andric
2410b57cec5SDimitry Andric if (Size >= 4)
2420b57cec5SDimitry Andric TS = CurDAG->getStore(SDValue(LoadN, 2), dl, SDValue(LoadN, 0), Loc, PI,
243e8d8bef9SDimitry Andric Align(Size));
2440b57cec5SDimitry Andric else
2450b57cec5SDimitry Andric TS = CurDAG->getTruncStore(SDValue(LoadN, 2), dl, SDValue(LoadN, 0), Loc,
246e8d8bef9SDimitry Andric PI, MVT::getIntegerVT(Size * 8), Align(Size));
2470b57cec5SDimitry Andric
2480b57cec5SDimitry Andric SDNode *StoreN;
2490b57cec5SDimitry Andric {
2500b57cec5SDimitry Andric HandleSDNode Handle(TS);
2510b57cec5SDimitry Andric SelectStore(TS.getNode());
2520b57cec5SDimitry Andric StoreN = Handle.getValue().getNode();
2530b57cec5SDimitry Andric }
2540b57cec5SDimitry Andric
2550b57cec5SDimitry Andric // Load's results are { Loaded value, Updated pointer, Chain }
2560b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 0), SDValue(LoadN, 1));
2570b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 1), SDValue(StoreN, 0));
2580b57cec5SDimitry Andric return StoreN;
2590b57cec5SDimitry Andric }
2600b57cec5SDimitry Andric
tryLoadOfLoadIntrinsic(LoadSDNode * N)2610b57cec5SDimitry Andric bool HexagonDAGToDAGISel::tryLoadOfLoadIntrinsic(LoadSDNode *N) {
2620b57cec5SDimitry Andric // The intrinsics for load circ/brev perform two operations:
2630b57cec5SDimitry Andric // 1. Load a value V from the specified location, using the addressing
2640b57cec5SDimitry Andric // mode corresponding to the intrinsic.
2650b57cec5SDimitry Andric // 2. Store V into a specified location. This location is typically a
2660b57cec5SDimitry Andric // local, temporary object.
2670b57cec5SDimitry Andric // In many cases, the program using these intrinsics will immediately
2680b57cec5SDimitry Andric // load V again from the local object. In those cases, when certain
2690b57cec5SDimitry Andric // conditions are met, the last load can be removed.
2700b57cec5SDimitry Andric // This function identifies and optimizes this pattern. If the pattern
2710b57cec5SDimitry Andric // cannot be optimized, it returns nullptr, which will cause the load
2720b57cec5SDimitry Andric // to be selected separately from the intrinsic (which will be handled
2730b57cec5SDimitry Andric // in SelectIntrinsicWChain).
2740b57cec5SDimitry Andric
2750b57cec5SDimitry Andric SDValue Ch = N->getOperand(0);
2760b57cec5SDimitry Andric SDValue Loc = N->getOperand(1);
2770b57cec5SDimitry Andric
2780b57cec5SDimitry Andric // Assume that the load and the intrinsic are connected directly with a
2790b57cec5SDimitry Andric // chain:
2800b57cec5SDimitry Andric // t1: i32,ch = int.load ..., ..., ..., Loc, ... // <-- C
2810b57cec5SDimitry Andric // t2: i32,ch = load t1:1, Loc, ...
2820b57cec5SDimitry Andric SDNode *C = Ch.getNode();
2830b57cec5SDimitry Andric
2840b57cec5SDimitry Andric if (C->getOpcode() != ISD::INTRINSIC_W_CHAIN)
2850b57cec5SDimitry Andric return false;
2860b57cec5SDimitry Andric
2870b57cec5SDimitry Andric // The second load can only be eliminated if its extension type matches
2880b57cec5SDimitry Andric // that of the load instruction corresponding to the intrinsic. The user
2890b57cec5SDimitry Andric // can provide an address of an unsigned variable to store the result of
2900b57cec5SDimitry Andric // a sign-extending intrinsic into (or the other way around).
2910b57cec5SDimitry Andric ISD::LoadExtType IntExt;
292647cbc5dSDimitry Andric switch (C->getConstantOperandVal(1)) {
2930b57cec5SDimitry Andric case Intrinsic::hexagon_circ_ldub:
2940b57cec5SDimitry Andric case Intrinsic::hexagon_circ_lduh:
2950b57cec5SDimitry Andric IntExt = ISD::ZEXTLOAD;
2960b57cec5SDimitry Andric break;
2970b57cec5SDimitry Andric case Intrinsic::hexagon_circ_ldw:
2980b57cec5SDimitry Andric case Intrinsic::hexagon_circ_ldd:
2990b57cec5SDimitry Andric IntExt = ISD::NON_EXTLOAD;
3000b57cec5SDimitry Andric break;
3010b57cec5SDimitry Andric default:
3020b57cec5SDimitry Andric IntExt = ISD::SEXTLOAD;
3030b57cec5SDimitry Andric break;
3040b57cec5SDimitry Andric }
3050b57cec5SDimitry Andric if (N->getExtensionType() != IntExt)
3060b57cec5SDimitry Andric return false;
3070b57cec5SDimitry Andric
3080b57cec5SDimitry Andric // Make sure the target location for the loaded value in the load intrinsic
3090b57cec5SDimitry Andric // is the location from which LD (or N) is loading.
3100b57cec5SDimitry Andric if (C->getNumOperands() < 4 || Loc.getNode() != C->getOperand(3).getNode())
3110b57cec5SDimitry Andric return false;
3120b57cec5SDimitry Andric
3130b57cec5SDimitry Andric if (MachineSDNode *L = LoadInstrForLoadIntrinsic(C)) {
3140b57cec5SDimitry Andric SDNode *S = StoreInstrForLoadIntrinsic(L, C);
3150b57cec5SDimitry Andric SDValue F[] = { SDValue(N,0), SDValue(N,1), SDValue(C,0), SDValue(C,1) };
3160b57cec5SDimitry Andric SDValue T[] = { SDValue(L,0), SDValue(S,0), SDValue(L,1), SDValue(S,0) };
317bdd1243dSDimitry Andric ReplaceUses(F, T, std::size(T));
3180b57cec5SDimitry Andric // This transformation will leave the intrinsic dead. If it remains in
3190b57cec5SDimitry Andric // the DAG, the selection code will see it again, but without the load,
3200b57cec5SDimitry Andric // and it will generate a store that is normally required for it.
3210b57cec5SDimitry Andric CurDAG->RemoveDeadNode(C);
3220b57cec5SDimitry Andric return true;
3230b57cec5SDimitry Andric }
3240b57cec5SDimitry Andric return false;
3250b57cec5SDimitry Andric }
3260b57cec5SDimitry Andric
3270b57cec5SDimitry Andric // Convert the bit-reverse load intrinsic to appropriate target instruction.
SelectBrevLdIntrinsic(SDNode * IntN)3280b57cec5SDimitry Andric bool HexagonDAGToDAGISel::SelectBrevLdIntrinsic(SDNode *IntN) {
3290b57cec5SDimitry Andric if (IntN->getOpcode() != ISD::INTRINSIC_W_CHAIN)
3300b57cec5SDimitry Andric return false;
3310b57cec5SDimitry Andric
3320b57cec5SDimitry Andric const SDLoc &dl(IntN);
333647cbc5dSDimitry Andric unsigned IntNo = IntN->getConstantOperandVal(1);
3340b57cec5SDimitry Andric
3350b57cec5SDimitry Andric static const std::map<unsigned, unsigned> LoadBrevMap = {
3360b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrb_pbr, Hexagon::L2_loadrb_pbr },
3370b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrub_pbr, Hexagon::L2_loadrub_pbr },
3380b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrh_pbr, Hexagon::L2_loadrh_pbr },
3390b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadruh_pbr, Hexagon::L2_loadruh_pbr },
3400b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadri_pbr, Hexagon::L2_loadri_pbr },
3410b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrd_pbr, Hexagon::L2_loadrd_pbr }
3420b57cec5SDimitry Andric };
3430b57cec5SDimitry Andric auto FLI = LoadBrevMap.find(IntNo);
3440b57cec5SDimitry Andric if (FLI != LoadBrevMap.end()) {
3450b57cec5SDimitry Andric EVT ValTy =
3460b57cec5SDimitry Andric (IntNo == Intrinsic::hexagon_L2_loadrd_pbr) ? MVT::i64 : MVT::i32;
3470b57cec5SDimitry Andric EVT RTys[] = { ValTy, MVT::i32, MVT::Other };
3480b57cec5SDimitry Andric // Operands of Intrinsic: {chain, enum ID of intrinsic, baseptr,
3490b57cec5SDimitry Andric // modifier}.
3500b57cec5SDimitry Andric // Operands of target instruction: { Base, Modifier, Chain }.
3510b57cec5SDimitry Andric MachineSDNode *Res = CurDAG->getMachineNode(
3520b57cec5SDimitry Andric FLI->second, dl, RTys,
3530b57cec5SDimitry Andric {IntN->getOperand(2), IntN->getOperand(3), IntN->getOperand(0)});
3540b57cec5SDimitry Andric
3550b57cec5SDimitry Andric MachineMemOperand *MemOp = cast<MemIntrinsicSDNode>(IntN)->getMemOperand();
3560b57cec5SDimitry Andric CurDAG->setNodeMemRefs(Res, {MemOp});
3570b57cec5SDimitry Andric
3580b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 0), SDValue(Res, 0));
3590b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 1), SDValue(Res, 1));
3600b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 2), SDValue(Res, 2));
3610b57cec5SDimitry Andric CurDAG->RemoveDeadNode(IntN);
3620b57cec5SDimitry Andric return true;
3630b57cec5SDimitry Andric }
3640b57cec5SDimitry Andric return false;
3650b57cec5SDimitry Andric }
3660b57cec5SDimitry Andric
367bdd1243dSDimitry Andric /// Generate a machine instruction node for the new circular buffer intrinsics.
3680b57cec5SDimitry Andric /// The new versions use a CSx register instead of the K field.
SelectNewCircIntrinsic(SDNode * IntN)3690b57cec5SDimitry Andric bool HexagonDAGToDAGISel::SelectNewCircIntrinsic(SDNode *IntN) {
3700b57cec5SDimitry Andric if (IntN->getOpcode() != ISD::INTRINSIC_W_CHAIN)
3710b57cec5SDimitry Andric return false;
3720b57cec5SDimitry Andric
3730b57cec5SDimitry Andric SDLoc DL(IntN);
374647cbc5dSDimitry Andric unsigned IntNo = IntN->getConstantOperandVal(1);
3750b57cec5SDimitry Andric SmallVector<SDValue, 7> Ops;
3760b57cec5SDimitry Andric
3770b57cec5SDimitry Andric static std::map<unsigned,unsigned> LoadNPcMap = {
3780b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrub_pci, Hexagon::PS_loadrub_pci },
3790b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrb_pci, Hexagon::PS_loadrb_pci },
3800b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadruh_pci, Hexagon::PS_loadruh_pci },
3810b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrh_pci, Hexagon::PS_loadrh_pci },
3820b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadri_pci, Hexagon::PS_loadri_pci },
3830b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrd_pci, Hexagon::PS_loadrd_pci },
3840b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrub_pcr, Hexagon::PS_loadrub_pcr },
3850b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrb_pcr, Hexagon::PS_loadrb_pcr },
3860b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadruh_pcr, Hexagon::PS_loadruh_pcr },
3870b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrh_pcr, Hexagon::PS_loadrh_pcr },
3880b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadri_pcr, Hexagon::PS_loadri_pcr },
3890b57cec5SDimitry Andric { Intrinsic::hexagon_L2_loadrd_pcr, Hexagon::PS_loadrd_pcr }
3900b57cec5SDimitry Andric };
3910b57cec5SDimitry Andric auto FLI = LoadNPcMap.find (IntNo);
3920b57cec5SDimitry Andric if (FLI != LoadNPcMap.end()) {
3930b57cec5SDimitry Andric EVT ValTy = MVT::i32;
3940b57cec5SDimitry Andric if (IntNo == Intrinsic::hexagon_L2_loadrd_pci ||
3950b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_L2_loadrd_pcr)
3960b57cec5SDimitry Andric ValTy = MVT::i64;
3970b57cec5SDimitry Andric EVT RTys[] = { ValTy, MVT::i32, MVT::Other };
3980b57cec5SDimitry Andric // Handle load.*_pci case which has 6 operands.
3990b57cec5SDimitry Andric if (IntN->getNumOperands() == 6) {
4000b57cec5SDimitry Andric auto Inc = cast<ConstantSDNode>(IntN->getOperand(3));
4010b57cec5SDimitry Andric SDValue I = CurDAG->getTargetConstant(Inc->getSExtValue(), DL, MVT::i32);
4020b57cec5SDimitry Andric // Operands: { Base, Increment, Modifier, Start, Chain }.
4030b57cec5SDimitry Andric Ops = { IntN->getOperand(2), I, IntN->getOperand(4), IntN->getOperand(5),
4040b57cec5SDimitry Andric IntN->getOperand(0) };
4050b57cec5SDimitry Andric } else
4060b57cec5SDimitry Andric // Handle load.*_pcr case which has 5 operands.
4070b57cec5SDimitry Andric // Operands: { Base, Modifier, Start, Chain }.
4080b57cec5SDimitry Andric Ops = { IntN->getOperand(2), IntN->getOperand(3), IntN->getOperand(4),
4090b57cec5SDimitry Andric IntN->getOperand(0) };
4100b57cec5SDimitry Andric MachineSDNode *Res = CurDAG->getMachineNode(FLI->second, DL, RTys, Ops);
4110b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 0), SDValue(Res, 0));
4120b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 1), SDValue(Res, 1));
4130b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 2), SDValue(Res, 2));
4140b57cec5SDimitry Andric CurDAG->RemoveDeadNode(IntN);
4150b57cec5SDimitry Andric return true;
4160b57cec5SDimitry Andric }
4170b57cec5SDimitry Andric
4180b57cec5SDimitry Andric static std::map<unsigned,unsigned> StoreNPcMap = {
4190b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storerb_pci, Hexagon::PS_storerb_pci },
4200b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storerh_pci, Hexagon::PS_storerh_pci },
4210b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storerf_pci, Hexagon::PS_storerf_pci },
4220b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storeri_pci, Hexagon::PS_storeri_pci },
4230b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storerd_pci, Hexagon::PS_storerd_pci },
4240b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storerb_pcr, Hexagon::PS_storerb_pcr },
4250b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storerh_pcr, Hexagon::PS_storerh_pcr },
4260b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storerf_pcr, Hexagon::PS_storerf_pcr },
4270b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storeri_pcr, Hexagon::PS_storeri_pcr },
4280b57cec5SDimitry Andric { Intrinsic::hexagon_S2_storerd_pcr, Hexagon::PS_storerd_pcr }
4290b57cec5SDimitry Andric };
4300b57cec5SDimitry Andric auto FSI = StoreNPcMap.find (IntNo);
4310b57cec5SDimitry Andric if (FSI != StoreNPcMap.end()) {
4320b57cec5SDimitry Andric EVT RTys[] = { MVT::i32, MVT::Other };
4330b57cec5SDimitry Andric // Handle store.*_pci case which has 7 operands.
4340b57cec5SDimitry Andric if (IntN->getNumOperands() == 7) {
4350b57cec5SDimitry Andric auto Inc = cast<ConstantSDNode>(IntN->getOperand(3));
4360b57cec5SDimitry Andric SDValue I = CurDAG->getTargetConstant(Inc->getSExtValue(), DL, MVT::i32);
4370b57cec5SDimitry Andric // Operands: { Base, Increment, Modifier, Value, Start, Chain }.
4380b57cec5SDimitry Andric Ops = { IntN->getOperand(2), I, IntN->getOperand(4), IntN->getOperand(5),
4390b57cec5SDimitry Andric IntN->getOperand(6), IntN->getOperand(0) };
4400b57cec5SDimitry Andric } else
4410b57cec5SDimitry Andric // Handle store.*_pcr case which has 6 operands.
4420b57cec5SDimitry Andric // Operands: { Base, Modifier, Value, Start, Chain }.
4430b57cec5SDimitry Andric Ops = { IntN->getOperand(2), IntN->getOperand(3), IntN->getOperand(4),
4440b57cec5SDimitry Andric IntN->getOperand(5), IntN->getOperand(0) };
4450b57cec5SDimitry Andric MachineSDNode *Res = CurDAG->getMachineNode(FSI->second, DL, RTys, Ops);
4460b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 0), SDValue(Res, 0));
4470b57cec5SDimitry Andric ReplaceUses(SDValue(IntN, 1), SDValue(Res, 1));
4480b57cec5SDimitry Andric CurDAG->RemoveDeadNode(IntN);
4490b57cec5SDimitry Andric return true;
4500b57cec5SDimitry Andric }
4510b57cec5SDimitry Andric
4520b57cec5SDimitry Andric return false;
4530b57cec5SDimitry Andric }
4540b57cec5SDimitry Andric
SelectLoad(SDNode * N)4550b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectLoad(SDNode *N) {
4560b57cec5SDimitry Andric SDLoc dl(N);
4570b57cec5SDimitry Andric LoadSDNode *LD = cast<LoadSDNode>(N);
4580b57cec5SDimitry Andric
4590b57cec5SDimitry Andric // Handle indexed loads.
4600b57cec5SDimitry Andric ISD::MemIndexedMode AM = LD->getAddressingMode();
4610b57cec5SDimitry Andric if (AM != ISD::UNINDEXED) {
4620b57cec5SDimitry Andric SelectIndexedLoad(LD, dl);
4630b57cec5SDimitry Andric return;
4640b57cec5SDimitry Andric }
4650b57cec5SDimitry Andric
4660b57cec5SDimitry Andric // Handle patterns using circ/brev load intrinsics.
4670b57cec5SDimitry Andric if (tryLoadOfLoadIntrinsic(LD))
4680b57cec5SDimitry Andric return;
4690b57cec5SDimitry Andric
4700b57cec5SDimitry Andric SelectCode(LD);
4710b57cec5SDimitry Andric }
4720b57cec5SDimitry Andric
SelectIndexedStore(StoreSDNode * ST,const SDLoc & dl)4730b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectIndexedStore(StoreSDNode *ST, const SDLoc &dl) {
4740b57cec5SDimitry Andric SDValue Chain = ST->getChain();
4750b57cec5SDimitry Andric SDValue Base = ST->getBasePtr();
4760b57cec5SDimitry Andric SDValue Offset = ST->getOffset();
4770b57cec5SDimitry Andric SDValue Value = ST->getValue();
4780b57cec5SDimitry Andric // Get the constant value.
4790b57cec5SDimitry Andric int32_t Inc = cast<ConstantSDNode>(Offset.getNode())->getSExtValue();
4800b57cec5SDimitry Andric EVT StoredVT = ST->getMemoryVT();
4810b57cec5SDimitry Andric EVT ValueVT = Value.getValueType();
4820b57cec5SDimitry Andric
4830b57cec5SDimitry Andric bool IsValidInc = HII->isValidAutoIncImm(StoredVT, Inc);
4840b57cec5SDimitry Andric unsigned Opcode = 0;
4850b57cec5SDimitry Andric
4860b57cec5SDimitry Andric assert(StoredVT.isSimple());
4870b57cec5SDimitry Andric switch (StoredVT.getSimpleVT().SimpleTy) {
4880b57cec5SDimitry Andric case MVT::i8:
4890b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::S2_storerb_pi : Hexagon::S2_storerb_io;
4900b57cec5SDimitry Andric break;
4910b57cec5SDimitry Andric case MVT::i16:
4920b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::S2_storerh_pi : Hexagon::S2_storerh_io;
4930b57cec5SDimitry Andric break;
4940b57cec5SDimitry Andric case MVT::i32:
4950b57cec5SDimitry Andric case MVT::f32:
4960b57cec5SDimitry Andric case MVT::v2i16:
4970b57cec5SDimitry Andric case MVT::v4i8:
4980b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::S2_storeri_pi : Hexagon::S2_storeri_io;
4990b57cec5SDimitry Andric break;
5000b57cec5SDimitry Andric case MVT::i64:
5010b57cec5SDimitry Andric case MVT::f64:
5020b57cec5SDimitry Andric case MVT::v2i32:
5030b57cec5SDimitry Andric case MVT::v4i16:
5040b57cec5SDimitry Andric case MVT::v8i8:
5050b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::S2_storerd_pi : Hexagon::S2_storerd_io;
5060b57cec5SDimitry Andric break;
5070b57cec5SDimitry Andric case MVT::v64i8:
5080b57cec5SDimitry Andric case MVT::v32i16:
5090b57cec5SDimitry Andric case MVT::v16i32:
5100b57cec5SDimitry Andric case MVT::v8i64:
5110b57cec5SDimitry Andric case MVT::v128i8:
5120b57cec5SDimitry Andric case MVT::v64i16:
5130b57cec5SDimitry Andric case MVT::v32i32:
5140b57cec5SDimitry Andric case MVT::v16i64:
5150b57cec5SDimitry Andric if (isAlignedMemNode(ST)) {
5160b57cec5SDimitry Andric if (ST->isNonTemporal())
5170b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::V6_vS32b_nt_pi : Hexagon::V6_vS32b_nt_ai;
5180b57cec5SDimitry Andric else
5190b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::V6_vS32b_pi : Hexagon::V6_vS32b_ai;
5200b57cec5SDimitry Andric } else {
5210b57cec5SDimitry Andric Opcode = IsValidInc ? Hexagon::V6_vS32Ub_pi : Hexagon::V6_vS32Ub_ai;
5220b57cec5SDimitry Andric }
5230b57cec5SDimitry Andric break;
5240b57cec5SDimitry Andric default:
5250b57cec5SDimitry Andric llvm_unreachable("Unexpected memory type in indexed store");
5260b57cec5SDimitry Andric }
5270b57cec5SDimitry Andric
5280b57cec5SDimitry Andric if (ST->isTruncatingStore() && ValueVT.getSizeInBits() == 64) {
5290b57cec5SDimitry Andric assert(StoredVT.getSizeInBits() < 64 && "Not a truncating store");
5300b57cec5SDimitry Andric Value = CurDAG->getTargetExtractSubreg(Hexagon::isub_lo,
5310b57cec5SDimitry Andric dl, MVT::i32, Value);
5320b57cec5SDimitry Andric }
5330b57cec5SDimitry Andric
5340b57cec5SDimitry Andric SDValue IncV = CurDAG->getTargetConstant(Inc, dl, MVT::i32);
5350b57cec5SDimitry Andric MachineMemOperand *MemOp = ST->getMemOperand();
5360b57cec5SDimitry Andric
5370b57cec5SDimitry Andric // Next address Chain
5380b57cec5SDimitry Andric SDValue From[2] = { SDValue(ST,0), SDValue(ST,1) };
5390b57cec5SDimitry Andric SDValue To[2];
5400b57cec5SDimitry Andric
5410b57cec5SDimitry Andric if (IsValidInc) {
5420b57cec5SDimitry Andric // Build post increment store.
5430b57cec5SDimitry Andric SDValue Ops[] = { Base, IncV, Value, Chain };
5440b57cec5SDimitry Andric MachineSDNode *S = CurDAG->getMachineNode(Opcode, dl, MVT::i32, MVT::Other,
5450b57cec5SDimitry Andric Ops);
5460b57cec5SDimitry Andric CurDAG->setNodeMemRefs(S, {MemOp});
5470b57cec5SDimitry Andric To[0] = SDValue(S, 0);
5480b57cec5SDimitry Andric To[1] = SDValue(S, 1);
5490b57cec5SDimitry Andric } else {
5500b57cec5SDimitry Andric SDValue Zero = CurDAG->getTargetConstant(0, dl, MVT::i32);
5510b57cec5SDimitry Andric SDValue Ops[] = { Base, Zero, Value, Chain };
5520b57cec5SDimitry Andric MachineSDNode *S = CurDAG->getMachineNode(Opcode, dl, MVT::Other, Ops);
5530b57cec5SDimitry Andric CurDAG->setNodeMemRefs(S, {MemOp});
5540b57cec5SDimitry Andric To[1] = SDValue(S, 0);
5550b57cec5SDimitry Andric MachineSDNode *A = CurDAG->getMachineNode(Hexagon::A2_addi, dl, MVT::i32,
5560b57cec5SDimitry Andric Base, IncV);
5570b57cec5SDimitry Andric To[0] = SDValue(A, 0);
5580b57cec5SDimitry Andric }
5590b57cec5SDimitry Andric
5600b57cec5SDimitry Andric ReplaceUses(From, To, 2);
5610b57cec5SDimitry Andric CurDAG->RemoveDeadNode(ST);
5620b57cec5SDimitry Andric }
5630b57cec5SDimitry Andric
SelectStore(SDNode * N)5640b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectStore(SDNode *N) {
5650b57cec5SDimitry Andric SDLoc dl(N);
5660b57cec5SDimitry Andric StoreSDNode *ST = cast<StoreSDNode>(N);
5670b57cec5SDimitry Andric
5680b57cec5SDimitry Andric // Handle indexed stores.
5690b57cec5SDimitry Andric ISD::MemIndexedMode AM = ST->getAddressingMode();
5700b57cec5SDimitry Andric if (AM != ISD::UNINDEXED) {
5710b57cec5SDimitry Andric SelectIndexedStore(ST, dl);
5720b57cec5SDimitry Andric return;
5730b57cec5SDimitry Andric }
5740b57cec5SDimitry Andric
5750b57cec5SDimitry Andric SelectCode(ST);
5760b57cec5SDimitry Andric }
5770b57cec5SDimitry Andric
SelectSHL(SDNode * N)5780b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectSHL(SDNode *N) {
5790b57cec5SDimitry Andric SDLoc dl(N);
5800b57cec5SDimitry Andric SDValue Shl_0 = N->getOperand(0);
5810b57cec5SDimitry Andric SDValue Shl_1 = N->getOperand(1);
5820b57cec5SDimitry Andric
5830b57cec5SDimitry Andric auto Default = [this,N] () -> void { SelectCode(N); };
5840b57cec5SDimitry Andric
5850b57cec5SDimitry Andric if (N->getValueType(0) != MVT::i32 || Shl_1.getOpcode() != ISD::Constant)
5860b57cec5SDimitry Andric return Default();
5870b57cec5SDimitry Andric
5880b57cec5SDimitry Andric // RHS is const.
5890b57cec5SDimitry Andric int32_t ShlConst = cast<ConstantSDNode>(Shl_1)->getSExtValue();
5900b57cec5SDimitry Andric
5910b57cec5SDimitry Andric if (Shl_0.getOpcode() == ISD::MUL) {
5920b57cec5SDimitry Andric SDValue Mul_0 = Shl_0.getOperand(0); // Val
5930b57cec5SDimitry Andric SDValue Mul_1 = Shl_0.getOperand(1); // Const
5940b57cec5SDimitry Andric // RHS of mul is const.
5950b57cec5SDimitry Andric if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Mul_1)) {
5960b57cec5SDimitry Andric int32_t ValConst = C->getSExtValue() << ShlConst;
5970b57cec5SDimitry Andric if (isInt<9>(ValConst)) {
5980b57cec5SDimitry Andric SDValue Val = CurDAG->getTargetConstant(ValConst, dl, MVT::i32);
5990b57cec5SDimitry Andric SDNode *Result = CurDAG->getMachineNode(Hexagon::M2_mpysmi, dl,
6000b57cec5SDimitry Andric MVT::i32, Mul_0, Val);
6010b57cec5SDimitry Andric ReplaceNode(N, Result);
6020b57cec5SDimitry Andric return;
6030b57cec5SDimitry Andric }
6040b57cec5SDimitry Andric }
6050b57cec5SDimitry Andric return Default();
6060b57cec5SDimitry Andric }
6070b57cec5SDimitry Andric
6080b57cec5SDimitry Andric if (Shl_0.getOpcode() == ISD::SUB) {
6090b57cec5SDimitry Andric SDValue Sub_0 = Shl_0.getOperand(0); // Const 0
6100b57cec5SDimitry Andric SDValue Sub_1 = Shl_0.getOperand(1); // Val
6110b57cec5SDimitry Andric if (ConstantSDNode *C1 = dyn_cast<ConstantSDNode>(Sub_0)) {
6120b57cec5SDimitry Andric if (C1->getSExtValue() != 0 || Sub_1.getOpcode() != ISD::SHL)
6130b57cec5SDimitry Andric return Default();
6140b57cec5SDimitry Andric SDValue Shl2_0 = Sub_1.getOperand(0); // Val
6150b57cec5SDimitry Andric SDValue Shl2_1 = Sub_1.getOperand(1); // Const
6160b57cec5SDimitry Andric if (ConstantSDNode *C2 = dyn_cast<ConstantSDNode>(Shl2_1)) {
6170b57cec5SDimitry Andric int32_t ValConst = 1 << (ShlConst + C2->getSExtValue());
6180b57cec5SDimitry Andric if (isInt<9>(-ValConst)) {
6190b57cec5SDimitry Andric SDValue Val = CurDAG->getTargetConstant(-ValConst, dl, MVT::i32);
6200b57cec5SDimitry Andric SDNode *Result = CurDAG->getMachineNode(Hexagon::M2_mpysmi, dl,
6210b57cec5SDimitry Andric MVT::i32, Shl2_0, Val);
6220b57cec5SDimitry Andric ReplaceNode(N, Result);
6230b57cec5SDimitry Andric return;
6240b57cec5SDimitry Andric }
6250b57cec5SDimitry Andric }
6260b57cec5SDimitry Andric }
6270b57cec5SDimitry Andric }
6280b57cec5SDimitry Andric
6290b57cec5SDimitry Andric return Default();
6300b57cec5SDimitry Andric }
6310b57cec5SDimitry Andric
6320b57cec5SDimitry Andric //
6330b57cec5SDimitry Andric // Handling intrinsics for circular load and bitreverse load.
6340b57cec5SDimitry Andric //
SelectIntrinsicWChain(SDNode * N)6350b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectIntrinsicWChain(SDNode *N) {
6360b57cec5SDimitry Andric if (MachineSDNode *L = LoadInstrForLoadIntrinsic(N)) {
6370b57cec5SDimitry Andric StoreInstrForLoadIntrinsic(L, N);
6380b57cec5SDimitry Andric CurDAG->RemoveDeadNode(N);
6390b57cec5SDimitry Andric return;
6400b57cec5SDimitry Andric }
6410b57cec5SDimitry Andric
6420b57cec5SDimitry Andric // Handle bit-reverse load intrinsics.
6430b57cec5SDimitry Andric if (SelectBrevLdIntrinsic(N))
6440b57cec5SDimitry Andric return;
6450b57cec5SDimitry Andric
6460b57cec5SDimitry Andric if (SelectNewCircIntrinsic(N))
6470b57cec5SDimitry Andric return;
6480b57cec5SDimitry Andric
649647cbc5dSDimitry Andric unsigned IntNo = N->getConstantOperandVal(1);
6500b57cec5SDimitry Andric if (IntNo == Intrinsic::hexagon_V6_vgathermw ||
6510b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermw_128B ||
6520b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermh ||
6530b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermh_128B ||
6540b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermhw ||
6550b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermhw_128B) {
6560b57cec5SDimitry Andric SelectV65Gather(N);
6570b57cec5SDimitry Andric return;
6580b57cec5SDimitry Andric }
6590b57cec5SDimitry Andric if (IntNo == Intrinsic::hexagon_V6_vgathermwq ||
6600b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermwq_128B ||
6610b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermhq ||
6620b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermhq_128B ||
6630b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermhwq ||
6640b57cec5SDimitry Andric IntNo == Intrinsic::hexagon_V6_vgathermhwq_128B) {
6650b57cec5SDimitry Andric SelectV65GatherPred(N);
6660b57cec5SDimitry Andric return;
6670b57cec5SDimitry Andric }
6680b57cec5SDimitry Andric
6690b57cec5SDimitry Andric SelectCode(N);
6700b57cec5SDimitry Andric }
6710b57cec5SDimitry Andric
SelectIntrinsicWOChain(SDNode * N)6720b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectIntrinsicWOChain(SDNode *N) {
673647cbc5dSDimitry Andric unsigned IID = N->getConstantOperandVal(0);
6740b57cec5SDimitry Andric unsigned Bits;
6750b57cec5SDimitry Andric switch (IID) {
6760b57cec5SDimitry Andric case Intrinsic::hexagon_S2_vsplatrb:
6770b57cec5SDimitry Andric Bits = 8;
6780b57cec5SDimitry Andric break;
6790b57cec5SDimitry Andric case Intrinsic::hexagon_S2_vsplatrh:
6800b57cec5SDimitry Andric Bits = 16;
6810b57cec5SDimitry Andric break;
6820b57cec5SDimitry Andric case Intrinsic::hexagon_V6_vaddcarry:
6830b57cec5SDimitry Andric case Intrinsic::hexagon_V6_vaddcarry_128B:
6840b57cec5SDimitry Andric case Intrinsic::hexagon_V6_vsubcarry:
6850b57cec5SDimitry Andric case Intrinsic::hexagon_V6_vsubcarry_128B:
6860b57cec5SDimitry Andric SelectHVXDualOutput(N);
6870b57cec5SDimitry Andric return;
6880b57cec5SDimitry Andric default:
6890b57cec5SDimitry Andric SelectCode(N);
6900b57cec5SDimitry Andric return;
6910b57cec5SDimitry Andric }
6920b57cec5SDimitry Andric
6930b57cec5SDimitry Andric SDValue V = N->getOperand(1);
6940b57cec5SDimitry Andric SDValue U;
695bdd1243dSDimitry Andric // Splat intrinsics.
6960b57cec5SDimitry Andric if (keepsLowBits(V, Bits, U)) {
6970b57cec5SDimitry Andric SDValue R = CurDAG->getNode(N->getOpcode(), SDLoc(N), N->getValueType(0),
6980b57cec5SDimitry Andric N->getOperand(0), U);
6990b57cec5SDimitry Andric ReplaceNode(N, R.getNode());
7000b57cec5SDimitry Andric SelectCode(R.getNode());
7010b57cec5SDimitry Andric return;
7020b57cec5SDimitry Andric }
7030b57cec5SDimitry Andric SelectCode(N);
7040b57cec5SDimitry Andric }
7050b57cec5SDimitry Andric
SelectExtractSubvector(SDNode * N)706bdd1243dSDimitry Andric void HexagonDAGToDAGISel::SelectExtractSubvector(SDNode *N) {
707bdd1243dSDimitry Andric SDValue Inp = N->getOperand(0);
708bdd1243dSDimitry Andric MVT ResTy = N->getValueType(0).getSimpleVT();
7097a6dacacSDimitry Andric unsigned Idx = N->getConstantOperandVal(1);
710bdd1243dSDimitry Andric
711bdd1243dSDimitry Andric [[maybe_unused]] MVT InpTy = Inp.getValueType().getSimpleVT();
712bdd1243dSDimitry Andric [[maybe_unused]] unsigned ResLen = ResTy.getVectorNumElements();
713bdd1243dSDimitry Andric assert(InpTy.getVectorElementType() == ResTy.getVectorElementType());
714bdd1243dSDimitry Andric assert(2 * ResLen == InpTy.getVectorNumElements());
715bdd1243dSDimitry Andric assert(ResTy.getSizeInBits() == 32);
716bdd1243dSDimitry Andric assert(Idx == 0 || Idx == ResLen);
717bdd1243dSDimitry Andric
718bdd1243dSDimitry Andric unsigned SubReg = Idx == 0 ? Hexagon::isub_lo : Hexagon::isub_hi;
719bdd1243dSDimitry Andric SDValue Ext = CurDAG->getTargetExtractSubreg(SubReg, SDLoc(N), ResTy, Inp);
720bdd1243dSDimitry Andric
721bdd1243dSDimitry Andric ReplaceNode(N, Ext.getNode());
722bdd1243dSDimitry Andric }
723bdd1243dSDimitry Andric
7240b57cec5SDimitry Andric //
7250b57cec5SDimitry Andric // Map floating point constant values.
7260b57cec5SDimitry Andric //
SelectConstantFP(SDNode * N)7270b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectConstantFP(SDNode *N) {
7280b57cec5SDimitry Andric SDLoc dl(N);
7298bcb0991SDimitry Andric auto *CN = cast<ConstantFPSDNode>(N);
7300b57cec5SDimitry Andric APInt A = CN->getValueAPF().bitcastToAPInt();
7310b57cec5SDimitry Andric if (N->getValueType(0) == MVT::f32) {
7320b57cec5SDimitry Andric SDValue V = CurDAG->getTargetConstant(A.getZExtValue(), dl, MVT::i32);
7330b57cec5SDimitry Andric ReplaceNode(N, CurDAG->getMachineNode(Hexagon::A2_tfrsi, dl, MVT::f32, V));
7340b57cec5SDimitry Andric return;
7350b57cec5SDimitry Andric }
7360b57cec5SDimitry Andric if (N->getValueType(0) == MVT::f64) {
7370b57cec5SDimitry Andric SDValue V = CurDAG->getTargetConstant(A.getZExtValue(), dl, MVT::i64);
7380b57cec5SDimitry Andric ReplaceNode(N, CurDAG->getMachineNode(Hexagon::CONST64, dl, MVT::f64, V));
7390b57cec5SDimitry Andric return;
7400b57cec5SDimitry Andric }
7410b57cec5SDimitry Andric
7420b57cec5SDimitry Andric SelectCode(N);
7430b57cec5SDimitry Andric }
7440b57cec5SDimitry Andric
7450b57cec5SDimitry Andric //
7460b57cec5SDimitry Andric // Map boolean values.
7470b57cec5SDimitry Andric //
SelectConstant(SDNode * N)7480b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectConstant(SDNode *N) {
7490b57cec5SDimitry Andric if (N->getValueType(0) == MVT::i1) {
7501db9f3b2SDimitry Andric assert(!(N->getAsZExtVal() >> 1));
7510b57cec5SDimitry Andric unsigned Opc = (cast<ConstantSDNode>(N)->getSExtValue() != 0)
7520b57cec5SDimitry Andric ? Hexagon::PS_true
7530b57cec5SDimitry Andric : Hexagon::PS_false;
7540b57cec5SDimitry Andric ReplaceNode(N, CurDAG->getMachineNode(Opc, SDLoc(N), MVT::i1));
7550b57cec5SDimitry Andric return;
7560b57cec5SDimitry Andric }
7570b57cec5SDimitry Andric
7580b57cec5SDimitry Andric SelectCode(N);
7590b57cec5SDimitry Andric }
7600b57cec5SDimitry Andric
SelectFrameIndex(SDNode * N)7610b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectFrameIndex(SDNode *N) {
7620b57cec5SDimitry Andric MachineFrameInfo &MFI = MF->getFrameInfo();
7630b57cec5SDimitry Andric const HexagonFrameLowering *HFI = HST->getFrameLowering();
7640b57cec5SDimitry Andric int FX = cast<FrameIndexSDNode>(N)->getIndex();
7655ffd83dbSDimitry Andric Align StkA = HFI->getStackAlign();
7665ffd83dbSDimitry Andric Align MaxA = MFI.getMaxAlign();
7670b57cec5SDimitry Andric SDValue FI = CurDAG->getTargetFrameIndex(FX, MVT::i32);
7680b57cec5SDimitry Andric SDLoc DL(N);
7690b57cec5SDimitry Andric SDValue Zero = CurDAG->getTargetConstant(0, DL, MVT::i32);
7700b57cec5SDimitry Andric SDNode *R = nullptr;
7710b57cec5SDimitry Andric
7720b57cec5SDimitry Andric // Use PS_fi when:
7730b57cec5SDimitry Andric // - the object is fixed, or
7740b57cec5SDimitry Andric // - there are no objects with higher-than-default alignment, or
7750b57cec5SDimitry Andric // - there are no dynamically allocated objects.
7760b57cec5SDimitry Andric // Otherwise, use PS_fia.
7770b57cec5SDimitry Andric if (FX < 0 || MaxA <= StkA || !MFI.hasVarSizedObjects()) {
7780b57cec5SDimitry Andric R = CurDAG->getMachineNode(Hexagon::PS_fi, DL, MVT::i32, FI, Zero);
7790b57cec5SDimitry Andric } else {
7800b57cec5SDimitry Andric auto &HMFI = *MF->getInfo<HexagonMachineFunctionInfo>();
781bdd1243dSDimitry Andric Register AR = HMFI.getStackAlignBaseReg();
7820b57cec5SDimitry Andric SDValue CH = CurDAG->getEntryNode();
7830b57cec5SDimitry Andric SDValue Ops[] = { CurDAG->getCopyFromReg(CH, DL, AR, MVT::i32), FI, Zero };
7840b57cec5SDimitry Andric R = CurDAG->getMachineNode(Hexagon::PS_fia, DL, MVT::i32, Ops);
7850b57cec5SDimitry Andric }
7860b57cec5SDimitry Andric
7870b57cec5SDimitry Andric ReplaceNode(N, R);
7880b57cec5SDimitry Andric }
7890b57cec5SDimitry Andric
SelectAddSubCarry(SDNode * N)7900b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectAddSubCarry(SDNode *N) {
7910b57cec5SDimitry Andric unsigned OpcCarry = N->getOpcode() == HexagonISD::ADDC ? Hexagon::A4_addp_c
7920b57cec5SDimitry Andric : Hexagon::A4_subp_c;
7930b57cec5SDimitry Andric SDNode *C = CurDAG->getMachineNode(OpcCarry, SDLoc(N), N->getVTList(),
7940b57cec5SDimitry Andric { N->getOperand(0), N->getOperand(1),
7950b57cec5SDimitry Andric N->getOperand(2) });
7960b57cec5SDimitry Andric ReplaceNode(N, C);
7970b57cec5SDimitry Andric }
7980b57cec5SDimitry Andric
SelectVAlign(SDNode * N)7990b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectVAlign(SDNode *N) {
8000b57cec5SDimitry Andric MVT ResTy = N->getValueType(0).getSimpleVT();
8010b57cec5SDimitry Andric if (HST->isHVXVectorType(ResTy, true))
8020b57cec5SDimitry Andric return SelectHvxVAlign(N);
8030b57cec5SDimitry Andric
8040b57cec5SDimitry Andric const SDLoc &dl(N);
8050b57cec5SDimitry Andric unsigned VecLen = ResTy.getSizeInBits();
8060b57cec5SDimitry Andric if (VecLen == 32) {
8070b57cec5SDimitry Andric SDValue Ops[] = {
8080b57cec5SDimitry Andric CurDAG->getTargetConstant(Hexagon::DoubleRegsRegClassID, dl, MVT::i32),
8090b57cec5SDimitry Andric N->getOperand(0),
8100b57cec5SDimitry Andric CurDAG->getTargetConstant(Hexagon::isub_hi, dl, MVT::i32),
8110b57cec5SDimitry Andric N->getOperand(1),
8120b57cec5SDimitry Andric CurDAG->getTargetConstant(Hexagon::isub_lo, dl, MVT::i32)
8130b57cec5SDimitry Andric };
8140b57cec5SDimitry Andric SDNode *R = CurDAG->getMachineNode(TargetOpcode::REG_SEQUENCE, dl,
8150b57cec5SDimitry Andric MVT::i64, Ops);
8160b57cec5SDimitry Andric
8170b57cec5SDimitry Andric // Shift right by "(Addr & 0x3) * 8" bytes.
8185ffd83dbSDimitry Andric SDNode *C;
8190b57cec5SDimitry Andric SDValue M0 = CurDAG->getTargetConstant(0x18, dl, MVT::i32);
8200b57cec5SDimitry Andric SDValue M1 = CurDAG->getTargetConstant(0x03, dl, MVT::i32);
8215ffd83dbSDimitry Andric if (HST->useCompound()) {
8225ffd83dbSDimitry Andric C = CurDAG->getMachineNode(Hexagon::S4_andi_asl_ri, dl, MVT::i32,
8230b57cec5SDimitry Andric M0, N->getOperand(2), M1);
8245ffd83dbSDimitry Andric } else {
8255ffd83dbSDimitry Andric SDNode *T = CurDAG->getMachineNode(Hexagon::S2_asl_i_r, dl, MVT::i32,
8265ffd83dbSDimitry Andric N->getOperand(2), M1);
8275ffd83dbSDimitry Andric C = CurDAG->getMachineNode(Hexagon::A2_andir, dl, MVT::i32,
8285ffd83dbSDimitry Andric SDValue(T, 0), M0);
8295ffd83dbSDimitry Andric }
8300b57cec5SDimitry Andric SDNode *S = CurDAG->getMachineNode(Hexagon::S2_lsr_r_p, dl, MVT::i64,
8310b57cec5SDimitry Andric SDValue(R, 0), SDValue(C, 0));
8320b57cec5SDimitry Andric SDValue E = CurDAG->getTargetExtractSubreg(Hexagon::isub_lo, dl, ResTy,
8330b57cec5SDimitry Andric SDValue(S, 0));
8340b57cec5SDimitry Andric ReplaceNode(N, E.getNode());
8350b57cec5SDimitry Andric } else {
8360b57cec5SDimitry Andric assert(VecLen == 64);
8370b57cec5SDimitry Andric SDNode *Pu = CurDAG->getMachineNode(Hexagon::C2_tfrrp, dl, MVT::v8i1,
8380b57cec5SDimitry Andric N->getOperand(2));
8390b57cec5SDimitry Andric SDNode *VA = CurDAG->getMachineNode(Hexagon::S2_valignrb, dl, ResTy,
8400b57cec5SDimitry Andric N->getOperand(0), N->getOperand(1),
8410b57cec5SDimitry Andric SDValue(Pu,0));
8420b57cec5SDimitry Andric ReplaceNode(N, VA);
8430b57cec5SDimitry Andric }
8440b57cec5SDimitry Andric }
8450b57cec5SDimitry Andric
SelectVAlignAddr(SDNode * N)8460b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectVAlignAddr(SDNode *N) {
8470b57cec5SDimitry Andric const SDLoc &dl(N);
8480b57cec5SDimitry Andric SDValue A = N->getOperand(1);
8490b57cec5SDimitry Andric int Mask = -cast<ConstantSDNode>(A.getNode())->getSExtValue();
8500b57cec5SDimitry Andric assert(isPowerOf2_32(-Mask));
8510b57cec5SDimitry Andric
8520b57cec5SDimitry Andric SDValue M = CurDAG->getTargetConstant(Mask, dl, MVT::i32);
8530b57cec5SDimitry Andric SDNode *AA = CurDAG->getMachineNode(Hexagon::A2_andir, dl, MVT::i32,
8540b57cec5SDimitry Andric N->getOperand(0), M);
8550b57cec5SDimitry Andric ReplaceNode(N, AA);
8560b57cec5SDimitry Andric }
8570b57cec5SDimitry Andric
8580b57cec5SDimitry Andric // Handle these nodes here to avoid having to write patterns for all
8590b57cec5SDimitry Andric // combinations of input/output types. In all cases, the resulting
8600b57cec5SDimitry Andric // instruction is the same.
SelectTypecast(SDNode * N)8610b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectTypecast(SDNode *N) {
8620b57cec5SDimitry Andric SDValue Op = N->getOperand(0);
8630b57cec5SDimitry Andric MVT OpTy = Op.getValueType().getSimpleVT();
8640b57cec5SDimitry Andric SDNode *T = CurDAG->MorphNodeTo(N, N->getOpcode(),
8650b57cec5SDimitry Andric CurDAG->getVTList(OpTy), {Op});
8660b57cec5SDimitry Andric ReplaceNode(T, Op.getNode());
8670b57cec5SDimitry Andric }
8680b57cec5SDimitry Andric
SelectP2D(SDNode * N)8690b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectP2D(SDNode *N) {
8700b57cec5SDimitry Andric MVT ResTy = N->getValueType(0).getSimpleVT();
8710b57cec5SDimitry Andric SDNode *T = CurDAG->getMachineNode(Hexagon::C2_mask, SDLoc(N), ResTy,
8720b57cec5SDimitry Andric N->getOperand(0));
8730b57cec5SDimitry Andric ReplaceNode(N, T);
8740b57cec5SDimitry Andric }
8750b57cec5SDimitry Andric
SelectD2P(SDNode * N)8760b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectD2P(SDNode *N) {
8770b57cec5SDimitry Andric const SDLoc &dl(N);
8780b57cec5SDimitry Andric MVT ResTy = N->getValueType(0).getSimpleVT();
8790b57cec5SDimitry Andric SDValue Zero = CurDAG->getTargetConstant(0, dl, MVT::i32);
8800b57cec5SDimitry Andric SDNode *T = CurDAG->getMachineNode(Hexagon::A4_vcmpbgtui, dl, ResTy,
8810b57cec5SDimitry Andric N->getOperand(0), Zero);
8820b57cec5SDimitry Andric ReplaceNode(N, T);
8830b57cec5SDimitry Andric }
8840b57cec5SDimitry Andric
SelectV2Q(SDNode * N)8850b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectV2Q(SDNode *N) {
8860b57cec5SDimitry Andric const SDLoc &dl(N);
8870b57cec5SDimitry Andric MVT ResTy = N->getValueType(0).getSimpleVT();
8880b57cec5SDimitry Andric // The argument to V2Q should be a single vector.
8890b57cec5SDimitry Andric MVT OpTy = N->getOperand(0).getValueType().getSimpleVT(); (void)OpTy;
8900b57cec5SDimitry Andric assert(HST->getVectorLength() * 8 == OpTy.getSizeInBits());
8910b57cec5SDimitry Andric
8920b57cec5SDimitry Andric SDValue C = CurDAG->getTargetConstant(-1, dl, MVT::i32);
8930b57cec5SDimitry Andric SDNode *R = CurDAG->getMachineNode(Hexagon::A2_tfrsi, dl, MVT::i32, C);
8940b57cec5SDimitry Andric SDNode *T = CurDAG->getMachineNode(Hexagon::V6_vandvrt, dl, ResTy,
8950b57cec5SDimitry Andric N->getOperand(0), SDValue(R,0));
8960b57cec5SDimitry Andric ReplaceNode(N, T);
8970b57cec5SDimitry Andric }
8980b57cec5SDimitry Andric
SelectQ2V(SDNode * N)8990b57cec5SDimitry Andric void HexagonDAGToDAGISel::SelectQ2V(SDNode *N) {
9000b57cec5SDimitry Andric const SDLoc &dl(N);
9010b57cec5SDimitry Andric MVT ResTy = N->getValueType(0).getSimpleVT();
9020b57cec5SDimitry Andric // The result of V2Q should be a single vector.
9030b57cec5SDimitry Andric assert(HST->getVectorLength() * 8 == ResTy.getSizeInBits());
9040b57cec5SDimitry Andric
9050b57cec5SDimitry Andric SDValue C = CurDAG->getTargetConstant(-1, dl, MVT::i32);
9060b57cec5SDimitry Andric SDNode *R = CurDAG->getMachineNode(Hexagon::A2_tfrsi, dl, MVT::i32, C);
9070b57cec5SDimitry Andric SDNode *T = CurDAG->getMachineNode(Hexagon::V6_vandqrt, dl, ResTy,
9080b57cec5SDimitry Andric N->getOperand(0), SDValue(R,0));
9090b57cec5SDimitry Andric ReplaceNode(N, T);
9100b57cec5SDimitry Andric }
9110b57cec5SDimitry Andric
FDiv(SDNode * N)912*0fca6ea1SDimitry Andric void HexagonDAGToDAGISel::FDiv(SDNode *N) {
913*0fca6ea1SDimitry Andric const SDLoc &dl(N);
914*0fca6ea1SDimitry Andric ArrayRef<EVT> ResultType(N->value_begin(), N->value_end());
915*0fca6ea1SDimitry Andric SmallVector<SDValue, 2> Ops;
916*0fca6ea1SDimitry Andric Ops = {N->getOperand(0), N->getOperand(1)};
917*0fca6ea1SDimitry Andric SDVTList VTs;
918*0fca6ea1SDimitry Andric VTs = CurDAG->getVTList(MVT::f32, MVT::f32);
919*0fca6ea1SDimitry Andric SDNode *ResScale = CurDAG->getMachineNode(Hexagon::F2_sfrecipa, dl, VTs, Ops);
920*0fca6ea1SDimitry Andric SDNode *D = CurDAG->getMachineNode(Hexagon::F2_sffixupd, dl, MVT::f32, Ops);
921*0fca6ea1SDimitry Andric
922*0fca6ea1SDimitry Andric SDValue C = CurDAG->getTargetConstant(0x3f800000, dl, MVT::i32);
923*0fca6ea1SDimitry Andric SDNode *constNode =
924*0fca6ea1SDimitry Andric CurDAG->getMachineNode(Hexagon::A2_tfrsi, dl, MVT::f32, C);
925*0fca6ea1SDimitry Andric
926*0fca6ea1SDimitry Andric SDNode *n = CurDAG->getMachineNode(Hexagon::F2_sffixupn, dl, MVT::f32, Ops);
927*0fca6ea1SDimitry Andric SDNode *Err = CurDAG->getMachineNode(Hexagon::F2_sffms_lib, dl, MVT::f32,
928*0fca6ea1SDimitry Andric SDValue(constNode, 0), SDValue(D, 0),
929*0fca6ea1SDimitry Andric SDValue(ResScale, 0));
930*0fca6ea1SDimitry Andric SDNode *NewRec = CurDAG->getMachineNode(Hexagon::F2_sffma_lib, dl, MVT::f32,
931*0fca6ea1SDimitry Andric SDValue(ResScale, 0), SDValue(Err, 0),
932*0fca6ea1SDimitry Andric SDValue(ResScale, 0));
933*0fca6ea1SDimitry Andric SDNode *newErr = CurDAG->getMachineNode(Hexagon::F2_sffms_lib, dl, MVT::f32,
934*0fca6ea1SDimitry Andric SDValue(constNode, 0), SDValue(D, 0),
935*0fca6ea1SDimitry Andric SDValue(NewRec, 0));
936*0fca6ea1SDimitry Andric SDNode *q = CurDAG->getMachineNode(
937*0fca6ea1SDimitry Andric Hexagon::A2_andir, dl, MVT::f32, SDValue(n, 0),
938*0fca6ea1SDimitry Andric CurDAG->getTargetConstant(0x80000000, dl, MVT::i32));
939*0fca6ea1SDimitry Andric SDNode *NewQ =
940*0fca6ea1SDimitry Andric CurDAG->getMachineNode(Hexagon::F2_sffma_lib, dl, MVT::f32, SDValue(q, 0),
941*0fca6ea1SDimitry Andric SDValue(n, 0), SDValue(NewRec, 0));
942*0fca6ea1SDimitry Andric SDNode *NNewRec = CurDAG->getMachineNode(
943*0fca6ea1SDimitry Andric Hexagon::F2_sffma_lib, dl, MVT::f32, SDValue(NewRec, 0),
944*0fca6ea1SDimitry Andric SDValue(newErr, 0), SDValue(NewRec, 0));
945*0fca6ea1SDimitry Andric SDNode *qErr =
946*0fca6ea1SDimitry Andric CurDAG->getMachineNode(Hexagon::F2_sffms_lib, dl, MVT::f32, SDValue(n, 0),
947*0fca6ea1SDimitry Andric SDValue(D, 0), SDValue(NewQ, 0));
948*0fca6ea1SDimitry Andric SDNode *NNewQ = CurDAG->getMachineNode(Hexagon::F2_sffma_lib, dl, MVT::f32,
949*0fca6ea1SDimitry Andric SDValue(NewQ, 0), SDValue(qErr, 0),
950*0fca6ea1SDimitry Andric SDValue(NNewRec, 0));
951*0fca6ea1SDimitry Andric
952*0fca6ea1SDimitry Andric SDNode *NqErr =
953*0fca6ea1SDimitry Andric CurDAG->getMachineNode(Hexagon::F2_sffms_lib, dl, MVT::f32, SDValue(n, 0),
954*0fca6ea1SDimitry Andric SDValue(NNewQ, 0), SDValue(D, 0));
955*0fca6ea1SDimitry Andric std::array<SDValue, 4> temp1 = {SDValue(NNewQ, 0), SDValue(NqErr, 0),
956*0fca6ea1SDimitry Andric SDValue(NNewRec, 0), SDValue(ResScale, 1)};
957*0fca6ea1SDimitry Andric ArrayRef<SDValue> OpValue1(temp1);
958*0fca6ea1SDimitry Andric SDNode *FinalNewQ =
959*0fca6ea1SDimitry Andric CurDAG->getMachineNode(Hexagon::F2_sffma_sc, dl, MVT::f32, OpValue1);
960*0fca6ea1SDimitry Andric ReplaceNode(N, FinalNewQ);
961*0fca6ea1SDimitry Andric }
962*0fca6ea1SDimitry Andric
FastFDiv(SDNode * N)963*0fca6ea1SDimitry Andric void HexagonDAGToDAGISel::FastFDiv(SDNode *N) {
964*0fca6ea1SDimitry Andric const SDLoc &dl(N);
965*0fca6ea1SDimitry Andric ArrayRef<EVT> ResultType(N->value_begin(), N->value_end());
966*0fca6ea1SDimitry Andric SmallVector<SDValue, 2> Ops;
967*0fca6ea1SDimitry Andric Ops = {N->getOperand(0), N->getOperand(1)};
968*0fca6ea1SDimitry Andric SDVTList VTs;
969*0fca6ea1SDimitry Andric VTs = CurDAG->getVTList(MVT::f32, MVT::f32);
970*0fca6ea1SDimitry Andric SDNode *ResScale = CurDAG->getMachineNode(Hexagon::F2_sfrecipa, dl, VTs, Ops);
971*0fca6ea1SDimitry Andric SDNode *D = CurDAG->getMachineNode(Hexagon::F2_sffixupd, dl, MVT::f32, Ops);
972*0fca6ea1SDimitry Andric
973*0fca6ea1SDimitry Andric SDValue C = CurDAG->getTargetConstant(0x3f800000, dl, MVT::i32);
974*0fca6ea1SDimitry Andric SDNode *constNode =
975*0fca6ea1SDimitry Andric CurDAG->getMachineNode(Hexagon::A2_tfrsi, dl, MVT::f32, C);
976*0fca6ea1SDimitry Andric
977*0fca6ea1SDimitry Andric SDNode *n = CurDAG->getMachineNode(Hexagon::F2_sffixupn, dl, MVT::f32, Ops);
978*0fca6ea1SDimitry Andric SDNode *Err = CurDAG->getMachineNode(Hexagon::F2_sffms_lib, dl, MVT::f32,
979*0fca6ea1SDimitry Andric SDValue(constNode, 0), SDValue(D, 0),
980*0fca6ea1SDimitry Andric SDValue(ResScale, 0));
981*0fca6ea1SDimitry Andric SDNode *NewRec = CurDAG->getMachineNode(Hexagon::F2_sffma_lib, dl, MVT::f32,
982*0fca6ea1SDimitry Andric SDValue(ResScale, 0), SDValue(Err, 0),
983*0fca6ea1SDimitry Andric SDValue(ResScale, 0));
984*0fca6ea1SDimitry Andric SDNode *newErr = CurDAG->getMachineNode(Hexagon::F2_sffms_lib, dl, MVT::f32,
985*0fca6ea1SDimitry Andric SDValue(constNode, 0), SDValue(D, 0),
986*0fca6ea1SDimitry Andric SDValue(NewRec, 0));
987*0fca6ea1SDimitry Andric
988*0fca6ea1SDimitry Andric SDNode *NNewRec = CurDAG->getMachineNode(
989*0fca6ea1SDimitry Andric Hexagon::F2_sffma_lib, dl, MVT::f32, SDValue(NewRec, 0),
990*0fca6ea1SDimitry Andric SDValue(newErr, 0), SDValue(NewRec, 0));
991*0fca6ea1SDimitry Andric SDNode *FinalNewQ = CurDAG->getMachineNode(
992*0fca6ea1SDimitry Andric Hexagon::F2_sfmpy, dl, MVT::f32, SDValue(NNewRec, 0), SDValue(n, 0));
993*0fca6ea1SDimitry Andric ReplaceNode(N, FinalNewQ);
994*0fca6ea1SDimitry Andric }
995*0fca6ea1SDimitry Andric
SelectFDiv(SDNode * N)996*0fca6ea1SDimitry Andric void HexagonDAGToDAGISel::SelectFDiv(SDNode *N) {
997*0fca6ea1SDimitry Andric if (N->getFlags().hasAllowReassociation())
998*0fca6ea1SDimitry Andric FastFDiv(N);
999*0fca6ea1SDimitry Andric else
1000*0fca6ea1SDimitry Andric FDiv(N);
1001*0fca6ea1SDimitry Andric return;
1002*0fca6ea1SDimitry Andric }
1003*0fca6ea1SDimitry Andric
Select(SDNode * N)10040b57cec5SDimitry Andric void HexagonDAGToDAGISel::Select(SDNode *N) {
10050b57cec5SDimitry Andric if (N->isMachineOpcode())
10060b57cec5SDimitry Andric return N->setNodeId(-1); // Already selected.
10070b57cec5SDimitry Andric
1008bdd1243dSDimitry Andric auto isHvxOp = [this](SDNode *N) {
1009bdd1243dSDimitry Andric for (unsigned i = 0, e = N->getNumValues(); i != e; ++i) {
1010bdd1243dSDimitry Andric if (HST->isHVXVectorType(N->getValueType(i), true))
1011bdd1243dSDimitry Andric return true;
1012bdd1243dSDimitry Andric }
1013bdd1243dSDimitry Andric for (SDValue I : N->ops()) {
1014bdd1243dSDimitry Andric if (HST->isHVXVectorType(I.getValueType(), true))
1015bdd1243dSDimitry Andric return true;
1016bdd1243dSDimitry Andric }
1017bdd1243dSDimitry Andric return false;
1018bdd1243dSDimitry Andric };
1019bdd1243dSDimitry Andric
1020bdd1243dSDimitry Andric if (HST->useHVXOps() && isHvxOp(N)) {
1021bdd1243dSDimitry Andric switch (N->getOpcode()) {
1022bdd1243dSDimitry Andric case ISD::EXTRACT_SUBVECTOR: return SelectHvxExtractSubvector(N);
1023bdd1243dSDimitry Andric case ISD::VECTOR_SHUFFLE: return SelectHvxShuffle(N);
1024bdd1243dSDimitry Andric
1025bdd1243dSDimitry Andric case HexagonISD::VROR: return SelectHvxRor(N);
1026bdd1243dSDimitry Andric }
1027bdd1243dSDimitry Andric }
1028bdd1243dSDimitry Andric
10290b57cec5SDimitry Andric switch (N->getOpcode()) {
10300b57cec5SDimitry Andric case ISD::Constant: return SelectConstant(N);
10310b57cec5SDimitry Andric case ISD::ConstantFP: return SelectConstantFP(N);
10320b57cec5SDimitry Andric case ISD::FrameIndex: return SelectFrameIndex(N);
10330b57cec5SDimitry Andric case ISD::SHL: return SelectSHL(N);
10340b57cec5SDimitry Andric case ISD::LOAD: return SelectLoad(N);
10350b57cec5SDimitry Andric case ISD::STORE: return SelectStore(N);
10360b57cec5SDimitry Andric case ISD::INTRINSIC_W_CHAIN: return SelectIntrinsicWChain(N);
10370b57cec5SDimitry Andric case ISD::INTRINSIC_WO_CHAIN: return SelectIntrinsicWOChain(N);
1038bdd1243dSDimitry Andric case ISD::EXTRACT_SUBVECTOR: return SelectExtractSubvector(N);
10390b57cec5SDimitry Andric
10400b57cec5SDimitry Andric case HexagonISD::ADDC:
10410b57cec5SDimitry Andric case HexagonISD::SUBC: return SelectAddSubCarry(N);
10420b57cec5SDimitry Andric case HexagonISD::VALIGN: return SelectVAlign(N);
10430b57cec5SDimitry Andric case HexagonISD::VALIGNADDR: return SelectVAlignAddr(N);
10440b57cec5SDimitry Andric case HexagonISD::TYPECAST: return SelectTypecast(N);
10450b57cec5SDimitry Andric case HexagonISD::P2D: return SelectP2D(N);
10460b57cec5SDimitry Andric case HexagonISD::D2P: return SelectD2P(N);
10470b57cec5SDimitry Andric case HexagonISD::Q2V: return SelectQ2V(N);
10480b57cec5SDimitry Andric case HexagonISD::V2Q: return SelectV2Q(N);
1049*0fca6ea1SDimitry Andric case ISD::FDIV:
1050*0fca6ea1SDimitry Andric return SelectFDiv(N);
10510b57cec5SDimitry Andric }
10520b57cec5SDimitry Andric
10530b57cec5SDimitry Andric SelectCode(N);
10540b57cec5SDimitry Andric }
10550b57cec5SDimitry Andric
SelectInlineAsmMemoryOperand(const SDValue & Op,InlineAsm::ConstraintCode ConstraintID,std::vector<SDValue> & OutOps)10565f757f3fSDimitry Andric bool HexagonDAGToDAGISel::SelectInlineAsmMemoryOperand(
10575f757f3fSDimitry Andric const SDValue &Op, InlineAsm::ConstraintCode ConstraintID,
10580b57cec5SDimitry Andric std::vector<SDValue> &OutOps) {
10590b57cec5SDimitry Andric SDValue Inp = Op, Res;
10600b57cec5SDimitry Andric
10610b57cec5SDimitry Andric switch (ConstraintID) {
10620b57cec5SDimitry Andric default:
10630b57cec5SDimitry Andric return true;
10645f757f3fSDimitry Andric case InlineAsm::ConstraintCode::o: // Offsetable.
10655f757f3fSDimitry Andric case InlineAsm::ConstraintCode::v: // Not offsetable.
10665f757f3fSDimitry Andric case InlineAsm::ConstraintCode::m: // Memory.
10670b57cec5SDimitry Andric if (SelectAddrFI(Inp, Res))
10680b57cec5SDimitry Andric OutOps.push_back(Res);
10690b57cec5SDimitry Andric else
10700b57cec5SDimitry Andric OutOps.push_back(Inp);
10710b57cec5SDimitry Andric break;
10720b57cec5SDimitry Andric }
10730b57cec5SDimitry Andric
10740b57cec5SDimitry Andric OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32));
10750b57cec5SDimitry Andric return false;
10760b57cec5SDimitry Andric }
10770b57cec5SDimitry Andric
isMemOPCandidate(SDNode * I,SDNode * U)10780b57cec5SDimitry Andric static bool isMemOPCandidate(SDNode *I, SDNode *U) {
10790b57cec5SDimitry Andric // I is an operand of U. Check if U is an arithmetic (binary) operation
10800b57cec5SDimitry Andric // usable in a memop, where the other operand is a loaded value, and the
10810b57cec5SDimitry Andric // result of U is stored in the same location.
10820b57cec5SDimitry Andric
10830b57cec5SDimitry Andric if (!U->hasOneUse())
10840b57cec5SDimitry Andric return false;
10850b57cec5SDimitry Andric unsigned Opc = U->getOpcode();
10860b57cec5SDimitry Andric switch (Opc) {
10870b57cec5SDimitry Andric case ISD::ADD:
10880b57cec5SDimitry Andric case ISD::SUB:
10890b57cec5SDimitry Andric case ISD::AND:
10900b57cec5SDimitry Andric case ISD::OR:
10910b57cec5SDimitry Andric break;
10920b57cec5SDimitry Andric default:
10930b57cec5SDimitry Andric return false;
10940b57cec5SDimitry Andric }
10950b57cec5SDimitry Andric
10960b57cec5SDimitry Andric SDValue S0 = U->getOperand(0);
10970b57cec5SDimitry Andric SDValue S1 = U->getOperand(1);
10980b57cec5SDimitry Andric SDValue SY = (S0.getNode() == I) ? S1 : S0;
10990b57cec5SDimitry Andric
11000b57cec5SDimitry Andric SDNode *UUse = *U->use_begin();
11010b57cec5SDimitry Andric if (UUse->getNumValues() != 1)
11020b57cec5SDimitry Andric return false;
11030b57cec5SDimitry Andric
11040b57cec5SDimitry Andric // Check if one of the inputs to U is a load instruction and the output
11050b57cec5SDimitry Andric // is used by a store instruction. If so and they also have the same
11060b57cec5SDimitry Andric // base pointer, then don't preoprocess this node sequence as it
11070b57cec5SDimitry Andric // can be matched to a memop.
11080b57cec5SDimitry Andric SDNode *SYNode = SY.getNode();
11090b57cec5SDimitry Andric if (UUse->getOpcode() == ISD::STORE && SYNode->getOpcode() == ISD::LOAD) {
11100b57cec5SDimitry Andric SDValue LDBasePtr = cast<MemSDNode>(SYNode)->getBasePtr();
11110b57cec5SDimitry Andric SDValue STBasePtr = cast<MemSDNode>(UUse)->getBasePtr();
11120b57cec5SDimitry Andric if (LDBasePtr == STBasePtr)
11130b57cec5SDimitry Andric return true;
11140b57cec5SDimitry Andric }
11150b57cec5SDimitry Andric return false;
11160b57cec5SDimitry Andric }
11170b57cec5SDimitry Andric
11180b57cec5SDimitry Andric
11190b57cec5SDimitry Andric // Transform: (or (select c x 0) z) -> (select c (or x z) z)
11200b57cec5SDimitry Andric // (or (select c 0 y) z) -> (select c z (or y z))
ppSimplifyOrSelect0(std::vector<SDNode * > && Nodes)11210b57cec5SDimitry Andric void HexagonDAGToDAGISel::ppSimplifyOrSelect0(std::vector<SDNode*> &&Nodes) {
11220b57cec5SDimitry Andric SelectionDAG &DAG = *CurDAG;
11230b57cec5SDimitry Andric
1124bdd1243dSDimitry Andric for (auto *I : Nodes) {
11250b57cec5SDimitry Andric if (I->getOpcode() != ISD::OR)
11260b57cec5SDimitry Andric continue;
11270b57cec5SDimitry Andric
11285f757f3fSDimitry Andric auto IsSelect0 = [](const SDValue &Op) -> bool {
11290b57cec5SDimitry Andric if (Op.getOpcode() != ISD::SELECT)
11300b57cec5SDimitry Andric return false;
11315f757f3fSDimitry Andric return isNullConstant(Op.getOperand(1)) ||
11325f757f3fSDimitry Andric isNullConstant(Op.getOperand(2));
11330b57cec5SDimitry Andric };
11340b57cec5SDimitry Andric
11350b57cec5SDimitry Andric SDValue N0 = I->getOperand(0), N1 = I->getOperand(1);
11360b57cec5SDimitry Andric EVT VT = I->getValueType(0);
11370b57cec5SDimitry Andric bool SelN0 = IsSelect0(N0);
11380b57cec5SDimitry Andric SDValue SOp = SelN0 ? N0 : N1;
11390b57cec5SDimitry Andric SDValue VOp = SelN0 ? N1 : N0;
11400b57cec5SDimitry Andric
11410b57cec5SDimitry Andric if (SOp.getOpcode() == ISD::SELECT && SOp.getNode()->hasOneUse()) {
11420b57cec5SDimitry Andric SDValue SC = SOp.getOperand(0);
11430b57cec5SDimitry Andric SDValue SX = SOp.getOperand(1);
11440b57cec5SDimitry Andric SDValue SY = SOp.getOperand(2);
11450b57cec5SDimitry Andric SDLoc DLS = SOp;
11465f757f3fSDimitry Andric if (isNullConstant(SY)) {
11470b57cec5SDimitry Andric SDValue NewOr = DAG.getNode(ISD::OR, DLS, VT, SX, VOp);
11480b57cec5SDimitry Andric SDValue NewSel = DAG.getNode(ISD::SELECT, DLS, VT, SC, NewOr, VOp);
11490b57cec5SDimitry Andric DAG.ReplaceAllUsesWith(I, NewSel.getNode());
11505f757f3fSDimitry Andric } else if (isNullConstant(SX)) {
11510b57cec5SDimitry Andric SDValue NewOr = DAG.getNode(ISD::OR, DLS, VT, SY, VOp);
11520b57cec5SDimitry Andric SDValue NewSel = DAG.getNode(ISD::SELECT, DLS, VT, SC, VOp, NewOr);
11530b57cec5SDimitry Andric DAG.ReplaceAllUsesWith(I, NewSel.getNode());
11540b57cec5SDimitry Andric }
11550b57cec5SDimitry Andric }
11560b57cec5SDimitry Andric }
11570b57cec5SDimitry Andric }
11580b57cec5SDimitry Andric
11590b57cec5SDimitry Andric // Transform: (store ch val (add x (add (shl y c) e)))
11600b57cec5SDimitry Andric // to: (store ch val (add x (shl (add y d) c))),
11610b57cec5SDimitry Andric // where e = (shl d c) for some integer d.
11620b57cec5SDimitry Andric // The purpose of this is to enable generation of loads/stores with
11630b57cec5SDimitry Andric // shifted addressing mode, i.e. mem(x+y<<#c). For that, the shift
11640b57cec5SDimitry Andric // value c must be 0, 1 or 2.
ppAddrReorderAddShl(std::vector<SDNode * > && Nodes)11650b57cec5SDimitry Andric void HexagonDAGToDAGISel::ppAddrReorderAddShl(std::vector<SDNode*> &&Nodes) {
11660b57cec5SDimitry Andric SelectionDAG &DAG = *CurDAG;
11670b57cec5SDimitry Andric
1168bdd1243dSDimitry Andric for (auto *I : Nodes) {
11690b57cec5SDimitry Andric if (I->getOpcode() != ISD::STORE)
11700b57cec5SDimitry Andric continue;
11710b57cec5SDimitry Andric
11720b57cec5SDimitry Andric // I matched: (store ch val Off)
11730b57cec5SDimitry Andric SDValue Off = I->getOperand(2);
11740b57cec5SDimitry Andric // Off needs to match: (add x (add (shl y c) (shl d c))))
11750b57cec5SDimitry Andric if (Off.getOpcode() != ISD::ADD)
11760b57cec5SDimitry Andric continue;
11770b57cec5SDimitry Andric // Off matched: (add x T0)
11780b57cec5SDimitry Andric SDValue T0 = Off.getOperand(1);
11790b57cec5SDimitry Andric // T0 needs to match: (add T1 T2):
11800b57cec5SDimitry Andric if (T0.getOpcode() != ISD::ADD)
11810b57cec5SDimitry Andric continue;
11820b57cec5SDimitry Andric // T0 matched: (add T1 T2)
11830b57cec5SDimitry Andric SDValue T1 = T0.getOperand(0);
11840b57cec5SDimitry Andric SDValue T2 = T0.getOperand(1);
11850b57cec5SDimitry Andric // T1 needs to match: (shl y c)
11860b57cec5SDimitry Andric if (T1.getOpcode() != ISD::SHL)
11870b57cec5SDimitry Andric continue;
11880b57cec5SDimitry Andric SDValue C = T1.getOperand(1);
11890b57cec5SDimitry Andric ConstantSDNode *CN = dyn_cast<ConstantSDNode>(C.getNode());
11900b57cec5SDimitry Andric if (CN == nullptr)
11910b57cec5SDimitry Andric continue;
11920b57cec5SDimitry Andric unsigned CV = CN->getZExtValue();
11930b57cec5SDimitry Andric if (CV > 2)
11940b57cec5SDimitry Andric continue;
11950b57cec5SDimitry Andric // T2 needs to match e, where e = (shl d c) for some d.
11960b57cec5SDimitry Andric ConstantSDNode *EN = dyn_cast<ConstantSDNode>(T2.getNode());
11970b57cec5SDimitry Andric if (EN == nullptr)
11980b57cec5SDimitry Andric continue;
11990b57cec5SDimitry Andric unsigned EV = EN->getZExtValue();
12000b57cec5SDimitry Andric if (EV % (1 << CV) != 0)
12010b57cec5SDimitry Andric continue;
12020b57cec5SDimitry Andric unsigned DV = EV / (1 << CV);
12030b57cec5SDimitry Andric
12040b57cec5SDimitry Andric // Replace T0 with: (shl (add y d) c)
12050b57cec5SDimitry Andric SDLoc DL = SDLoc(I);
12060b57cec5SDimitry Andric EVT VT = T0.getValueType();
12070b57cec5SDimitry Andric SDValue D = DAG.getConstant(DV, DL, VT);
12080b57cec5SDimitry Andric // NewAdd = (add y d)
12090b57cec5SDimitry Andric SDValue NewAdd = DAG.getNode(ISD::ADD, DL, VT, T1.getOperand(0), D);
12100b57cec5SDimitry Andric // NewShl = (shl NewAdd c)
12110b57cec5SDimitry Andric SDValue NewShl = DAG.getNode(ISD::SHL, DL, VT, NewAdd, C);
12120b57cec5SDimitry Andric ReplaceNode(T0.getNode(), NewShl.getNode());
12130b57cec5SDimitry Andric }
12140b57cec5SDimitry Andric }
12150b57cec5SDimitry Andric
12160b57cec5SDimitry Andric // Transform: (load ch (add x (and (srl y c) Mask)))
12170b57cec5SDimitry Andric // to: (load ch (add x (shl (srl y d) d-c)))
12180b57cec5SDimitry Andric // where
12190b57cec5SDimitry Andric // Mask = 00..0 111..1 0.0
12200b57cec5SDimitry Andric // | | +-- d-c 0s, and d-c is 0, 1 or 2.
12210b57cec5SDimitry Andric // | +-------- 1s
12220b57cec5SDimitry Andric // +-------------- at most c 0s
12230b57cec5SDimitry Andric // Motivating example:
12240b57cec5SDimitry Andric // DAG combiner optimizes (add x (shl (srl y 5) 2))
12250b57cec5SDimitry Andric // to (add x (and (srl y 3) 1FFFFFFC))
12260b57cec5SDimitry Andric // which results in a constant-extended and(##...,lsr). This transformation
12270b57cec5SDimitry Andric // undoes this simplification for cases where the shl can be folded into
12280b57cec5SDimitry Andric // an addressing mode.
ppAddrRewriteAndSrl(std::vector<SDNode * > && Nodes)12290b57cec5SDimitry Andric void HexagonDAGToDAGISel::ppAddrRewriteAndSrl(std::vector<SDNode*> &&Nodes) {
12300b57cec5SDimitry Andric SelectionDAG &DAG = *CurDAG;
12310b57cec5SDimitry Andric
12320b57cec5SDimitry Andric for (SDNode *N : Nodes) {
12330b57cec5SDimitry Andric unsigned Opc = N->getOpcode();
12340b57cec5SDimitry Andric if (Opc != ISD::LOAD && Opc != ISD::STORE)
12350b57cec5SDimitry Andric continue;
12360b57cec5SDimitry Andric SDValue Addr = Opc == ISD::LOAD ? N->getOperand(1) : N->getOperand(2);
12370b57cec5SDimitry Andric // Addr must match: (add x T0)
12380b57cec5SDimitry Andric if (Addr.getOpcode() != ISD::ADD)
12390b57cec5SDimitry Andric continue;
12400b57cec5SDimitry Andric SDValue T0 = Addr.getOperand(1);
12410b57cec5SDimitry Andric // T0 must match: (and T1 Mask)
12420b57cec5SDimitry Andric if (T0.getOpcode() != ISD::AND)
12430b57cec5SDimitry Andric continue;
12440b57cec5SDimitry Andric
12450b57cec5SDimitry Andric // We have an AND.
12460b57cec5SDimitry Andric //
12470b57cec5SDimitry Andric // Check the first operand. It must be: (srl y c).
12480b57cec5SDimitry Andric SDValue S = T0.getOperand(0);
12490b57cec5SDimitry Andric if (S.getOpcode() != ISD::SRL)
12500b57cec5SDimitry Andric continue;
12510b57cec5SDimitry Andric ConstantSDNode *SN = dyn_cast<ConstantSDNode>(S.getOperand(1).getNode());
12520b57cec5SDimitry Andric if (SN == nullptr)
12530b57cec5SDimitry Andric continue;
12540b57cec5SDimitry Andric if (SN->getAPIntValue().getBitWidth() != 32)
12550b57cec5SDimitry Andric continue;
12560b57cec5SDimitry Andric uint32_t CV = SN->getZExtValue();
12570b57cec5SDimitry Andric
12580b57cec5SDimitry Andric // Check the second operand: the supposed mask.
12590b57cec5SDimitry Andric ConstantSDNode *MN = dyn_cast<ConstantSDNode>(T0.getOperand(1).getNode());
12600b57cec5SDimitry Andric if (MN == nullptr)
12610b57cec5SDimitry Andric continue;
12620b57cec5SDimitry Andric if (MN->getAPIntValue().getBitWidth() != 32)
12630b57cec5SDimitry Andric continue;
12640b57cec5SDimitry Andric uint32_t Mask = MN->getZExtValue();
12650b57cec5SDimitry Andric // Examine the mask.
126606c3fb27SDimitry Andric uint32_t TZ = llvm::countr_zero(Mask);
126706c3fb27SDimitry Andric uint32_t M1 = llvm::countr_one(Mask >> TZ);
126806c3fb27SDimitry Andric uint32_t LZ = llvm::countl_zero(Mask);
12690b57cec5SDimitry Andric // Trailing zeros + middle ones + leading zeros must equal the width.
12700b57cec5SDimitry Andric if (TZ + M1 + LZ != 32)
12710b57cec5SDimitry Andric continue;
12720b57cec5SDimitry Andric // The number of trailing zeros will be encoded in the addressing mode.
12730b57cec5SDimitry Andric if (TZ > 2)
12740b57cec5SDimitry Andric continue;
12750b57cec5SDimitry Andric // The number of leading zeros must be at most c.
12760b57cec5SDimitry Andric if (LZ > CV)
12770b57cec5SDimitry Andric continue;
12780b57cec5SDimitry Andric
12790b57cec5SDimitry Andric // All looks good.
12800b57cec5SDimitry Andric SDValue Y = S.getOperand(0);
12810b57cec5SDimitry Andric EVT VT = Addr.getValueType();
12820b57cec5SDimitry Andric SDLoc dl(S);
12830b57cec5SDimitry Andric // TZ = D-C, so D = TZ+C.
12840b57cec5SDimitry Andric SDValue D = DAG.getConstant(TZ+CV, dl, VT);
12850b57cec5SDimitry Andric SDValue DC = DAG.getConstant(TZ, dl, VT);
12860b57cec5SDimitry Andric SDValue NewSrl = DAG.getNode(ISD::SRL, dl, VT, Y, D);
12870b57cec5SDimitry Andric SDValue NewShl = DAG.getNode(ISD::SHL, dl, VT, NewSrl, DC);
12880b57cec5SDimitry Andric ReplaceNode(T0.getNode(), NewShl.getNode());
12890b57cec5SDimitry Andric }
12900b57cec5SDimitry Andric }
12910b57cec5SDimitry Andric
12920b57cec5SDimitry Andric // Transform: (op ... (zext i1 c) ...) -> (select c (op ... 0 ...)
12930b57cec5SDimitry Andric // (op ... 1 ...))
ppHoistZextI1(std::vector<SDNode * > && Nodes)12940b57cec5SDimitry Andric void HexagonDAGToDAGISel::ppHoistZextI1(std::vector<SDNode*> &&Nodes) {
12950b57cec5SDimitry Andric SelectionDAG &DAG = *CurDAG;
12960b57cec5SDimitry Andric
12970b57cec5SDimitry Andric for (SDNode *N : Nodes) {
12980b57cec5SDimitry Andric unsigned Opc = N->getOpcode();
12990b57cec5SDimitry Andric if (Opc != ISD::ZERO_EXTEND)
13000b57cec5SDimitry Andric continue;
13010b57cec5SDimitry Andric SDValue OpI1 = N->getOperand(0);
13020b57cec5SDimitry Andric EVT OpVT = OpI1.getValueType();
13030b57cec5SDimitry Andric if (!OpVT.isSimple() || OpVT.getSimpleVT() != MVT::i1)
13040b57cec5SDimitry Andric continue;
13050b57cec5SDimitry Andric for (auto I = N->use_begin(), E = N->use_end(); I != E; ++I) {
13060b57cec5SDimitry Andric SDNode *U = *I;
13070b57cec5SDimitry Andric if (U->getNumValues() != 1)
13080b57cec5SDimitry Andric continue;
13090b57cec5SDimitry Andric EVT UVT = U->getValueType(0);
13100b57cec5SDimitry Andric if (!UVT.isSimple() || !UVT.isInteger() || UVT.getSimpleVT() == MVT::i1)
13110b57cec5SDimitry Andric continue;
131204eeddc0SDimitry Andric // Do not generate select for all i1 vector type.
131304eeddc0SDimitry Andric if (UVT.isVector() && UVT.getVectorElementType() == MVT::i1)
131404eeddc0SDimitry Andric continue;
13150b57cec5SDimitry Andric if (isMemOPCandidate(N, U))
13160b57cec5SDimitry Andric continue;
13170b57cec5SDimitry Andric
13180b57cec5SDimitry Andric // Potentially simplifiable operation.
13190b57cec5SDimitry Andric unsigned I1N = I.getOperandNo();
13200b57cec5SDimitry Andric SmallVector<SDValue,2> Ops(U->getNumOperands());
13210b57cec5SDimitry Andric for (unsigned i = 0, n = U->getNumOperands(); i != n; ++i)
13220b57cec5SDimitry Andric Ops[i] = U->getOperand(i);
13230b57cec5SDimitry Andric EVT BVT = Ops[I1N].getValueType();
13240b57cec5SDimitry Andric
13255ffd83dbSDimitry Andric const SDLoc &dl(U);
13260b57cec5SDimitry Andric SDValue C0 = DAG.getConstant(0, dl, BVT);
13270b57cec5SDimitry Andric SDValue C1 = DAG.getConstant(1, dl, BVT);
13280b57cec5SDimitry Andric SDValue If0, If1;
13290b57cec5SDimitry Andric
13300b57cec5SDimitry Andric if (isa<MachineSDNode>(U)) {
13310b57cec5SDimitry Andric unsigned UseOpc = U->getMachineOpcode();
13320b57cec5SDimitry Andric Ops[I1N] = C0;
13330b57cec5SDimitry Andric If0 = SDValue(DAG.getMachineNode(UseOpc, dl, UVT, Ops), 0);
13340b57cec5SDimitry Andric Ops[I1N] = C1;
13350b57cec5SDimitry Andric If1 = SDValue(DAG.getMachineNode(UseOpc, dl, UVT, Ops), 0);
13360b57cec5SDimitry Andric } else {
13370b57cec5SDimitry Andric unsigned UseOpc = U->getOpcode();
13380b57cec5SDimitry Andric Ops[I1N] = C0;
13390b57cec5SDimitry Andric If0 = DAG.getNode(UseOpc, dl, UVT, Ops);
13400b57cec5SDimitry Andric Ops[I1N] = C1;
13410b57cec5SDimitry Andric If1 = DAG.getNode(UseOpc, dl, UVT, Ops);
13420b57cec5SDimitry Andric }
13435ffd83dbSDimitry Andric // We're generating a SELECT way after legalization, so keep the types
13445ffd83dbSDimitry Andric // simple.
13455ffd83dbSDimitry Andric unsigned UW = UVT.getSizeInBits();
13465ffd83dbSDimitry Andric EVT SVT = (UW == 32 || UW == 64) ? MVT::getIntegerVT(UW) : UVT;
13475ffd83dbSDimitry Andric SDValue Sel = DAG.getNode(ISD::SELECT, dl, SVT, OpI1,
13485ffd83dbSDimitry Andric DAG.getBitcast(SVT, If1),
13495ffd83dbSDimitry Andric DAG.getBitcast(SVT, If0));
13505ffd83dbSDimitry Andric SDValue Ret = DAG.getBitcast(UVT, Sel);
13515ffd83dbSDimitry Andric DAG.ReplaceAllUsesWith(U, Ret.getNode());
13520b57cec5SDimitry Andric }
13530b57cec5SDimitry Andric }
13540b57cec5SDimitry Andric }
13550b57cec5SDimitry Andric
PreprocessISelDAG()13560b57cec5SDimitry Andric void HexagonDAGToDAGISel::PreprocessISelDAG() {
13570b57cec5SDimitry Andric // Repack all nodes before calling each preprocessing function,
13580b57cec5SDimitry Andric // because each of them can modify the set of nodes.
13590b57cec5SDimitry Andric auto getNodes = [this]() -> std::vector<SDNode *> {
13600b57cec5SDimitry Andric std::vector<SDNode *> T;
13610b57cec5SDimitry Andric T.reserve(CurDAG->allnodes_size());
13620b57cec5SDimitry Andric for (SDNode &N : CurDAG->allnodes())
13630b57cec5SDimitry Andric T.push_back(&N);
13640b57cec5SDimitry Andric return T;
13650b57cec5SDimitry Andric };
13660b57cec5SDimitry Andric
1367bdd1243dSDimitry Andric if (HST->useHVXOps())
1368bdd1243dSDimitry Andric PreprocessHvxISelDAG();
1369bdd1243dSDimitry Andric
13700b57cec5SDimitry Andric // Transform: (or (select c x 0) z) -> (select c (or x z) z)
13710b57cec5SDimitry Andric // (or (select c 0 y) z) -> (select c z (or y z))
13720b57cec5SDimitry Andric ppSimplifyOrSelect0(getNodes());
13730b57cec5SDimitry Andric
13740b57cec5SDimitry Andric // Transform: (store ch val (add x (add (shl y c) e)))
13750b57cec5SDimitry Andric // to: (store ch val (add x (shl (add y d) c))),
13760b57cec5SDimitry Andric // where e = (shl d c) for some integer d.
13770b57cec5SDimitry Andric // The purpose of this is to enable generation of loads/stores with
13780b57cec5SDimitry Andric // shifted addressing mode, i.e. mem(x+y<<#c). For that, the shift
13790b57cec5SDimitry Andric // value c must be 0, 1 or 2.
13800b57cec5SDimitry Andric ppAddrReorderAddShl(getNodes());
13810b57cec5SDimitry Andric
13820b57cec5SDimitry Andric // Transform: (load ch (add x (and (srl y c) Mask)))
13830b57cec5SDimitry Andric // to: (load ch (add x (shl (srl y d) d-c)))
13840b57cec5SDimitry Andric // where
13850b57cec5SDimitry Andric // Mask = 00..0 111..1 0.0
13860b57cec5SDimitry Andric // | | +-- d-c 0s, and d-c is 0, 1 or 2.
13870b57cec5SDimitry Andric // | +-------- 1s
13880b57cec5SDimitry Andric // +-------------- at most c 0s
13890b57cec5SDimitry Andric // Motivating example:
13900b57cec5SDimitry Andric // DAG combiner optimizes (add x (shl (srl y 5) 2))
13910b57cec5SDimitry Andric // to (add x (and (srl y 3) 1FFFFFFC))
13920b57cec5SDimitry Andric // which results in a constant-extended and(##...,lsr). This transformation
13930b57cec5SDimitry Andric // undoes this simplification for cases where the shl can be folded into
13940b57cec5SDimitry Andric // an addressing mode.
13950b57cec5SDimitry Andric ppAddrRewriteAndSrl(getNodes());
13960b57cec5SDimitry Andric
13970b57cec5SDimitry Andric // Transform: (op ... (zext i1 c) ...) -> (select c (op ... 0 ...)
13980b57cec5SDimitry Andric // (op ... 1 ...))
13990b57cec5SDimitry Andric ppHoistZextI1(getNodes());
14000b57cec5SDimitry Andric
14010b57cec5SDimitry Andric DEBUG_WITH_TYPE("isel", {
14020b57cec5SDimitry Andric dbgs() << "Preprocessed (Hexagon) selection DAG:";
14030b57cec5SDimitry Andric CurDAG->dump();
14040b57cec5SDimitry Andric });
14050b57cec5SDimitry Andric
14060b57cec5SDimitry Andric if (EnableAddressRebalancing) {
14070b57cec5SDimitry Andric rebalanceAddressTrees();
14080b57cec5SDimitry Andric
14090b57cec5SDimitry Andric DEBUG_WITH_TYPE("isel", {
14100b57cec5SDimitry Andric dbgs() << "Address tree balanced selection DAG:";
14110b57cec5SDimitry Andric CurDAG->dump();
14120b57cec5SDimitry Andric });
14130b57cec5SDimitry Andric }
14140b57cec5SDimitry Andric }
14150b57cec5SDimitry Andric
emitFunctionEntryCode()14165ffd83dbSDimitry Andric void HexagonDAGToDAGISel::emitFunctionEntryCode() {
1417480093f4SDimitry Andric auto &HST = MF->getSubtarget<HexagonSubtarget>();
14180b57cec5SDimitry Andric auto &HFI = *HST.getFrameLowering();
14190b57cec5SDimitry Andric if (!HFI.needsAligna(*MF))
14200b57cec5SDimitry Andric return;
14210b57cec5SDimitry Andric
14220b57cec5SDimitry Andric MachineFrameInfo &MFI = MF->getFrameInfo();
14230b57cec5SDimitry Andric MachineBasicBlock *EntryBB = &MF->front();
14245ffd83dbSDimitry Andric Align EntryMaxA = MFI.getMaxAlign();
1425bdd1243dSDimitry Andric
1426bdd1243dSDimitry Andric // Reserve the first non-volatile register.
1427bdd1243dSDimitry Andric Register AP = 0;
1428bdd1243dSDimitry Andric auto &HRI = *HST.getRegisterInfo();
1429bdd1243dSDimitry Andric BitVector Reserved = HRI.getReservedRegs(*MF);
1430bdd1243dSDimitry Andric for (const MCPhysReg *R = HRI.getCalleeSavedRegs(MF); *R; ++R) {
1431bdd1243dSDimitry Andric if (Reserved[*R])
1432bdd1243dSDimitry Andric continue;
1433bdd1243dSDimitry Andric AP = *R;
1434bdd1243dSDimitry Andric break;
1435bdd1243dSDimitry Andric }
1436bdd1243dSDimitry Andric assert(AP.isValid() && "Couldn't reserve stack align register");
1437bdd1243dSDimitry Andric BuildMI(EntryBB, DebugLoc(), HII->get(Hexagon::PS_aligna), AP)
14385ffd83dbSDimitry Andric .addImm(EntryMaxA.value());
1439bdd1243dSDimitry Andric MF->getInfo<HexagonMachineFunctionInfo>()->setStackAlignBaseReg(AP);
14400b57cec5SDimitry Andric }
14410b57cec5SDimitry Andric
updateAligna()1442480093f4SDimitry Andric void HexagonDAGToDAGISel::updateAligna() {
1443480093f4SDimitry Andric auto &HFI = *MF->getSubtarget<HexagonSubtarget>().getFrameLowering();
1444480093f4SDimitry Andric if (!HFI.needsAligna(*MF))
1445480093f4SDimitry Andric return;
1446480093f4SDimitry Andric auto *AlignaI = const_cast<MachineInstr*>(HFI.getAlignaInstr(*MF));
1447480093f4SDimitry Andric assert(AlignaI != nullptr);
14485ffd83dbSDimitry Andric unsigned MaxA = MF->getFrameInfo().getMaxAlign().value();
1449480093f4SDimitry Andric if (AlignaI->getOperand(1).getImm() < MaxA)
1450480093f4SDimitry Andric AlignaI->getOperand(1).setImm(MaxA);
1451480093f4SDimitry Andric }
1452480093f4SDimitry Andric
14530b57cec5SDimitry Andric // Match a frame index that can be used in an addressing mode.
SelectAddrFI(SDValue & N,SDValue & R)14540b57cec5SDimitry Andric bool HexagonDAGToDAGISel::SelectAddrFI(SDValue &N, SDValue &R) {
14550b57cec5SDimitry Andric if (N.getOpcode() != ISD::FrameIndex)
14560b57cec5SDimitry Andric return false;
14570b57cec5SDimitry Andric auto &HFI = *HST->getFrameLowering();
14580b57cec5SDimitry Andric MachineFrameInfo &MFI = MF->getFrameInfo();
14590b57cec5SDimitry Andric int FX = cast<FrameIndexSDNode>(N)->getIndex();
14600b57cec5SDimitry Andric if (!MFI.isFixedObjectIndex(FX) && HFI.needsAligna(*MF))
14610b57cec5SDimitry Andric return false;
14620b57cec5SDimitry Andric R = CurDAG->getTargetFrameIndex(FX, MVT::i32);
14630b57cec5SDimitry Andric return true;
14640b57cec5SDimitry Andric }
14650b57cec5SDimitry Andric
SelectAddrGA(SDValue & N,SDValue & R)14660b57cec5SDimitry Andric inline bool HexagonDAGToDAGISel::SelectAddrGA(SDValue &N, SDValue &R) {
14675ffd83dbSDimitry Andric return SelectGlobalAddress(N, R, false, Align(1));
14680b57cec5SDimitry Andric }
14690b57cec5SDimitry Andric
SelectAddrGP(SDValue & N,SDValue & R)14700b57cec5SDimitry Andric inline bool HexagonDAGToDAGISel::SelectAddrGP(SDValue &N, SDValue &R) {
14715ffd83dbSDimitry Andric return SelectGlobalAddress(N, R, true, Align(1));
14720b57cec5SDimitry Andric }
14730b57cec5SDimitry Andric
SelectAnyImm(SDValue & N,SDValue & R)14740b57cec5SDimitry Andric inline bool HexagonDAGToDAGISel::SelectAnyImm(SDValue &N, SDValue &R) {
14755ffd83dbSDimitry Andric return SelectAnyImmediate(N, R, Align(1));
14760b57cec5SDimitry Andric }
14770b57cec5SDimitry Andric
SelectAnyImm0(SDValue & N,SDValue & R)14780b57cec5SDimitry Andric inline bool HexagonDAGToDAGISel::SelectAnyImm0(SDValue &N, SDValue &R) {
14795ffd83dbSDimitry Andric return SelectAnyImmediate(N, R, Align(1));
14800b57cec5SDimitry Andric }
SelectAnyImm1(SDValue & N,SDValue & R)14810b57cec5SDimitry Andric inline bool HexagonDAGToDAGISel::SelectAnyImm1(SDValue &N, SDValue &R) {
14825ffd83dbSDimitry Andric return SelectAnyImmediate(N, R, Align(2));
14830b57cec5SDimitry Andric }
SelectAnyImm2(SDValue & N,SDValue & R)14840b57cec5SDimitry Andric inline bool HexagonDAGToDAGISel::SelectAnyImm2(SDValue &N, SDValue &R) {
14855ffd83dbSDimitry Andric return SelectAnyImmediate(N, R, Align(4));
14860b57cec5SDimitry Andric }
SelectAnyImm3(SDValue & N,SDValue & R)14870b57cec5SDimitry Andric inline bool HexagonDAGToDAGISel::SelectAnyImm3(SDValue &N, SDValue &R) {
14885ffd83dbSDimitry Andric return SelectAnyImmediate(N, R, Align(8));
14890b57cec5SDimitry Andric }
14900b57cec5SDimitry Andric
SelectAnyInt(SDValue & N,SDValue & R)14910b57cec5SDimitry Andric inline bool HexagonDAGToDAGISel::SelectAnyInt(SDValue &N, SDValue &R) {
14920b57cec5SDimitry Andric EVT T = N.getValueType();
14930b57cec5SDimitry Andric if (!T.isInteger() || T.getSizeInBits() != 32 || !isa<ConstantSDNode>(N))
14940b57cec5SDimitry Andric return false;
149581ad6265SDimitry Andric int32_t V = cast<const ConstantSDNode>(N)->getZExtValue();
149681ad6265SDimitry Andric R = CurDAG->getTargetConstant(V, SDLoc(N), N.getValueType());
14970b57cec5SDimitry Andric return true;
14980b57cec5SDimitry Andric }
14990b57cec5SDimitry Andric
SelectAnyImmediate(SDValue & N,SDValue & R,Align Alignment)15000b57cec5SDimitry Andric bool HexagonDAGToDAGISel::SelectAnyImmediate(SDValue &N, SDValue &R,
15015ffd83dbSDimitry Andric Align Alignment) {
15020b57cec5SDimitry Andric switch (N.getOpcode()) {
15030b57cec5SDimitry Andric case ISD::Constant: {
15040b57cec5SDimitry Andric if (N.getValueType() != MVT::i32)
15050b57cec5SDimitry Andric return false;
15060b57cec5SDimitry Andric int32_t V = cast<const ConstantSDNode>(N)->getZExtValue();
15075ffd83dbSDimitry Andric if (!isAligned(Alignment, V))
15080b57cec5SDimitry Andric return false;
15090b57cec5SDimitry Andric R = CurDAG->getTargetConstant(V, SDLoc(N), N.getValueType());
15100b57cec5SDimitry Andric return true;
15110b57cec5SDimitry Andric }
15120b57cec5SDimitry Andric case HexagonISD::JT:
15130b57cec5SDimitry Andric case HexagonISD::CP:
15140b57cec5SDimitry Andric // These are assumed to always be aligned at least 8-byte boundary.
15155ffd83dbSDimitry Andric if (Alignment > Align(8))
15160b57cec5SDimitry Andric return false;
15170b57cec5SDimitry Andric R = N.getOperand(0);
15180b57cec5SDimitry Andric return true;
15190b57cec5SDimitry Andric case ISD::ExternalSymbol:
15200b57cec5SDimitry Andric // Symbols may be aligned at any boundary.
15215ffd83dbSDimitry Andric if (Alignment > Align(1))
15220b57cec5SDimitry Andric return false;
15230b57cec5SDimitry Andric R = N;
15240b57cec5SDimitry Andric return true;
15250b57cec5SDimitry Andric case ISD::BlockAddress:
15260b57cec5SDimitry Andric // Block address is always aligned at least 4-byte boundary.
15275ffd83dbSDimitry Andric if (Alignment > Align(4) ||
15285ffd83dbSDimitry Andric !isAligned(Alignment, cast<BlockAddressSDNode>(N)->getOffset()))
15290b57cec5SDimitry Andric return false;
15300b57cec5SDimitry Andric R = N;
15310b57cec5SDimitry Andric return true;
15320b57cec5SDimitry Andric }
15330b57cec5SDimitry Andric
15345ffd83dbSDimitry Andric if (SelectGlobalAddress(N, R, false, Alignment) ||
15355ffd83dbSDimitry Andric SelectGlobalAddress(N, R, true, Alignment))
15360b57cec5SDimitry Andric return true;
15370b57cec5SDimitry Andric
15380b57cec5SDimitry Andric return false;
15390b57cec5SDimitry Andric }
15400b57cec5SDimitry Andric
SelectGlobalAddress(SDValue & N,SDValue & R,bool UseGP,Align Alignment)15410b57cec5SDimitry Andric bool HexagonDAGToDAGISel::SelectGlobalAddress(SDValue &N, SDValue &R,
15425ffd83dbSDimitry Andric bool UseGP, Align Alignment) {
15430b57cec5SDimitry Andric switch (N.getOpcode()) {
15440b57cec5SDimitry Andric case ISD::ADD: {
15450b57cec5SDimitry Andric SDValue N0 = N.getOperand(0);
15460b57cec5SDimitry Andric SDValue N1 = N.getOperand(1);
15470b57cec5SDimitry Andric unsigned GAOpc = N0.getOpcode();
15480b57cec5SDimitry Andric if (UseGP && GAOpc != HexagonISD::CONST32_GP)
15490b57cec5SDimitry Andric return false;
15500b57cec5SDimitry Andric if (!UseGP && GAOpc != HexagonISD::CONST32)
15510b57cec5SDimitry Andric return false;
15520b57cec5SDimitry Andric if (ConstantSDNode *Const = dyn_cast<ConstantSDNode>(N1)) {
15535ffd83dbSDimitry Andric if (!isAligned(Alignment, Const->getZExtValue()))
15540b57cec5SDimitry Andric return false;
15555ffd83dbSDimitry Andric SDValue Addr = N0.getOperand(0);
15560b57cec5SDimitry Andric if (GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(Addr)) {
15570b57cec5SDimitry Andric if (GA->getOpcode() == ISD::TargetGlobalAddress) {
15580b57cec5SDimitry Andric uint64_t NewOff = GA->getOffset() + (uint64_t)Const->getSExtValue();
15590b57cec5SDimitry Andric R = CurDAG->getTargetGlobalAddress(GA->getGlobal(), SDLoc(Const),
15600b57cec5SDimitry Andric N.getValueType(), NewOff);
15610b57cec5SDimitry Andric return true;
15620b57cec5SDimitry Andric }
15630b57cec5SDimitry Andric }
15640b57cec5SDimitry Andric }
15650b57cec5SDimitry Andric break;
15660b57cec5SDimitry Andric }
15670b57cec5SDimitry Andric case HexagonISD::CP:
15680b57cec5SDimitry Andric case HexagonISD::JT:
15690b57cec5SDimitry Andric case HexagonISD::CONST32:
15700b57cec5SDimitry Andric // The operand(0) of CONST32 is TargetGlobalAddress, which is what we
15710b57cec5SDimitry Andric // want in the instruction.
15720b57cec5SDimitry Andric if (!UseGP)
15730b57cec5SDimitry Andric R = N.getOperand(0);
15740b57cec5SDimitry Andric return !UseGP;
15750b57cec5SDimitry Andric case HexagonISD::CONST32_GP:
15760b57cec5SDimitry Andric if (UseGP)
15770b57cec5SDimitry Andric R = N.getOperand(0);
15780b57cec5SDimitry Andric return UseGP;
15790b57cec5SDimitry Andric default:
15800b57cec5SDimitry Andric return false;
15810b57cec5SDimitry Andric }
15820b57cec5SDimitry Andric
15830b57cec5SDimitry Andric return false;
15840b57cec5SDimitry Andric }
15850b57cec5SDimitry Andric
DetectUseSxtw(SDValue & N,SDValue & R)15860b57cec5SDimitry Andric bool HexagonDAGToDAGISel::DetectUseSxtw(SDValue &N, SDValue &R) {
15870b57cec5SDimitry Andric // This (complex pattern) function is meant to detect a sign-extension
15880b57cec5SDimitry Andric // i32->i64 on a per-operand basis. This would allow writing single
15890b57cec5SDimitry Andric // patterns that would cover a number of combinations of different ways
15900b57cec5SDimitry Andric // a sign-extensions could be written. For example:
15910b57cec5SDimitry Andric // (mul (DetectUseSxtw x) (DetectUseSxtw y)) -> (M2_dpmpyss_s0 x y)
15920b57cec5SDimitry Andric // could match either one of these:
15930b57cec5SDimitry Andric // (mul (sext x) (sext_inreg y))
15940b57cec5SDimitry Andric // (mul (sext-load *p) (sext_inreg y))
15950b57cec5SDimitry Andric // (mul (sext_inreg x) (sext y))
15960b57cec5SDimitry Andric // etc.
15970b57cec5SDimitry Andric //
15980b57cec5SDimitry Andric // The returned value will have type i64 and its low word will
15990b57cec5SDimitry Andric // contain the value being extended. The high bits are not specified.
16000b57cec5SDimitry Andric // The returned type is i64 because the original type of N was i64,
16010b57cec5SDimitry Andric // but the users of this function should only use the low-word of the
16020b57cec5SDimitry Andric // result, e.g.
16030b57cec5SDimitry Andric // (mul sxtw:x, sxtw:y) -> (M2_dpmpyss_s0 (LoReg sxtw:x), (LoReg sxtw:y))
16040b57cec5SDimitry Andric
16050b57cec5SDimitry Andric if (N.getValueType() != MVT::i64)
16060b57cec5SDimitry Andric return false;
16070b57cec5SDimitry Andric unsigned Opc = N.getOpcode();
16080b57cec5SDimitry Andric switch (Opc) {
16090b57cec5SDimitry Andric case ISD::SIGN_EXTEND:
16100b57cec5SDimitry Andric case ISD::SIGN_EXTEND_INREG: {
16110b57cec5SDimitry Andric // sext_inreg has the source type as a separate operand.
16120b57cec5SDimitry Andric EVT T = Opc == ISD::SIGN_EXTEND
16130b57cec5SDimitry Andric ? N.getOperand(0).getValueType()
16140b57cec5SDimitry Andric : cast<VTSDNode>(N.getOperand(1))->getVT();
16150b57cec5SDimitry Andric unsigned SW = T.getSizeInBits();
16160b57cec5SDimitry Andric if (SW == 32)
16170b57cec5SDimitry Andric R = N.getOperand(0);
16180b57cec5SDimitry Andric else if (SW < 32)
16190b57cec5SDimitry Andric R = N;
16200b57cec5SDimitry Andric else
16210b57cec5SDimitry Andric return false;
16220b57cec5SDimitry Andric break;
16230b57cec5SDimitry Andric }
16240b57cec5SDimitry Andric case ISD::LOAD: {
16250b57cec5SDimitry Andric LoadSDNode *L = cast<LoadSDNode>(N);
16260b57cec5SDimitry Andric if (L->getExtensionType() != ISD::SEXTLOAD)
16270b57cec5SDimitry Andric return false;
16280b57cec5SDimitry Andric // All extending loads extend to i32, so even if the value in
16290b57cec5SDimitry Andric // memory is shorter than 32 bits, it will be i32 after the load.
16300b57cec5SDimitry Andric if (L->getMemoryVT().getSizeInBits() > 32)
16310b57cec5SDimitry Andric return false;
16320b57cec5SDimitry Andric R = N;
16330b57cec5SDimitry Andric break;
16340b57cec5SDimitry Andric }
16350b57cec5SDimitry Andric case ISD::SRA: {
16360b57cec5SDimitry Andric auto *S = dyn_cast<ConstantSDNode>(N.getOperand(1));
16370b57cec5SDimitry Andric if (!S || S->getZExtValue() != 32)
16380b57cec5SDimitry Andric return false;
16390b57cec5SDimitry Andric R = N;
16400b57cec5SDimitry Andric break;
16410b57cec5SDimitry Andric }
16420b57cec5SDimitry Andric default:
16430b57cec5SDimitry Andric return false;
16440b57cec5SDimitry Andric }
16450b57cec5SDimitry Andric EVT RT = R.getValueType();
16460b57cec5SDimitry Andric if (RT == MVT::i64)
16470b57cec5SDimitry Andric return true;
16480b57cec5SDimitry Andric assert(RT == MVT::i32);
16490b57cec5SDimitry Andric // This is only to produce a value of type i64. Do not rely on the
16500b57cec5SDimitry Andric // high bits produced by this.
16510b57cec5SDimitry Andric const SDLoc &dl(N);
16520b57cec5SDimitry Andric SDValue Ops[] = {
16530b57cec5SDimitry Andric CurDAG->getTargetConstant(Hexagon::DoubleRegsRegClassID, dl, MVT::i32),
16540b57cec5SDimitry Andric R, CurDAG->getTargetConstant(Hexagon::isub_hi, dl, MVT::i32),
16550b57cec5SDimitry Andric R, CurDAG->getTargetConstant(Hexagon::isub_lo, dl, MVT::i32)
16560b57cec5SDimitry Andric };
16570b57cec5SDimitry Andric SDNode *T = CurDAG->getMachineNode(TargetOpcode::REG_SEQUENCE, dl,
16580b57cec5SDimitry Andric MVT::i64, Ops);
16590b57cec5SDimitry Andric R = SDValue(T, 0);
16600b57cec5SDimitry Andric return true;
16610b57cec5SDimitry Andric }
16620b57cec5SDimitry Andric
keepsLowBits(const SDValue & Val,unsigned NumBits,SDValue & Src)16630b57cec5SDimitry Andric bool HexagonDAGToDAGISel::keepsLowBits(const SDValue &Val, unsigned NumBits,
16640b57cec5SDimitry Andric SDValue &Src) {
16650b57cec5SDimitry Andric unsigned Opc = Val.getOpcode();
16660b57cec5SDimitry Andric switch (Opc) {
16670b57cec5SDimitry Andric case ISD::SIGN_EXTEND:
16680b57cec5SDimitry Andric case ISD::ZERO_EXTEND:
16690b57cec5SDimitry Andric case ISD::ANY_EXTEND: {
16700b57cec5SDimitry Andric const SDValue &Op0 = Val.getOperand(0);
16710b57cec5SDimitry Andric EVT T = Op0.getValueType();
16720b57cec5SDimitry Andric if (T.isInteger() && T.getSizeInBits() == NumBits) {
16730b57cec5SDimitry Andric Src = Op0;
16740b57cec5SDimitry Andric return true;
16750b57cec5SDimitry Andric }
16760b57cec5SDimitry Andric break;
16770b57cec5SDimitry Andric }
16780b57cec5SDimitry Andric case ISD::SIGN_EXTEND_INREG:
16790b57cec5SDimitry Andric case ISD::AssertSext:
16800b57cec5SDimitry Andric case ISD::AssertZext:
16810b57cec5SDimitry Andric if (Val.getOperand(0).getValueType().isInteger()) {
16820b57cec5SDimitry Andric VTSDNode *T = cast<VTSDNode>(Val.getOperand(1));
16830b57cec5SDimitry Andric if (T->getVT().getSizeInBits() == NumBits) {
16840b57cec5SDimitry Andric Src = Val.getOperand(0);
16850b57cec5SDimitry Andric return true;
16860b57cec5SDimitry Andric }
16870b57cec5SDimitry Andric }
16880b57cec5SDimitry Andric break;
16890b57cec5SDimitry Andric case ISD::AND: {
16900b57cec5SDimitry Andric // Check if this is an AND with NumBits of lower bits set to 1.
169181ad6265SDimitry Andric uint64_t Mask = (1ULL << NumBits) - 1;
16920b57cec5SDimitry Andric if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Val.getOperand(0))) {
16930b57cec5SDimitry Andric if (C->getZExtValue() == Mask) {
16940b57cec5SDimitry Andric Src = Val.getOperand(1);
16950b57cec5SDimitry Andric return true;
16960b57cec5SDimitry Andric }
16970b57cec5SDimitry Andric }
16980b57cec5SDimitry Andric if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Val.getOperand(1))) {
16990b57cec5SDimitry Andric if (C->getZExtValue() == Mask) {
17000b57cec5SDimitry Andric Src = Val.getOperand(0);
17010b57cec5SDimitry Andric return true;
17020b57cec5SDimitry Andric }
17030b57cec5SDimitry Andric }
17040b57cec5SDimitry Andric break;
17050b57cec5SDimitry Andric }
17060b57cec5SDimitry Andric case ISD::OR:
17070b57cec5SDimitry Andric case ISD::XOR: {
17080b57cec5SDimitry Andric // OR/XOR with the lower NumBits bits set to 0.
170981ad6265SDimitry Andric uint64_t Mask = (1ULL << NumBits) - 1;
17100b57cec5SDimitry Andric if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Val.getOperand(0))) {
17110b57cec5SDimitry Andric if ((C->getZExtValue() & Mask) == 0) {
17120b57cec5SDimitry Andric Src = Val.getOperand(1);
17130b57cec5SDimitry Andric return true;
17140b57cec5SDimitry Andric }
17150b57cec5SDimitry Andric }
17160b57cec5SDimitry Andric if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Val.getOperand(1))) {
17170b57cec5SDimitry Andric if ((C->getZExtValue() & Mask) == 0) {
17180b57cec5SDimitry Andric Src = Val.getOperand(0);
17190b57cec5SDimitry Andric return true;
17200b57cec5SDimitry Andric }
17210b57cec5SDimitry Andric }
17220b57cec5SDimitry Andric break;
17230b57cec5SDimitry Andric }
17240b57cec5SDimitry Andric default:
17250b57cec5SDimitry Andric break;
17260b57cec5SDimitry Andric }
17270b57cec5SDimitry Andric return false;
17280b57cec5SDimitry Andric }
17290b57cec5SDimitry Andric
isAlignedMemNode(const MemSDNode * N) const17300b57cec5SDimitry Andric bool HexagonDAGToDAGISel::isAlignedMemNode(const MemSDNode *N) const {
173181ad6265SDimitry Andric return N->getAlign().value() >= N->getMemoryVT().getStoreSize();
17320b57cec5SDimitry Andric }
17330b57cec5SDimitry Andric
isSmallStackStore(const StoreSDNode * N) const17340b57cec5SDimitry Andric bool HexagonDAGToDAGISel::isSmallStackStore(const StoreSDNode *N) const {
17350b57cec5SDimitry Andric unsigned StackSize = MF->getFrameInfo().estimateStackSize(*MF);
17360b57cec5SDimitry Andric switch (N->getMemoryVT().getStoreSize()) {
17370b57cec5SDimitry Andric case 1:
17380b57cec5SDimitry Andric return StackSize <= 56; // 1*2^6 - 8
17390b57cec5SDimitry Andric case 2:
17400b57cec5SDimitry Andric return StackSize <= 120; // 2*2^6 - 8
17410b57cec5SDimitry Andric case 4:
17420b57cec5SDimitry Andric return StackSize <= 248; // 4*2^6 - 8
17430b57cec5SDimitry Andric default:
17440b57cec5SDimitry Andric return false;
17450b57cec5SDimitry Andric }
17460b57cec5SDimitry Andric }
17470b57cec5SDimitry Andric
17480b57cec5SDimitry Andric // Return true when the given node fits in a positive half word.
isPositiveHalfWord(const SDNode * N) const17490b57cec5SDimitry Andric bool HexagonDAGToDAGISel::isPositiveHalfWord(const SDNode *N) const {
17500b57cec5SDimitry Andric if (const ConstantSDNode *CN = dyn_cast<const ConstantSDNode>(N)) {
17510b57cec5SDimitry Andric int64_t V = CN->getSExtValue();
17520b57cec5SDimitry Andric return V > 0 && isInt<16>(V);
17530b57cec5SDimitry Andric }
17540b57cec5SDimitry Andric if (N->getOpcode() == ISD::SIGN_EXTEND_INREG) {
17550b57cec5SDimitry Andric const VTSDNode *VN = dyn_cast<const VTSDNode>(N->getOperand(1));
17560b57cec5SDimitry Andric return VN->getVT().getSizeInBits() <= 16;
17570b57cec5SDimitry Andric }
17580b57cec5SDimitry Andric return false;
17590b57cec5SDimitry Andric }
17600b57cec5SDimitry Andric
hasOneUse(const SDNode * N) const17610b57cec5SDimitry Andric bool HexagonDAGToDAGISel::hasOneUse(const SDNode *N) const {
17620b57cec5SDimitry Andric return !CheckSingleUse || N->hasOneUse();
17630b57cec5SDimitry Andric }
17640b57cec5SDimitry Andric
17650b57cec5SDimitry Andric ////////////////////////////////////////////////////////////////////////////////
17660b57cec5SDimitry Andric // Rebalancing of address calculation trees
17670b57cec5SDimitry Andric
isOpcodeHandled(const SDNode * N)17680b57cec5SDimitry Andric static bool isOpcodeHandled(const SDNode *N) {
17690b57cec5SDimitry Andric switch (N->getOpcode()) {
17700b57cec5SDimitry Andric case ISD::ADD:
17710b57cec5SDimitry Andric case ISD::MUL:
17720b57cec5SDimitry Andric return true;
17730b57cec5SDimitry Andric case ISD::SHL:
17740b57cec5SDimitry Andric // We only handle constant shifts because these can be easily flattened
17750b57cec5SDimitry Andric // into multiplications by 2^Op1.
17760b57cec5SDimitry Andric return isa<ConstantSDNode>(N->getOperand(1).getNode());
17770b57cec5SDimitry Andric default:
17780b57cec5SDimitry Andric return false;
17790b57cec5SDimitry Andric }
17800b57cec5SDimitry Andric }
17810b57cec5SDimitry Andric
17820b57cec5SDimitry Andric /// Return the weight of an SDNode
getWeight(SDNode * N)17830b57cec5SDimitry Andric int HexagonDAGToDAGISel::getWeight(SDNode *N) {
17840b57cec5SDimitry Andric if (!isOpcodeHandled(N))
17850b57cec5SDimitry Andric return 1;
17860b57cec5SDimitry Andric assert(RootWeights.count(N) && "Cannot get weight of unseen root!");
17870b57cec5SDimitry Andric assert(RootWeights[N] != -1 && "Cannot get weight of unvisited root!");
17880b57cec5SDimitry Andric assert(RootWeights[N] != -2 && "Cannot get weight of RAWU'd root!");
17890b57cec5SDimitry Andric return RootWeights[N];
17900b57cec5SDimitry Andric }
17910b57cec5SDimitry Andric
getHeight(SDNode * N)17920b57cec5SDimitry Andric int HexagonDAGToDAGISel::getHeight(SDNode *N) {
17930b57cec5SDimitry Andric if (!isOpcodeHandled(N))
17940b57cec5SDimitry Andric return 0;
17950b57cec5SDimitry Andric assert(RootWeights.count(N) && RootWeights[N] >= 0 &&
17960b57cec5SDimitry Andric "Cannot query height of unvisited/RAUW'd node!");
17970b57cec5SDimitry Andric return RootHeights[N];
17980b57cec5SDimitry Andric }
17990b57cec5SDimitry Andric
18000b57cec5SDimitry Andric namespace {
18010b57cec5SDimitry Andric struct WeightedLeaf {
18020b57cec5SDimitry Andric SDValue Value;
18030b57cec5SDimitry Andric int Weight;
18040b57cec5SDimitry Andric int InsertionOrder;
18050b57cec5SDimitry Andric
WeightedLeaf__anon14d602910611::WeightedLeaf180681ad6265SDimitry Andric WeightedLeaf() {}
18070b57cec5SDimitry Andric
WeightedLeaf__anon14d602910611::WeightedLeaf18080b57cec5SDimitry Andric WeightedLeaf(SDValue Value, int Weight, int InsertionOrder) :
18090b57cec5SDimitry Andric Value(Value), Weight(Weight), InsertionOrder(InsertionOrder) {
18100b57cec5SDimitry Andric assert(Weight >= 0 && "Weight must be >= 0");
18110b57cec5SDimitry Andric }
18120b57cec5SDimitry Andric
Compare__anon14d602910611::WeightedLeaf18130b57cec5SDimitry Andric static bool Compare(const WeightedLeaf &A, const WeightedLeaf &B) {
18140b57cec5SDimitry Andric assert(A.Value.getNode() && B.Value.getNode());
18150b57cec5SDimitry Andric return A.Weight == B.Weight ?
18160b57cec5SDimitry Andric (A.InsertionOrder > B.InsertionOrder) :
18170b57cec5SDimitry Andric (A.Weight > B.Weight);
18180b57cec5SDimitry Andric }
18190b57cec5SDimitry Andric };
18200b57cec5SDimitry Andric
18210b57cec5SDimitry Andric /// A specialized priority queue for WeigthedLeaves. It automatically folds
18220b57cec5SDimitry Andric /// constants and allows removal of non-top elements while maintaining the
18230b57cec5SDimitry Andric /// priority order.
18240b57cec5SDimitry Andric class LeafPrioQueue {
18250b57cec5SDimitry Andric SmallVector<WeightedLeaf, 8> Q;
18260b57cec5SDimitry Andric bool HaveConst;
18270b57cec5SDimitry Andric WeightedLeaf ConstElt;
18280b57cec5SDimitry Andric unsigned Opcode;
18290b57cec5SDimitry Andric
18300b57cec5SDimitry Andric public:
empty()18310b57cec5SDimitry Andric bool empty() {
18320b57cec5SDimitry Andric return (!HaveConst && Q.empty());
18330b57cec5SDimitry Andric }
18340b57cec5SDimitry Andric
size()18350b57cec5SDimitry Andric size_t size() {
18360b57cec5SDimitry Andric return Q.size() + HaveConst;
18370b57cec5SDimitry Andric }
18380b57cec5SDimitry Andric
hasConst()18390b57cec5SDimitry Andric bool hasConst() {
18400b57cec5SDimitry Andric return HaveConst;
18410b57cec5SDimitry Andric }
18420b57cec5SDimitry Andric
top()18430b57cec5SDimitry Andric const WeightedLeaf &top() {
18440b57cec5SDimitry Andric if (HaveConst)
18450b57cec5SDimitry Andric return ConstElt;
18460b57cec5SDimitry Andric return Q.front();
18470b57cec5SDimitry Andric }
18480b57cec5SDimitry Andric
pop()18490b57cec5SDimitry Andric WeightedLeaf pop() {
18500b57cec5SDimitry Andric if (HaveConst) {
18510b57cec5SDimitry Andric HaveConst = false;
18520b57cec5SDimitry Andric return ConstElt;
18530b57cec5SDimitry Andric }
18540b57cec5SDimitry Andric std::pop_heap(Q.begin(), Q.end(), WeightedLeaf::Compare);
18550b57cec5SDimitry Andric return Q.pop_back_val();
18560b57cec5SDimitry Andric }
18570b57cec5SDimitry Andric
push(WeightedLeaf L,bool SeparateConst=true)18580b57cec5SDimitry Andric void push(WeightedLeaf L, bool SeparateConst=true) {
18590b57cec5SDimitry Andric if (!HaveConst && SeparateConst && isa<ConstantSDNode>(L.Value)) {
18600b57cec5SDimitry Andric if (Opcode == ISD::MUL &&
18610b57cec5SDimitry Andric cast<ConstantSDNode>(L.Value)->getSExtValue() == 1)
18620b57cec5SDimitry Andric return;
18630b57cec5SDimitry Andric if (Opcode == ISD::ADD &&
18640b57cec5SDimitry Andric cast<ConstantSDNode>(L.Value)->getSExtValue() == 0)
18650b57cec5SDimitry Andric return;
18660b57cec5SDimitry Andric
18670b57cec5SDimitry Andric HaveConst = true;
18680b57cec5SDimitry Andric ConstElt = L;
18690b57cec5SDimitry Andric } else {
18700b57cec5SDimitry Andric Q.push_back(L);
18710b57cec5SDimitry Andric std::push_heap(Q.begin(), Q.end(), WeightedLeaf::Compare);
18720b57cec5SDimitry Andric }
18730b57cec5SDimitry Andric }
18740b57cec5SDimitry Andric
18750b57cec5SDimitry Andric /// Push L to the bottom of the queue regardless of its weight. If L is
18760b57cec5SDimitry Andric /// constant, it will not be folded with other constants in the queue.
pushToBottom(WeightedLeaf L)18770b57cec5SDimitry Andric void pushToBottom(WeightedLeaf L) {
18780b57cec5SDimitry Andric L.Weight = 1000;
18790b57cec5SDimitry Andric push(L, false);
18800b57cec5SDimitry Andric }
18810b57cec5SDimitry Andric
18820b57cec5SDimitry Andric /// Search for a SHL(x, [<=MaxAmount]) subtree in the queue, return the one of
18830b57cec5SDimitry Andric /// lowest weight and remove it from the queue.
18840b57cec5SDimitry Andric WeightedLeaf findSHL(uint64_t MaxAmount);
18850b57cec5SDimitry Andric
18860b57cec5SDimitry Andric WeightedLeaf findMULbyConst();
18870b57cec5SDimitry Andric
LeafPrioQueue(unsigned Opcode)18880b57cec5SDimitry Andric LeafPrioQueue(unsigned Opcode) :
18890b57cec5SDimitry Andric HaveConst(false), Opcode(Opcode) { }
18900b57cec5SDimitry Andric };
18910b57cec5SDimitry Andric } // end anonymous namespace
18920b57cec5SDimitry Andric
findSHL(uint64_t MaxAmount)18930b57cec5SDimitry Andric WeightedLeaf LeafPrioQueue::findSHL(uint64_t MaxAmount) {
18940b57cec5SDimitry Andric int ResultPos;
18950b57cec5SDimitry Andric WeightedLeaf Result;
18960b57cec5SDimitry Andric
18970b57cec5SDimitry Andric for (int Pos = 0, End = Q.size(); Pos != End; ++Pos) {
18980b57cec5SDimitry Andric const WeightedLeaf &L = Q[Pos];
18990b57cec5SDimitry Andric const SDValue &Val = L.Value;
19000b57cec5SDimitry Andric if (Val.getOpcode() != ISD::SHL ||
19010b57cec5SDimitry Andric !isa<ConstantSDNode>(Val.getOperand(1)) ||
19020b57cec5SDimitry Andric Val.getConstantOperandVal(1) > MaxAmount)
19030b57cec5SDimitry Andric continue;
19040b57cec5SDimitry Andric if (!Result.Value.getNode() || Result.Weight > L.Weight ||
19050b57cec5SDimitry Andric (Result.Weight == L.Weight && Result.InsertionOrder > L.InsertionOrder))
19060b57cec5SDimitry Andric {
19070b57cec5SDimitry Andric Result = L;
19080b57cec5SDimitry Andric ResultPos = Pos;
19090b57cec5SDimitry Andric }
19100b57cec5SDimitry Andric }
19110b57cec5SDimitry Andric
19120b57cec5SDimitry Andric if (Result.Value.getNode()) {
19130b57cec5SDimitry Andric Q.erase(&Q[ResultPos]);
19140b57cec5SDimitry Andric std::make_heap(Q.begin(), Q.end(), WeightedLeaf::Compare);
19150b57cec5SDimitry Andric }
19160b57cec5SDimitry Andric
19170b57cec5SDimitry Andric return Result;
19180b57cec5SDimitry Andric }
19190b57cec5SDimitry Andric
findMULbyConst()19200b57cec5SDimitry Andric WeightedLeaf LeafPrioQueue::findMULbyConst() {
19210b57cec5SDimitry Andric int ResultPos;
19220b57cec5SDimitry Andric WeightedLeaf Result;
19230b57cec5SDimitry Andric
19240b57cec5SDimitry Andric for (int Pos = 0, End = Q.size(); Pos != End; ++Pos) {
19250b57cec5SDimitry Andric const WeightedLeaf &L = Q[Pos];
19260b57cec5SDimitry Andric const SDValue &Val = L.Value;
19270b57cec5SDimitry Andric if (Val.getOpcode() != ISD::MUL ||
19280b57cec5SDimitry Andric !isa<ConstantSDNode>(Val.getOperand(1)) ||
19290b57cec5SDimitry Andric Val.getConstantOperandVal(1) > 127)
19300b57cec5SDimitry Andric continue;
19310b57cec5SDimitry Andric if (!Result.Value.getNode() || Result.Weight > L.Weight ||
19320b57cec5SDimitry Andric (Result.Weight == L.Weight && Result.InsertionOrder > L.InsertionOrder))
19330b57cec5SDimitry Andric {
19340b57cec5SDimitry Andric Result = L;
19350b57cec5SDimitry Andric ResultPos = Pos;
19360b57cec5SDimitry Andric }
19370b57cec5SDimitry Andric }
19380b57cec5SDimitry Andric
19390b57cec5SDimitry Andric if (Result.Value.getNode()) {
19400b57cec5SDimitry Andric Q.erase(&Q[ResultPos]);
19410b57cec5SDimitry Andric std::make_heap(Q.begin(), Q.end(), WeightedLeaf::Compare);
19420b57cec5SDimitry Andric }
19430b57cec5SDimitry Andric
19440b57cec5SDimitry Andric return Result;
19450b57cec5SDimitry Andric }
19460b57cec5SDimitry Andric
getMultiplierForSHL(SDNode * N)19470b57cec5SDimitry Andric SDValue HexagonDAGToDAGISel::getMultiplierForSHL(SDNode *N) {
19480b57cec5SDimitry Andric uint64_t MulFactor = 1ull << N->getConstantOperandVal(1);
19490b57cec5SDimitry Andric return CurDAG->getConstant(MulFactor, SDLoc(N),
19500b57cec5SDimitry Andric N->getOperand(1).getValueType());
19510b57cec5SDimitry Andric }
19520b57cec5SDimitry Andric
19530b57cec5SDimitry Andric /// @returns the value x for which 2^x is a factor of Val
getPowerOf2Factor(SDValue Val)19540b57cec5SDimitry Andric static unsigned getPowerOf2Factor(SDValue Val) {
19550b57cec5SDimitry Andric if (Val.getOpcode() == ISD::MUL) {
19560b57cec5SDimitry Andric unsigned MaxFactor = 0;
19570b57cec5SDimitry Andric for (int i = 0; i < 2; ++i) {
19580b57cec5SDimitry Andric ConstantSDNode *C = dyn_cast<ConstantSDNode>(Val.getOperand(i));
19590b57cec5SDimitry Andric if (!C)
19600b57cec5SDimitry Andric continue;
19610b57cec5SDimitry Andric const APInt &CInt = C->getAPIntValue();
19620b57cec5SDimitry Andric if (CInt.getBoolValue())
196306c3fb27SDimitry Andric MaxFactor = CInt.countr_zero();
19640b57cec5SDimitry Andric }
19650b57cec5SDimitry Andric return MaxFactor;
19660b57cec5SDimitry Andric }
19670b57cec5SDimitry Andric if (Val.getOpcode() == ISD::SHL) {
19680b57cec5SDimitry Andric if (!isa<ConstantSDNode>(Val.getOperand(1).getNode()))
19690b57cec5SDimitry Andric return 0;
19700b57cec5SDimitry Andric return (unsigned) Val.getConstantOperandVal(1);
19710b57cec5SDimitry Andric }
19720b57cec5SDimitry Andric
19730b57cec5SDimitry Andric return 0;
19740b57cec5SDimitry Andric }
19750b57cec5SDimitry Andric
19760b57cec5SDimitry Andric /// @returns true if V>>Amount will eliminate V's operation on its child
willShiftRightEliminate(SDValue V,unsigned Amount)19770b57cec5SDimitry Andric static bool willShiftRightEliminate(SDValue V, unsigned Amount) {
19780b57cec5SDimitry Andric if (V.getOpcode() == ISD::MUL) {
19790b57cec5SDimitry Andric SDValue Ops[] = { V.getOperand(0), V.getOperand(1) };
19800b57cec5SDimitry Andric for (int i = 0; i < 2; ++i)
19810b57cec5SDimitry Andric if (isa<ConstantSDNode>(Ops[i].getNode()) &&
19820b57cec5SDimitry Andric V.getConstantOperandVal(i) % (1ULL << Amount) == 0) {
19830b57cec5SDimitry Andric uint64_t NewConst = V.getConstantOperandVal(i) >> Amount;
19840b57cec5SDimitry Andric return (NewConst == 1);
19850b57cec5SDimitry Andric }
19860b57cec5SDimitry Andric } else if (V.getOpcode() == ISD::SHL) {
19870b57cec5SDimitry Andric return (Amount == V.getConstantOperandVal(1));
19880b57cec5SDimitry Andric }
19890b57cec5SDimitry Andric
19900b57cec5SDimitry Andric return false;
19910b57cec5SDimitry Andric }
19920b57cec5SDimitry Andric
factorOutPowerOf2(SDValue V,unsigned Power)19930b57cec5SDimitry Andric SDValue HexagonDAGToDAGISel::factorOutPowerOf2(SDValue V, unsigned Power) {
19940b57cec5SDimitry Andric SDValue Ops[] = { V.getOperand(0), V.getOperand(1) };
19950b57cec5SDimitry Andric if (V.getOpcode() == ISD::MUL) {
19960b57cec5SDimitry Andric for (int i=0; i < 2; ++i) {
19970b57cec5SDimitry Andric if (isa<ConstantSDNode>(Ops[i].getNode()) &&
19980b57cec5SDimitry Andric V.getConstantOperandVal(i) % ((uint64_t)1 << Power) == 0) {
19990b57cec5SDimitry Andric uint64_t NewConst = V.getConstantOperandVal(i) >> Power;
20000b57cec5SDimitry Andric if (NewConst == 1)
20010b57cec5SDimitry Andric return Ops[!i];
20020b57cec5SDimitry Andric Ops[i] = CurDAG->getConstant(NewConst,
20030b57cec5SDimitry Andric SDLoc(V), V.getValueType());
20040b57cec5SDimitry Andric break;
20050b57cec5SDimitry Andric }
20060b57cec5SDimitry Andric }
20070b57cec5SDimitry Andric } else if (V.getOpcode() == ISD::SHL) {
20080b57cec5SDimitry Andric uint64_t ShiftAmount = V.getConstantOperandVal(1);
20090b57cec5SDimitry Andric if (ShiftAmount == Power)
20100b57cec5SDimitry Andric return Ops[0];
20110b57cec5SDimitry Andric Ops[1] = CurDAG->getConstant(ShiftAmount - Power,
20120b57cec5SDimitry Andric SDLoc(V), V.getValueType());
20130b57cec5SDimitry Andric }
20140b57cec5SDimitry Andric
20150b57cec5SDimitry Andric return CurDAG->getNode(V.getOpcode(), SDLoc(V), V.getValueType(), Ops);
20160b57cec5SDimitry Andric }
20170b57cec5SDimitry Andric
isTargetConstant(const SDValue & V)20180b57cec5SDimitry Andric static bool isTargetConstant(const SDValue &V) {
20190b57cec5SDimitry Andric return V.getOpcode() == HexagonISD::CONST32 ||
20200b57cec5SDimitry Andric V.getOpcode() == HexagonISD::CONST32_GP;
20210b57cec5SDimitry Andric }
20220b57cec5SDimitry Andric
getUsesInFunction(const Value * V)20230b57cec5SDimitry Andric unsigned HexagonDAGToDAGISel::getUsesInFunction(const Value *V) {
20240b57cec5SDimitry Andric if (GAUsesInFunction.count(V))
20250b57cec5SDimitry Andric return GAUsesInFunction[V];
20260b57cec5SDimitry Andric
20270b57cec5SDimitry Andric unsigned Result = 0;
20280b57cec5SDimitry Andric const Function &CurF = CurDAG->getMachineFunction().getFunction();
20290b57cec5SDimitry Andric for (const User *U : V->users()) {
20300b57cec5SDimitry Andric if (isa<Instruction>(U) &&
20310b57cec5SDimitry Andric cast<Instruction>(U)->getParent()->getParent() == &CurF)
20320b57cec5SDimitry Andric ++Result;
20330b57cec5SDimitry Andric }
20340b57cec5SDimitry Andric
20350b57cec5SDimitry Andric GAUsesInFunction[V] = Result;
20360b57cec5SDimitry Andric
20370b57cec5SDimitry Andric return Result;
20380b57cec5SDimitry Andric }
20390b57cec5SDimitry Andric
20400b57cec5SDimitry Andric /// Note - After calling this, N may be dead. It may have been replaced by a
20410b57cec5SDimitry Andric /// new node, so always use the returned value in place of N.
20420b57cec5SDimitry Andric ///
20430b57cec5SDimitry Andric /// @returns The SDValue taking the place of N (which could be N if it is
20440b57cec5SDimitry Andric /// unchanged)
balanceSubTree(SDNode * N,bool TopLevel)20450b57cec5SDimitry Andric SDValue HexagonDAGToDAGISel::balanceSubTree(SDNode *N, bool TopLevel) {
20460b57cec5SDimitry Andric assert(RootWeights.count(N) && "Cannot balance non-root node.");
20470b57cec5SDimitry Andric assert(RootWeights[N] != -2 && "This node was RAUW'd!");
20480b57cec5SDimitry Andric assert(!TopLevel || N->getOpcode() == ISD::ADD);
20490b57cec5SDimitry Andric
20500b57cec5SDimitry Andric // Return early if this node was already visited
20510b57cec5SDimitry Andric if (RootWeights[N] != -1)
20520b57cec5SDimitry Andric return SDValue(N, 0);
20530b57cec5SDimitry Andric
20540b57cec5SDimitry Andric assert(isOpcodeHandled(N));
20550b57cec5SDimitry Andric
20560b57cec5SDimitry Andric SDValue Op0 = N->getOperand(0);
20570b57cec5SDimitry Andric SDValue Op1 = N->getOperand(1);
20580b57cec5SDimitry Andric
20590b57cec5SDimitry Andric // Return early if the operands will remain unchanged or are all roots
20600b57cec5SDimitry Andric if ((!isOpcodeHandled(Op0.getNode()) || RootWeights.count(Op0.getNode())) &&
20610b57cec5SDimitry Andric (!isOpcodeHandled(Op1.getNode()) || RootWeights.count(Op1.getNode()))) {
20620b57cec5SDimitry Andric SDNode *Op0N = Op0.getNode();
20630b57cec5SDimitry Andric int Weight;
20640b57cec5SDimitry Andric if (isOpcodeHandled(Op0N) && RootWeights[Op0N] == -1) {
20650b57cec5SDimitry Andric Weight = getWeight(balanceSubTree(Op0N).getNode());
20660b57cec5SDimitry Andric // Weight = calculateWeight(Op0N);
20670b57cec5SDimitry Andric } else
20680b57cec5SDimitry Andric Weight = getWeight(Op0N);
20690b57cec5SDimitry Andric
20700b57cec5SDimitry Andric SDNode *Op1N = N->getOperand(1).getNode(); // Op1 may have been RAUWd
20710b57cec5SDimitry Andric if (isOpcodeHandled(Op1N) && RootWeights[Op1N] == -1) {
20720b57cec5SDimitry Andric Weight += getWeight(balanceSubTree(Op1N).getNode());
20730b57cec5SDimitry Andric // Weight += calculateWeight(Op1N);
20740b57cec5SDimitry Andric } else
20750b57cec5SDimitry Andric Weight += getWeight(Op1N);
20760b57cec5SDimitry Andric
20770b57cec5SDimitry Andric RootWeights[N] = Weight;
20780b57cec5SDimitry Andric RootHeights[N] = std::max(getHeight(N->getOperand(0).getNode()),
20790b57cec5SDimitry Andric getHeight(N->getOperand(1).getNode())) + 1;
20800b57cec5SDimitry Andric
20810b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> No need to balance root (Weight=" << Weight
20820b57cec5SDimitry Andric << " Height=" << RootHeights[N] << "): ");
20830b57cec5SDimitry Andric LLVM_DEBUG(N->dump(CurDAG));
20840b57cec5SDimitry Andric
20850b57cec5SDimitry Andric return SDValue(N, 0);
20860b57cec5SDimitry Andric }
20870b57cec5SDimitry Andric
20880b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "** Balancing root node: ");
20890b57cec5SDimitry Andric LLVM_DEBUG(N->dump(CurDAG));
20900b57cec5SDimitry Andric
20910b57cec5SDimitry Andric unsigned NOpcode = N->getOpcode();
20920b57cec5SDimitry Andric
20930b57cec5SDimitry Andric LeafPrioQueue Leaves(NOpcode);
20940b57cec5SDimitry Andric SmallVector<SDValue, 4> Worklist;
20950b57cec5SDimitry Andric Worklist.push_back(SDValue(N, 0));
20960b57cec5SDimitry Andric
20970b57cec5SDimitry Andric // SHL nodes will be converted to MUL nodes
20980b57cec5SDimitry Andric if (NOpcode == ISD::SHL)
20990b57cec5SDimitry Andric NOpcode = ISD::MUL;
21000b57cec5SDimitry Andric
21010b57cec5SDimitry Andric bool CanFactorize = false;
21020b57cec5SDimitry Andric WeightedLeaf Mul1, Mul2;
21030b57cec5SDimitry Andric unsigned MaxPowerOf2 = 0;
21040b57cec5SDimitry Andric WeightedLeaf GA;
21050b57cec5SDimitry Andric
21060b57cec5SDimitry Andric // Do not try to factor out a shift if there is already a shift at the tip of
21070b57cec5SDimitry Andric // the tree.
21080b57cec5SDimitry Andric bool HaveTopLevelShift = false;
21090b57cec5SDimitry Andric if (TopLevel &&
21100b57cec5SDimitry Andric ((isOpcodeHandled(Op0.getNode()) && Op0.getOpcode() == ISD::SHL &&
21110b57cec5SDimitry Andric Op0.getConstantOperandVal(1) < 4) ||
21120b57cec5SDimitry Andric (isOpcodeHandled(Op1.getNode()) && Op1.getOpcode() == ISD::SHL &&
21130b57cec5SDimitry Andric Op1.getConstantOperandVal(1) < 4)))
21140b57cec5SDimitry Andric HaveTopLevelShift = true;
21150b57cec5SDimitry Andric
21160b57cec5SDimitry Andric // Flatten the subtree into an ordered list of leaves; at the same time
21170b57cec5SDimitry Andric // determine whether the tree is already balanced.
21180b57cec5SDimitry Andric int InsertionOrder = 0;
21190b57cec5SDimitry Andric SmallDenseMap<SDValue, int> NodeHeights;
21200b57cec5SDimitry Andric bool Imbalanced = false;
21210b57cec5SDimitry Andric int CurrentWeight = 0;
21220b57cec5SDimitry Andric while (!Worklist.empty()) {
21230b57cec5SDimitry Andric SDValue Child = Worklist.pop_back_val();
21240b57cec5SDimitry Andric
21250b57cec5SDimitry Andric if (Child.getNode() != N && RootWeights.count(Child.getNode())) {
21260b57cec5SDimitry Andric // CASE 1: Child is a root note
21270b57cec5SDimitry Andric
21280b57cec5SDimitry Andric int Weight = RootWeights[Child.getNode()];
21290b57cec5SDimitry Andric if (Weight == -1) {
21300b57cec5SDimitry Andric Child = balanceSubTree(Child.getNode());
21310b57cec5SDimitry Andric // calculateWeight(Child.getNode());
21320b57cec5SDimitry Andric Weight = getWeight(Child.getNode());
21330b57cec5SDimitry Andric } else if (Weight == -2) {
21340b57cec5SDimitry Andric // Whoops, this node was RAUWd by one of the balanceSubTree calls we
21350b57cec5SDimitry Andric // made. Our worklist isn't up to date anymore.
21360b57cec5SDimitry Andric // Restart the whole process.
21370b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Subtree was RAUWd. Restarting...\n");
21380b57cec5SDimitry Andric return balanceSubTree(N, TopLevel);
21390b57cec5SDimitry Andric }
21400b57cec5SDimitry Andric
21410b57cec5SDimitry Andric NodeHeights[Child] = 1;
21420b57cec5SDimitry Andric CurrentWeight += Weight;
21430b57cec5SDimitry Andric
21440b57cec5SDimitry Andric unsigned PowerOf2;
21450b57cec5SDimitry Andric if (TopLevel && !CanFactorize && !HaveTopLevelShift &&
21460b57cec5SDimitry Andric (Child.getOpcode() == ISD::MUL || Child.getOpcode() == ISD::SHL) &&
21470b57cec5SDimitry Andric Child.hasOneUse() && (PowerOf2 = getPowerOf2Factor(Child))) {
21480b57cec5SDimitry Andric // Try to identify two factorizable MUL/SHL children greedily. Leave
21490b57cec5SDimitry Andric // them out of the priority queue for now so we can deal with them
21500b57cec5SDimitry Andric // after.
21510b57cec5SDimitry Andric if (!Mul1.Value.getNode()) {
21520b57cec5SDimitry Andric Mul1 = WeightedLeaf(Child, Weight, InsertionOrder++);
21530b57cec5SDimitry Andric MaxPowerOf2 = PowerOf2;
21540b57cec5SDimitry Andric } else {
21550b57cec5SDimitry Andric Mul2 = WeightedLeaf(Child, Weight, InsertionOrder++);
21560b57cec5SDimitry Andric MaxPowerOf2 = std::min(MaxPowerOf2, PowerOf2);
21570b57cec5SDimitry Andric
21580b57cec5SDimitry Andric // Our addressing modes can only shift by a maximum of 3
21590b57cec5SDimitry Andric if (MaxPowerOf2 > 3)
21600b57cec5SDimitry Andric MaxPowerOf2 = 3;
21610b57cec5SDimitry Andric
21620b57cec5SDimitry Andric CanFactorize = true;
21630b57cec5SDimitry Andric }
21640b57cec5SDimitry Andric } else
21650b57cec5SDimitry Andric Leaves.push(WeightedLeaf(Child, Weight, InsertionOrder++));
21660b57cec5SDimitry Andric } else if (!isOpcodeHandled(Child.getNode())) {
21670b57cec5SDimitry Andric // CASE 2: Child is an unhandled kind of node (e.g. constant)
21680b57cec5SDimitry Andric int Weight = getWeight(Child.getNode());
21690b57cec5SDimitry Andric
21700b57cec5SDimitry Andric NodeHeights[Child] = getHeight(Child.getNode());
21710b57cec5SDimitry Andric CurrentWeight += Weight;
21720b57cec5SDimitry Andric
21730b57cec5SDimitry Andric if (isTargetConstant(Child) && !GA.Value.getNode())
21740b57cec5SDimitry Andric GA = WeightedLeaf(Child, Weight, InsertionOrder++);
21750b57cec5SDimitry Andric else
21760b57cec5SDimitry Andric Leaves.push(WeightedLeaf(Child, Weight, InsertionOrder++));
21770b57cec5SDimitry Andric } else {
21780b57cec5SDimitry Andric // CASE 3: Child is a subtree of same opcode
21790b57cec5SDimitry Andric // Visit children first, then flatten.
21800b57cec5SDimitry Andric unsigned ChildOpcode = Child.getOpcode();
21810b57cec5SDimitry Andric assert(ChildOpcode == NOpcode ||
21820b57cec5SDimitry Andric (NOpcode == ISD::MUL && ChildOpcode == ISD::SHL));
21830b57cec5SDimitry Andric
21840b57cec5SDimitry Andric // Convert SHL to MUL
21850b57cec5SDimitry Andric SDValue Op1;
21860b57cec5SDimitry Andric if (ChildOpcode == ISD::SHL)
21870b57cec5SDimitry Andric Op1 = getMultiplierForSHL(Child.getNode());
21880b57cec5SDimitry Andric else
21890b57cec5SDimitry Andric Op1 = Child->getOperand(1);
21900b57cec5SDimitry Andric
21910b57cec5SDimitry Andric if (!NodeHeights.count(Op1) || !NodeHeights.count(Child->getOperand(0))) {
21920b57cec5SDimitry Andric assert(!NodeHeights.count(Child) && "Parent visited before children?");
21930b57cec5SDimitry Andric // Visit children first, then re-visit this node
21940b57cec5SDimitry Andric Worklist.push_back(Child);
21950b57cec5SDimitry Andric Worklist.push_back(Op1);
21960b57cec5SDimitry Andric Worklist.push_back(Child->getOperand(0));
21970b57cec5SDimitry Andric } else {
21980b57cec5SDimitry Andric // Back at this node after visiting the children
21990b57cec5SDimitry Andric if (std::abs(NodeHeights[Op1] - NodeHeights[Child->getOperand(0)]) > 1)
22000b57cec5SDimitry Andric Imbalanced = true;
22010b57cec5SDimitry Andric
22020b57cec5SDimitry Andric NodeHeights[Child] = std::max(NodeHeights[Op1],
22030b57cec5SDimitry Andric NodeHeights[Child->getOperand(0)]) + 1;
22040b57cec5SDimitry Andric }
22050b57cec5SDimitry Andric }
22060b57cec5SDimitry Andric }
22070b57cec5SDimitry Andric
22080b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Current height=" << NodeHeights[SDValue(N, 0)]
22090b57cec5SDimitry Andric << " weight=" << CurrentWeight
22100b57cec5SDimitry Andric << " imbalanced=" << Imbalanced << "\n");
22110b57cec5SDimitry Andric
22120b57cec5SDimitry Andric // Transform MUL(x, C * 2^Y) + SHL(z, Y) -> SHL(ADD(MUL(x, C), z), Y)
22130b57cec5SDimitry Andric // This factors out a shift in order to match memw(a<<Y+b).
22140b57cec5SDimitry Andric if (CanFactorize && (willShiftRightEliminate(Mul1.Value, MaxPowerOf2) ||
22150b57cec5SDimitry Andric willShiftRightEliminate(Mul2.Value, MaxPowerOf2))) {
22160b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Found common factor for two MUL children!\n");
22170b57cec5SDimitry Andric int Weight = Mul1.Weight + Mul2.Weight;
22180b57cec5SDimitry Andric int Height = std::max(NodeHeights[Mul1.Value], NodeHeights[Mul2.Value]) + 1;
22190b57cec5SDimitry Andric SDValue Mul1Factored = factorOutPowerOf2(Mul1.Value, MaxPowerOf2);
22200b57cec5SDimitry Andric SDValue Mul2Factored = factorOutPowerOf2(Mul2.Value, MaxPowerOf2);
22210b57cec5SDimitry Andric SDValue Sum = CurDAG->getNode(ISD::ADD, SDLoc(N), Mul1.Value.getValueType(),
22220b57cec5SDimitry Andric Mul1Factored, Mul2Factored);
22230b57cec5SDimitry Andric SDValue Const = CurDAG->getConstant(MaxPowerOf2, SDLoc(N),
22240b57cec5SDimitry Andric Mul1.Value.getValueType());
22250b57cec5SDimitry Andric SDValue New = CurDAG->getNode(ISD::SHL, SDLoc(N), Mul1.Value.getValueType(),
22260b57cec5SDimitry Andric Sum, Const);
22270b57cec5SDimitry Andric NodeHeights[New] = Height;
22280b57cec5SDimitry Andric Leaves.push(WeightedLeaf(New, Weight, Mul1.InsertionOrder));
22290b57cec5SDimitry Andric } else if (Mul1.Value.getNode()) {
22300b57cec5SDimitry Andric // We failed to factorize two MULs, so now the Muls are left outside the
22310b57cec5SDimitry Andric // queue... add them back.
22320b57cec5SDimitry Andric Leaves.push(Mul1);
22330b57cec5SDimitry Andric if (Mul2.Value.getNode())
22340b57cec5SDimitry Andric Leaves.push(Mul2);
22350b57cec5SDimitry Andric CanFactorize = false;
22360b57cec5SDimitry Andric }
22370b57cec5SDimitry Andric
22380b57cec5SDimitry Andric // Combine GA + Constant -> GA+Offset, but only if GA is not used elsewhere
22390b57cec5SDimitry Andric // and the root node itself is not used more than twice. This reduces the
22400b57cec5SDimitry Andric // amount of additional constant extenders introduced by this optimization.
22410b57cec5SDimitry Andric bool CombinedGA = false;
22420b57cec5SDimitry Andric if (NOpcode == ISD::ADD && GA.Value.getNode() && Leaves.hasConst() &&
22430b57cec5SDimitry Andric GA.Value.hasOneUse() && N->use_size() < 3) {
22440b57cec5SDimitry Andric GlobalAddressSDNode *GANode =
22450b57cec5SDimitry Andric cast<GlobalAddressSDNode>(GA.Value.getOperand(0));
22460b57cec5SDimitry Andric ConstantSDNode *Offset = cast<ConstantSDNode>(Leaves.top().Value);
22470b57cec5SDimitry Andric
22480b57cec5SDimitry Andric if (getUsesInFunction(GANode->getGlobal()) == 1 && Offset->hasOneUse() &&
22490b57cec5SDimitry Andric getTargetLowering()->isOffsetFoldingLegal(GANode)) {
22500b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Combining GA and offset ("
22510b57cec5SDimitry Andric << Offset->getSExtValue() << "): ");
22520b57cec5SDimitry Andric LLVM_DEBUG(GANode->dump(CurDAG));
22530b57cec5SDimitry Andric
22540b57cec5SDimitry Andric SDValue NewTGA =
22550b57cec5SDimitry Andric CurDAG->getTargetGlobalAddress(GANode->getGlobal(), SDLoc(GA.Value),
22560b57cec5SDimitry Andric GANode->getValueType(0),
22570b57cec5SDimitry Andric GANode->getOffset() + (uint64_t)Offset->getSExtValue());
22580b57cec5SDimitry Andric GA.Value = CurDAG->getNode(GA.Value.getOpcode(), SDLoc(GA.Value),
22590b57cec5SDimitry Andric GA.Value.getValueType(), NewTGA);
22600b57cec5SDimitry Andric GA.Weight += Leaves.top().Weight;
22610b57cec5SDimitry Andric
22620b57cec5SDimitry Andric NodeHeights[GA.Value] = getHeight(GA.Value.getNode());
22630b57cec5SDimitry Andric CombinedGA = true;
22640b57cec5SDimitry Andric
22650b57cec5SDimitry Andric Leaves.pop(); // Remove the offset constant from the queue
22660b57cec5SDimitry Andric }
22670b57cec5SDimitry Andric }
22680b57cec5SDimitry Andric
22690b57cec5SDimitry Andric if ((RebalanceOnlyForOptimizations && !CanFactorize && !CombinedGA) ||
22700b57cec5SDimitry Andric (RebalanceOnlyImbalancedTrees && !Imbalanced)) {
22710b57cec5SDimitry Andric RootWeights[N] = CurrentWeight;
22720b57cec5SDimitry Andric RootHeights[N] = NodeHeights[SDValue(N, 0)];
22730b57cec5SDimitry Andric
22740b57cec5SDimitry Andric return SDValue(N, 0);
22750b57cec5SDimitry Andric }
22760b57cec5SDimitry Andric
22770b57cec5SDimitry Andric // Combine GA + SHL(x, C<=31) so we will match Rx=add(#u8,asl(Rx,#U5))
22780b57cec5SDimitry Andric if (NOpcode == ISD::ADD && GA.Value.getNode()) {
22790b57cec5SDimitry Andric WeightedLeaf SHL = Leaves.findSHL(31);
22800b57cec5SDimitry Andric if (SHL.Value.getNode()) {
22810b57cec5SDimitry Andric int Height = std::max(NodeHeights[GA.Value], NodeHeights[SHL.Value]) + 1;
22820b57cec5SDimitry Andric GA.Value = CurDAG->getNode(ISD::ADD, SDLoc(GA.Value),
22830b57cec5SDimitry Andric GA.Value.getValueType(),
22840b57cec5SDimitry Andric GA.Value, SHL.Value);
22850b57cec5SDimitry Andric GA.Weight = SHL.Weight; // Specifically ignore the GA weight here
22860b57cec5SDimitry Andric NodeHeights[GA.Value] = Height;
22870b57cec5SDimitry Andric }
22880b57cec5SDimitry Andric }
22890b57cec5SDimitry Andric
22900b57cec5SDimitry Andric if (GA.Value.getNode())
22910b57cec5SDimitry Andric Leaves.push(GA);
22920b57cec5SDimitry Andric
22930b57cec5SDimitry Andric // If this is the top level and we haven't factored out a shift, we should try
22940b57cec5SDimitry Andric // to move a constant to the bottom to match addressing modes like memw(rX+C)
22950b57cec5SDimitry Andric if (TopLevel && !CanFactorize && Leaves.hasConst()) {
22960b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Pushing constant to tip of tree.");
22970b57cec5SDimitry Andric Leaves.pushToBottom(Leaves.pop());
22980b57cec5SDimitry Andric }
22990b57cec5SDimitry Andric
23000b57cec5SDimitry Andric const DataLayout &DL = CurDAG->getDataLayout();
23010b57cec5SDimitry Andric const TargetLowering &TLI = *getTargetLowering();
23020b57cec5SDimitry Andric
23030b57cec5SDimitry Andric // Rebuild the tree using Huffman's algorithm
23040b57cec5SDimitry Andric while (Leaves.size() > 1) {
23050b57cec5SDimitry Andric WeightedLeaf L0 = Leaves.pop();
23060b57cec5SDimitry Andric
23070b57cec5SDimitry Andric // See whether we can grab a MUL to form an add(Rx,mpyi(Ry,#u6)),
23080b57cec5SDimitry Andric // otherwise just get the next leaf
23090b57cec5SDimitry Andric WeightedLeaf L1 = Leaves.findMULbyConst();
23100b57cec5SDimitry Andric if (!L1.Value.getNode())
23110b57cec5SDimitry Andric L1 = Leaves.pop();
23120b57cec5SDimitry Andric
23130b57cec5SDimitry Andric assert(L0.Weight <= L1.Weight && "Priority queue is broken!");
23140b57cec5SDimitry Andric
23150b57cec5SDimitry Andric SDValue V0 = L0.Value;
23160b57cec5SDimitry Andric int V0Weight = L0.Weight;
23170b57cec5SDimitry Andric SDValue V1 = L1.Value;
23180b57cec5SDimitry Andric int V1Weight = L1.Weight;
23190b57cec5SDimitry Andric
23200b57cec5SDimitry Andric // Make sure that none of these nodes have been RAUW'd
23210b57cec5SDimitry Andric if ((RootWeights.count(V0.getNode()) && RootWeights[V0.getNode()] == -2) ||
23220b57cec5SDimitry Andric (RootWeights.count(V1.getNode()) && RootWeights[V1.getNode()] == -2)) {
23230b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Subtree was RAUWd. Restarting...\n");
23240b57cec5SDimitry Andric return balanceSubTree(N, TopLevel);
23250b57cec5SDimitry Andric }
23260b57cec5SDimitry Andric
23270b57cec5SDimitry Andric ConstantSDNode *V0C = dyn_cast<ConstantSDNode>(V0);
23280b57cec5SDimitry Andric ConstantSDNode *V1C = dyn_cast<ConstantSDNode>(V1);
23290b57cec5SDimitry Andric EVT VT = N->getValueType(0);
23300b57cec5SDimitry Andric SDValue NewNode;
23310b57cec5SDimitry Andric
23320b57cec5SDimitry Andric if (V0C && !V1C) {
23330b57cec5SDimitry Andric std::swap(V0, V1);
23340b57cec5SDimitry Andric std::swap(V0C, V1C);
23350b57cec5SDimitry Andric }
23360b57cec5SDimitry Andric
23370b57cec5SDimitry Andric // Calculate height of this node
23380b57cec5SDimitry Andric assert(NodeHeights.count(V0) && NodeHeights.count(V1) &&
23390b57cec5SDimitry Andric "Children must have been visited before re-combining them!");
23400b57cec5SDimitry Andric int Height = std::max(NodeHeights[V0], NodeHeights[V1]) + 1;
23410b57cec5SDimitry Andric
23420b57cec5SDimitry Andric // Rebuild this node (and restore SHL from MUL if needed)
23430b57cec5SDimitry Andric if (V1C && NOpcode == ISD::MUL && V1C->getAPIntValue().isPowerOf2())
23440b57cec5SDimitry Andric NewNode = CurDAG->getNode(
23450b57cec5SDimitry Andric ISD::SHL, SDLoc(V0), VT, V0,
23460b57cec5SDimitry Andric CurDAG->getConstant(
23470b57cec5SDimitry Andric V1C->getAPIntValue().logBase2(), SDLoc(N),
23480b57cec5SDimitry Andric TLI.getScalarShiftAmountTy(DL, V0.getValueType())));
23490b57cec5SDimitry Andric else
23500b57cec5SDimitry Andric NewNode = CurDAG->getNode(NOpcode, SDLoc(N), VT, V0, V1);
23510b57cec5SDimitry Andric
23520b57cec5SDimitry Andric NodeHeights[NewNode] = Height;
23530b57cec5SDimitry Andric
23540b57cec5SDimitry Andric int Weight = V0Weight + V1Weight;
23550b57cec5SDimitry Andric Leaves.push(WeightedLeaf(NewNode, Weight, L0.InsertionOrder));
23560b57cec5SDimitry Andric
23570b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Built new node (Weight=" << Weight
23580b57cec5SDimitry Andric << ",Height=" << Height << "):\n");
23590b57cec5SDimitry Andric LLVM_DEBUG(NewNode.dump());
23600b57cec5SDimitry Andric }
23610b57cec5SDimitry Andric
23620b57cec5SDimitry Andric assert(Leaves.size() == 1);
23630b57cec5SDimitry Andric SDValue NewRoot = Leaves.top().Value;
23640b57cec5SDimitry Andric
23650b57cec5SDimitry Andric assert(NodeHeights.count(NewRoot));
23660b57cec5SDimitry Andric int Height = NodeHeights[NewRoot];
23670b57cec5SDimitry Andric
23680b57cec5SDimitry Andric // Restore SHL if we earlier converted it to a MUL
23690b57cec5SDimitry Andric if (NewRoot.getOpcode() == ISD::MUL) {
23700b57cec5SDimitry Andric ConstantSDNode *V1C = dyn_cast<ConstantSDNode>(NewRoot.getOperand(1));
23710b57cec5SDimitry Andric if (V1C && V1C->getAPIntValue().isPowerOf2()) {
23720b57cec5SDimitry Andric EVT VT = NewRoot.getValueType();
23730b57cec5SDimitry Andric SDValue V0 = NewRoot.getOperand(0);
23740b57cec5SDimitry Andric NewRoot = CurDAG->getNode(
23750b57cec5SDimitry Andric ISD::SHL, SDLoc(NewRoot), VT, V0,
23760b57cec5SDimitry Andric CurDAG->getConstant(
23770b57cec5SDimitry Andric V1C->getAPIntValue().logBase2(), SDLoc(NewRoot),
23780b57cec5SDimitry Andric TLI.getScalarShiftAmountTy(DL, V0.getValueType())));
23790b57cec5SDimitry Andric }
23800b57cec5SDimitry Andric }
23810b57cec5SDimitry Andric
23820b57cec5SDimitry Andric if (N != NewRoot.getNode()) {
23830b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Root is now: ");
23840b57cec5SDimitry Andric LLVM_DEBUG(NewRoot.dump());
23850b57cec5SDimitry Andric
23860b57cec5SDimitry Andric // Replace all uses of old root by new root
23870b57cec5SDimitry Andric CurDAG->ReplaceAllUsesWith(N, NewRoot.getNode());
23880b57cec5SDimitry Andric // Mark that we have RAUW'd N
23890b57cec5SDimitry Andric RootWeights[N] = -2;
23900b57cec5SDimitry Andric } else {
23910b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Root unchanged.\n");
23920b57cec5SDimitry Andric }
23930b57cec5SDimitry Andric
23940b57cec5SDimitry Andric RootWeights[NewRoot.getNode()] = Leaves.top().Weight;
23950b57cec5SDimitry Andric RootHeights[NewRoot.getNode()] = Height;
23960b57cec5SDimitry Andric
23970b57cec5SDimitry Andric return NewRoot;
23980b57cec5SDimitry Andric }
23990b57cec5SDimitry Andric
rebalanceAddressTrees()24000b57cec5SDimitry Andric void HexagonDAGToDAGISel::rebalanceAddressTrees() {
2401349cc55cSDimitry Andric for (SDNode &Node : llvm::make_early_inc_range(CurDAG->allnodes())) {
2402349cc55cSDimitry Andric SDNode *N = &Node;
24030b57cec5SDimitry Andric if (N->getOpcode() != ISD::LOAD && N->getOpcode() != ISD::STORE)
24040b57cec5SDimitry Andric continue;
24050b57cec5SDimitry Andric
24060b57cec5SDimitry Andric SDValue BasePtr = cast<MemSDNode>(N)->getBasePtr();
24070b57cec5SDimitry Andric if (BasePtr.getOpcode() != ISD::ADD)
24080b57cec5SDimitry Andric continue;
24090b57cec5SDimitry Andric
24100b57cec5SDimitry Andric // We've already processed this node
24110b57cec5SDimitry Andric if (RootWeights.count(BasePtr.getNode()))
24120b57cec5SDimitry Andric continue;
24130b57cec5SDimitry Andric
24140b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "** Rebalancing address calculation in node: ");
24150b57cec5SDimitry Andric LLVM_DEBUG(N->dump(CurDAG));
24160b57cec5SDimitry Andric
24170b57cec5SDimitry Andric // FindRoots
24180b57cec5SDimitry Andric SmallVector<SDNode *, 4> Worklist;
24190b57cec5SDimitry Andric
24200b57cec5SDimitry Andric Worklist.push_back(BasePtr.getOperand(0).getNode());
24210b57cec5SDimitry Andric Worklist.push_back(BasePtr.getOperand(1).getNode());
24220b57cec5SDimitry Andric
24230b57cec5SDimitry Andric while (!Worklist.empty()) {
24240b57cec5SDimitry Andric SDNode *N = Worklist.pop_back_val();
24250b57cec5SDimitry Andric unsigned Opcode = N->getOpcode();
24260b57cec5SDimitry Andric
24270b57cec5SDimitry Andric if (!isOpcodeHandled(N))
24280b57cec5SDimitry Andric continue;
24290b57cec5SDimitry Andric
24300b57cec5SDimitry Andric Worklist.push_back(N->getOperand(0).getNode());
24310b57cec5SDimitry Andric Worklist.push_back(N->getOperand(1).getNode());
24320b57cec5SDimitry Andric
24330b57cec5SDimitry Andric // Not a root if it has only one use and same opcode as its parent
24340b57cec5SDimitry Andric if (N->hasOneUse() && Opcode == N->use_begin()->getOpcode())
24350b57cec5SDimitry Andric continue;
24360b57cec5SDimitry Andric
24370b57cec5SDimitry Andric // This root node has already been processed
24380b57cec5SDimitry Andric if (RootWeights.count(N))
24390b57cec5SDimitry Andric continue;
24400b57cec5SDimitry Andric
24410b57cec5SDimitry Andric RootWeights[N] = -1;
24420b57cec5SDimitry Andric }
24430b57cec5SDimitry Andric
24440b57cec5SDimitry Andric // Balance node itself
24450b57cec5SDimitry Andric RootWeights[BasePtr.getNode()] = -1;
24460b57cec5SDimitry Andric SDValue NewBasePtr = balanceSubTree(BasePtr.getNode(), /*TopLevel=*/ true);
24470b57cec5SDimitry Andric
24480b57cec5SDimitry Andric if (N->getOpcode() == ISD::LOAD)
24490b57cec5SDimitry Andric N = CurDAG->UpdateNodeOperands(N, N->getOperand(0),
24500b57cec5SDimitry Andric NewBasePtr, N->getOperand(2));
24510b57cec5SDimitry Andric else
24520b57cec5SDimitry Andric N = CurDAG->UpdateNodeOperands(N, N->getOperand(0), N->getOperand(1),
24530b57cec5SDimitry Andric NewBasePtr, N->getOperand(3));
24540b57cec5SDimitry Andric
24550b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "--> Final node: ");
24560b57cec5SDimitry Andric LLVM_DEBUG(N->dump(CurDAG));
24570b57cec5SDimitry Andric }
24580b57cec5SDimitry Andric
24590b57cec5SDimitry Andric CurDAG->RemoveDeadNodes();
24600b57cec5SDimitry Andric GAUsesInFunction.clear();
24610b57cec5SDimitry Andric RootHeights.clear();
24620b57cec5SDimitry Andric RootWeights.clear();
24630b57cec5SDimitry Andric }
2464