xref: /freebsd/contrib/llvm-project/llvm/lib/Target/X86/X86ISelLowering.h (revision 5ffd83dbcc34f10e07f6d3e968ae6365869615f4)
10b57cec5SDimitry Andric //===-- X86ISelLowering.h - X86 DAG Lowering Interface ----------*- C++ -*-===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file defines the interfaces that X86 uses to lower LLVM code into a
100b57cec5SDimitry Andric // selection DAG.
110b57cec5SDimitry Andric //
120b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
130b57cec5SDimitry Andric 
140b57cec5SDimitry Andric #ifndef LLVM_LIB_TARGET_X86_X86ISELLOWERING_H
150b57cec5SDimitry Andric #define LLVM_LIB_TARGET_X86_X86ISELLOWERING_H
160b57cec5SDimitry Andric 
170b57cec5SDimitry Andric #include "llvm/CodeGen/TargetLowering.h"
180b57cec5SDimitry Andric 
190b57cec5SDimitry Andric namespace llvm {
200b57cec5SDimitry Andric   class X86Subtarget;
210b57cec5SDimitry Andric   class X86TargetMachine;
220b57cec5SDimitry Andric 
230b57cec5SDimitry Andric   namespace X86ISD {
240b57cec5SDimitry Andric     // X86 Specific DAG Nodes
250b57cec5SDimitry Andric   enum NodeType : unsigned {
260b57cec5SDimitry Andric     // Start the numbering where the builtin ops leave off.
270b57cec5SDimitry Andric     FIRST_NUMBER = ISD::BUILTIN_OP_END,
280b57cec5SDimitry Andric 
290b57cec5SDimitry Andric     /// Bit scan forward.
300b57cec5SDimitry Andric     BSF,
310b57cec5SDimitry Andric     /// Bit scan reverse.
320b57cec5SDimitry Andric     BSR,
330b57cec5SDimitry Andric 
34*5ffd83dbSDimitry Andric     /// X86 funnel/double shift i16 instructions. These correspond to
35*5ffd83dbSDimitry Andric     /// X86::SHLDW and X86::SHRDW instructions which have different amt
36*5ffd83dbSDimitry Andric     /// modulo rules to generic funnel shifts.
37*5ffd83dbSDimitry Andric     /// NOTE: The operand order matches ISD::FSHL/FSHR not SHLD/SHRD.
38*5ffd83dbSDimitry Andric     FSHL,
39*5ffd83dbSDimitry Andric     FSHR,
400b57cec5SDimitry Andric 
410b57cec5SDimitry Andric     /// Bitwise logical AND of floating point values. This corresponds
420b57cec5SDimitry Andric     /// to X86::ANDPS or X86::ANDPD.
430b57cec5SDimitry Andric     FAND,
440b57cec5SDimitry Andric 
450b57cec5SDimitry Andric     /// Bitwise logical OR of floating point values. This corresponds
460b57cec5SDimitry Andric     /// to X86::ORPS or X86::ORPD.
470b57cec5SDimitry Andric     FOR,
480b57cec5SDimitry Andric 
490b57cec5SDimitry Andric     /// Bitwise logical XOR of floating point values. This corresponds
500b57cec5SDimitry Andric     /// to X86::XORPS or X86::XORPD.
510b57cec5SDimitry Andric     FXOR,
520b57cec5SDimitry Andric 
530b57cec5SDimitry Andric     ///  Bitwise logical ANDNOT of floating point values. This
540b57cec5SDimitry Andric     /// corresponds to X86::ANDNPS or X86::ANDNPD.
550b57cec5SDimitry Andric     FANDN,
560b57cec5SDimitry Andric 
570b57cec5SDimitry Andric     /// These operations represent an abstract X86 call
580b57cec5SDimitry Andric     /// instruction, which includes a bunch of information.  In particular the
590b57cec5SDimitry Andric     /// operands of these node are:
600b57cec5SDimitry Andric     ///
610b57cec5SDimitry Andric     ///     #0 - The incoming token chain
620b57cec5SDimitry Andric     ///     #1 - The callee
630b57cec5SDimitry Andric     ///     #2 - The number of arg bytes the caller pushes on the stack.
640b57cec5SDimitry Andric     ///     #3 - The number of arg bytes the callee pops off the stack.
650b57cec5SDimitry Andric     ///     #4 - The value to pass in AL/AX/EAX (optional)
660b57cec5SDimitry Andric     ///     #5 - The value to pass in DL/DX/EDX (optional)
670b57cec5SDimitry Andric     ///
680b57cec5SDimitry Andric     /// The result values of these nodes are:
690b57cec5SDimitry Andric     ///
700b57cec5SDimitry Andric     ///     #0 - The outgoing token chain
710b57cec5SDimitry Andric     ///     #1 - The first register result value (optional)
720b57cec5SDimitry Andric     ///     #2 - The second register result value (optional)
730b57cec5SDimitry Andric     ///
740b57cec5SDimitry Andric     CALL,
750b57cec5SDimitry Andric 
760b57cec5SDimitry Andric     /// Same as call except it adds the NoTrack prefix.
770b57cec5SDimitry Andric     NT_CALL,
780b57cec5SDimitry Andric 
790b57cec5SDimitry Andric     /// X86 compare and logical compare instructions.
80*5ffd83dbSDimitry Andric     CMP,
81*5ffd83dbSDimitry Andric     FCMP,
82*5ffd83dbSDimitry Andric     COMI,
83*5ffd83dbSDimitry Andric     UCOMI,
840b57cec5SDimitry Andric 
850b57cec5SDimitry Andric     /// X86 bit-test instructions.
860b57cec5SDimitry Andric     BT,
870b57cec5SDimitry Andric 
880b57cec5SDimitry Andric     /// X86 SetCC. Operand 0 is condition code, and operand 1 is the EFLAGS
890b57cec5SDimitry Andric     /// operand, usually produced by a CMP instruction.
900b57cec5SDimitry Andric     SETCC,
910b57cec5SDimitry Andric 
920b57cec5SDimitry Andric     /// X86 Select
930b57cec5SDimitry Andric     SELECTS,
940b57cec5SDimitry Andric 
950b57cec5SDimitry Andric     // Same as SETCC except it's materialized with a sbb and the value is all
960b57cec5SDimitry Andric     // one's or all zero's.
970b57cec5SDimitry Andric     SETCC_CARRY, // R = carry_bit ? ~0 : 0
980b57cec5SDimitry Andric 
990b57cec5SDimitry Andric     /// X86 FP SETCC, implemented with CMP{cc}SS/CMP{cc}SD.
1000b57cec5SDimitry Andric     /// Operands are two FP values to compare; result is a mask of
1010b57cec5SDimitry Andric     /// 0s or 1s.  Generally DTRT for C/C++ with NaNs.
1020b57cec5SDimitry Andric     FSETCC,
1030b57cec5SDimitry Andric 
1040b57cec5SDimitry Andric     /// X86 FP SETCC, similar to above, but with output as an i1 mask and
1050b57cec5SDimitry Andric     /// and a version with SAE.
106*5ffd83dbSDimitry Andric     FSETCCM,
107*5ffd83dbSDimitry Andric     FSETCCM_SAE,
1080b57cec5SDimitry Andric 
1090b57cec5SDimitry Andric     /// X86 conditional moves. Operand 0 and operand 1 are the two values
1100b57cec5SDimitry Andric     /// to select from. Operand 2 is the condition code, and operand 3 is the
1110b57cec5SDimitry Andric     /// flag operand produced by a CMP or TEST instruction.
1120b57cec5SDimitry Andric     CMOV,
1130b57cec5SDimitry Andric 
1140b57cec5SDimitry Andric     /// X86 conditional branches. Operand 0 is the chain operand, operand 1
1150b57cec5SDimitry Andric     /// is the block to branch if condition is true, operand 2 is the
1160b57cec5SDimitry Andric     /// condition code, and operand 3 is the flag operand produced by a CMP
1170b57cec5SDimitry Andric     /// or TEST instruction.
1180b57cec5SDimitry Andric     BRCOND,
1190b57cec5SDimitry Andric 
1200b57cec5SDimitry Andric     /// BRIND node with NoTrack prefix. Operand 0 is the chain operand and
1210b57cec5SDimitry Andric     /// operand 1 is the target address.
1220b57cec5SDimitry Andric     NT_BRIND,
1230b57cec5SDimitry Andric 
1240b57cec5SDimitry Andric     /// Return with a flag operand. Operand 0 is the chain operand, operand
1250b57cec5SDimitry Andric     /// 1 is the number of bytes of stack to pop.
1260b57cec5SDimitry Andric     RET_FLAG,
1270b57cec5SDimitry Andric 
1280b57cec5SDimitry Andric     /// Return from interrupt. Operand 0 is the number of bytes to pop.
1290b57cec5SDimitry Andric     IRET,
1300b57cec5SDimitry Andric 
1310b57cec5SDimitry Andric     /// Repeat fill, corresponds to X86::REP_STOSx.
1320b57cec5SDimitry Andric     REP_STOS,
1330b57cec5SDimitry Andric 
1340b57cec5SDimitry Andric     /// Repeat move, corresponds to X86::REP_MOVSx.
1350b57cec5SDimitry Andric     REP_MOVS,
1360b57cec5SDimitry Andric 
1370b57cec5SDimitry Andric     /// On Darwin, this node represents the result of the popl
1380b57cec5SDimitry Andric     /// at function entry, used for PIC code.
1390b57cec5SDimitry Andric     GlobalBaseReg,
1400b57cec5SDimitry Andric 
1410b57cec5SDimitry Andric     /// A wrapper node for TargetConstantPool, TargetJumpTable,
1420b57cec5SDimitry Andric     /// TargetExternalSymbol, TargetGlobalAddress, TargetGlobalTLSAddress,
1430b57cec5SDimitry Andric     /// MCSymbol and TargetBlockAddress.
1440b57cec5SDimitry Andric     Wrapper,
1450b57cec5SDimitry Andric 
1460b57cec5SDimitry Andric     /// Special wrapper used under X86-64 PIC mode for RIP
1470b57cec5SDimitry Andric     /// relative displacements.
1480b57cec5SDimitry Andric     WrapperRIP,
1490b57cec5SDimitry Andric 
1508bcb0991SDimitry Andric     /// Copies a 64-bit value from an MMX vector to the low word
1518bcb0991SDimitry Andric     /// of an XMM vector, with the high word zero filled.
1528bcb0991SDimitry Andric     MOVQ2DQ,
1538bcb0991SDimitry Andric 
1540b57cec5SDimitry Andric     /// Copies a 64-bit value from the low word of an XMM vector
1550b57cec5SDimitry Andric     /// to an MMX vector.
1560b57cec5SDimitry Andric     MOVDQ2Q,
1570b57cec5SDimitry Andric 
1580b57cec5SDimitry Andric     /// Copies a 32-bit value from the low word of a MMX
1590b57cec5SDimitry Andric     /// vector to a GPR.
1600b57cec5SDimitry Andric     MMX_MOVD2W,
1610b57cec5SDimitry Andric 
1620b57cec5SDimitry Andric     /// Copies a GPR into the low 32-bit word of a MMX vector
1630b57cec5SDimitry Andric     /// and zero out the high word.
1640b57cec5SDimitry Andric     MMX_MOVW2D,
1650b57cec5SDimitry Andric 
1660b57cec5SDimitry Andric     /// Extract an 8-bit value from a vector and zero extend it to
1670b57cec5SDimitry Andric     /// i32, corresponds to X86::PEXTRB.
1680b57cec5SDimitry Andric     PEXTRB,
1690b57cec5SDimitry Andric 
1700b57cec5SDimitry Andric     /// Extract a 16-bit value from a vector and zero extend it to
1710b57cec5SDimitry Andric     /// i32, corresponds to X86::PEXTRW.
1720b57cec5SDimitry Andric     PEXTRW,
1730b57cec5SDimitry Andric 
1740b57cec5SDimitry Andric     /// Insert any element of a 4 x float vector into any element
1750b57cec5SDimitry Andric     /// of a destination 4 x floatvector.
1760b57cec5SDimitry Andric     INSERTPS,
1770b57cec5SDimitry Andric 
1780b57cec5SDimitry Andric     /// Insert the lower 8-bits of a 32-bit value to a vector,
1790b57cec5SDimitry Andric     /// corresponds to X86::PINSRB.
1800b57cec5SDimitry Andric     PINSRB,
1810b57cec5SDimitry Andric 
1820b57cec5SDimitry Andric     /// Insert the lower 16-bits of a 32-bit value to a vector,
1830b57cec5SDimitry Andric     /// corresponds to X86::PINSRW.
1840b57cec5SDimitry Andric     PINSRW,
1850b57cec5SDimitry Andric 
1860b57cec5SDimitry Andric     /// Shuffle 16 8-bit values within a vector.
1870b57cec5SDimitry Andric     PSHUFB,
1880b57cec5SDimitry Andric 
1890b57cec5SDimitry Andric     /// Compute Sum of Absolute Differences.
1900b57cec5SDimitry Andric     PSADBW,
1910b57cec5SDimitry Andric     /// Compute Double Block Packed Sum-Absolute-Differences
1920b57cec5SDimitry Andric     DBPSADBW,
1930b57cec5SDimitry Andric 
1940b57cec5SDimitry Andric     /// Bitwise Logical AND NOT of Packed FP values.
1950b57cec5SDimitry Andric     ANDNP,
1960b57cec5SDimitry Andric 
1970b57cec5SDimitry Andric     /// Blend where the selector is an immediate.
1980b57cec5SDimitry Andric     BLENDI,
1990b57cec5SDimitry Andric 
2000b57cec5SDimitry Andric     /// Dynamic (non-constant condition) vector blend where only the sign bits
2010b57cec5SDimitry Andric     /// of the condition elements are used. This is used to enforce that the
2020b57cec5SDimitry Andric     /// condition mask is not valid for generic VSELECT optimizations. This
2030b57cec5SDimitry Andric     /// is also used to implement the intrinsics.
2040b57cec5SDimitry Andric     /// Operands are in VSELECT order: MASK, TRUE, FALSE
2050b57cec5SDimitry Andric     BLENDV,
2060b57cec5SDimitry Andric 
2070b57cec5SDimitry Andric     /// Combined add and sub on an FP vector.
2080b57cec5SDimitry Andric     ADDSUB,
2090b57cec5SDimitry Andric 
2100b57cec5SDimitry Andric     //  FP vector ops with rounding mode.
211*5ffd83dbSDimitry Andric     FADD_RND,
212*5ffd83dbSDimitry Andric     FADDS,
213*5ffd83dbSDimitry Andric     FADDS_RND,
214*5ffd83dbSDimitry Andric     FSUB_RND,
215*5ffd83dbSDimitry Andric     FSUBS,
216*5ffd83dbSDimitry Andric     FSUBS_RND,
217*5ffd83dbSDimitry Andric     FMUL_RND,
218*5ffd83dbSDimitry Andric     FMULS,
219*5ffd83dbSDimitry Andric     FMULS_RND,
220*5ffd83dbSDimitry Andric     FDIV_RND,
221*5ffd83dbSDimitry Andric     FDIVS,
222*5ffd83dbSDimitry Andric     FDIVS_RND,
223*5ffd83dbSDimitry Andric     FMAX_SAE,
224*5ffd83dbSDimitry Andric     FMAXS_SAE,
225*5ffd83dbSDimitry Andric     FMIN_SAE,
226*5ffd83dbSDimitry Andric     FMINS_SAE,
227*5ffd83dbSDimitry Andric     FSQRT_RND,
228*5ffd83dbSDimitry Andric     FSQRTS,
229*5ffd83dbSDimitry Andric     FSQRTS_RND,
2300b57cec5SDimitry Andric 
2310b57cec5SDimitry Andric     // FP vector get exponent.
232*5ffd83dbSDimitry Andric     FGETEXP,
233*5ffd83dbSDimitry Andric     FGETEXP_SAE,
234*5ffd83dbSDimitry Andric     FGETEXPS,
235*5ffd83dbSDimitry Andric     FGETEXPS_SAE,
2360b57cec5SDimitry Andric     // Extract Normalized Mantissas.
237*5ffd83dbSDimitry Andric     VGETMANT,
238*5ffd83dbSDimitry Andric     VGETMANT_SAE,
239*5ffd83dbSDimitry Andric     VGETMANTS,
240*5ffd83dbSDimitry Andric     VGETMANTS_SAE,
2410b57cec5SDimitry Andric     // FP Scale.
242*5ffd83dbSDimitry Andric     SCALEF,
243*5ffd83dbSDimitry Andric     SCALEF_RND,
244*5ffd83dbSDimitry Andric     SCALEFS,
245*5ffd83dbSDimitry Andric     SCALEFS_RND,
2460b57cec5SDimitry Andric 
2470b57cec5SDimitry Andric     // Unsigned Integer average.
2480b57cec5SDimitry Andric     AVG,
2490b57cec5SDimitry Andric 
2500b57cec5SDimitry Andric     /// Integer horizontal add/sub.
2510b57cec5SDimitry Andric     HADD,
2520b57cec5SDimitry Andric     HSUB,
2530b57cec5SDimitry Andric 
2540b57cec5SDimitry Andric     /// Floating point horizontal add/sub.
2550b57cec5SDimitry Andric     FHADD,
2560b57cec5SDimitry Andric     FHSUB,
2570b57cec5SDimitry Andric 
2580b57cec5SDimitry Andric     // Detect Conflicts Within a Vector
2590b57cec5SDimitry Andric     CONFLICT,
2600b57cec5SDimitry Andric 
2610b57cec5SDimitry Andric     /// Floating point max and min.
262*5ffd83dbSDimitry Andric     FMAX,
263*5ffd83dbSDimitry Andric     FMIN,
2640b57cec5SDimitry Andric 
2650b57cec5SDimitry Andric     /// Commutative FMIN and FMAX.
266*5ffd83dbSDimitry Andric     FMAXC,
267*5ffd83dbSDimitry Andric     FMINC,
2680b57cec5SDimitry Andric 
2690b57cec5SDimitry Andric     /// Scalar intrinsic floating point max and min.
270*5ffd83dbSDimitry Andric     FMAXS,
271*5ffd83dbSDimitry Andric     FMINS,
2720b57cec5SDimitry Andric 
2730b57cec5SDimitry Andric     /// Floating point reciprocal-sqrt and reciprocal approximation.
2740b57cec5SDimitry Andric     /// Note that these typically require refinement
2750b57cec5SDimitry Andric     /// in order to obtain suitable precision.
276*5ffd83dbSDimitry Andric     FRSQRT,
277*5ffd83dbSDimitry Andric     FRCP,
2780b57cec5SDimitry Andric 
2790b57cec5SDimitry Andric     // AVX-512 reciprocal approximations with a little more precision.
280*5ffd83dbSDimitry Andric     RSQRT14,
281*5ffd83dbSDimitry Andric     RSQRT14S,
282*5ffd83dbSDimitry Andric     RCP14,
283*5ffd83dbSDimitry Andric     RCP14S,
2840b57cec5SDimitry Andric 
2850b57cec5SDimitry Andric     // Thread Local Storage.
2860b57cec5SDimitry Andric     TLSADDR,
2870b57cec5SDimitry Andric 
2880b57cec5SDimitry Andric     // Thread Local Storage. A call to get the start address
2890b57cec5SDimitry Andric     // of the TLS block for the current module.
2900b57cec5SDimitry Andric     TLSBASEADDR,
2910b57cec5SDimitry Andric 
2920b57cec5SDimitry Andric     // Thread Local Storage.  When calling to an OS provided
2930b57cec5SDimitry Andric     // thunk at the address from an earlier relocation.
2940b57cec5SDimitry Andric     TLSCALL,
2950b57cec5SDimitry Andric 
2960b57cec5SDimitry Andric     // Exception Handling helpers.
2970b57cec5SDimitry Andric     EH_RETURN,
2980b57cec5SDimitry Andric 
2990b57cec5SDimitry Andric     // SjLj exception handling setjmp.
3000b57cec5SDimitry Andric     EH_SJLJ_SETJMP,
3010b57cec5SDimitry Andric 
3020b57cec5SDimitry Andric     // SjLj exception handling longjmp.
3030b57cec5SDimitry Andric     EH_SJLJ_LONGJMP,
3040b57cec5SDimitry Andric 
3050b57cec5SDimitry Andric     // SjLj exception handling dispatch.
3060b57cec5SDimitry Andric     EH_SJLJ_SETUP_DISPATCH,
3070b57cec5SDimitry Andric 
3080b57cec5SDimitry Andric     /// Tail call return. See X86TargetLowering::LowerCall for
3090b57cec5SDimitry Andric     /// the list of operands.
3100b57cec5SDimitry Andric     TC_RETURN,
3110b57cec5SDimitry Andric 
3120b57cec5SDimitry Andric     // Vector move to low scalar and zero higher vector elements.
3130b57cec5SDimitry Andric     VZEXT_MOVL,
3140b57cec5SDimitry Andric 
3150b57cec5SDimitry Andric     // Vector integer truncate.
3160b57cec5SDimitry Andric     VTRUNC,
3170b57cec5SDimitry Andric     // Vector integer truncate with unsigned/signed saturation.
318*5ffd83dbSDimitry Andric     VTRUNCUS,
319*5ffd83dbSDimitry Andric     VTRUNCS,
3200b57cec5SDimitry Andric 
3210b57cec5SDimitry Andric     // Masked version of the above. Used when less than a 128-bit result is
3220b57cec5SDimitry Andric     // produced since the mask only applies to the lower elements and can't
3230b57cec5SDimitry Andric     // be represented by a select.
3240b57cec5SDimitry Andric     // SRC, PASSTHRU, MASK
325*5ffd83dbSDimitry Andric     VMTRUNC,
326*5ffd83dbSDimitry Andric     VMTRUNCUS,
327*5ffd83dbSDimitry Andric     VMTRUNCS,
3280b57cec5SDimitry Andric 
3290b57cec5SDimitry Andric     // Vector FP extend.
330*5ffd83dbSDimitry Andric     VFPEXT,
331*5ffd83dbSDimitry Andric     VFPEXT_SAE,
332*5ffd83dbSDimitry Andric     VFPEXTS,
333*5ffd83dbSDimitry Andric     VFPEXTS_SAE,
3340b57cec5SDimitry Andric 
3350b57cec5SDimitry Andric     // Vector FP round.
336*5ffd83dbSDimitry Andric     VFPROUND,
337*5ffd83dbSDimitry Andric     VFPROUND_RND,
338*5ffd83dbSDimitry Andric     VFPROUNDS,
339*5ffd83dbSDimitry Andric     VFPROUNDS_RND,
3400b57cec5SDimitry Andric 
3410b57cec5SDimitry Andric     // Masked version of above. Used for v2f64->v4f32.
3420b57cec5SDimitry Andric     // SRC, PASSTHRU, MASK
3430b57cec5SDimitry Andric     VMFPROUND,
3440b57cec5SDimitry Andric 
3450b57cec5SDimitry Andric     // 128-bit vector logical left / right shift
346*5ffd83dbSDimitry Andric     VSHLDQ,
347*5ffd83dbSDimitry Andric     VSRLDQ,
3480b57cec5SDimitry Andric 
3490b57cec5SDimitry Andric     // Vector shift elements
350*5ffd83dbSDimitry Andric     VSHL,
351*5ffd83dbSDimitry Andric     VSRL,
352*5ffd83dbSDimitry Andric     VSRA,
3530b57cec5SDimitry Andric 
3540b57cec5SDimitry Andric     // Vector variable shift
355*5ffd83dbSDimitry Andric     VSHLV,
356*5ffd83dbSDimitry Andric     VSRLV,
357*5ffd83dbSDimitry Andric     VSRAV,
3580b57cec5SDimitry Andric 
3590b57cec5SDimitry Andric     // Vector shift elements by immediate
360*5ffd83dbSDimitry Andric     VSHLI,
361*5ffd83dbSDimitry Andric     VSRLI,
362*5ffd83dbSDimitry Andric     VSRAI,
3630b57cec5SDimitry Andric 
3640b57cec5SDimitry Andric     // Shifts of mask registers.
365*5ffd83dbSDimitry Andric     KSHIFTL,
366*5ffd83dbSDimitry Andric     KSHIFTR,
3670b57cec5SDimitry Andric 
3680b57cec5SDimitry Andric     // Bit rotate by immediate
369*5ffd83dbSDimitry Andric     VROTLI,
370*5ffd83dbSDimitry Andric     VROTRI,
3710b57cec5SDimitry Andric 
3720b57cec5SDimitry Andric     // Vector packed double/float comparison.
3730b57cec5SDimitry Andric     CMPP,
3740b57cec5SDimitry Andric 
3750b57cec5SDimitry Andric     // Vector integer comparisons.
376*5ffd83dbSDimitry Andric     PCMPEQ,
377*5ffd83dbSDimitry Andric     PCMPGT,
3780b57cec5SDimitry Andric 
3790b57cec5SDimitry Andric     // v8i16 Horizontal minimum and position.
3800b57cec5SDimitry Andric     PHMINPOS,
3810b57cec5SDimitry Andric 
3820b57cec5SDimitry Andric     MULTISHIFT,
3830b57cec5SDimitry Andric 
3840b57cec5SDimitry Andric     /// Vector comparison generating mask bits for fp and
3850b57cec5SDimitry Andric     /// integer signed and unsigned data types.
3860b57cec5SDimitry Andric     CMPM,
3870b57cec5SDimitry Andric     // Vector comparison with SAE for FP values
3880b57cec5SDimitry Andric     CMPM_SAE,
3890b57cec5SDimitry Andric 
3900b57cec5SDimitry Andric     // Arithmetic operations with FLAGS results.
391*5ffd83dbSDimitry Andric     ADD,
392*5ffd83dbSDimitry Andric     SUB,
393*5ffd83dbSDimitry Andric     ADC,
394*5ffd83dbSDimitry Andric     SBB,
395*5ffd83dbSDimitry Andric     SMUL,
396*5ffd83dbSDimitry Andric     UMUL,
397*5ffd83dbSDimitry Andric     OR,
398*5ffd83dbSDimitry Andric     XOR,
399*5ffd83dbSDimitry Andric     AND,
4000b57cec5SDimitry Andric 
4010b57cec5SDimitry Andric     // Bit field extract.
4020b57cec5SDimitry Andric     BEXTR,
4030b57cec5SDimitry Andric 
4040b57cec5SDimitry Andric     // Zero High Bits Starting with Specified Bit Position.
4050b57cec5SDimitry Andric     BZHI,
4060b57cec5SDimitry Andric 
407*5ffd83dbSDimitry Andric     // Parallel extract and deposit.
408*5ffd83dbSDimitry Andric     PDEP,
409*5ffd83dbSDimitry Andric     PEXT,
410*5ffd83dbSDimitry Andric 
4110b57cec5SDimitry Andric     // X86-specific multiply by immediate.
4120b57cec5SDimitry Andric     MUL_IMM,
4130b57cec5SDimitry Andric 
4140b57cec5SDimitry Andric     // Vector sign bit extraction.
4150b57cec5SDimitry Andric     MOVMSK,
4160b57cec5SDimitry Andric 
4170b57cec5SDimitry Andric     // Vector bitwise comparisons.
4180b57cec5SDimitry Andric     PTEST,
4190b57cec5SDimitry Andric 
4200b57cec5SDimitry Andric     // Vector packed fp sign bitwise comparisons.
4210b57cec5SDimitry Andric     TESTP,
4220b57cec5SDimitry Andric 
4230b57cec5SDimitry Andric     // OR/AND test for masks.
4240b57cec5SDimitry Andric     KORTEST,
4250b57cec5SDimitry Andric     KTEST,
4260b57cec5SDimitry Andric 
4270b57cec5SDimitry Andric     // ADD for masks.
4280b57cec5SDimitry Andric     KADD,
4290b57cec5SDimitry Andric 
4300b57cec5SDimitry Andric     // Several flavors of instructions with vector shuffle behaviors.
4310b57cec5SDimitry Andric     // Saturated signed/unnsigned packing.
4320b57cec5SDimitry Andric     PACKSS,
4330b57cec5SDimitry Andric     PACKUS,
4340b57cec5SDimitry Andric     // Intra-lane alignr.
4350b57cec5SDimitry Andric     PALIGNR,
4360b57cec5SDimitry Andric     // AVX512 inter-lane alignr.
4370b57cec5SDimitry Andric     VALIGN,
4380b57cec5SDimitry Andric     PSHUFD,
4390b57cec5SDimitry Andric     PSHUFHW,
4400b57cec5SDimitry Andric     PSHUFLW,
4410b57cec5SDimitry Andric     SHUFP,
4420b57cec5SDimitry Andric     // VBMI2 Concat & Shift.
4430b57cec5SDimitry Andric     VSHLD,
4440b57cec5SDimitry Andric     VSHRD,
4450b57cec5SDimitry Andric     VSHLDV,
4460b57cec5SDimitry Andric     VSHRDV,
4470b57cec5SDimitry Andric     // Shuffle Packed Values at 128-bit granularity.
4480b57cec5SDimitry Andric     SHUF128,
4490b57cec5SDimitry Andric     MOVDDUP,
4500b57cec5SDimitry Andric     MOVSHDUP,
4510b57cec5SDimitry Andric     MOVSLDUP,
4520b57cec5SDimitry Andric     MOVLHPS,
4530b57cec5SDimitry Andric     MOVHLPS,
4540b57cec5SDimitry Andric     MOVSD,
4550b57cec5SDimitry Andric     MOVSS,
4560b57cec5SDimitry Andric     UNPCKL,
4570b57cec5SDimitry Andric     UNPCKH,
4580b57cec5SDimitry Andric     VPERMILPV,
4590b57cec5SDimitry Andric     VPERMILPI,
4600b57cec5SDimitry Andric     VPERMI,
4610b57cec5SDimitry Andric     VPERM2X128,
4620b57cec5SDimitry Andric 
4630b57cec5SDimitry Andric     // Variable Permute (VPERM).
4640b57cec5SDimitry Andric     // Res = VPERMV MaskV, V0
4650b57cec5SDimitry Andric     VPERMV,
4660b57cec5SDimitry Andric 
4670b57cec5SDimitry Andric     // 3-op Variable Permute (VPERMT2).
4680b57cec5SDimitry Andric     // Res = VPERMV3 V0, MaskV, V1
4690b57cec5SDimitry Andric     VPERMV3,
4700b57cec5SDimitry Andric 
4710b57cec5SDimitry Andric     // Bitwise ternary logic.
4720b57cec5SDimitry Andric     VPTERNLOG,
4730b57cec5SDimitry Andric     // Fix Up Special Packed Float32/64 values.
474*5ffd83dbSDimitry Andric     VFIXUPIMM,
475*5ffd83dbSDimitry Andric     VFIXUPIMM_SAE,
476*5ffd83dbSDimitry Andric     VFIXUPIMMS,
477*5ffd83dbSDimitry Andric     VFIXUPIMMS_SAE,
4780b57cec5SDimitry Andric     // Range Restriction Calculation For Packed Pairs of Float32/64 values.
479*5ffd83dbSDimitry Andric     VRANGE,
480*5ffd83dbSDimitry Andric     VRANGE_SAE,
481*5ffd83dbSDimitry Andric     VRANGES,
482*5ffd83dbSDimitry Andric     VRANGES_SAE,
4830b57cec5SDimitry Andric     // Reduce - Perform Reduction Transformation on scalar\packed FP.
484*5ffd83dbSDimitry Andric     VREDUCE,
485*5ffd83dbSDimitry Andric     VREDUCE_SAE,
486*5ffd83dbSDimitry Andric     VREDUCES,
487*5ffd83dbSDimitry Andric     VREDUCES_SAE,
4880b57cec5SDimitry Andric     // RndScale - Round FP Values To Include A Given Number Of Fraction Bits.
4890b57cec5SDimitry Andric     // Also used by the legacy (V)ROUND intrinsics where we mask out the
4900b57cec5SDimitry Andric     // scaling part of the immediate.
491*5ffd83dbSDimitry Andric     VRNDSCALE,
492*5ffd83dbSDimitry Andric     VRNDSCALE_SAE,
493*5ffd83dbSDimitry Andric     VRNDSCALES,
494*5ffd83dbSDimitry Andric     VRNDSCALES_SAE,
4950b57cec5SDimitry Andric     // Tests Types Of a FP Values for packed types.
4960b57cec5SDimitry Andric     VFPCLASS,
4970b57cec5SDimitry Andric     // Tests Types Of a FP Values for scalar types.
4980b57cec5SDimitry Andric     VFPCLASSS,
4990b57cec5SDimitry Andric 
5000b57cec5SDimitry Andric     // Broadcast (splat) scalar or element 0 of a vector. If the operand is
5010b57cec5SDimitry Andric     // a vector, this node may change the vector length as part of the splat.
5020b57cec5SDimitry Andric     VBROADCAST,
5030b57cec5SDimitry Andric     // Broadcast mask to vector.
5040b57cec5SDimitry Andric     VBROADCASTM,
5050b57cec5SDimitry Andric     // Broadcast subvector to vector.
5060b57cec5SDimitry Andric     SUBV_BROADCAST,
5070b57cec5SDimitry Andric 
5080b57cec5SDimitry Andric     /// SSE4A Extraction and Insertion.
509*5ffd83dbSDimitry Andric     EXTRQI,
510*5ffd83dbSDimitry Andric     INSERTQI,
5110b57cec5SDimitry Andric 
5120b57cec5SDimitry Andric     // XOP arithmetic/logical shifts.
513*5ffd83dbSDimitry Andric     VPSHA,
514*5ffd83dbSDimitry Andric     VPSHL,
5150b57cec5SDimitry Andric     // XOP signed/unsigned integer comparisons.
516*5ffd83dbSDimitry Andric     VPCOM,
517*5ffd83dbSDimitry Andric     VPCOMU,
5180b57cec5SDimitry Andric     // XOP packed permute bytes.
5190b57cec5SDimitry Andric     VPPERM,
5200b57cec5SDimitry Andric     // XOP two source permutation.
5210b57cec5SDimitry Andric     VPERMIL2,
5220b57cec5SDimitry Andric 
5230b57cec5SDimitry Andric     // Vector multiply packed unsigned doubleword integers.
5240b57cec5SDimitry Andric     PMULUDQ,
5250b57cec5SDimitry Andric     // Vector multiply packed signed doubleword integers.
5260b57cec5SDimitry Andric     PMULDQ,
5270b57cec5SDimitry Andric     // Vector Multiply Packed UnsignedIntegers with Round and Scale.
5280b57cec5SDimitry Andric     MULHRS,
5290b57cec5SDimitry Andric 
5300b57cec5SDimitry Andric     // Multiply and Add Packed Integers.
531*5ffd83dbSDimitry Andric     VPMADDUBSW,
532*5ffd83dbSDimitry Andric     VPMADDWD,
5330b57cec5SDimitry Andric 
5340b57cec5SDimitry Andric     // AVX512IFMA multiply and add.
5350b57cec5SDimitry Andric     // NOTE: These are different than the instruction and perform
5360b57cec5SDimitry Andric     // op0 x op1 + op2.
537*5ffd83dbSDimitry Andric     VPMADD52L,
538*5ffd83dbSDimitry Andric     VPMADD52H,
5390b57cec5SDimitry Andric 
5400b57cec5SDimitry Andric     // VNNI
5410b57cec5SDimitry Andric     VPDPBUSD,
5420b57cec5SDimitry Andric     VPDPBUSDS,
5430b57cec5SDimitry Andric     VPDPWSSD,
5440b57cec5SDimitry Andric     VPDPWSSDS,
5450b57cec5SDimitry Andric 
5460b57cec5SDimitry Andric     // FMA nodes.
5470b57cec5SDimitry Andric     // We use the target independent ISD::FMA for the non-inverted case.
5480b57cec5SDimitry Andric     FNMADD,
5490b57cec5SDimitry Andric     FMSUB,
5500b57cec5SDimitry Andric     FNMSUB,
5510b57cec5SDimitry Andric     FMADDSUB,
5520b57cec5SDimitry Andric     FMSUBADD,
5530b57cec5SDimitry Andric 
5540b57cec5SDimitry Andric     // FMA with rounding mode.
5550b57cec5SDimitry Andric     FMADD_RND,
5560b57cec5SDimitry Andric     FNMADD_RND,
5570b57cec5SDimitry Andric     FMSUB_RND,
5580b57cec5SDimitry Andric     FNMSUB_RND,
5590b57cec5SDimitry Andric     FMADDSUB_RND,
5600b57cec5SDimitry Andric     FMSUBADD_RND,
5610b57cec5SDimitry Andric 
5620b57cec5SDimitry Andric     // Compress and expand.
5630b57cec5SDimitry Andric     COMPRESS,
5640b57cec5SDimitry Andric     EXPAND,
5650b57cec5SDimitry Andric 
5660b57cec5SDimitry Andric     // Bits shuffle
5670b57cec5SDimitry Andric     VPSHUFBITQMB,
5680b57cec5SDimitry Andric 
5690b57cec5SDimitry Andric     // Convert Unsigned/Integer to Floating-Point Value with rounding mode.
570*5ffd83dbSDimitry Andric     SINT_TO_FP_RND,
571*5ffd83dbSDimitry Andric     UINT_TO_FP_RND,
572*5ffd83dbSDimitry Andric     SCALAR_SINT_TO_FP,
573*5ffd83dbSDimitry Andric     SCALAR_UINT_TO_FP,
574*5ffd83dbSDimitry Andric     SCALAR_SINT_TO_FP_RND,
575*5ffd83dbSDimitry Andric     SCALAR_UINT_TO_FP_RND,
5760b57cec5SDimitry Andric 
5770b57cec5SDimitry Andric     // Vector float/double to signed/unsigned integer.
578*5ffd83dbSDimitry Andric     CVTP2SI,
579*5ffd83dbSDimitry Andric     CVTP2UI,
580*5ffd83dbSDimitry Andric     CVTP2SI_RND,
581*5ffd83dbSDimitry Andric     CVTP2UI_RND,
5820b57cec5SDimitry Andric     // Scalar float/double to signed/unsigned integer.
583*5ffd83dbSDimitry Andric     CVTS2SI,
584*5ffd83dbSDimitry Andric     CVTS2UI,
585*5ffd83dbSDimitry Andric     CVTS2SI_RND,
586*5ffd83dbSDimitry Andric     CVTS2UI_RND,
5870b57cec5SDimitry Andric 
5880b57cec5SDimitry Andric     // Vector float/double to signed/unsigned integer with truncation.
589*5ffd83dbSDimitry Andric     CVTTP2SI,
590*5ffd83dbSDimitry Andric     CVTTP2UI,
591*5ffd83dbSDimitry Andric     CVTTP2SI_SAE,
592*5ffd83dbSDimitry Andric     CVTTP2UI_SAE,
5930b57cec5SDimitry Andric     // Scalar float/double to signed/unsigned integer with truncation.
594*5ffd83dbSDimitry Andric     CVTTS2SI,
595*5ffd83dbSDimitry Andric     CVTTS2UI,
596*5ffd83dbSDimitry Andric     CVTTS2SI_SAE,
597*5ffd83dbSDimitry Andric     CVTTS2UI_SAE,
5980b57cec5SDimitry Andric 
5990b57cec5SDimitry Andric     // Vector signed/unsigned integer to float/double.
600*5ffd83dbSDimitry Andric     CVTSI2P,
601*5ffd83dbSDimitry Andric     CVTUI2P,
6020b57cec5SDimitry Andric 
6030b57cec5SDimitry Andric     // Masked versions of above. Used for v2f64->v4f32.
6040b57cec5SDimitry Andric     // SRC, PASSTHRU, MASK
605*5ffd83dbSDimitry Andric     MCVTP2SI,
606*5ffd83dbSDimitry Andric     MCVTP2UI,
607*5ffd83dbSDimitry Andric     MCVTTP2SI,
608*5ffd83dbSDimitry Andric     MCVTTP2UI,
609*5ffd83dbSDimitry Andric     MCVTSI2P,
610*5ffd83dbSDimitry Andric     MCVTUI2P,
6110b57cec5SDimitry Andric 
6120b57cec5SDimitry Andric     // Vector float to bfloat16.
6130b57cec5SDimitry Andric     // Convert TWO packed single data to one packed BF16 data
6140b57cec5SDimitry Andric     CVTNE2PS2BF16,
6150b57cec5SDimitry Andric     // Convert packed single data to packed BF16 data
6160b57cec5SDimitry Andric     CVTNEPS2BF16,
6170b57cec5SDimitry Andric     // Masked version of above.
6180b57cec5SDimitry Andric     // SRC, PASSTHRU, MASK
6190b57cec5SDimitry Andric     MCVTNEPS2BF16,
6200b57cec5SDimitry Andric 
6210b57cec5SDimitry Andric     // Dot product of BF16 pairs to accumulated into
6220b57cec5SDimitry Andric     // packed single precision.
6230b57cec5SDimitry Andric     DPBF16PS,
6240b57cec5SDimitry Andric 
6250b57cec5SDimitry Andric     // Save xmm argument registers to the stack, according to %al. An operator
6260b57cec5SDimitry Andric     // is needed so that this can be expanded with control flow.
6270b57cec5SDimitry Andric     VASTART_SAVE_XMM_REGS,
6280b57cec5SDimitry Andric 
6290b57cec5SDimitry Andric     // Windows's _chkstk call to do stack probing.
6300b57cec5SDimitry Andric     WIN_ALLOCA,
6310b57cec5SDimitry Andric 
6320b57cec5SDimitry Andric     // For allocating variable amounts of stack space when using
6330b57cec5SDimitry Andric     // segmented stacks. Check if the current stacklet has enough space, and
6340b57cec5SDimitry Andric     // falls back to heap allocation if not.
6350b57cec5SDimitry Andric     SEG_ALLOCA,
6360b57cec5SDimitry Andric 
637*5ffd83dbSDimitry Andric     // For allocating stack space when using stack clash protector.
638*5ffd83dbSDimitry Andric     // Allocation is performed by block, and each block is probed.
639*5ffd83dbSDimitry Andric     PROBED_ALLOCA,
640*5ffd83dbSDimitry Andric 
6410b57cec5SDimitry Andric     // Memory barriers.
6420b57cec5SDimitry Andric     MEMBARRIER,
6430b57cec5SDimitry Andric     MFENCE,
6440b57cec5SDimitry Andric 
6450b57cec5SDimitry Andric     // Get a random integer and indicate whether it is valid in CF.
6460b57cec5SDimitry Andric     RDRAND,
6470b57cec5SDimitry Andric 
6480b57cec5SDimitry Andric     // Get a NIST SP800-90B & C compliant random integer and
6490b57cec5SDimitry Andric     // indicate whether it is valid in CF.
6500b57cec5SDimitry Andric     RDSEED,
6510b57cec5SDimitry Andric 
6520b57cec5SDimitry Andric     // Protection keys
6530b57cec5SDimitry Andric     // RDPKRU - Operand 0 is chain. Operand 1 is value for ECX.
6540b57cec5SDimitry Andric     // WRPKRU - Operand 0 is chain. Operand 1 is value for EDX. Operand 2 is
6550b57cec5SDimitry Andric     // value for ECX.
656*5ffd83dbSDimitry Andric     RDPKRU,
657*5ffd83dbSDimitry Andric     WRPKRU,
6580b57cec5SDimitry Andric 
6590b57cec5SDimitry Andric     // SSE42 string comparisons.
6600b57cec5SDimitry Andric     // These nodes produce 3 results, index, mask, and flags. X86ISelDAGToDAG
6610b57cec5SDimitry Andric     // will emit one or two instructions based on which results are used. If
6620b57cec5SDimitry Andric     // flags and index/mask this allows us to use a single instruction since
6630b57cec5SDimitry Andric     // we won't have to pick and opcode for flags. Instead we can rely on the
6640b57cec5SDimitry Andric     // DAG to CSE everything and decide at isel.
6650b57cec5SDimitry Andric     PCMPISTR,
6660b57cec5SDimitry Andric     PCMPESTR,
6670b57cec5SDimitry Andric 
6680b57cec5SDimitry Andric     // Test if in transactional execution.
6690b57cec5SDimitry Andric     XTEST,
6700b57cec5SDimitry Andric 
6710b57cec5SDimitry Andric     // ERI instructions.
672*5ffd83dbSDimitry Andric     RSQRT28,
673*5ffd83dbSDimitry Andric     RSQRT28_SAE,
674*5ffd83dbSDimitry Andric     RSQRT28S,
675*5ffd83dbSDimitry Andric     RSQRT28S_SAE,
676*5ffd83dbSDimitry Andric     RCP28,
677*5ffd83dbSDimitry Andric     RCP28_SAE,
678*5ffd83dbSDimitry Andric     RCP28S,
679*5ffd83dbSDimitry Andric     RCP28S_SAE,
680*5ffd83dbSDimitry Andric     EXP2,
681*5ffd83dbSDimitry Andric     EXP2_SAE,
6820b57cec5SDimitry Andric 
6830b57cec5SDimitry Andric     // Conversions between float and half-float.
684*5ffd83dbSDimitry Andric     CVTPS2PH,
685*5ffd83dbSDimitry Andric     CVTPH2PS,
686*5ffd83dbSDimitry Andric     CVTPH2PS_SAE,
6870b57cec5SDimitry Andric 
6880b57cec5SDimitry Andric     // Masked version of above.
6890b57cec5SDimitry Andric     // SRC, RND, PASSTHRU, MASK
6900b57cec5SDimitry Andric     MCVTPS2PH,
6910b57cec5SDimitry Andric 
6920b57cec5SDimitry Andric     // Galois Field Arithmetic Instructions
693*5ffd83dbSDimitry Andric     GF2P8AFFINEINVQB,
694*5ffd83dbSDimitry Andric     GF2P8AFFINEQB,
695*5ffd83dbSDimitry Andric     GF2P8MULB,
6960b57cec5SDimitry Andric 
6970b57cec5SDimitry Andric     // LWP insert record.
6980b57cec5SDimitry Andric     LWPINS,
6990b57cec5SDimitry Andric 
7000b57cec5SDimitry Andric     // User level wait
701*5ffd83dbSDimitry Andric     UMWAIT,
702*5ffd83dbSDimitry Andric     TPAUSE,
7030b57cec5SDimitry Andric 
7040b57cec5SDimitry Andric     // Enqueue Stores Instructions
705*5ffd83dbSDimitry Andric     ENQCMD,
706*5ffd83dbSDimitry Andric     ENQCMDS,
7070b57cec5SDimitry Andric 
7080b57cec5SDimitry Andric     // For avx512-vp2intersect
7090b57cec5SDimitry Andric     VP2INTERSECT,
7100b57cec5SDimitry Andric 
711480093f4SDimitry Andric     /// X86 strict FP compare instructions.
712480093f4SDimitry Andric     STRICT_FCMP = ISD::FIRST_TARGET_STRICTFP_OPCODE,
713480093f4SDimitry Andric     STRICT_FCMPS,
714480093f4SDimitry Andric 
715480093f4SDimitry Andric     // Vector packed double/float comparison.
716480093f4SDimitry Andric     STRICT_CMPP,
717480093f4SDimitry Andric 
718480093f4SDimitry Andric     /// Vector comparison generating mask bits for fp and
719480093f4SDimitry Andric     /// integer signed and unsigned data types.
720480093f4SDimitry Andric     STRICT_CMPM,
721480093f4SDimitry Andric 
722480093f4SDimitry Andric     // Vector float/double to signed/unsigned integer with truncation.
723*5ffd83dbSDimitry Andric     STRICT_CVTTP2SI,
724*5ffd83dbSDimitry Andric     STRICT_CVTTP2UI,
725480093f4SDimitry Andric 
726480093f4SDimitry Andric     // Vector FP extend.
727480093f4SDimitry Andric     STRICT_VFPEXT,
728480093f4SDimitry Andric 
729480093f4SDimitry Andric     // Vector FP round.
730480093f4SDimitry Andric     STRICT_VFPROUND,
731480093f4SDimitry Andric 
732480093f4SDimitry Andric     // RndScale - Round FP Values To Include A Given Number Of Fraction Bits.
733480093f4SDimitry Andric     // Also used by the legacy (V)ROUND intrinsics where we mask out the
734480093f4SDimitry Andric     // scaling part of the immediate.
735480093f4SDimitry Andric     STRICT_VRNDSCALE,
736480093f4SDimitry Andric 
737480093f4SDimitry Andric     // Vector signed/unsigned integer to float/double.
738*5ffd83dbSDimitry Andric     STRICT_CVTSI2P,
739*5ffd83dbSDimitry Andric     STRICT_CVTUI2P,
740*5ffd83dbSDimitry Andric 
741*5ffd83dbSDimitry Andric     // Strict FMA nodes.
742*5ffd83dbSDimitry Andric     STRICT_FNMADD,
743*5ffd83dbSDimitry Andric     STRICT_FMSUB,
744*5ffd83dbSDimitry Andric     STRICT_FNMSUB,
745*5ffd83dbSDimitry Andric 
746*5ffd83dbSDimitry Andric     // Conversions between float and half-float.
747*5ffd83dbSDimitry Andric     STRICT_CVTPS2PH,
748*5ffd83dbSDimitry Andric     STRICT_CVTPH2PS,
749480093f4SDimitry Andric 
7500b57cec5SDimitry Andric     // Compare and swap.
7510b57cec5SDimitry Andric     LCMPXCHG_DAG = ISD::FIRST_TARGET_MEMORY_OPCODE,
7520b57cec5SDimitry Andric     LCMPXCHG8_DAG,
7530b57cec5SDimitry Andric     LCMPXCHG16_DAG,
7540b57cec5SDimitry Andric     LCMPXCHG8_SAVE_EBX_DAG,
7550b57cec5SDimitry Andric     LCMPXCHG16_SAVE_RBX_DAG,
7560b57cec5SDimitry Andric 
7570b57cec5SDimitry Andric     /// LOCK-prefixed arithmetic read-modify-write instructions.
7580b57cec5SDimitry Andric     /// EFLAGS, OUTCHAIN = LADD(INCHAIN, PTR, RHS)
759*5ffd83dbSDimitry Andric     LADD,
760*5ffd83dbSDimitry Andric     LSUB,
761*5ffd83dbSDimitry Andric     LOR,
762*5ffd83dbSDimitry Andric     LXOR,
763*5ffd83dbSDimitry Andric     LAND,
7640b57cec5SDimitry Andric 
7650b57cec5SDimitry Andric     // Load, scalar_to_vector, and zero extend.
7660b57cec5SDimitry Andric     VZEXT_LOAD,
7670b57cec5SDimitry Andric 
7680b57cec5SDimitry Andric     // extract_vector_elt, store.
7690b57cec5SDimitry Andric     VEXTRACT_STORE,
7700b57cec5SDimitry Andric 
7718bcb0991SDimitry Andric     // scalar broadcast from memory
7728bcb0991SDimitry Andric     VBROADCAST_LOAD,
7738bcb0991SDimitry Andric 
7740b57cec5SDimitry Andric     // Store FP control world into i16 memory.
7750b57cec5SDimitry Andric     FNSTCW16m,
7760b57cec5SDimitry Andric 
7770b57cec5SDimitry Andric     /// This instruction implements FP_TO_SINT with the
7780b57cec5SDimitry Andric     /// integer destination in memory and a FP reg source.  This corresponds
7790b57cec5SDimitry Andric     /// to the X86::FIST*m instructions and the rounding mode change stuff. It
7800b57cec5SDimitry Andric     /// has two inputs (token chain and address) and two outputs (int value
7810b57cec5SDimitry Andric     /// and token chain). Memory VT specifies the type to store to.
7820b57cec5SDimitry Andric     FP_TO_INT_IN_MEM,
7830b57cec5SDimitry Andric 
7840b57cec5SDimitry Andric     /// This instruction implements SINT_TO_FP with the
7850b57cec5SDimitry Andric     /// integer source in memory and FP reg result.  This corresponds to the
7860b57cec5SDimitry Andric     /// X86::FILD*m instructions. It has two inputs (token chain and address)
787*5ffd83dbSDimitry Andric     /// and two outputs (FP value and token chain). The integer source type is
788*5ffd83dbSDimitry Andric     /// specified by the memory VT.
7890b57cec5SDimitry Andric     FILD,
7900b57cec5SDimitry Andric 
7910b57cec5SDimitry Andric     /// This instruction implements a fp->int store from FP stack
7920b57cec5SDimitry Andric     /// slots. This corresponds to the fist instruction. It takes a
7930b57cec5SDimitry Andric     /// chain operand, value to store, address, and glue. The memory VT
7940b57cec5SDimitry Andric     /// specifies the type to store as.
7950b57cec5SDimitry Andric     FIST,
7960b57cec5SDimitry Andric 
7970b57cec5SDimitry Andric     /// This instruction implements an extending load to FP stack slots.
7980b57cec5SDimitry Andric     /// This corresponds to the X86::FLD32m / X86::FLD64m. It takes a chain
7990b57cec5SDimitry Andric     /// operand, and ptr to load from. The memory VT specifies the type to
8000b57cec5SDimitry Andric     /// load from.
8010b57cec5SDimitry Andric     FLD,
8020b57cec5SDimitry Andric 
8030b57cec5SDimitry Andric     /// This instruction implements a truncating store from FP stack
8040b57cec5SDimitry Andric     /// slots. This corresponds to the X86::FST32m / X86::FST64m. It takes a
8050b57cec5SDimitry Andric     /// chain operand, value to store, address, and glue. The memory VT
8060b57cec5SDimitry Andric     /// specifies the type to store as.
8070b57cec5SDimitry Andric     FST,
8080b57cec5SDimitry Andric 
8090b57cec5SDimitry Andric     /// This instruction grabs the address of the next argument
8100b57cec5SDimitry Andric     /// from a va_list. (reads and modifies the va_list in memory)
8110b57cec5SDimitry Andric     VAARG_64,
8120b57cec5SDimitry Andric 
8130b57cec5SDimitry Andric     // Vector truncating store with unsigned/signed saturation
814*5ffd83dbSDimitry Andric     VTRUNCSTOREUS,
815*5ffd83dbSDimitry Andric     VTRUNCSTORES,
8160b57cec5SDimitry Andric     // Vector truncating masked store with unsigned/signed saturation
817*5ffd83dbSDimitry Andric     VMTRUNCSTOREUS,
818*5ffd83dbSDimitry Andric     VMTRUNCSTORES,
8190b57cec5SDimitry Andric 
8200b57cec5SDimitry Andric     // X86 specific gather and scatter
821*5ffd83dbSDimitry Andric     MGATHER,
822*5ffd83dbSDimitry Andric     MSCATTER,
8230b57cec5SDimitry Andric 
8240b57cec5SDimitry Andric     // WARNING: Do not add anything in the end unless you want the node to
8250b57cec5SDimitry Andric     // have memop! In fact, starting from FIRST_TARGET_MEMORY_OPCODE all
8260b57cec5SDimitry Andric     // opcodes will be thought as target memory ops!
8270b57cec5SDimitry Andric   };
8280b57cec5SDimitry Andric   } // end namespace X86ISD
8290b57cec5SDimitry Andric 
8300b57cec5SDimitry Andric   /// Define some predicates that are used for node matching.
8310b57cec5SDimitry Andric   namespace X86 {
8320b57cec5SDimitry Andric     /// Returns true if Elt is a constant zero or floating point constant +0.0.
8330b57cec5SDimitry Andric     bool isZeroNode(SDValue Elt);
8340b57cec5SDimitry Andric 
8350b57cec5SDimitry Andric     /// Returns true of the given offset can be
8360b57cec5SDimitry Andric     /// fit into displacement field of the instruction.
8370b57cec5SDimitry Andric     bool isOffsetSuitableForCodeModel(int64_t Offset, CodeModel::Model M,
8380b57cec5SDimitry Andric                                       bool hasSymbolicDisplacement = true);
8390b57cec5SDimitry Andric 
8400b57cec5SDimitry Andric     /// Determines whether the callee is required to pop its
8410b57cec5SDimitry Andric     /// own arguments. Callee pop is necessary to support tail calls.
8420b57cec5SDimitry Andric     bool isCalleePop(CallingConv::ID CallingConv,
8430b57cec5SDimitry Andric                      bool is64Bit, bool IsVarArg, bool GuaranteeTCO);
8440b57cec5SDimitry Andric 
8458bcb0991SDimitry Andric     /// If Op is a constant whose elements are all the same constant or
8468bcb0991SDimitry Andric     /// undefined, return true and return the constant value in \p SplatVal.
847*5ffd83dbSDimitry Andric     /// If we have undef bits that don't cover an entire element, we treat these
848*5ffd83dbSDimitry Andric     /// as zero if AllowPartialUndefs is set, else we fail and return false.
849*5ffd83dbSDimitry Andric     bool isConstantSplat(SDValue Op, APInt &SplatVal,
850*5ffd83dbSDimitry Andric                          bool AllowPartialUndefs = true);
8510b57cec5SDimitry Andric   } // end namespace X86
8520b57cec5SDimitry Andric 
8530b57cec5SDimitry Andric   //===--------------------------------------------------------------------===//
8540b57cec5SDimitry Andric   //  X86 Implementation of the TargetLowering interface
8550b57cec5SDimitry Andric   class X86TargetLowering final : public TargetLowering {
8560b57cec5SDimitry Andric   public:
8570b57cec5SDimitry Andric     explicit X86TargetLowering(const X86TargetMachine &TM,
8580b57cec5SDimitry Andric                                const X86Subtarget &STI);
8590b57cec5SDimitry Andric 
8600b57cec5SDimitry Andric     unsigned getJumpTableEncoding() const override;
8610b57cec5SDimitry Andric     bool useSoftFloat() const override;
8620b57cec5SDimitry Andric 
8630b57cec5SDimitry Andric     void markLibCallAttributes(MachineFunction *MF, unsigned CC,
8640b57cec5SDimitry Andric                                ArgListTy &Args) const override;
8650b57cec5SDimitry Andric 
8660b57cec5SDimitry Andric     MVT getScalarShiftAmountTy(const DataLayout &, EVT VT) const override {
8670b57cec5SDimitry Andric       return MVT::i8;
8680b57cec5SDimitry Andric     }
8690b57cec5SDimitry Andric 
8700b57cec5SDimitry Andric     const MCExpr *
8710b57cec5SDimitry Andric     LowerCustomJumpTableEntry(const MachineJumpTableInfo *MJTI,
8720b57cec5SDimitry Andric                               const MachineBasicBlock *MBB, unsigned uid,
8730b57cec5SDimitry Andric                               MCContext &Ctx) const override;
8740b57cec5SDimitry Andric 
8750b57cec5SDimitry Andric     /// Returns relocation base for the given PIC jumptable.
8760b57cec5SDimitry Andric     SDValue getPICJumpTableRelocBase(SDValue Table,
8770b57cec5SDimitry Andric                                      SelectionDAG &DAG) const override;
8780b57cec5SDimitry Andric     const MCExpr *
8790b57cec5SDimitry Andric     getPICJumpTableRelocBaseExpr(const MachineFunction *MF,
8800b57cec5SDimitry Andric                                  unsigned JTI, MCContext &Ctx) const override;
8810b57cec5SDimitry Andric 
8820b57cec5SDimitry Andric     /// Return the desired alignment for ByVal aggregate
8830b57cec5SDimitry Andric     /// function arguments in the caller parameter area. For X86, aggregates
8840b57cec5SDimitry Andric     /// that contains are placed at 16-byte boundaries while the rest are at
8850b57cec5SDimitry Andric     /// 4-byte boundaries.
8860b57cec5SDimitry Andric     unsigned getByValTypeAlignment(Type *Ty,
8870b57cec5SDimitry Andric                                    const DataLayout &DL) const override;
8880b57cec5SDimitry Andric 
889*5ffd83dbSDimitry Andric     EVT getOptimalMemOpType(const MemOp &Op,
8900b57cec5SDimitry Andric                             const AttributeList &FuncAttributes) const override;
8910b57cec5SDimitry Andric 
8920b57cec5SDimitry Andric     /// Returns true if it's safe to use load / store of the
8930b57cec5SDimitry Andric     /// specified type to expand memcpy / memset inline. This is mostly true
8940b57cec5SDimitry Andric     /// for all types except for some special cases. For example, on X86
8950b57cec5SDimitry Andric     /// targets without SSE2 f64 load / store are done with fldl / fstpl which
8960b57cec5SDimitry Andric     /// also does type conversion. Note the specified type doesn't have to be
8970b57cec5SDimitry Andric     /// legal as the hook is used before type legalization.
8980b57cec5SDimitry Andric     bool isSafeMemOpType(MVT VT) const override;
8990b57cec5SDimitry Andric 
9000b57cec5SDimitry Andric     /// Returns true if the target allows unaligned memory accesses of the
9010b57cec5SDimitry Andric     /// specified type. Returns whether it is "fast" in the last argument.
9020b57cec5SDimitry Andric     bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AS, unsigned Align,
9030b57cec5SDimitry Andric                                         MachineMemOperand::Flags Flags,
9040b57cec5SDimitry Andric                                         bool *Fast) const override;
9050b57cec5SDimitry Andric 
9060b57cec5SDimitry Andric     /// Provide custom lowering hooks for some operations.
9070b57cec5SDimitry Andric     ///
9080b57cec5SDimitry Andric     SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
9090b57cec5SDimitry Andric 
9100b57cec5SDimitry Andric     /// Places new result values for the node in Results (their number
9110b57cec5SDimitry Andric     /// and types must exactly match those of the original return values of
9120b57cec5SDimitry Andric     /// the node), or leaves Results empty, which indicates that the node is not
9130b57cec5SDimitry Andric     /// to be custom lowered after all.
9140b57cec5SDimitry Andric     void LowerOperationWrapper(SDNode *N,
9150b57cec5SDimitry Andric                                SmallVectorImpl<SDValue> &Results,
9160b57cec5SDimitry Andric                                SelectionDAG &DAG) const override;
9170b57cec5SDimitry Andric 
9180b57cec5SDimitry Andric     /// Replace the results of node with an illegal result
9190b57cec5SDimitry Andric     /// type with new values built out of custom code.
9200b57cec5SDimitry Andric     ///
9210b57cec5SDimitry Andric     void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue>&Results,
9220b57cec5SDimitry Andric                             SelectionDAG &DAG) const override;
9230b57cec5SDimitry Andric 
9240b57cec5SDimitry Andric     SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
9250b57cec5SDimitry Andric 
9260b57cec5SDimitry Andric     /// Return true if the target has native support for
9270b57cec5SDimitry Andric     /// the specified value type and it is 'desirable' to use the type for the
9280b57cec5SDimitry Andric     /// given node type. e.g. On x86 i16 is legal, but undesirable since i16
9290b57cec5SDimitry Andric     /// instruction encodings are longer and some i16 instructions are slow.
9300b57cec5SDimitry Andric     bool isTypeDesirableForOp(unsigned Opc, EVT VT) const override;
9310b57cec5SDimitry Andric 
9320b57cec5SDimitry Andric     /// Return true if the target has native support for the
9330b57cec5SDimitry Andric     /// specified value type and it is 'desirable' to use the type. e.g. On x86
9340b57cec5SDimitry Andric     /// i16 is legal, but undesirable since i16 instruction encodings are longer
9350b57cec5SDimitry Andric     /// and some i16 instructions are slow.
9360b57cec5SDimitry Andric     bool IsDesirableToPromoteOp(SDValue Op, EVT &PVT) const override;
9370b57cec5SDimitry Andric 
938*5ffd83dbSDimitry Andric     /// Return the newly negated expression if the cost is not expensive and
939*5ffd83dbSDimitry Andric     /// set the cost in \p Cost to indicate that if it is cheaper or neutral to
940*5ffd83dbSDimitry Andric     /// do the negation.
9418bcb0991SDimitry Andric     SDValue getNegatedExpression(SDValue Op, SelectionDAG &DAG,
9428bcb0991SDimitry Andric                                  bool LegalOperations, bool ForCodeSize,
943*5ffd83dbSDimitry Andric                                  NegatibleCost &Cost,
9448bcb0991SDimitry Andric                                  unsigned Depth) const override;
9458bcb0991SDimitry Andric 
9460b57cec5SDimitry Andric     MachineBasicBlock *
9470b57cec5SDimitry Andric     EmitInstrWithCustomInserter(MachineInstr &MI,
9480b57cec5SDimitry Andric                                 MachineBasicBlock *MBB) const override;
9490b57cec5SDimitry Andric 
9500b57cec5SDimitry Andric     /// This method returns the name of a target specific DAG node.
9510b57cec5SDimitry Andric     const char *getTargetNodeName(unsigned Opcode) const override;
9520b57cec5SDimitry Andric 
9530b57cec5SDimitry Andric     /// Do not merge vector stores after legalization because that may conflict
9540b57cec5SDimitry Andric     /// with x86-specific store splitting optimizations.
9550b57cec5SDimitry Andric     bool mergeStoresAfterLegalization(EVT MemVT) const override {
9560b57cec5SDimitry Andric       return !MemVT.isVector();
9570b57cec5SDimitry Andric     }
9580b57cec5SDimitry Andric 
9590b57cec5SDimitry Andric     bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT,
9600b57cec5SDimitry Andric                           const SelectionDAG &DAG) const override;
9610b57cec5SDimitry Andric 
9620b57cec5SDimitry Andric     bool isCheapToSpeculateCttz() const override;
9630b57cec5SDimitry Andric 
9640b57cec5SDimitry Andric     bool isCheapToSpeculateCtlz() const override;
9650b57cec5SDimitry Andric 
9660b57cec5SDimitry Andric     bool isCtlzFast() const override;
9670b57cec5SDimitry Andric 
9680b57cec5SDimitry Andric     bool hasBitPreservingFPLogic(EVT VT) const override {
9690b57cec5SDimitry Andric       return VT == MVT::f32 || VT == MVT::f64 || VT.isVector();
9700b57cec5SDimitry Andric     }
9710b57cec5SDimitry Andric 
9720b57cec5SDimitry Andric     bool isMultiStoresCheaperThanBitsMerge(EVT LTy, EVT HTy) const override {
9730b57cec5SDimitry Andric       // If the pair to store is a mixture of float and int values, we will
9740b57cec5SDimitry Andric       // save two bitwise instructions and one float-to-int instruction and
9750b57cec5SDimitry Andric       // increase one store instruction. There is potentially a more
9760b57cec5SDimitry Andric       // significant benefit because it avoids the float->int domain switch
9770b57cec5SDimitry Andric       // for input value. So It is more likely a win.
9780b57cec5SDimitry Andric       if ((LTy.isFloatingPoint() && HTy.isInteger()) ||
9790b57cec5SDimitry Andric           (LTy.isInteger() && HTy.isFloatingPoint()))
9800b57cec5SDimitry Andric         return true;
9810b57cec5SDimitry Andric       // If the pair only contains int values, we will save two bitwise
9820b57cec5SDimitry Andric       // instructions and increase one store instruction (costing one more
9830b57cec5SDimitry Andric       // store buffer). Since the benefit is more blurred so we leave
9840b57cec5SDimitry Andric       // such pair out until we get testcase to prove it is a win.
9850b57cec5SDimitry Andric       return false;
9860b57cec5SDimitry Andric     }
9870b57cec5SDimitry Andric 
9880b57cec5SDimitry Andric     bool isMaskAndCmp0FoldingBeneficial(const Instruction &AndI) const override;
9890b57cec5SDimitry Andric 
9900b57cec5SDimitry Andric     bool hasAndNotCompare(SDValue Y) const override;
9910b57cec5SDimitry Andric 
9920b57cec5SDimitry Andric     bool hasAndNot(SDValue Y) const override;
9930b57cec5SDimitry Andric 
9948bcb0991SDimitry Andric     bool hasBitTest(SDValue X, SDValue Y) const override;
9958bcb0991SDimitry Andric 
9968bcb0991SDimitry Andric     bool shouldProduceAndByConstByHoistingConstFromShiftsLHSOfAnd(
9978bcb0991SDimitry Andric         SDValue X, ConstantSDNode *XC, ConstantSDNode *CC, SDValue Y,
9988bcb0991SDimitry Andric         unsigned OldShiftOpcode, unsigned NewShiftOpcode,
9998bcb0991SDimitry Andric         SelectionDAG &DAG) const override;
10008bcb0991SDimitry Andric 
10010b57cec5SDimitry Andric     bool shouldFoldConstantShiftPairToMask(const SDNode *N,
10020b57cec5SDimitry Andric                                            CombineLevel Level) const override;
10030b57cec5SDimitry Andric 
10040b57cec5SDimitry Andric     bool shouldFoldMaskToVariableShiftPair(SDValue Y) const override;
10050b57cec5SDimitry Andric 
10060b57cec5SDimitry Andric     bool
10070b57cec5SDimitry Andric     shouldTransformSignedTruncationCheck(EVT XVT,
10080b57cec5SDimitry Andric                                          unsigned KeptBits) const override {
10090b57cec5SDimitry Andric       // For vectors, we don't have a preference..
10100b57cec5SDimitry Andric       if (XVT.isVector())
10110b57cec5SDimitry Andric         return false;
10120b57cec5SDimitry Andric 
10130b57cec5SDimitry Andric       auto VTIsOk = [](EVT VT) -> bool {
10140b57cec5SDimitry Andric         return VT == MVT::i8 || VT == MVT::i16 || VT == MVT::i32 ||
10150b57cec5SDimitry Andric                VT == MVT::i64;
10160b57cec5SDimitry Andric       };
10170b57cec5SDimitry Andric 
10180b57cec5SDimitry Andric       // We are ok with KeptBitsVT being byte/word/dword, what MOVS supports.
10190b57cec5SDimitry Andric       // XVT will be larger than KeptBitsVT.
10200b57cec5SDimitry Andric       MVT KeptBitsVT = MVT::getIntegerVT(KeptBits);
10210b57cec5SDimitry Andric       return VTIsOk(XVT) && VTIsOk(KeptBitsVT);
10220b57cec5SDimitry Andric     }
10230b57cec5SDimitry Andric 
10240b57cec5SDimitry Andric     bool shouldExpandShift(SelectionDAG &DAG, SDNode *N) const override;
10250b57cec5SDimitry Andric 
10260b57cec5SDimitry Andric     bool shouldSplatInsEltVarIndex(EVT VT) const override;
10270b57cec5SDimitry Andric 
10280b57cec5SDimitry Andric     bool convertSetCCLogicToBitwiseLogic(EVT VT) const override {
10290b57cec5SDimitry Andric       return VT.isScalarInteger();
10300b57cec5SDimitry Andric     }
10310b57cec5SDimitry Andric 
10320b57cec5SDimitry Andric     /// Vector-sized comparisons are fast using PCMPEQ + PMOVMSK or PTEST.
10330b57cec5SDimitry Andric     MVT hasFastEqualityCompare(unsigned NumBits) const override;
10340b57cec5SDimitry Andric 
10350b57cec5SDimitry Andric     /// Return the value type to use for ISD::SETCC.
10360b57cec5SDimitry Andric     EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context,
10370b57cec5SDimitry Andric                            EVT VT) const override;
10380b57cec5SDimitry Andric 
1039*5ffd83dbSDimitry Andric     bool targetShrinkDemandedConstant(SDValue Op, const APInt &DemandedBits,
1040*5ffd83dbSDimitry Andric                                       const APInt &DemandedElts,
10410b57cec5SDimitry Andric                                       TargetLoweringOpt &TLO) const override;
10420b57cec5SDimitry Andric 
10430b57cec5SDimitry Andric     /// Determine which of the bits specified in Mask are known to be either
10440b57cec5SDimitry Andric     /// zero or one and return them in the KnownZero/KnownOne bitsets.
10450b57cec5SDimitry Andric     void computeKnownBitsForTargetNode(const SDValue Op,
10460b57cec5SDimitry Andric                                        KnownBits &Known,
10470b57cec5SDimitry Andric                                        const APInt &DemandedElts,
10480b57cec5SDimitry Andric                                        const SelectionDAG &DAG,
10490b57cec5SDimitry Andric                                        unsigned Depth = 0) const override;
10500b57cec5SDimitry Andric 
10510b57cec5SDimitry Andric     /// Determine the number of bits in the operation that are sign bits.
10520b57cec5SDimitry Andric     unsigned ComputeNumSignBitsForTargetNode(SDValue Op,
10530b57cec5SDimitry Andric                                              const APInt &DemandedElts,
10540b57cec5SDimitry Andric                                              const SelectionDAG &DAG,
10550b57cec5SDimitry Andric                                              unsigned Depth) const override;
10560b57cec5SDimitry Andric 
10570b57cec5SDimitry Andric     bool SimplifyDemandedVectorEltsForTargetNode(SDValue Op,
10580b57cec5SDimitry Andric                                                  const APInt &DemandedElts,
10590b57cec5SDimitry Andric                                                  APInt &KnownUndef,
10600b57cec5SDimitry Andric                                                  APInt &KnownZero,
10610b57cec5SDimitry Andric                                                  TargetLoweringOpt &TLO,
10620b57cec5SDimitry Andric                                                  unsigned Depth) const override;
10630b57cec5SDimitry Andric 
1064*5ffd83dbSDimitry Andric     bool SimplifyDemandedVectorEltsForTargetShuffle(SDValue Op,
1065*5ffd83dbSDimitry Andric                                                     const APInt &DemandedElts,
1066*5ffd83dbSDimitry Andric                                                     unsigned MaskIndex,
1067*5ffd83dbSDimitry Andric                                                     TargetLoweringOpt &TLO,
1068*5ffd83dbSDimitry Andric                                                     unsigned Depth) const;
1069*5ffd83dbSDimitry Andric 
10700b57cec5SDimitry Andric     bool SimplifyDemandedBitsForTargetNode(SDValue Op,
10710b57cec5SDimitry Andric                                            const APInt &DemandedBits,
10720b57cec5SDimitry Andric                                            const APInt &DemandedElts,
10730b57cec5SDimitry Andric                                            KnownBits &Known,
10740b57cec5SDimitry Andric                                            TargetLoweringOpt &TLO,
10750b57cec5SDimitry Andric                                            unsigned Depth) const override;
10760b57cec5SDimitry Andric 
10778bcb0991SDimitry Andric     SDValue SimplifyMultipleUseDemandedBitsForTargetNode(
10788bcb0991SDimitry Andric         SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts,
10798bcb0991SDimitry Andric         SelectionDAG &DAG, unsigned Depth) const override;
10808bcb0991SDimitry Andric 
10810b57cec5SDimitry Andric     const Constant *getTargetConstantFromLoad(LoadSDNode *LD) const override;
10820b57cec5SDimitry Andric 
10830b57cec5SDimitry Andric     SDValue unwrapAddress(SDValue N) const override;
10840b57cec5SDimitry Andric 
10850b57cec5SDimitry Andric     SDValue getReturnAddressFrameIndex(SelectionDAG &DAG) const;
10860b57cec5SDimitry Andric 
10870b57cec5SDimitry Andric     bool ExpandInlineAsm(CallInst *CI) const override;
10880b57cec5SDimitry Andric 
10890b57cec5SDimitry Andric     ConstraintType getConstraintType(StringRef Constraint) const override;
10900b57cec5SDimitry Andric 
10910b57cec5SDimitry Andric     /// Examine constraint string and operand type and determine a weight value.
10920b57cec5SDimitry Andric     /// The operand object must already have been set up with the operand type.
10930b57cec5SDimitry Andric     ConstraintWeight
10940b57cec5SDimitry Andric       getSingleConstraintMatchWeight(AsmOperandInfo &info,
10950b57cec5SDimitry Andric                                      const char *constraint) const override;
10960b57cec5SDimitry Andric 
10970b57cec5SDimitry Andric     const char *LowerXConstraint(EVT ConstraintVT) const override;
10980b57cec5SDimitry Andric 
10990b57cec5SDimitry Andric     /// Lower the specified operand into the Ops vector. If it is invalid, don't
11000b57cec5SDimitry Andric     /// add anything to Ops. If hasMemory is true it means one of the asm
11010b57cec5SDimitry Andric     /// constraint of the inline asm instruction being processed is 'm'.
11020b57cec5SDimitry Andric     void LowerAsmOperandForConstraint(SDValue Op,
11030b57cec5SDimitry Andric                                       std::string &Constraint,
11040b57cec5SDimitry Andric                                       std::vector<SDValue> &Ops,
11050b57cec5SDimitry Andric                                       SelectionDAG &DAG) const override;
11060b57cec5SDimitry Andric 
11070b57cec5SDimitry Andric     unsigned
11080b57cec5SDimitry Andric     getInlineAsmMemConstraint(StringRef ConstraintCode) const override {
1109480093f4SDimitry Andric       if (ConstraintCode == "o")
11100b57cec5SDimitry Andric         return InlineAsm::Constraint_o;
11110b57cec5SDimitry Andric       else if (ConstraintCode == "v")
11120b57cec5SDimitry Andric         return InlineAsm::Constraint_v;
11130b57cec5SDimitry Andric       else if (ConstraintCode == "X")
11140b57cec5SDimitry Andric         return InlineAsm::Constraint_X;
11150b57cec5SDimitry Andric       return TargetLowering::getInlineAsmMemConstraint(ConstraintCode);
11160b57cec5SDimitry Andric     }
11170b57cec5SDimitry Andric 
11180b57cec5SDimitry Andric     /// Handle Lowering flag assembly outputs.
11190b57cec5SDimitry Andric     SDValue LowerAsmOutputForConstraint(SDValue &Chain, SDValue &Flag, SDLoc DL,
11200b57cec5SDimitry Andric                                         const AsmOperandInfo &Constraint,
11210b57cec5SDimitry Andric                                         SelectionDAG &DAG) const override;
11220b57cec5SDimitry Andric 
11230b57cec5SDimitry Andric     /// Given a physical register constraint
11240b57cec5SDimitry Andric     /// (e.g. {edx}), return the register number and the register class for the
11250b57cec5SDimitry Andric     /// register.  This should only be used for C_Register constraints.  On
11260b57cec5SDimitry Andric     /// error, this returns a register number of 0.
11270b57cec5SDimitry Andric     std::pair<unsigned, const TargetRegisterClass *>
11280b57cec5SDimitry Andric     getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
11290b57cec5SDimitry Andric                                  StringRef Constraint, MVT VT) const override;
11300b57cec5SDimitry Andric 
11310b57cec5SDimitry Andric     /// Return true if the addressing mode represented
11320b57cec5SDimitry Andric     /// by AM is legal for this target, for a load/store of the specified type.
11330b57cec5SDimitry Andric     bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM,
11340b57cec5SDimitry Andric                                Type *Ty, unsigned AS,
11350b57cec5SDimitry Andric                                Instruction *I = nullptr) const override;
11360b57cec5SDimitry Andric 
11370b57cec5SDimitry Andric     /// Return true if the specified immediate is legal
11380b57cec5SDimitry Andric     /// icmp immediate, that is the target has icmp instructions which can
11390b57cec5SDimitry Andric     /// compare a register against the immediate without having to materialize
11400b57cec5SDimitry Andric     /// the immediate into a register.
11410b57cec5SDimitry Andric     bool isLegalICmpImmediate(int64_t Imm) const override;
11420b57cec5SDimitry Andric 
11430b57cec5SDimitry Andric     /// Return true if the specified immediate is legal
11440b57cec5SDimitry Andric     /// add immediate, that is the target has add instructions which can
11450b57cec5SDimitry Andric     /// add a register and the immediate without having to materialize
11460b57cec5SDimitry Andric     /// the immediate into a register.
11470b57cec5SDimitry Andric     bool isLegalAddImmediate(int64_t Imm) const override;
11480b57cec5SDimitry Andric 
11490b57cec5SDimitry Andric     bool isLegalStoreImmediate(int64_t Imm) const override;
11500b57cec5SDimitry Andric 
11510b57cec5SDimitry Andric     /// Return the cost of the scaling factor used in the addressing
11520b57cec5SDimitry Andric     /// mode represented by AM for this target, for a load/store
11530b57cec5SDimitry Andric     /// of the specified type.
11540b57cec5SDimitry Andric     /// If the AM is supported, the return value must be >= 0.
11550b57cec5SDimitry Andric     /// If the AM is not supported, it returns a negative value.
11560b57cec5SDimitry Andric     int getScalingFactorCost(const DataLayout &DL, const AddrMode &AM, Type *Ty,
11570b57cec5SDimitry Andric                              unsigned AS) const override;
11580b57cec5SDimitry Andric 
1159*5ffd83dbSDimitry Andric     /// This is used to enable splatted operand transforms for vector shifts
1160*5ffd83dbSDimitry Andric     /// and vector funnel shifts.
11610b57cec5SDimitry Andric     bool isVectorShiftByScalarCheap(Type *Ty) const override;
11620b57cec5SDimitry Andric 
11630b57cec5SDimitry Andric     /// Add x86-specific opcodes to the default list.
11640b57cec5SDimitry Andric     bool isBinOp(unsigned Opcode) const override;
11650b57cec5SDimitry Andric 
11660b57cec5SDimitry Andric     /// Returns true if the opcode is a commutative binary operation.
11670b57cec5SDimitry Andric     bool isCommutativeBinOp(unsigned Opcode) const override;
11680b57cec5SDimitry Andric 
11690b57cec5SDimitry Andric     /// Return true if it's free to truncate a value of
11700b57cec5SDimitry Andric     /// type Ty1 to type Ty2. e.g. On x86 it's free to truncate a i32 value in
11710b57cec5SDimitry Andric     /// register EAX to i16 by referencing its sub-register AX.
11720b57cec5SDimitry Andric     bool isTruncateFree(Type *Ty1, Type *Ty2) const override;
11730b57cec5SDimitry Andric     bool isTruncateFree(EVT VT1, EVT VT2) const override;
11740b57cec5SDimitry Andric 
11750b57cec5SDimitry Andric     bool allowTruncateForTailCall(Type *Ty1, Type *Ty2) const override;
11760b57cec5SDimitry Andric 
11770b57cec5SDimitry Andric     /// Return true if any actual instruction that defines a
11780b57cec5SDimitry Andric     /// value of type Ty1 implicit zero-extends the value to Ty2 in the result
11790b57cec5SDimitry Andric     /// register. This does not necessarily include registers defined in
11800b57cec5SDimitry Andric     /// unknown ways, such as incoming arguments, or copies from unknown
11810b57cec5SDimitry Andric     /// virtual registers. Also, if isTruncateFree(Ty2, Ty1) is true, this
11820b57cec5SDimitry Andric     /// does not necessarily apply to truncate instructions. e.g. on x86-64,
11830b57cec5SDimitry Andric     /// all instructions that define 32-bit values implicit zero-extend the
11840b57cec5SDimitry Andric     /// result out to 64 bits.
11850b57cec5SDimitry Andric     bool isZExtFree(Type *Ty1, Type *Ty2) const override;
11860b57cec5SDimitry Andric     bool isZExtFree(EVT VT1, EVT VT2) const override;
11870b57cec5SDimitry Andric     bool isZExtFree(SDValue Val, EVT VT2) const override;
11880b57cec5SDimitry Andric 
1189*5ffd83dbSDimitry Andric     bool shouldSinkOperands(Instruction *I,
1190*5ffd83dbSDimitry Andric                             SmallVectorImpl<Use *> &Ops) const override;
1191*5ffd83dbSDimitry Andric     bool shouldConvertPhiType(Type *From, Type *To) const override;
1192*5ffd83dbSDimitry Andric 
11930b57cec5SDimitry Andric     /// Return true if folding a vector load into ExtVal (a sign, zero, or any
11940b57cec5SDimitry Andric     /// extend node) is profitable.
11950b57cec5SDimitry Andric     bool isVectorLoadExtDesirable(SDValue) const override;
11960b57cec5SDimitry Andric 
11970b57cec5SDimitry Andric     /// Return true if an FMA operation is faster than a pair of fmul and fadd
11980b57cec5SDimitry Andric     /// instructions. fmuladd intrinsics will be expanded to FMAs when this
11990b57cec5SDimitry Andric     /// method returns true, otherwise fmuladd is expanded to fmul + fadd.
1200480093f4SDimitry Andric     bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF,
1201480093f4SDimitry Andric                                     EVT VT) const override;
12020b57cec5SDimitry Andric 
12030b57cec5SDimitry Andric     /// Return true if it's profitable to narrow
12040b57cec5SDimitry Andric     /// operations of type VT1 to VT2. e.g. on x86, it's profitable to narrow
12050b57cec5SDimitry Andric     /// from i32 to i8 but not from i32 to i16.
12060b57cec5SDimitry Andric     bool isNarrowingProfitable(EVT VT1, EVT VT2) const override;
12070b57cec5SDimitry Andric 
12080b57cec5SDimitry Andric     /// Given an intrinsic, checks if on the target the intrinsic will need to map
12090b57cec5SDimitry Andric     /// to a MemIntrinsicNode (touches memory). If this is the case, it returns
12100b57cec5SDimitry Andric     /// true and stores the intrinsic information into the IntrinsicInfo that was
12110b57cec5SDimitry Andric     /// passed to the function.
12120b57cec5SDimitry Andric     bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallInst &I,
12130b57cec5SDimitry Andric                             MachineFunction &MF,
12140b57cec5SDimitry Andric                             unsigned Intrinsic) const override;
12150b57cec5SDimitry Andric 
12160b57cec5SDimitry Andric     /// Returns true if the target can instruction select the
12170b57cec5SDimitry Andric     /// specified FP immediate natively. If false, the legalizer will
12180b57cec5SDimitry Andric     /// materialize the FP immediate as a load from a constant pool.
12190b57cec5SDimitry Andric     bool isFPImmLegal(const APFloat &Imm, EVT VT,
12200b57cec5SDimitry Andric                       bool ForCodeSize) const override;
12210b57cec5SDimitry Andric 
12220b57cec5SDimitry Andric     /// Targets can use this to indicate that they only support *some*
12230b57cec5SDimitry Andric     /// VECTOR_SHUFFLE operations, those with specific masks. By default, if a
12240b57cec5SDimitry Andric     /// target supports the VECTOR_SHUFFLE node, all mask values are assumed to
12250b57cec5SDimitry Andric     /// be legal.
12260b57cec5SDimitry Andric     bool isShuffleMaskLegal(ArrayRef<int> Mask, EVT VT) const override;
12270b57cec5SDimitry Andric 
12280b57cec5SDimitry Andric     /// Similar to isShuffleMaskLegal. Targets can use this to indicate if there
12290b57cec5SDimitry Andric     /// is a suitable VECTOR_SHUFFLE that can be used to replace a VAND with a
12300b57cec5SDimitry Andric     /// constant pool entry.
12310b57cec5SDimitry Andric     bool isVectorClearMaskLegal(ArrayRef<int> Mask, EVT VT) const override;
12320b57cec5SDimitry Andric 
12330b57cec5SDimitry Andric     /// Returns true if lowering to a jump table is allowed.
12340b57cec5SDimitry Andric     bool areJTsAllowed(const Function *Fn) const override;
12350b57cec5SDimitry Andric 
12360b57cec5SDimitry Andric     /// If true, then instruction selection should
12370b57cec5SDimitry Andric     /// seek to shrink the FP constant of the specified type to a smaller type
12380b57cec5SDimitry Andric     /// in order to save space and / or reduce runtime.
12390b57cec5SDimitry Andric     bool ShouldShrinkFPConstant(EVT VT) const override {
12400b57cec5SDimitry Andric       // Don't shrink FP constpool if SSE2 is available since cvtss2sd is more
12410b57cec5SDimitry Andric       // expensive than a straight movsd. On the other hand, it's important to
12420b57cec5SDimitry Andric       // shrink long double fp constant since fldt is very slow.
12430b57cec5SDimitry Andric       return !X86ScalarSSEf64 || VT == MVT::f80;
12440b57cec5SDimitry Andric     }
12450b57cec5SDimitry Andric 
12460b57cec5SDimitry Andric     /// Return true if we believe it is correct and profitable to reduce the
12470b57cec5SDimitry Andric     /// load node to a smaller type.
12480b57cec5SDimitry Andric     bool shouldReduceLoadWidth(SDNode *Load, ISD::LoadExtType ExtTy,
12490b57cec5SDimitry Andric                                EVT NewVT) const override;
12500b57cec5SDimitry Andric 
12510b57cec5SDimitry Andric     /// Return true if the specified scalar FP type is computed in an SSE
12520b57cec5SDimitry Andric     /// register, not on the X87 floating point stack.
12530b57cec5SDimitry Andric     bool isScalarFPTypeInSSEReg(EVT VT) const {
12540b57cec5SDimitry Andric       return (VT == MVT::f64 && X86ScalarSSEf64) || // f64 is when SSE2
12550b57cec5SDimitry Andric              (VT == MVT::f32 && X86ScalarSSEf32);   // f32 is when SSE1
12560b57cec5SDimitry Andric     }
12570b57cec5SDimitry Andric 
12580b57cec5SDimitry Andric     /// Returns true if it is beneficial to convert a load of a constant
12590b57cec5SDimitry Andric     /// to just the constant itself.
12600b57cec5SDimitry Andric     bool shouldConvertConstantLoadToIntImm(const APInt &Imm,
12610b57cec5SDimitry Andric                                            Type *Ty) const override;
12620b57cec5SDimitry Andric 
12638bcb0991SDimitry Andric     bool reduceSelectOfFPConstantLoads(EVT CmpOpVT) const override;
12640b57cec5SDimitry Andric 
12650b57cec5SDimitry Andric     bool convertSelectOfConstantsToMath(EVT VT) const override;
12660b57cec5SDimitry Andric 
12678bcb0991SDimitry Andric     bool decomposeMulByConstant(LLVMContext &Context, EVT VT,
12688bcb0991SDimitry Andric                                 SDValue C) const override;
12690b57cec5SDimitry Andric 
12700b57cec5SDimitry Andric     /// Return true if EXTRACT_SUBVECTOR is cheap for this result type
12710b57cec5SDimitry Andric     /// with this index.
12720b57cec5SDimitry Andric     bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
12730b57cec5SDimitry Andric                                  unsigned Index) const override;
12740b57cec5SDimitry Andric 
12750b57cec5SDimitry Andric     /// Scalar ops always have equal or better analysis/performance/power than
12760b57cec5SDimitry Andric     /// the vector equivalent, so this always makes sense if the scalar op is
12770b57cec5SDimitry Andric     /// supported.
12780b57cec5SDimitry Andric     bool shouldScalarizeBinop(SDValue) const override;
12790b57cec5SDimitry Andric 
12800b57cec5SDimitry Andric     /// Extract of a scalar FP value from index 0 of a vector is free.
12810b57cec5SDimitry Andric     bool isExtractVecEltCheap(EVT VT, unsigned Index) const override {
12820b57cec5SDimitry Andric       EVT EltVT = VT.getScalarType();
12830b57cec5SDimitry Andric       return (EltVT == MVT::f32 || EltVT == MVT::f64) && Index == 0;
12840b57cec5SDimitry Andric     }
12850b57cec5SDimitry Andric 
12860b57cec5SDimitry Andric     /// Overflow nodes should get combined/lowered to optimal instructions
12870b57cec5SDimitry Andric     /// (they should allow eliminating explicit compares by getting flags from
12880b57cec5SDimitry Andric     /// math ops).
1289*5ffd83dbSDimitry Andric     bool shouldFormOverflowOp(unsigned Opcode, EVT VT,
1290*5ffd83dbSDimitry Andric                               bool MathUsed) const override;
12910b57cec5SDimitry Andric 
12920b57cec5SDimitry Andric     bool storeOfVectorConstantIsCheap(EVT MemVT, unsigned NumElem,
12930b57cec5SDimitry Andric                                       unsigned AddrSpace) const override {
12940b57cec5SDimitry Andric       // If we can replace more than 2 scalar stores, there will be a reduction
12950b57cec5SDimitry Andric       // in instructions even after we add a vector constant load.
12960b57cec5SDimitry Andric       return NumElem > 2;
12970b57cec5SDimitry Andric     }
12980b57cec5SDimitry Andric 
12990b57cec5SDimitry Andric     bool isLoadBitCastBeneficial(EVT LoadVT, EVT BitcastVT,
13000b57cec5SDimitry Andric                                  const SelectionDAG &DAG,
13010b57cec5SDimitry Andric                                  const MachineMemOperand &MMO) const override;
13020b57cec5SDimitry Andric 
13030b57cec5SDimitry Andric     /// Intel processors have a unified instruction and data cache
13040b57cec5SDimitry Andric     const char * getClearCacheBuiltinName() const override {
13050b57cec5SDimitry Andric       return nullptr; // nothing to do, move along.
13060b57cec5SDimitry Andric     }
13070b57cec5SDimitry Andric 
1308480093f4SDimitry Andric     Register getRegisterByName(const char* RegName, LLT VT,
13098bcb0991SDimitry Andric                                const MachineFunction &MF) const override;
13100b57cec5SDimitry Andric 
13110b57cec5SDimitry Andric     /// If a physical register, this returns the register that receives the
13120b57cec5SDimitry Andric     /// exception address on entry to an EH pad.
1313*5ffd83dbSDimitry Andric     Register
13140b57cec5SDimitry Andric     getExceptionPointerRegister(const Constant *PersonalityFn) const override;
13150b57cec5SDimitry Andric 
13160b57cec5SDimitry Andric     /// If a physical register, this returns the register that receives the
13170b57cec5SDimitry Andric     /// exception typeid on entry to a landing pad.
1318*5ffd83dbSDimitry Andric     Register
13190b57cec5SDimitry Andric     getExceptionSelectorRegister(const Constant *PersonalityFn) const override;
13200b57cec5SDimitry Andric 
13210b57cec5SDimitry Andric     virtual bool needsFixedCatchObjects() const override;
13220b57cec5SDimitry Andric 
13230b57cec5SDimitry Andric     /// This method returns a target specific FastISel object,
13240b57cec5SDimitry Andric     /// or null if the target does not support "fast" ISel.
13250b57cec5SDimitry Andric     FastISel *createFastISel(FunctionLoweringInfo &funcInfo,
13260b57cec5SDimitry Andric                              const TargetLibraryInfo *libInfo) const override;
13270b57cec5SDimitry Andric 
13280b57cec5SDimitry Andric     /// If the target has a standard location for the stack protector cookie,
13290b57cec5SDimitry Andric     /// returns the address of that location. Otherwise, returns nullptr.
13300b57cec5SDimitry Andric     Value *getIRStackGuard(IRBuilder<> &IRB) const override;
13310b57cec5SDimitry Andric 
13320b57cec5SDimitry Andric     bool useLoadStackGuardNode() const override;
13330b57cec5SDimitry Andric     bool useStackGuardXorFP() const override;
13340b57cec5SDimitry Andric     void insertSSPDeclarations(Module &M) const override;
13350b57cec5SDimitry Andric     Value *getSDagStackGuard(const Module &M) const override;
13360b57cec5SDimitry Andric     Function *getSSPStackGuardCheck(const Module &M) const override;
13370b57cec5SDimitry Andric     SDValue emitStackGuardXorFP(SelectionDAG &DAG, SDValue Val,
13380b57cec5SDimitry Andric                                 const SDLoc &DL) const override;
13390b57cec5SDimitry Andric 
13400b57cec5SDimitry Andric 
13410b57cec5SDimitry Andric     /// Return true if the target stores SafeStack pointer at a fixed offset in
13420b57cec5SDimitry Andric     /// some non-standard address space, and populates the address space and
13430b57cec5SDimitry Andric     /// offset as appropriate.
13440b57cec5SDimitry Andric     Value *getSafeStackPointerLocation(IRBuilder<> &IRB) const override;
13450b57cec5SDimitry Andric 
1346*5ffd83dbSDimitry Andric     std::pair<SDValue, SDValue> BuildFILD(EVT DstVT, EVT SrcVT, const SDLoc &DL,
1347*5ffd83dbSDimitry Andric                                           SDValue Chain, SDValue Pointer,
1348*5ffd83dbSDimitry Andric                                           MachinePointerInfo PtrInfo,
1349*5ffd83dbSDimitry Andric                                           Align Alignment,
13500b57cec5SDimitry Andric                                           SelectionDAG &DAG) const;
13510b57cec5SDimitry Andric 
13520b57cec5SDimitry Andric     bool isNoopAddrSpaceCast(unsigned SrcAS, unsigned DestAS) const override;
13530b57cec5SDimitry Andric 
13540b57cec5SDimitry Andric     /// Customize the preferred legalization strategy for certain types.
13550b57cec5SDimitry Andric     LegalizeTypeAction getPreferredVectorAction(MVT VT) const override;
13560b57cec5SDimitry Andric 
1357*5ffd83dbSDimitry Andric     bool softPromoteHalfType() const override { return true; }
1358*5ffd83dbSDimitry Andric 
13590b57cec5SDimitry Andric     MVT getRegisterTypeForCallingConv(LLVMContext &Context, CallingConv::ID CC,
13600b57cec5SDimitry Andric                                       EVT VT) const override;
13610b57cec5SDimitry Andric 
13620b57cec5SDimitry Andric     unsigned getNumRegistersForCallingConv(LLVMContext &Context,
13630b57cec5SDimitry Andric                                            CallingConv::ID CC,
13640b57cec5SDimitry Andric                                            EVT VT) const override;
13650b57cec5SDimitry Andric 
13668bcb0991SDimitry Andric     unsigned getVectorTypeBreakdownForCallingConv(
13678bcb0991SDimitry Andric         LLVMContext &Context, CallingConv::ID CC, EVT VT, EVT &IntermediateVT,
13688bcb0991SDimitry Andric         unsigned &NumIntermediates, MVT &RegisterVT) const override;
13698bcb0991SDimitry Andric 
13700b57cec5SDimitry Andric     bool isIntDivCheap(EVT VT, AttributeList Attr) const override;
13710b57cec5SDimitry Andric 
13720b57cec5SDimitry Andric     bool supportSwiftError() const override;
13730b57cec5SDimitry Andric 
1374*5ffd83dbSDimitry Andric     bool hasStackProbeSymbol(MachineFunction &MF) const override;
1375*5ffd83dbSDimitry Andric     bool hasInlineStackProbe(MachineFunction &MF) const override;
13760b57cec5SDimitry Andric     StringRef getStackProbeSymbolName(MachineFunction &MF) const override;
13770b57cec5SDimitry Andric 
13788bcb0991SDimitry Andric     unsigned getStackProbeSize(MachineFunction &MF) const;
13798bcb0991SDimitry Andric 
13800b57cec5SDimitry Andric     bool hasVectorBlend() const override { return true; }
13810b57cec5SDimitry Andric 
13820b57cec5SDimitry Andric     unsigned getMaxSupportedInterleaveFactor() const override { return 4; }
13830b57cec5SDimitry Andric 
13840b57cec5SDimitry Andric     /// Lower interleaved load(s) into target specific
13850b57cec5SDimitry Andric     /// instructions/intrinsics.
13860b57cec5SDimitry Andric     bool lowerInterleavedLoad(LoadInst *LI,
13870b57cec5SDimitry Andric                               ArrayRef<ShuffleVectorInst *> Shuffles,
13880b57cec5SDimitry Andric                               ArrayRef<unsigned> Indices,
13890b57cec5SDimitry Andric                               unsigned Factor) const override;
13900b57cec5SDimitry Andric 
13910b57cec5SDimitry Andric     /// Lower interleaved store(s) into target specific
13920b57cec5SDimitry Andric     /// instructions/intrinsics.
13930b57cec5SDimitry Andric     bool lowerInterleavedStore(StoreInst *SI, ShuffleVectorInst *SVI,
13940b57cec5SDimitry Andric                                unsigned Factor) const override;
13950b57cec5SDimitry Andric 
13960b57cec5SDimitry Andric     SDValue expandIndirectJTBranch(const SDLoc& dl, SDValue Value,
13970b57cec5SDimitry Andric                                    SDValue Addr, SelectionDAG &DAG)
13980b57cec5SDimitry Andric                                    const override;
13990b57cec5SDimitry Andric 
14000b57cec5SDimitry Andric   protected:
14010b57cec5SDimitry Andric     std::pair<const TargetRegisterClass *, uint8_t>
14020b57cec5SDimitry Andric     findRepresentativeClass(const TargetRegisterInfo *TRI,
14030b57cec5SDimitry Andric                             MVT VT) const override;
14040b57cec5SDimitry Andric 
14050b57cec5SDimitry Andric   private:
14060b57cec5SDimitry Andric     /// Keep a reference to the X86Subtarget around so that we can
14070b57cec5SDimitry Andric     /// make the right decision when generating code for different targets.
14080b57cec5SDimitry Andric     const X86Subtarget &Subtarget;
14090b57cec5SDimitry Andric 
14100b57cec5SDimitry Andric     /// Select between SSE or x87 floating point ops.
14110b57cec5SDimitry Andric     /// When SSE is available, use it for f32 operations.
14120b57cec5SDimitry Andric     /// When SSE2 is available, use it for f64 operations.
14130b57cec5SDimitry Andric     bool X86ScalarSSEf32;
14140b57cec5SDimitry Andric     bool X86ScalarSSEf64;
14150b57cec5SDimitry Andric 
14160b57cec5SDimitry Andric     /// A list of legal FP immediates.
14170b57cec5SDimitry Andric     std::vector<APFloat> LegalFPImmediates;
14180b57cec5SDimitry Andric 
14190b57cec5SDimitry Andric     /// Indicate that this x86 target can instruction
14200b57cec5SDimitry Andric     /// select the specified FP immediate natively.
14210b57cec5SDimitry Andric     void addLegalFPImmediate(const APFloat& Imm) {
14220b57cec5SDimitry Andric       LegalFPImmediates.push_back(Imm);
14230b57cec5SDimitry Andric     }
14240b57cec5SDimitry Andric 
14250b57cec5SDimitry Andric     SDValue LowerCallResult(SDValue Chain, SDValue InFlag,
14260b57cec5SDimitry Andric                             CallingConv::ID CallConv, bool isVarArg,
14270b57cec5SDimitry Andric                             const SmallVectorImpl<ISD::InputArg> &Ins,
14280b57cec5SDimitry Andric                             const SDLoc &dl, SelectionDAG &DAG,
14290b57cec5SDimitry Andric                             SmallVectorImpl<SDValue> &InVals,
14300b57cec5SDimitry Andric                             uint32_t *RegMask) const;
14310b57cec5SDimitry Andric     SDValue LowerMemArgument(SDValue Chain, CallingConv::ID CallConv,
14320b57cec5SDimitry Andric                              const SmallVectorImpl<ISD::InputArg> &ArgInfo,
14330b57cec5SDimitry Andric                              const SDLoc &dl, SelectionDAG &DAG,
14340b57cec5SDimitry Andric                              const CCValAssign &VA, MachineFrameInfo &MFI,
14350b57cec5SDimitry Andric                              unsigned i) const;
14360b57cec5SDimitry Andric     SDValue LowerMemOpCallTo(SDValue Chain, SDValue StackPtr, SDValue Arg,
14370b57cec5SDimitry Andric                              const SDLoc &dl, SelectionDAG &DAG,
14380b57cec5SDimitry Andric                              const CCValAssign &VA,
1439*5ffd83dbSDimitry Andric                              ISD::ArgFlagsTy Flags, bool isByval) const;
14400b57cec5SDimitry Andric 
14410b57cec5SDimitry Andric     // Call lowering helpers.
14420b57cec5SDimitry Andric 
14430b57cec5SDimitry Andric     /// Check whether the call is eligible for tail call optimization. Targets
14440b57cec5SDimitry Andric     /// that want to do tail call optimization should implement this function.
14450b57cec5SDimitry Andric     bool IsEligibleForTailCallOptimization(SDValue Callee,
14460b57cec5SDimitry Andric                                            CallingConv::ID CalleeCC,
14470b57cec5SDimitry Andric                                            bool isVarArg,
14480b57cec5SDimitry Andric                                            bool isCalleeStructRet,
14490b57cec5SDimitry Andric                                            bool isCallerStructRet,
14500b57cec5SDimitry Andric                                            Type *RetTy,
14510b57cec5SDimitry Andric                                     const SmallVectorImpl<ISD::OutputArg> &Outs,
14520b57cec5SDimitry Andric                                     const SmallVectorImpl<SDValue> &OutVals,
14530b57cec5SDimitry Andric                                     const SmallVectorImpl<ISD::InputArg> &Ins,
14540b57cec5SDimitry Andric                                            SelectionDAG& DAG) const;
14550b57cec5SDimitry Andric     SDValue EmitTailCallLoadRetAddr(SelectionDAG &DAG, SDValue &OutRetAddr,
14560b57cec5SDimitry Andric                                     SDValue Chain, bool IsTailCall,
14570b57cec5SDimitry Andric                                     bool Is64Bit, int FPDiff,
14580b57cec5SDimitry Andric                                     const SDLoc &dl) const;
14590b57cec5SDimitry Andric 
14600b57cec5SDimitry Andric     unsigned GetAlignedArgumentStackSize(unsigned StackSize,
14610b57cec5SDimitry Andric                                          SelectionDAG &DAG) const;
14620b57cec5SDimitry Andric 
14630b57cec5SDimitry Andric     unsigned getAddressSpace(void) const;
14640b57cec5SDimitry Andric 
1465*5ffd83dbSDimitry Andric     SDValue FP_TO_INTHelper(SDValue Op, SelectionDAG &DAG, bool IsSigned,
1466480093f4SDimitry Andric                             SDValue &Chain) const;
1467*5ffd83dbSDimitry Andric     SDValue LRINT_LLRINTHelper(SDNode *N, SelectionDAG &DAG) const;
14680b57cec5SDimitry Andric 
14690b57cec5SDimitry Andric     SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const;
14700b57cec5SDimitry Andric     SDValue LowerVSELECT(SDValue Op, SelectionDAG &DAG) const;
14710b57cec5SDimitry Andric     SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
14720b57cec5SDimitry Andric     SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
14730b57cec5SDimitry Andric 
14740b57cec5SDimitry Andric     unsigned getGlobalWrapperKind(const GlobalValue *GV = nullptr,
14750b57cec5SDimitry Andric                                   const unsigned char OpFlags = 0) const;
14760b57cec5SDimitry Andric     SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) const;
14770b57cec5SDimitry Andric     SDValue LowerBlockAddress(SDValue Op, SelectionDAG &DAG) const;
14780b57cec5SDimitry Andric     SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
14790b57cec5SDimitry Andric     SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
14800b57cec5SDimitry Andric     SDValue LowerExternalSymbol(SDValue Op, SelectionDAG &DAG) const;
14810b57cec5SDimitry Andric 
14820b57cec5SDimitry Andric     /// Creates target global address or external symbol nodes for calls or
14830b57cec5SDimitry Andric     /// other uses.
14840b57cec5SDimitry Andric     SDValue LowerGlobalOrExternal(SDValue Op, SelectionDAG &DAG,
14850b57cec5SDimitry Andric                                   bool ForCall) const;
14860b57cec5SDimitry Andric 
14870b57cec5SDimitry Andric     SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
14880b57cec5SDimitry Andric     SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
14890b57cec5SDimitry Andric     SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG) const;
14900b57cec5SDimitry Andric     SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) const;
1491*5ffd83dbSDimitry Andric     SDValue LowerLRINT_LLRINT(SDValue Op, SelectionDAG &DAG) const;
14920b57cec5SDimitry Andric     SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG) const;
14930b57cec5SDimitry Andric     SDValue LowerSETCCCARRY(SDValue Op, SelectionDAG &DAG) const;
14940b57cec5SDimitry Andric     SDValue LowerSELECT(SDValue Op, SelectionDAG &DAG) const;
14950b57cec5SDimitry Andric     SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG) const;
14960b57cec5SDimitry Andric     SDValue LowerJumpTable(SDValue Op, SelectionDAG &DAG) const;
14970b57cec5SDimitry Andric     SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
14980b57cec5SDimitry Andric     SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG) const;
14990b57cec5SDimitry Andric     SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG) const;
15000b57cec5SDimitry Andric     SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
15010b57cec5SDimitry Andric     SDValue LowerADDROFRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
15020b57cec5SDimitry Andric     SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const;
15030b57cec5SDimitry Andric     SDValue LowerFRAME_TO_ARGS_OFFSET(SDValue Op, SelectionDAG &DAG) const;
15040b57cec5SDimitry Andric     SDValue LowerEH_RETURN(SDValue Op, SelectionDAG &DAG) const;
15050b57cec5SDimitry Andric     SDValue lowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const;
15060b57cec5SDimitry Andric     SDValue lowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const;
15070b57cec5SDimitry Andric     SDValue lowerEH_SJLJ_SETUP_DISPATCH(SDValue Op, SelectionDAG &DAG) const;
15080b57cec5SDimitry Andric     SDValue LowerINIT_TRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
15090b57cec5SDimitry Andric     SDValue LowerFLT_ROUNDS_(SDValue Op, SelectionDAG &DAG) const;
15100b57cec5SDimitry Andric     SDValue LowerWin64_i128OP(SDValue Op, SelectionDAG &DAG) const;
1511480093f4SDimitry Andric     SDValue LowerGC_TRANSITION(SDValue Op, SelectionDAG &DAG) const;
15120b57cec5SDimitry Andric     SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
15138bcb0991SDimitry Andric     SDValue lowerFaddFsub(SDValue Op, SelectionDAG &DAG) const;
15148bcb0991SDimitry Andric     SDValue LowerFP_EXTEND(SDValue Op, SelectionDAG &DAG) const;
15158bcb0991SDimitry Andric     SDValue LowerFP_ROUND(SDValue Op, SelectionDAG &DAG) const;
15168bcb0991SDimitry Andric 
15178bcb0991SDimitry Andric     SDValue LowerF128Call(SDValue Op, SelectionDAG &DAG,
15188bcb0991SDimitry Andric                           RTLIB::Libcall Call) const;
15190b57cec5SDimitry Andric 
15200b57cec5SDimitry Andric     SDValue
15210b57cec5SDimitry Andric     LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
15220b57cec5SDimitry Andric                          const SmallVectorImpl<ISD::InputArg> &Ins,
15230b57cec5SDimitry Andric                          const SDLoc &dl, SelectionDAG &DAG,
15240b57cec5SDimitry Andric                          SmallVectorImpl<SDValue> &InVals) const override;
15250b57cec5SDimitry Andric     SDValue LowerCall(CallLoweringInfo &CLI,
15260b57cec5SDimitry Andric                       SmallVectorImpl<SDValue> &InVals) const override;
15270b57cec5SDimitry Andric 
15280b57cec5SDimitry Andric     SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
15290b57cec5SDimitry Andric                         const SmallVectorImpl<ISD::OutputArg> &Outs,
15300b57cec5SDimitry Andric                         const SmallVectorImpl<SDValue> &OutVals,
15310b57cec5SDimitry Andric                         const SDLoc &dl, SelectionDAG &DAG) const override;
15320b57cec5SDimitry Andric 
15330b57cec5SDimitry Andric     bool supportSplitCSR(MachineFunction *MF) const override {
15340b57cec5SDimitry Andric       return MF->getFunction().getCallingConv() == CallingConv::CXX_FAST_TLS &&
15350b57cec5SDimitry Andric           MF->getFunction().hasFnAttribute(Attribute::NoUnwind);
15360b57cec5SDimitry Andric     }
15370b57cec5SDimitry Andric     void initializeSplitCSR(MachineBasicBlock *Entry) const override;
15380b57cec5SDimitry Andric     void insertCopiesSplitCSR(
15390b57cec5SDimitry Andric       MachineBasicBlock *Entry,
15400b57cec5SDimitry Andric       const SmallVectorImpl<MachineBasicBlock *> &Exits) const override;
15410b57cec5SDimitry Andric 
15420b57cec5SDimitry Andric     bool isUsedByReturnOnly(SDNode *N, SDValue &Chain) const override;
15430b57cec5SDimitry Andric 
15440b57cec5SDimitry Andric     bool mayBeEmittedAsTailCall(const CallInst *CI) const override;
15450b57cec5SDimitry Andric 
15460b57cec5SDimitry Andric     EVT getTypeForExtReturn(LLVMContext &Context, EVT VT,
15470b57cec5SDimitry Andric                             ISD::NodeType ExtendKind) const override;
15480b57cec5SDimitry Andric 
15490b57cec5SDimitry Andric     bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF,
15500b57cec5SDimitry Andric                         bool isVarArg,
15510b57cec5SDimitry Andric                         const SmallVectorImpl<ISD::OutputArg> &Outs,
15520b57cec5SDimitry Andric                         LLVMContext &Context) const override;
15530b57cec5SDimitry Andric 
15540b57cec5SDimitry Andric     const MCPhysReg *getScratchRegisters(CallingConv::ID CC) const override;
15550b57cec5SDimitry Andric 
15560b57cec5SDimitry Andric     TargetLoweringBase::AtomicExpansionKind
1557*5ffd83dbSDimitry Andric     shouldExpandAtomicLoadInIR(LoadInst *LI) const override;
15580b57cec5SDimitry Andric     bool shouldExpandAtomicStoreInIR(StoreInst *SI) const override;
15590b57cec5SDimitry Andric     TargetLoweringBase::AtomicExpansionKind
15600b57cec5SDimitry Andric     shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
15610b57cec5SDimitry Andric 
15620b57cec5SDimitry Andric     LoadInst *
15630b57cec5SDimitry Andric     lowerIdempotentRMWIntoFencedLoad(AtomicRMWInst *AI) const override;
15640b57cec5SDimitry Andric 
15658bcb0991SDimitry Andric     bool lowerAtomicStoreAsStoreSDNode(const StoreInst &SI) const override;
15668bcb0991SDimitry Andric     bool lowerAtomicLoadAsLoadSDNode(const LoadInst &LI) const override;
15678bcb0991SDimitry Andric 
15680b57cec5SDimitry Andric     bool needsCmpXchgNb(Type *MemType) const;
15690b57cec5SDimitry Andric 
15700b57cec5SDimitry Andric     void SetupEntryBlockForSjLj(MachineInstr &MI, MachineBasicBlock *MBB,
15710b57cec5SDimitry Andric                                 MachineBasicBlock *DispatchBB, int FI) const;
15720b57cec5SDimitry Andric 
15730b57cec5SDimitry Andric     // Utility function to emit the low-level va_arg code for X86-64.
15740b57cec5SDimitry Andric     MachineBasicBlock *
15750b57cec5SDimitry Andric     EmitVAARG64WithCustomInserter(MachineInstr &MI,
15760b57cec5SDimitry Andric                                   MachineBasicBlock *MBB) const;
15770b57cec5SDimitry Andric 
15780b57cec5SDimitry Andric     /// Utility function to emit the xmm reg save portion of va_start.
15790b57cec5SDimitry Andric     MachineBasicBlock *
15800b57cec5SDimitry Andric     EmitVAStartSaveXMMRegsWithCustomInserter(MachineInstr &BInstr,
15810b57cec5SDimitry Andric                                              MachineBasicBlock *BB) const;
15820b57cec5SDimitry Andric 
15830b57cec5SDimitry Andric     MachineBasicBlock *EmitLoweredCascadedSelect(MachineInstr &MI1,
15840b57cec5SDimitry Andric                                                  MachineInstr &MI2,
15850b57cec5SDimitry Andric                                                  MachineBasicBlock *BB) const;
15860b57cec5SDimitry Andric 
15870b57cec5SDimitry Andric     MachineBasicBlock *EmitLoweredSelect(MachineInstr &I,
15880b57cec5SDimitry Andric                                          MachineBasicBlock *BB) const;
15890b57cec5SDimitry Andric 
15900b57cec5SDimitry Andric     MachineBasicBlock *EmitLoweredCatchRet(MachineInstr &MI,
15910b57cec5SDimitry Andric                                            MachineBasicBlock *BB) const;
15920b57cec5SDimitry Andric 
1593*5ffd83dbSDimitry Andric     MachineBasicBlock *EmitLoweredSegAlloca(MachineInstr &MI,
15940b57cec5SDimitry Andric                                             MachineBasicBlock *BB) const;
15950b57cec5SDimitry Andric 
1596*5ffd83dbSDimitry Andric     MachineBasicBlock *EmitLoweredProbedAlloca(MachineInstr &MI,
15970b57cec5SDimitry Andric                                                MachineBasicBlock *BB) const;
15980b57cec5SDimitry Andric 
15990b57cec5SDimitry Andric     MachineBasicBlock *EmitLoweredTLSAddr(MachineInstr &MI,
16000b57cec5SDimitry Andric                                           MachineBasicBlock *BB) const;
16010b57cec5SDimitry Andric 
16020b57cec5SDimitry Andric     MachineBasicBlock *EmitLoweredTLSCall(MachineInstr &MI,
16030b57cec5SDimitry Andric                                           MachineBasicBlock *BB) const;
16040b57cec5SDimitry Andric 
16050946e70aSDimitry Andric     MachineBasicBlock *EmitLoweredIndirectThunk(MachineInstr &MI,
16060b57cec5SDimitry Andric                                                 MachineBasicBlock *BB) const;
16070b57cec5SDimitry Andric 
16080b57cec5SDimitry Andric     MachineBasicBlock *emitEHSjLjSetJmp(MachineInstr &MI,
16090b57cec5SDimitry Andric                                         MachineBasicBlock *MBB) const;
16100b57cec5SDimitry Andric 
16110b57cec5SDimitry Andric     void emitSetJmpShadowStackFix(MachineInstr &MI,
16120b57cec5SDimitry Andric                                   MachineBasicBlock *MBB) const;
16130b57cec5SDimitry Andric 
16140b57cec5SDimitry Andric     MachineBasicBlock *emitEHSjLjLongJmp(MachineInstr &MI,
16150b57cec5SDimitry Andric                                          MachineBasicBlock *MBB) const;
16160b57cec5SDimitry Andric 
16170b57cec5SDimitry Andric     MachineBasicBlock *emitLongJmpShadowStackFix(MachineInstr &MI,
16180b57cec5SDimitry Andric                                                  MachineBasicBlock *MBB) const;
16190b57cec5SDimitry Andric 
16200b57cec5SDimitry Andric     MachineBasicBlock *EmitSjLjDispatchBlock(MachineInstr &MI,
16210b57cec5SDimitry Andric                                              MachineBasicBlock *MBB) const;
16220b57cec5SDimitry Andric 
16230b57cec5SDimitry Andric     /// Emit flags for the given setcc condition and operands. Also returns the
16240b57cec5SDimitry Andric     /// corresponding X86 condition code constant in X86CC.
1625480093f4SDimitry Andric     SDValue emitFlagsForSetcc(SDValue Op0, SDValue Op1, ISD::CondCode CC,
1626480093f4SDimitry Andric                               const SDLoc &dl, SelectionDAG &DAG,
1627*5ffd83dbSDimitry Andric                               SDValue &X86CC) const;
16280b57cec5SDimitry Andric 
16290b57cec5SDimitry Andric     /// Check if replacement of SQRT with RSQRT should be disabled.
1630*5ffd83dbSDimitry Andric     bool isFsqrtCheap(SDValue Op, SelectionDAG &DAG) const override;
16310b57cec5SDimitry Andric 
16320b57cec5SDimitry Andric     /// Use rsqrt* to speed up sqrt calculations.
1633*5ffd83dbSDimitry Andric     SDValue getSqrtEstimate(SDValue Op, SelectionDAG &DAG, int Enabled,
16340b57cec5SDimitry Andric                             int &RefinementSteps, bool &UseOneConstNR,
16350b57cec5SDimitry Andric                             bool Reciprocal) const override;
16360b57cec5SDimitry Andric 
16370b57cec5SDimitry Andric     /// Use rcp* to speed up fdiv calculations.
1638*5ffd83dbSDimitry Andric     SDValue getRecipEstimate(SDValue Op, SelectionDAG &DAG, int Enabled,
16390b57cec5SDimitry Andric                              int &RefinementSteps) const override;
16400b57cec5SDimitry Andric 
16410b57cec5SDimitry Andric     /// Reassociate floating point divisions into multiply by reciprocal.
16420b57cec5SDimitry Andric     unsigned combineRepeatedFPDivisors() const override;
16438bcb0991SDimitry Andric 
16448bcb0991SDimitry Andric     SDValue BuildSDIVPow2(SDNode *N, const APInt &Divisor, SelectionDAG &DAG,
16458bcb0991SDimitry Andric                           SmallVectorImpl<SDNode *> &Created) const override;
16460b57cec5SDimitry Andric   };
16470b57cec5SDimitry Andric 
16480b57cec5SDimitry Andric   namespace X86 {
16490b57cec5SDimitry Andric     FastISel *createFastISel(FunctionLoweringInfo &funcInfo,
16500b57cec5SDimitry Andric                              const TargetLibraryInfo *libInfo);
16510b57cec5SDimitry Andric   } // end namespace X86
16520b57cec5SDimitry Andric 
16530b57cec5SDimitry Andric   // X86 specific Gather/Scatter nodes.
16540b57cec5SDimitry Andric   // The class has the same order of operands as MaskedGatherScatterSDNode for
16550b57cec5SDimitry Andric   // convenience.
1656*5ffd83dbSDimitry Andric   class X86MaskedGatherScatterSDNode : public MemIntrinsicSDNode {
16570b57cec5SDimitry Andric   public:
1658*5ffd83dbSDimitry Andric     // This is a intended as a utility and should never be directly created.
1659*5ffd83dbSDimitry Andric     X86MaskedGatherScatterSDNode() = delete;
1660*5ffd83dbSDimitry Andric     ~X86MaskedGatherScatterSDNode() = delete;
16610b57cec5SDimitry Andric 
16620b57cec5SDimitry Andric     const SDValue &getBasePtr() const { return getOperand(3); }
16630b57cec5SDimitry Andric     const SDValue &getIndex()   const { return getOperand(4); }
16640b57cec5SDimitry Andric     const SDValue &getMask()    const { return getOperand(2); }
16650b57cec5SDimitry Andric     const SDValue &getScale()   const { return getOperand(5); }
16660b57cec5SDimitry Andric 
16670b57cec5SDimitry Andric     static bool classof(const SDNode *N) {
16680b57cec5SDimitry Andric       return N->getOpcode() == X86ISD::MGATHER ||
16690b57cec5SDimitry Andric              N->getOpcode() == X86ISD::MSCATTER;
16700b57cec5SDimitry Andric     }
16710b57cec5SDimitry Andric   };
16720b57cec5SDimitry Andric 
16730b57cec5SDimitry Andric   class X86MaskedGatherSDNode : public X86MaskedGatherScatterSDNode {
16740b57cec5SDimitry Andric   public:
16750b57cec5SDimitry Andric     const SDValue &getPassThru() const { return getOperand(1); }
16760b57cec5SDimitry Andric 
16770b57cec5SDimitry Andric     static bool classof(const SDNode *N) {
16780b57cec5SDimitry Andric       return N->getOpcode() == X86ISD::MGATHER;
16790b57cec5SDimitry Andric     }
16800b57cec5SDimitry Andric   };
16810b57cec5SDimitry Andric 
16820b57cec5SDimitry Andric   class X86MaskedScatterSDNode : public X86MaskedGatherScatterSDNode {
16830b57cec5SDimitry Andric   public:
16840b57cec5SDimitry Andric     const SDValue &getValue() const { return getOperand(1); }
16850b57cec5SDimitry Andric 
16860b57cec5SDimitry Andric     static bool classof(const SDNode *N) {
16870b57cec5SDimitry Andric       return N->getOpcode() == X86ISD::MSCATTER;
16880b57cec5SDimitry Andric     }
16890b57cec5SDimitry Andric   };
16900b57cec5SDimitry Andric 
16910b57cec5SDimitry Andric   /// Generate unpacklo/unpackhi shuffle mask.
1692*5ffd83dbSDimitry Andric   void createUnpackShuffleMask(MVT VT, SmallVectorImpl<int> &Mask, bool Lo,
1693*5ffd83dbSDimitry Andric                                bool Unary);
16940b57cec5SDimitry Andric 
1695*5ffd83dbSDimitry Andric   /// Similar to unpacklo/unpackhi, but without the 128-bit lane limitation
1696*5ffd83dbSDimitry Andric   /// imposed by AVX and specific to the unary pattern. Example:
1697*5ffd83dbSDimitry Andric   /// v8iX Lo --> <0, 0, 1, 1, 2, 2, 3, 3>
1698*5ffd83dbSDimitry Andric   /// v8iX Hi --> <4, 4, 5, 5, 6, 6, 7, 7>
1699*5ffd83dbSDimitry Andric   void createSplat2ShuffleMask(MVT VT, SmallVectorImpl<int> &Mask, bool Lo);
17000b57cec5SDimitry Andric 
17010b57cec5SDimitry Andric } // end namespace llvm
17020b57cec5SDimitry Andric 
17030b57cec5SDimitry Andric #endif // LLVM_LIB_TARGET_X86_X86ISELLOWERING_H
1704