Target/X86/X86ISelLowering.h

0b57cec5SDimitry Andric//===-- X86ISelLowering.h - X86 DAG Lowering Interface ----------*- C++ -*-===//
0b57cec5SDimitry Andric//
0b57cec5SDimitry Andric// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
0b57cec5SDimitry Andric// See https://llvm.org/LICENSE.txt for license information.
0b57cec5SDimitry Andric// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
0b57cec5SDimitry Andric//
0b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
0b57cec5SDimitry Andric//
0b57cec5SDimitry Andric// This file defines the interfaces that X86 uses to lower LLVM code into a
0b57cec5SDimitry Andric// selection DAG.
0b57cec5SDimitry Andric//
0b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric#ifndef LLVM_LIB_TARGET_X86_X86ISELLOWERING_H
0b57cec5SDimitry Andric#define LLVM_LIB_TARGET_X86_X86ISELLOWERING_H
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric#include "llvm/CodeGen/TargetLowering.h"
0b57cec5SDimitry Andric
0b57cec5SDimitry Andricnamespace llvm {
0b57cec5SDimitry Andric  class X86Subtarget;
0b57cec5SDimitry Andric  class X86TargetMachine;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  namespace X86ISD {
0b57cec5SDimitry Andric    // X86 Specific DAG Nodes
0b57cec5SDimitry Andric  enum NodeType : unsigned {
0b57cec5SDimitry Andric    // Start the numbering where the builtin ops leave off.
0b57cec5SDimitry Andric    FIRST_NUMBER = ISD::BUILTIN_OP_END,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Bit scan forward.
0b57cec5SDimitry Andric    BSF,
0b57cec5SDimitry Andric    /// Bit scan reverse.
0b57cec5SDimitry Andric    BSR,
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    /// X86 funnel/double shift i16 instructions. These correspond to
*5ffd83dbSDimitry Andric    /// X86::SHLDW and X86::SHRDW instructions which have different amt
*5ffd83dbSDimitry Andric    /// modulo rules to generic funnel shifts.
*5ffd83dbSDimitry Andric    /// NOTE: The operand order matches ISD::FSHL/FSHR not SHLD/SHRD.
*5ffd83dbSDimitry Andric    FSHL,
*5ffd83dbSDimitry Andric    FSHR,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Bitwise logical AND of floating point values. This corresponds
0b57cec5SDimitry Andric    /// to X86::ANDPS or X86::ANDPD.
0b57cec5SDimitry Andric    FAND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Bitwise logical OR of floating point values. This corresponds
0b57cec5SDimitry Andric    /// to X86::ORPS or X86::ORPD.
0b57cec5SDimitry Andric    FOR,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Bitwise logical XOR of floating point values. This corresponds
0b57cec5SDimitry Andric    /// to X86::XORPS or X86::XORPD.
0b57cec5SDimitry Andric    FXOR,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    ///  Bitwise logical ANDNOT of floating point values. This
0b57cec5SDimitry Andric    /// corresponds to X86::ANDNPS or X86::ANDNPD.
0b57cec5SDimitry Andric    FANDN,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// These operations represent an abstract X86 call
0b57cec5SDimitry Andric    /// instruction, which includes a bunch of information.  In particular the
0b57cec5SDimitry Andric    /// operands of these node are:
0b57cec5SDimitry Andric    ///
0b57cec5SDimitry Andric    ///     #0 - The incoming token chain
0b57cec5SDimitry Andric    ///     #1 - The callee
0b57cec5SDimitry Andric    ///     #2 - The number of arg bytes the caller pushes on the stack.
0b57cec5SDimitry Andric    ///     #3 - The number of arg bytes the callee pops off the stack.
0b57cec5SDimitry Andric    ///     #4 - The value to pass in AL/AX/EAX (optional)
0b57cec5SDimitry Andric    ///     #5 - The value to pass in DL/DX/EDX (optional)
0b57cec5SDimitry Andric    ///
0b57cec5SDimitry Andric    /// The result values of these nodes are:
0b57cec5SDimitry Andric    ///
0b57cec5SDimitry Andric    ///     #0 - The outgoing token chain
0b57cec5SDimitry Andric    ///     #1 - The first register result value (optional)
0b57cec5SDimitry Andric    ///     #2 - The second register result value (optional)
0b57cec5SDimitry Andric    ///
0b57cec5SDimitry Andric    CALL,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Same as call except it adds the NoTrack prefix.
0b57cec5SDimitry Andric    NT_CALL,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// X86 compare and logical compare instructions.
*5ffd83dbSDimitry Andric    CMP,
*5ffd83dbSDimitry Andric    FCMP,
*5ffd83dbSDimitry Andric    COMI,
*5ffd83dbSDimitry Andric    UCOMI,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// X86 bit-test instructions.
0b57cec5SDimitry Andric    BT,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// X86 SetCC. Operand 0 is condition code, and operand 1 is the EFLAGS
0b57cec5SDimitry Andric    /// operand, usually produced by a CMP instruction.
0b57cec5SDimitry Andric    SETCC,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// X86 Select
0b57cec5SDimitry Andric    SELECTS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Same as SETCC except it's materialized with a sbb and the value is all
0b57cec5SDimitry Andric    // one's or all zero's.
0b57cec5SDimitry Andric    SETCC_CARRY, // R = carry_bit ? ~0 : 0
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// X86 FP SETCC, implemented with CMP{cc}SS/CMP{cc}SD.
0b57cec5SDimitry Andric    /// Operands are two FP values to compare; result is a mask of
0b57cec5SDimitry Andric    /// 0s or 1s.  Generally DTRT for C/C++ with NaNs.
0b57cec5SDimitry Andric    FSETCC,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// X86 FP SETCC, similar to above, but with output as an i1 mask and
0b57cec5SDimitry Andric    /// and a version with SAE.
*5ffd83dbSDimitry Andric    FSETCCM,
*5ffd83dbSDimitry Andric    FSETCCM_SAE,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// X86 conditional moves. Operand 0 and operand 1 are the two values
0b57cec5SDimitry Andric    /// to select from. Operand 2 is the condition code, and operand 3 is the
0b57cec5SDimitry Andric    /// flag operand produced by a CMP or TEST instruction.
0b57cec5SDimitry Andric    CMOV,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// X86 conditional branches. Operand 0 is the chain operand, operand 1
0b57cec5SDimitry Andric    /// is the block to branch if condition is true, operand 2 is the
0b57cec5SDimitry Andric    /// condition code, and operand 3 is the flag operand produced by a CMP
0b57cec5SDimitry Andric    /// or TEST instruction.
0b57cec5SDimitry Andric    BRCOND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// BRIND node with NoTrack prefix. Operand 0 is the chain operand and
0b57cec5SDimitry Andric    /// operand 1 is the target address.
0b57cec5SDimitry Andric    NT_BRIND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return with a flag operand. Operand 0 is the chain operand, operand
0b57cec5SDimitry Andric    /// 1 is the number of bytes of stack to pop.
0b57cec5SDimitry Andric    RET_FLAG,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return from interrupt. Operand 0 is the number of bytes to pop.
0b57cec5SDimitry Andric    IRET,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Repeat fill, corresponds to X86::REP_STOSx.
0b57cec5SDimitry Andric    REP_STOS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Repeat move, corresponds to X86::REP_MOVSx.
0b57cec5SDimitry Andric    REP_MOVS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// On Darwin, this node represents the result of the popl
0b57cec5SDimitry Andric    /// at function entry, used for PIC code.
0b57cec5SDimitry Andric    GlobalBaseReg,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// A wrapper node for TargetConstantPool, TargetJumpTable,
0b57cec5SDimitry Andric    /// TargetExternalSymbol, TargetGlobalAddress, TargetGlobalTLSAddress,
0b57cec5SDimitry Andric    /// MCSymbol and TargetBlockAddress.
0b57cec5SDimitry Andric    Wrapper,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Special wrapper used under X86-64 PIC mode for RIP
0b57cec5SDimitry Andric    /// relative displacements.
0b57cec5SDimitry Andric    WrapperRIP,
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    /// Copies a 64-bit value from an MMX vector to the low word
8bcb0991SDimitry Andric    /// of an XMM vector, with the high word zero filled.
8bcb0991SDimitry Andric    MOVQ2DQ,
8bcb0991SDimitry Andric
0b57cec5SDimitry Andric    /// Copies a 64-bit value from the low word of an XMM vector
0b57cec5SDimitry Andric    /// to an MMX vector.
0b57cec5SDimitry Andric    MOVDQ2Q,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Copies a 32-bit value from the low word of a MMX
0b57cec5SDimitry Andric    /// vector to a GPR.
0b57cec5SDimitry Andric    MMX_MOVD2W,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Copies a GPR into the low 32-bit word of a MMX vector
0b57cec5SDimitry Andric    /// and zero out the high word.
0b57cec5SDimitry Andric    MMX_MOVW2D,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Extract an 8-bit value from a vector and zero extend it to
0b57cec5SDimitry Andric    /// i32, corresponds to X86::PEXTRB.
0b57cec5SDimitry Andric    PEXTRB,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Extract a 16-bit value from a vector and zero extend it to
0b57cec5SDimitry Andric    /// i32, corresponds to X86::PEXTRW.
0b57cec5SDimitry Andric    PEXTRW,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Insert any element of a 4 x float vector into any element
0b57cec5SDimitry Andric    /// of a destination 4 x floatvector.
0b57cec5SDimitry Andric    INSERTPS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Insert the lower 8-bits of a 32-bit value to a vector,
0b57cec5SDimitry Andric    /// corresponds to X86::PINSRB.
0b57cec5SDimitry Andric    PINSRB,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Insert the lower 16-bits of a 32-bit value to a vector,
0b57cec5SDimitry Andric    /// corresponds to X86::PINSRW.
0b57cec5SDimitry Andric    PINSRW,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Shuffle 16 8-bit values within a vector.
0b57cec5SDimitry Andric    PSHUFB,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Compute Sum of Absolute Differences.
0b57cec5SDimitry Andric    PSADBW,
0b57cec5SDimitry Andric    /// Compute Double Block Packed Sum-Absolute-Differences
0b57cec5SDimitry Andric    DBPSADBW,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Bitwise Logical AND NOT of Packed FP values.
0b57cec5SDimitry Andric    ANDNP,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Blend where the selector is an immediate.
0b57cec5SDimitry Andric    BLENDI,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Dynamic (non-constant condition) vector blend where only the sign bits
0b57cec5SDimitry Andric    /// of the condition elements are used. This is used to enforce that the
0b57cec5SDimitry Andric    /// condition mask is not valid for generic VSELECT optimizations. This
0b57cec5SDimitry Andric    /// is also used to implement the intrinsics.
0b57cec5SDimitry Andric    /// Operands are in VSELECT order: MASK, TRUE, FALSE
0b57cec5SDimitry Andric    BLENDV,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Combined add and sub on an FP vector.
0b57cec5SDimitry Andric    ADDSUB,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    //  FP vector ops with rounding mode.
*5ffd83dbSDimitry Andric    FADD_RND,
*5ffd83dbSDimitry Andric    FADDS,
*5ffd83dbSDimitry Andric    FADDS_RND,
*5ffd83dbSDimitry Andric    FSUB_RND,
*5ffd83dbSDimitry Andric    FSUBS,
*5ffd83dbSDimitry Andric    FSUBS_RND,
*5ffd83dbSDimitry Andric    FMUL_RND,
*5ffd83dbSDimitry Andric    FMULS,
*5ffd83dbSDimitry Andric    FMULS_RND,
*5ffd83dbSDimitry Andric    FDIV_RND,
*5ffd83dbSDimitry Andric    FDIVS,
*5ffd83dbSDimitry Andric    FDIVS_RND,
*5ffd83dbSDimitry Andric    FMAX_SAE,
*5ffd83dbSDimitry Andric    FMAXS_SAE,
*5ffd83dbSDimitry Andric    FMIN_SAE,
*5ffd83dbSDimitry Andric    FMINS_SAE,
*5ffd83dbSDimitry Andric    FSQRT_RND,
*5ffd83dbSDimitry Andric    FSQRTS,
*5ffd83dbSDimitry Andric    FSQRTS_RND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // FP vector get exponent.
*5ffd83dbSDimitry Andric    FGETEXP,
*5ffd83dbSDimitry Andric    FGETEXP_SAE,
*5ffd83dbSDimitry Andric    FGETEXPS,
*5ffd83dbSDimitry Andric    FGETEXPS_SAE,
0b57cec5SDimitry Andric    // Extract Normalized Mantissas.
*5ffd83dbSDimitry Andric    VGETMANT,
*5ffd83dbSDimitry Andric    VGETMANT_SAE,
*5ffd83dbSDimitry Andric    VGETMANTS,
*5ffd83dbSDimitry Andric    VGETMANTS_SAE,
0b57cec5SDimitry Andric    // FP Scale.
*5ffd83dbSDimitry Andric    SCALEF,
*5ffd83dbSDimitry Andric    SCALEF_RND,
*5ffd83dbSDimitry Andric    SCALEFS,
*5ffd83dbSDimitry Andric    SCALEFS_RND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Unsigned Integer average.
0b57cec5SDimitry Andric    AVG,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Integer horizontal add/sub.
0b57cec5SDimitry Andric    HADD,
0b57cec5SDimitry Andric    HSUB,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Floating point horizontal add/sub.
0b57cec5SDimitry Andric    FHADD,
0b57cec5SDimitry Andric    FHSUB,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Detect Conflicts Within a Vector
0b57cec5SDimitry Andric    CONFLICT,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Floating point max and min.
*5ffd83dbSDimitry Andric    FMAX,
*5ffd83dbSDimitry Andric    FMIN,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Commutative FMIN and FMAX.
*5ffd83dbSDimitry Andric    FMAXC,
*5ffd83dbSDimitry Andric    FMINC,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Scalar intrinsic floating point max and min.
*5ffd83dbSDimitry Andric    FMAXS,
*5ffd83dbSDimitry Andric    FMINS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Floating point reciprocal-sqrt and reciprocal approximation.
0b57cec5SDimitry Andric    /// Note that these typically require refinement
0b57cec5SDimitry Andric    /// in order to obtain suitable precision.
*5ffd83dbSDimitry Andric    FRSQRT,
*5ffd83dbSDimitry Andric    FRCP,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // AVX-512 reciprocal approximations with a little more precision.
*5ffd83dbSDimitry Andric    RSQRT14,
*5ffd83dbSDimitry Andric    RSQRT14S,
*5ffd83dbSDimitry Andric    RCP14,
*5ffd83dbSDimitry Andric    RCP14S,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Thread Local Storage.
0b57cec5SDimitry Andric    TLSADDR,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Thread Local Storage. A call to get the start address
0b57cec5SDimitry Andric    // of the TLS block for the current module.
0b57cec5SDimitry Andric    TLSBASEADDR,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Thread Local Storage.  When calling to an OS provided
0b57cec5SDimitry Andric    // thunk at the address from an earlier relocation.
0b57cec5SDimitry Andric    TLSCALL,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Exception Handling helpers.
0b57cec5SDimitry Andric    EH_RETURN,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // SjLj exception handling setjmp.
0b57cec5SDimitry Andric    EH_SJLJ_SETJMP,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // SjLj exception handling longjmp.
0b57cec5SDimitry Andric    EH_SJLJ_LONGJMP,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // SjLj exception handling dispatch.
0b57cec5SDimitry Andric    EH_SJLJ_SETUP_DISPATCH,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Tail call return. See X86TargetLowering::LowerCall for
0b57cec5SDimitry Andric    /// the list of operands.
0b57cec5SDimitry Andric    TC_RETURN,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector move to low scalar and zero higher vector elements.
0b57cec5SDimitry Andric    VZEXT_MOVL,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector integer truncate.
0b57cec5SDimitry Andric    VTRUNC,
0b57cec5SDimitry Andric    // Vector integer truncate with unsigned/signed saturation.
*5ffd83dbSDimitry Andric    VTRUNCUS,
*5ffd83dbSDimitry Andric    VTRUNCS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Masked version of the above. Used when less than a 128-bit result is
0b57cec5SDimitry Andric    // produced since the mask only applies to the lower elements and can't
0b57cec5SDimitry Andric    // be represented by a select.
0b57cec5SDimitry Andric    // SRC, PASSTHRU, MASK
*5ffd83dbSDimitry Andric    VMTRUNC,
*5ffd83dbSDimitry Andric    VMTRUNCUS,
*5ffd83dbSDimitry Andric    VMTRUNCS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector FP extend.
*5ffd83dbSDimitry Andric    VFPEXT,
*5ffd83dbSDimitry Andric    VFPEXT_SAE,
*5ffd83dbSDimitry Andric    VFPEXTS,
*5ffd83dbSDimitry Andric    VFPEXTS_SAE,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector FP round.
*5ffd83dbSDimitry Andric    VFPROUND,
*5ffd83dbSDimitry Andric    VFPROUND_RND,
*5ffd83dbSDimitry Andric    VFPROUNDS,
*5ffd83dbSDimitry Andric    VFPROUNDS_RND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Masked version of above. Used for v2f64->v4f32.
0b57cec5SDimitry Andric    // SRC, PASSTHRU, MASK
0b57cec5SDimitry Andric    VMFPROUND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // 128-bit vector logical left / right shift
*5ffd83dbSDimitry Andric    VSHLDQ,
*5ffd83dbSDimitry Andric    VSRLDQ,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector shift elements
*5ffd83dbSDimitry Andric    VSHL,
*5ffd83dbSDimitry Andric    VSRL,
*5ffd83dbSDimitry Andric    VSRA,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector variable shift
*5ffd83dbSDimitry Andric    VSHLV,
*5ffd83dbSDimitry Andric    VSRLV,
*5ffd83dbSDimitry Andric    VSRAV,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector shift elements by immediate
*5ffd83dbSDimitry Andric    VSHLI,
*5ffd83dbSDimitry Andric    VSRLI,
*5ffd83dbSDimitry Andric    VSRAI,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Shifts of mask registers.
*5ffd83dbSDimitry Andric    KSHIFTL,
*5ffd83dbSDimitry Andric    KSHIFTR,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Bit rotate by immediate
*5ffd83dbSDimitry Andric    VROTLI,
*5ffd83dbSDimitry Andric    VROTRI,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector packed double/float comparison.
0b57cec5SDimitry Andric    CMPP,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector integer comparisons.
*5ffd83dbSDimitry Andric    PCMPEQ,
*5ffd83dbSDimitry Andric    PCMPGT,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // v8i16 Horizontal minimum and position.
0b57cec5SDimitry Andric    PHMINPOS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MULTISHIFT,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Vector comparison generating mask bits for fp and
0b57cec5SDimitry Andric    /// integer signed and unsigned data types.
0b57cec5SDimitry Andric    CMPM,
0b57cec5SDimitry Andric    // Vector comparison with SAE for FP values
0b57cec5SDimitry Andric    CMPM_SAE,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Arithmetic operations with FLAGS results.
*5ffd83dbSDimitry Andric    ADD,
*5ffd83dbSDimitry Andric    SUB,
*5ffd83dbSDimitry Andric    ADC,
*5ffd83dbSDimitry Andric    SBB,
*5ffd83dbSDimitry Andric    SMUL,
*5ffd83dbSDimitry Andric    UMUL,
*5ffd83dbSDimitry Andric    OR,
*5ffd83dbSDimitry Andric    XOR,
*5ffd83dbSDimitry Andric    AND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Bit field extract.
0b57cec5SDimitry Andric    BEXTR,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Zero High Bits Starting with Specified Bit Position.
0b57cec5SDimitry Andric    BZHI,
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    // Parallel extract and deposit.
*5ffd83dbSDimitry Andric    PDEP,
*5ffd83dbSDimitry Andric    PEXT,
*5ffd83dbSDimitry Andric
0b57cec5SDimitry Andric    // X86-specific multiply by immediate.
0b57cec5SDimitry Andric    MUL_IMM,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector sign bit extraction.
0b57cec5SDimitry Andric    MOVMSK,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector bitwise comparisons.
0b57cec5SDimitry Andric    PTEST,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector packed fp sign bitwise comparisons.
0b57cec5SDimitry Andric    TESTP,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // OR/AND test for masks.
0b57cec5SDimitry Andric    KORTEST,
0b57cec5SDimitry Andric    KTEST,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // ADD for masks.
0b57cec5SDimitry Andric    KADD,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Several flavors of instructions with vector shuffle behaviors.
0b57cec5SDimitry Andric    // Saturated signed/unnsigned packing.
0b57cec5SDimitry Andric    PACKSS,
0b57cec5SDimitry Andric    PACKUS,
0b57cec5SDimitry Andric    // Intra-lane alignr.
0b57cec5SDimitry Andric    PALIGNR,
0b57cec5SDimitry Andric    // AVX512 inter-lane alignr.
0b57cec5SDimitry Andric    VALIGN,
0b57cec5SDimitry Andric    PSHUFD,
0b57cec5SDimitry Andric    PSHUFHW,
0b57cec5SDimitry Andric    PSHUFLW,
0b57cec5SDimitry Andric    SHUFP,
0b57cec5SDimitry Andric    // VBMI2 Concat & Shift.
0b57cec5SDimitry Andric    VSHLD,
0b57cec5SDimitry Andric    VSHRD,
0b57cec5SDimitry Andric    VSHLDV,
0b57cec5SDimitry Andric    VSHRDV,
0b57cec5SDimitry Andric    // Shuffle Packed Values at 128-bit granularity.
0b57cec5SDimitry Andric    SHUF128,
0b57cec5SDimitry Andric    MOVDDUP,
0b57cec5SDimitry Andric    MOVSHDUP,
0b57cec5SDimitry Andric    MOVSLDUP,
0b57cec5SDimitry Andric    MOVLHPS,
0b57cec5SDimitry Andric    MOVHLPS,
0b57cec5SDimitry Andric    MOVSD,
0b57cec5SDimitry Andric    MOVSS,
0b57cec5SDimitry Andric    UNPCKL,
0b57cec5SDimitry Andric    UNPCKH,
0b57cec5SDimitry Andric    VPERMILPV,
0b57cec5SDimitry Andric    VPERMILPI,
0b57cec5SDimitry Andric    VPERMI,
0b57cec5SDimitry Andric    VPERM2X128,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Variable Permute (VPERM).
0b57cec5SDimitry Andric    // Res = VPERMV MaskV, V0
0b57cec5SDimitry Andric    VPERMV,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // 3-op Variable Permute (VPERMT2).
0b57cec5SDimitry Andric    // Res = VPERMV3 V0, MaskV, V1
0b57cec5SDimitry Andric    VPERMV3,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Bitwise ternary logic.
0b57cec5SDimitry Andric    VPTERNLOG,
0b57cec5SDimitry Andric    // Fix Up Special Packed Float32/64 values.
*5ffd83dbSDimitry Andric    VFIXUPIMM,
*5ffd83dbSDimitry Andric    VFIXUPIMM_SAE,
*5ffd83dbSDimitry Andric    VFIXUPIMMS,
*5ffd83dbSDimitry Andric    VFIXUPIMMS_SAE,
0b57cec5SDimitry Andric    // Range Restriction Calculation For Packed Pairs of Float32/64 values.
*5ffd83dbSDimitry Andric    VRANGE,
*5ffd83dbSDimitry Andric    VRANGE_SAE,
*5ffd83dbSDimitry Andric    VRANGES,
*5ffd83dbSDimitry Andric    VRANGES_SAE,
0b57cec5SDimitry Andric    // Reduce - Perform Reduction Transformation on scalar\packed FP.
*5ffd83dbSDimitry Andric    VREDUCE,
*5ffd83dbSDimitry Andric    VREDUCE_SAE,
*5ffd83dbSDimitry Andric    VREDUCES,
*5ffd83dbSDimitry Andric    VREDUCES_SAE,
0b57cec5SDimitry Andric    // RndScale - Round FP Values To Include A Given Number Of Fraction Bits.
0b57cec5SDimitry Andric    // Also used by the legacy (V)ROUND intrinsics where we mask out the
0b57cec5SDimitry Andric    // scaling part of the immediate.
*5ffd83dbSDimitry Andric    VRNDSCALE,
*5ffd83dbSDimitry Andric    VRNDSCALE_SAE,
*5ffd83dbSDimitry Andric    VRNDSCALES,
*5ffd83dbSDimitry Andric    VRNDSCALES_SAE,
0b57cec5SDimitry Andric    // Tests Types Of a FP Values for packed types.
0b57cec5SDimitry Andric    VFPCLASS,
0b57cec5SDimitry Andric    // Tests Types Of a FP Values for scalar types.
0b57cec5SDimitry Andric    VFPCLASSS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Broadcast (splat) scalar or element 0 of a vector. If the operand is
0b57cec5SDimitry Andric    // a vector, this node may change the vector length as part of the splat.
0b57cec5SDimitry Andric    VBROADCAST,
0b57cec5SDimitry Andric    // Broadcast mask to vector.
0b57cec5SDimitry Andric    VBROADCASTM,
0b57cec5SDimitry Andric    // Broadcast subvector to vector.
0b57cec5SDimitry Andric    SUBV_BROADCAST,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// SSE4A Extraction and Insertion.
*5ffd83dbSDimitry Andric    EXTRQI,
*5ffd83dbSDimitry Andric    INSERTQI,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // XOP arithmetic/logical shifts.
*5ffd83dbSDimitry Andric    VPSHA,
*5ffd83dbSDimitry Andric    VPSHL,
0b57cec5SDimitry Andric    // XOP signed/unsigned integer comparisons.
*5ffd83dbSDimitry Andric    VPCOM,
*5ffd83dbSDimitry Andric    VPCOMU,
0b57cec5SDimitry Andric    // XOP packed permute bytes.
0b57cec5SDimitry Andric    VPPERM,
0b57cec5SDimitry Andric    // XOP two source permutation.
0b57cec5SDimitry Andric    VPERMIL2,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector multiply packed unsigned doubleword integers.
0b57cec5SDimitry Andric    PMULUDQ,
0b57cec5SDimitry Andric    // Vector multiply packed signed doubleword integers.
0b57cec5SDimitry Andric    PMULDQ,
0b57cec5SDimitry Andric    // Vector Multiply Packed UnsignedIntegers with Round and Scale.
0b57cec5SDimitry Andric    MULHRS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Multiply and Add Packed Integers.
*5ffd83dbSDimitry Andric    VPMADDUBSW,
*5ffd83dbSDimitry Andric    VPMADDWD,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // AVX512IFMA multiply and add.
0b57cec5SDimitry Andric    // NOTE: These are different than the instruction and perform
0b57cec5SDimitry Andric    // op0 x op1 + op2.
*5ffd83dbSDimitry Andric    VPMADD52L,
*5ffd83dbSDimitry Andric    VPMADD52H,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // VNNI
0b57cec5SDimitry Andric    VPDPBUSD,
0b57cec5SDimitry Andric    VPDPBUSDS,
0b57cec5SDimitry Andric    VPDPWSSD,
0b57cec5SDimitry Andric    VPDPWSSDS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // FMA nodes.
0b57cec5SDimitry Andric    // We use the target independent ISD::FMA for the non-inverted case.
0b57cec5SDimitry Andric    FNMADD,
0b57cec5SDimitry Andric    FMSUB,
0b57cec5SDimitry Andric    FNMSUB,
0b57cec5SDimitry Andric    FMADDSUB,
0b57cec5SDimitry Andric    FMSUBADD,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // FMA with rounding mode.
0b57cec5SDimitry Andric    FMADD_RND,
0b57cec5SDimitry Andric    FNMADD_RND,
0b57cec5SDimitry Andric    FMSUB_RND,
0b57cec5SDimitry Andric    FNMSUB_RND,
0b57cec5SDimitry Andric    FMADDSUB_RND,
0b57cec5SDimitry Andric    FMSUBADD_RND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Compress and expand.
0b57cec5SDimitry Andric    COMPRESS,
0b57cec5SDimitry Andric    EXPAND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Bits shuffle
0b57cec5SDimitry Andric    VPSHUFBITQMB,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Convert Unsigned/Integer to Floating-Point Value with rounding mode.
*5ffd83dbSDimitry Andric    SINT_TO_FP_RND,
*5ffd83dbSDimitry Andric    UINT_TO_FP_RND,
*5ffd83dbSDimitry Andric    SCALAR_SINT_TO_FP,
*5ffd83dbSDimitry Andric    SCALAR_UINT_TO_FP,
*5ffd83dbSDimitry Andric    SCALAR_SINT_TO_FP_RND,
*5ffd83dbSDimitry Andric    SCALAR_UINT_TO_FP_RND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector float/double to signed/unsigned integer.
*5ffd83dbSDimitry Andric    CVTP2SI,
*5ffd83dbSDimitry Andric    CVTP2UI,
*5ffd83dbSDimitry Andric    CVTP2SI_RND,
*5ffd83dbSDimitry Andric    CVTP2UI_RND,
0b57cec5SDimitry Andric    // Scalar float/double to signed/unsigned integer.
*5ffd83dbSDimitry Andric    CVTS2SI,
*5ffd83dbSDimitry Andric    CVTS2UI,
*5ffd83dbSDimitry Andric    CVTS2SI_RND,
*5ffd83dbSDimitry Andric    CVTS2UI_RND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector float/double to signed/unsigned integer with truncation.
*5ffd83dbSDimitry Andric    CVTTP2SI,
*5ffd83dbSDimitry Andric    CVTTP2UI,
*5ffd83dbSDimitry Andric    CVTTP2SI_SAE,
*5ffd83dbSDimitry Andric    CVTTP2UI_SAE,
0b57cec5SDimitry Andric    // Scalar float/double to signed/unsigned integer with truncation.
*5ffd83dbSDimitry Andric    CVTTS2SI,
*5ffd83dbSDimitry Andric    CVTTS2UI,
*5ffd83dbSDimitry Andric    CVTTS2SI_SAE,
*5ffd83dbSDimitry Andric    CVTTS2UI_SAE,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector signed/unsigned integer to float/double.
*5ffd83dbSDimitry Andric    CVTSI2P,
*5ffd83dbSDimitry Andric    CVTUI2P,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Masked versions of above. Used for v2f64->v4f32.
0b57cec5SDimitry Andric    // SRC, PASSTHRU, MASK
*5ffd83dbSDimitry Andric    MCVTP2SI,
*5ffd83dbSDimitry Andric    MCVTP2UI,
*5ffd83dbSDimitry Andric    MCVTTP2SI,
*5ffd83dbSDimitry Andric    MCVTTP2UI,
*5ffd83dbSDimitry Andric    MCVTSI2P,
*5ffd83dbSDimitry Andric    MCVTUI2P,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector float to bfloat16.
0b57cec5SDimitry Andric    // Convert TWO packed single data to one packed BF16 data
0b57cec5SDimitry Andric    CVTNE2PS2BF16,
0b57cec5SDimitry Andric    // Convert packed single data to packed BF16 data
0b57cec5SDimitry Andric    CVTNEPS2BF16,
0b57cec5SDimitry Andric    // Masked version of above.
0b57cec5SDimitry Andric    // SRC, PASSTHRU, MASK
0b57cec5SDimitry Andric    MCVTNEPS2BF16,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Dot product of BF16 pairs to accumulated into
0b57cec5SDimitry Andric    // packed single precision.
0b57cec5SDimitry Andric    DPBF16PS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Save xmm argument registers to the stack, according to %al. An operator
0b57cec5SDimitry Andric    // is needed so that this can be expanded with control flow.
0b57cec5SDimitry Andric    VASTART_SAVE_XMM_REGS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Windows's _chkstk call to do stack probing.
0b57cec5SDimitry Andric    WIN_ALLOCA,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // For allocating variable amounts of stack space when using
0b57cec5SDimitry Andric    // segmented stacks. Check if the current stacklet has enough space, and
0b57cec5SDimitry Andric    // falls back to heap allocation if not.
0b57cec5SDimitry Andric    SEG_ALLOCA,
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    // For allocating stack space when using stack clash protector.
*5ffd83dbSDimitry Andric    // Allocation is performed by block, and each block is probed.
*5ffd83dbSDimitry Andric    PROBED_ALLOCA,
*5ffd83dbSDimitry Andric
0b57cec5SDimitry Andric    // Memory barriers.
0b57cec5SDimitry Andric    MEMBARRIER,
0b57cec5SDimitry Andric    MFENCE,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Get a random integer and indicate whether it is valid in CF.
0b57cec5SDimitry Andric    RDRAND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Get a NIST SP800-90B & C compliant random integer and
0b57cec5SDimitry Andric    // indicate whether it is valid in CF.
0b57cec5SDimitry Andric    RDSEED,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Protection keys
0b57cec5SDimitry Andric    // RDPKRU - Operand 0 is chain. Operand 1 is value for ECX.
0b57cec5SDimitry Andric    // WRPKRU - Operand 0 is chain. Operand 1 is value for EDX. Operand 2 is
0b57cec5SDimitry Andric    // value for ECX.
*5ffd83dbSDimitry Andric    RDPKRU,
*5ffd83dbSDimitry Andric    WRPKRU,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // SSE42 string comparisons.
0b57cec5SDimitry Andric    // These nodes produce 3 results, index, mask, and flags. X86ISelDAGToDAG
0b57cec5SDimitry Andric    // will emit one or two instructions based on which results are used. If
0b57cec5SDimitry Andric    // flags and index/mask this allows us to use a single instruction since
0b57cec5SDimitry Andric    // we won't have to pick and opcode for flags. Instead we can rely on the
0b57cec5SDimitry Andric    // DAG to CSE everything and decide at isel.
0b57cec5SDimitry Andric    PCMPISTR,
0b57cec5SDimitry Andric    PCMPESTR,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Test if in transactional execution.
0b57cec5SDimitry Andric    XTEST,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // ERI instructions.
*5ffd83dbSDimitry Andric    RSQRT28,
*5ffd83dbSDimitry Andric    RSQRT28_SAE,
*5ffd83dbSDimitry Andric    RSQRT28S,
*5ffd83dbSDimitry Andric    RSQRT28S_SAE,
*5ffd83dbSDimitry Andric    RCP28,
*5ffd83dbSDimitry Andric    RCP28_SAE,
*5ffd83dbSDimitry Andric    RCP28S,
*5ffd83dbSDimitry Andric    RCP28S_SAE,
*5ffd83dbSDimitry Andric    EXP2,
*5ffd83dbSDimitry Andric    EXP2_SAE,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Conversions between float and half-float.
*5ffd83dbSDimitry Andric    CVTPS2PH,
*5ffd83dbSDimitry Andric    CVTPH2PS,
*5ffd83dbSDimitry Andric    CVTPH2PS_SAE,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Masked version of above.
0b57cec5SDimitry Andric    // SRC, RND, PASSTHRU, MASK
0b57cec5SDimitry Andric    MCVTPS2PH,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Galois Field Arithmetic Instructions
*5ffd83dbSDimitry Andric    GF2P8AFFINEINVQB,
*5ffd83dbSDimitry Andric    GF2P8AFFINEQB,
*5ffd83dbSDimitry Andric    GF2P8MULB,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // LWP insert record.
0b57cec5SDimitry Andric    LWPINS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // User level wait
*5ffd83dbSDimitry Andric    UMWAIT,
*5ffd83dbSDimitry Andric    TPAUSE,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Enqueue Stores Instructions
*5ffd83dbSDimitry Andric    ENQCMD,
*5ffd83dbSDimitry Andric    ENQCMDS,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // For avx512-vp2intersect
0b57cec5SDimitry Andric    VP2INTERSECT,
0b57cec5SDimitry Andric
480093f4SDimitry Andric    /// X86 strict FP compare instructions.
480093f4SDimitry Andric    STRICT_FCMP = ISD::FIRST_TARGET_STRICTFP_OPCODE,
480093f4SDimitry Andric    STRICT_FCMPS,
480093f4SDimitry Andric
480093f4SDimitry Andric    // Vector packed double/float comparison.
480093f4SDimitry Andric    STRICT_CMPP,
480093f4SDimitry Andric
480093f4SDimitry Andric    /// Vector comparison generating mask bits for fp and
480093f4SDimitry Andric    /// integer signed and unsigned data types.
480093f4SDimitry Andric    STRICT_CMPM,
480093f4SDimitry Andric
480093f4SDimitry Andric    // Vector float/double to signed/unsigned integer with truncation.
*5ffd83dbSDimitry Andric    STRICT_CVTTP2SI,
*5ffd83dbSDimitry Andric    STRICT_CVTTP2UI,
480093f4SDimitry Andric
480093f4SDimitry Andric    // Vector FP extend.
480093f4SDimitry Andric    STRICT_VFPEXT,
480093f4SDimitry Andric
480093f4SDimitry Andric    // Vector FP round.
480093f4SDimitry Andric    STRICT_VFPROUND,
480093f4SDimitry Andric
480093f4SDimitry Andric    // RndScale - Round FP Values To Include A Given Number Of Fraction Bits.
480093f4SDimitry Andric    // Also used by the legacy (V)ROUND intrinsics where we mask out the
480093f4SDimitry Andric    // scaling part of the immediate.
480093f4SDimitry Andric    STRICT_VRNDSCALE,
480093f4SDimitry Andric
480093f4SDimitry Andric    // Vector signed/unsigned integer to float/double.
*5ffd83dbSDimitry Andric    STRICT_CVTSI2P,
*5ffd83dbSDimitry Andric    STRICT_CVTUI2P,
*5ffd83dbSDimitry Andric
*5ffd83dbSDimitry Andric    // Strict FMA nodes.
*5ffd83dbSDimitry Andric    STRICT_FNMADD,
*5ffd83dbSDimitry Andric    STRICT_FMSUB,
*5ffd83dbSDimitry Andric    STRICT_FNMSUB,
*5ffd83dbSDimitry Andric
*5ffd83dbSDimitry Andric    // Conversions between float and half-float.
*5ffd83dbSDimitry Andric    STRICT_CVTPS2PH,
*5ffd83dbSDimitry Andric    STRICT_CVTPH2PS,
480093f4SDimitry Andric
0b57cec5SDimitry Andric    // Compare and swap.
0b57cec5SDimitry Andric    LCMPXCHG_DAG = ISD::FIRST_TARGET_MEMORY_OPCODE,
0b57cec5SDimitry Andric    LCMPXCHG8_DAG,
0b57cec5SDimitry Andric    LCMPXCHG16_DAG,
0b57cec5SDimitry Andric    LCMPXCHG8_SAVE_EBX_DAG,
0b57cec5SDimitry Andric    LCMPXCHG16_SAVE_RBX_DAG,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// LOCK-prefixed arithmetic read-modify-write instructions.
0b57cec5SDimitry Andric    /// EFLAGS, OUTCHAIN = LADD(INCHAIN, PTR, RHS)
*5ffd83dbSDimitry Andric    LADD,
*5ffd83dbSDimitry Andric    LSUB,
*5ffd83dbSDimitry Andric    LOR,
*5ffd83dbSDimitry Andric    LXOR,
*5ffd83dbSDimitry Andric    LAND,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Load, scalar_to_vector, and zero extend.
0b57cec5SDimitry Andric    VZEXT_LOAD,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // extract_vector_elt, store.
0b57cec5SDimitry Andric    VEXTRACT_STORE,
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    // scalar broadcast from memory
8bcb0991SDimitry Andric    VBROADCAST_LOAD,
8bcb0991SDimitry Andric
0b57cec5SDimitry Andric    // Store FP control world into i16 memory.
0b57cec5SDimitry Andric    FNSTCW16m,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// This instruction implements FP_TO_SINT with the
0b57cec5SDimitry Andric    /// integer destination in memory and a FP reg source.  This corresponds
0b57cec5SDimitry Andric    /// to the X86::FIST*m instructions and the rounding mode change stuff. It
0b57cec5SDimitry Andric    /// has two inputs (token chain and address) and two outputs (int value
0b57cec5SDimitry Andric    /// and token chain). Memory VT specifies the type to store to.
0b57cec5SDimitry Andric    FP_TO_INT_IN_MEM,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// This instruction implements SINT_TO_FP with the
0b57cec5SDimitry Andric    /// integer source in memory and FP reg result.  This corresponds to the
0b57cec5SDimitry Andric    /// X86::FILD*m instructions. It has two inputs (token chain and address)
*5ffd83dbSDimitry Andric    /// and two outputs (FP value and token chain). The integer source type is
*5ffd83dbSDimitry Andric    /// specified by the memory VT.
0b57cec5SDimitry Andric    FILD,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// This instruction implements a fp->int store from FP stack
0b57cec5SDimitry Andric    /// slots. This corresponds to the fist instruction. It takes a
0b57cec5SDimitry Andric    /// chain operand, value to store, address, and glue. The memory VT
0b57cec5SDimitry Andric    /// specifies the type to store as.
0b57cec5SDimitry Andric    FIST,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// This instruction implements an extending load to FP stack slots.
0b57cec5SDimitry Andric    /// This corresponds to the X86::FLD32m / X86::FLD64m. It takes a chain
0b57cec5SDimitry Andric    /// operand, and ptr to load from. The memory VT specifies the type to
0b57cec5SDimitry Andric    /// load from.
0b57cec5SDimitry Andric    FLD,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// This instruction implements a truncating store from FP stack
0b57cec5SDimitry Andric    /// slots. This corresponds to the X86::FST32m / X86::FST64m. It takes a
0b57cec5SDimitry Andric    /// chain operand, value to store, address, and glue. The memory VT
0b57cec5SDimitry Andric    /// specifies the type to store as.
0b57cec5SDimitry Andric    FST,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// This instruction grabs the address of the next argument
0b57cec5SDimitry Andric    /// from a va_list. (reads and modifies the va_list in memory)
0b57cec5SDimitry Andric    VAARG_64,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Vector truncating store with unsigned/signed saturation
*5ffd83dbSDimitry Andric    VTRUNCSTOREUS,
*5ffd83dbSDimitry Andric    VTRUNCSTORES,
0b57cec5SDimitry Andric    // Vector truncating masked store with unsigned/signed saturation
*5ffd83dbSDimitry Andric    VMTRUNCSTOREUS,
*5ffd83dbSDimitry Andric    VMTRUNCSTORES,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // X86 specific gather and scatter
*5ffd83dbSDimitry Andric    MGATHER,
*5ffd83dbSDimitry Andric    MSCATTER,
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // WARNING: Do not add anything in the end unless you want the node to
0b57cec5SDimitry Andric    // have memop! In fact, starting from FIRST_TARGET_MEMORY_OPCODE all
0b57cec5SDimitry Andric    // opcodes will be thought as target memory ops!
0b57cec5SDimitry Andric  };
0b57cec5SDimitry Andric  } // end namespace X86ISD
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  /// Define some predicates that are used for node matching.
0b57cec5SDimitry Andric  namespace X86 {
0b57cec5SDimitry Andric    /// Returns true if Elt is a constant zero or floating point constant +0.0.
0b57cec5SDimitry Andric    bool isZeroNode(SDValue Elt);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Returns true of the given offset can be
0b57cec5SDimitry Andric    /// fit into displacement field of the instruction.
0b57cec5SDimitry Andric    bool isOffsetSuitableForCodeModel(int64_t Offset, CodeModel::Model M,
0b57cec5SDimitry Andric                                      bool hasSymbolicDisplacement = true);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Determines whether the callee is required to pop its
0b57cec5SDimitry Andric    /// own arguments. Callee pop is necessary to support tail calls.
0b57cec5SDimitry Andric    bool isCalleePop(CallingConv::ID CallingConv,
0b57cec5SDimitry Andric                     bool is64Bit, bool IsVarArg, bool GuaranteeTCO);
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    /// If Op is a constant whose elements are all the same constant or
8bcb0991SDimitry Andric    /// undefined, return true and return the constant value in \p SplatVal.
*5ffd83dbSDimitry Andric    /// If we have undef bits that don't cover an entire element, we treat these
*5ffd83dbSDimitry Andric    /// as zero if AllowPartialUndefs is set, else we fail and return false.
*5ffd83dbSDimitry Andric    bool isConstantSplat(SDValue Op, APInt &SplatVal,
*5ffd83dbSDimitry Andric                         bool AllowPartialUndefs = true);
0b57cec5SDimitry Andric  } // end namespace X86
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  //===--------------------------------------------------------------------===//
0b57cec5SDimitry Andric  //  X86 Implementation of the TargetLowering interface
0b57cec5SDimitry Andric  class X86TargetLowering final : public TargetLowering {
0b57cec5SDimitry Andric  public:
0b57cec5SDimitry Andric    explicit X86TargetLowering(const X86TargetMachine &TM,
0b57cec5SDimitry Andric                               const X86Subtarget &STI);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    unsigned getJumpTableEncoding() const override;
0b57cec5SDimitry Andric    bool useSoftFloat() const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    void markLibCallAttributes(MachineFunction *MF, unsigned CC,
0b57cec5SDimitry Andric                               ArgListTy &Args) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MVT getScalarShiftAmountTy(const DataLayout &, EVT VT) const override {
0b57cec5SDimitry Andric      return MVT::i8;
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    const MCExpr *
0b57cec5SDimitry Andric    LowerCustomJumpTableEntry(const MachineJumpTableInfo *MJTI,
0b57cec5SDimitry Andric                              const MachineBasicBlock *MBB, unsigned uid,
0b57cec5SDimitry Andric                              MCContext &Ctx) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Returns relocation base for the given PIC jumptable.
0b57cec5SDimitry Andric    SDValue getPICJumpTableRelocBase(SDValue Table,
0b57cec5SDimitry Andric                                     SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric    const MCExpr *
0b57cec5SDimitry Andric    getPICJumpTableRelocBaseExpr(const MachineFunction *MF,
0b57cec5SDimitry Andric                                 unsigned JTI, MCContext &Ctx) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return the desired alignment for ByVal aggregate
0b57cec5SDimitry Andric    /// function arguments in the caller parameter area. For X86, aggregates
0b57cec5SDimitry Andric    /// that contains are placed at 16-byte boundaries while the rest are at
0b57cec5SDimitry Andric    /// 4-byte boundaries.
0b57cec5SDimitry Andric    unsigned getByValTypeAlignment(Type *Ty,
0b57cec5SDimitry Andric                                   const DataLayout &DL) const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    EVT getOptimalMemOpType(const MemOp &Op,
0b57cec5SDimitry Andric                            const AttributeList &FuncAttributes) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Returns true if it's safe to use load / store of the
0b57cec5SDimitry Andric    /// specified type to expand memcpy / memset inline. This is mostly true
0b57cec5SDimitry Andric    /// for all types except for some special cases. For example, on X86
0b57cec5SDimitry Andric    /// targets without SSE2 f64 load / store are done with fldl / fstpl which
0b57cec5SDimitry Andric    /// also does type conversion. Note the specified type doesn't have to be
0b57cec5SDimitry Andric    /// legal as the hook is used before type legalization.
0b57cec5SDimitry Andric    bool isSafeMemOpType(MVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Returns true if the target allows unaligned memory accesses of the
0b57cec5SDimitry Andric    /// specified type. Returns whether it is "fast" in the last argument.
0b57cec5SDimitry Andric    bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AS, unsigned Align,
0b57cec5SDimitry Andric                                        MachineMemOperand::Flags Flags,
0b57cec5SDimitry Andric                                        bool *Fast) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Provide custom lowering hooks for some operations.
0b57cec5SDimitry Andric    ///
0b57cec5SDimitry Andric    SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Places new result values for the node in Results (their number
0b57cec5SDimitry Andric    /// and types must exactly match those of the original return values of
0b57cec5SDimitry Andric    /// the node), or leaves Results empty, which indicates that the node is not
0b57cec5SDimitry Andric    /// to be custom lowered after all.
0b57cec5SDimitry Andric    void LowerOperationWrapper(SDNode *N,
0b57cec5SDimitry Andric                               SmallVectorImpl<SDValue> &Results,
0b57cec5SDimitry Andric                               SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Replace the results of node with an illegal result
0b57cec5SDimitry Andric    /// type with new values built out of custom code.
0b57cec5SDimitry Andric    ///
0b57cec5SDimitry Andric    void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue>&Results,
0b57cec5SDimitry Andric                            SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if the target has native support for
0b57cec5SDimitry Andric    /// the specified value type and it is 'desirable' to use the type for the
0b57cec5SDimitry Andric    /// given node type. e.g. On x86 i16 is legal, but undesirable since i16
0b57cec5SDimitry Andric    /// instruction encodings are longer and some i16 instructions are slow.
0b57cec5SDimitry Andric    bool isTypeDesirableForOp(unsigned Opc, EVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if the target has native support for the
0b57cec5SDimitry Andric    /// specified value type and it is 'desirable' to use the type. e.g. On x86
0b57cec5SDimitry Andric    /// i16 is legal, but undesirable since i16 instruction encodings are longer
0b57cec5SDimitry Andric    /// and some i16 instructions are slow.
0b57cec5SDimitry Andric    bool IsDesirableToPromoteOp(SDValue Op, EVT &PVT) const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    /// Return the newly negated expression if the cost is not expensive and
*5ffd83dbSDimitry Andric    /// set the cost in \p Cost to indicate that if it is cheaper or neutral to
*5ffd83dbSDimitry Andric    /// do the negation.
8bcb0991SDimitry Andric    SDValue getNegatedExpression(SDValue Op, SelectionDAG &DAG,
8bcb0991SDimitry Andric                                 bool LegalOperations, bool ForCodeSize,
*5ffd83dbSDimitry Andric                                 NegatibleCost &Cost,
8bcb0991SDimitry Andric                                 unsigned Depth) const override;
8bcb0991SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *
0b57cec5SDimitry Andric    EmitInstrWithCustomInserter(MachineInstr &MI,
0b57cec5SDimitry Andric                                MachineBasicBlock *MBB) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// This method returns the name of a target specific DAG node.
0b57cec5SDimitry Andric    const char *getTargetNodeName(unsigned Opcode) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Do not merge vector stores after legalization because that may conflict
0b57cec5SDimitry Andric    /// with x86-specific store splitting optimizations.
0b57cec5SDimitry Andric    bool mergeStoresAfterLegalization(EVT MemVT) const override {
0b57cec5SDimitry Andric      return !MemVT.isVector();
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT,
0b57cec5SDimitry Andric                          const SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isCheapToSpeculateCttz() const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isCheapToSpeculateCtlz() const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isCtlzFast() const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool hasBitPreservingFPLogic(EVT VT) const override {
0b57cec5SDimitry Andric      return VT == MVT::f32 || VT == MVT::f64 || VT.isVector();
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isMultiStoresCheaperThanBitsMerge(EVT LTy, EVT HTy) const override {
0b57cec5SDimitry Andric      // If the pair to store is a mixture of float and int values, we will
0b57cec5SDimitry Andric      // save two bitwise instructions and one float-to-int instruction and
0b57cec5SDimitry Andric      // increase one store instruction. There is potentially a more
0b57cec5SDimitry Andric      // significant benefit because it avoids the float->int domain switch
0b57cec5SDimitry Andric      // for input value. So It is more likely a win.
0b57cec5SDimitry Andric      if ((LTy.isFloatingPoint() && HTy.isInteger()) ||
0b57cec5SDimitry Andric          (LTy.isInteger() && HTy.isFloatingPoint()))
0b57cec5SDimitry Andric        return true;
0b57cec5SDimitry Andric      // If the pair only contains int values, we will save two bitwise
0b57cec5SDimitry Andric      // instructions and increase one store instruction (costing one more
0b57cec5SDimitry Andric      // store buffer). Since the benefit is more blurred so we leave
0b57cec5SDimitry Andric      // such pair out until we get testcase to prove it is a win.
0b57cec5SDimitry Andric      return false;
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isMaskAndCmp0FoldingBeneficial(const Instruction &AndI) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool hasAndNotCompare(SDValue Y) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool hasAndNot(SDValue Y) const override;
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    bool hasBitTest(SDValue X, SDValue Y) const override;
8bcb0991SDimitry Andric
8bcb0991SDimitry Andric    bool shouldProduceAndByConstByHoistingConstFromShiftsLHSOfAnd(
8bcb0991SDimitry Andric        SDValue X, ConstantSDNode *XC, ConstantSDNode *CC, SDValue Y,
8bcb0991SDimitry Andric        unsigned OldShiftOpcode, unsigned NewShiftOpcode,
8bcb0991SDimitry Andric        SelectionDAG &DAG) const override;
8bcb0991SDimitry Andric
0b57cec5SDimitry Andric    bool shouldFoldConstantShiftPairToMask(const SDNode *N,
0b57cec5SDimitry Andric                                           CombineLevel Level) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool shouldFoldMaskToVariableShiftPair(SDValue Y) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool
0b57cec5SDimitry Andric    shouldTransformSignedTruncationCheck(EVT XVT,
0b57cec5SDimitry Andric                                         unsigned KeptBits) const override {
0b57cec5SDimitry Andric      // For vectors, we don't have a preference..
0b57cec5SDimitry Andric      if (XVT.isVector())
0b57cec5SDimitry Andric        return false;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric      auto VTIsOk = [](EVT VT) -> bool {
0b57cec5SDimitry Andric        return VT == MVT::i8 || VT == MVT::i16 || VT == MVT::i32 ||
0b57cec5SDimitry Andric               VT == MVT::i64;
0b57cec5SDimitry Andric      };
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric      // We are ok with KeptBitsVT being byte/word/dword, what MOVS supports.
0b57cec5SDimitry Andric      // XVT will be larger than KeptBitsVT.
0b57cec5SDimitry Andric      MVT KeptBitsVT = MVT::getIntegerVT(KeptBits);
0b57cec5SDimitry Andric      return VTIsOk(XVT) && VTIsOk(KeptBitsVT);
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool shouldExpandShift(SelectionDAG &DAG, SDNode *N) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool shouldSplatInsEltVarIndex(EVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool convertSetCCLogicToBitwiseLogic(EVT VT) const override {
0b57cec5SDimitry Andric      return VT.isScalarInteger();
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Vector-sized comparisons are fast using PCMPEQ + PMOVMSK or PTEST.
0b57cec5SDimitry Andric    MVT hasFastEqualityCompare(unsigned NumBits) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return the value type to use for ISD::SETCC.
0b57cec5SDimitry Andric    EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context,
0b57cec5SDimitry Andric                           EVT VT) const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    bool targetShrinkDemandedConstant(SDValue Op, const APInt &DemandedBits,
*5ffd83dbSDimitry Andric                                      const APInt &DemandedElts,
0b57cec5SDimitry Andric                                      TargetLoweringOpt &TLO) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Determine which of the bits specified in Mask are known to be either
0b57cec5SDimitry Andric    /// zero or one and return them in the KnownZero/KnownOne bitsets.
0b57cec5SDimitry Andric    void computeKnownBitsForTargetNode(const SDValue Op,
0b57cec5SDimitry Andric                                       KnownBits &Known,
0b57cec5SDimitry Andric                                       const APInt &DemandedElts,
0b57cec5SDimitry Andric                                       const SelectionDAG &DAG,
0b57cec5SDimitry Andric                                       unsigned Depth = 0) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Determine the number of bits in the operation that are sign bits.
0b57cec5SDimitry Andric    unsigned ComputeNumSignBitsForTargetNode(SDValue Op,
0b57cec5SDimitry Andric                                             const APInt &DemandedElts,
0b57cec5SDimitry Andric                                             const SelectionDAG &DAG,
0b57cec5SDimitry Andric                                             unsigned Depth) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool SimplifyDemandedVectorEltsForTargetNode(SDValue Op,
0b57cec5SDimitry Andric                                                 const APInt &DemandedElts,
0b57cec5SDimitry Andric                                                 APInt &KnownUndef,
0b57cec5SDimitry Andric                                                 APInt &KnownZero,
0b57cec5SDimitry Andric                                                 TargetLoweringOpt &TLO,
0b57cec5SDimitry Andric                                                 unsigned Depth) const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    bool SimplifyDemandedVectorEltsForTargetShuffle(SDValue Op,
*5ffd83dbSDimitry Andric                                                    const APInt &DemandedElts,
*5ffd83dbSDimitry Andric                                                    unsigned MaskIndex,
*5ffd83dbSDimitry Andric                                                    TargetLoweringOpt &TLO,
*5ffd83dbSDimitry Andric                                                    unsigned Depth) const;
*5ffd83dbSDimitry Andric
0b57cec5SDimitry Andric    bool SimplifyDemandedBitsForTargetNode(SDValue Op,
0b57cec5SDimitry Andric                                           const APInt &DemandedBits,
0b57cec5SDimitry Andric                                           const APInt &DemandedElts,
0b57cec5SDimitry Andric                                           KnownBits &Known,
0b57cec5SDimitry Andric                                           TargetLoweringOpt &TLO,
0b57cec5SDimitry Andric                                           unsigned Depth) const override;
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    SDValue SimplifyMultipleUseDemandedBitsForTargetNode(
8bcb0991SDimitry Andric        SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts,
8bcb0991SDimitry Andric        SelectionDAG &DAG, unsigned Depth) const override;
8bcb0991SDimitry Andric
0b57cec5SDimitry Andric    const Constant *getTargetConstantFromLoad(LoadSDNode *LD) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue unwrapAddress(SDValue N) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue getReturnAddressFrameIndex(SelectionDAG &DAG) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool ExpandInlineAsm(CallInst *CI) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    ConstraintType getConstraintType(StringRef Constraint) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Examine constraint string and operand type and determine a weight value.
0b57cec5SDimitry Andric    /// The operand object must already have been set up with the operand type.
0b57cec5SDimitry Andric    ConstraintWeight
0b57cec5SDimitry Andric      getSingleConstraintMatchWeight(AsmOperandInfo &info,
0b57cec5SDimitry Andric                                     const char *constraint) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    const char *LowerXConstraint(EVT ConstraintVT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Lower the specified operand into the Ops vector. If it is invalid, don't
0b57cec5SDimitry Andric    /// add anything to Ops. If hasMemory is true it means one of the asm
0b57cec5SDimitry Andric    /// constraint of the inline asm instruction being processed is 'm'.
0b57cec5SDimitry Andric    void LowerAsmOperandForConstraint(SDValue Op,
0b57cec5SDimitry Andric                                      std::string &Constraint,
0b57cec5SDimitry Andric                                      std::vector<SDValue> &Ops,
0b57cec5SDimitry Andric                                      SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    unsigned
0b57cec5SDimitry Andric    getInlineAsmMemConstraint(StringRef ConstraintCode) const override {
480093f4SDimitry Andric      if (ConstraintCode == "o")
0b57cec5SDimitry Andric        return InlineAsm::Constraint_o;
0b57cec5SDimitry Andric      else if (ConstraintCode == "v")
0b57cec5SDimitry Andric        return InlineAsm::Constraint_v;
0b57cec5SDimitry Andric      else if (ConstraintCode == "X")
0b57cec5SDimitry Andric        return InlineAsm::Constraint_X;
0b57cec5SDimitry Andric      return TargetLowering::getInlineAsmMemConstraint(ConstraintCode);
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Handle Lowering flag assembly outputs.
0b57cec5SDimitry Andric    SDValue LowerAsmOutputForConstraint(SDValue &Chain, SDValue &Flag, SDLoc DL,
0b57cec5SDimitry Andric                                        const AsmOperandInfo &Constraint,
0b57cec5SDimitry Andric                                        SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Given a physical register constraint
0b57cec5SDimitry Andric    /// (e.g. {edx}), return the register number and the register class for the
0b57cec5SDimitry Andric    /// register.  This should only be used for C_Register constraints.  On
0b57cec5SDimitry Andric    /// error, this returns a register number of 0.
0b57cec5SDimitry Andric    std::pair<unsigned, const TargetRegisterClass *>
0b57cec5SDimitry Andric    getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
0b57cec5SDimitry Andric                                 StringRef Constraint, MVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if the addressing mode represented
0b57cec5SDimitry Andric    /// by AM is legal for this target, for a load/store of the specified type.
0b57cec5SDimitry Andric    bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM,
0b57cec5SDimitry Andric                               Type *Ty, unsigned AS,
0b57cec5SDimitry Andric                               Instruction *I = nullptr) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if the specified immediate is legal
0b57cec5SDimitry Andric    /// icmp immediate, that is the target has icmp instructions which can
0b57cec5SDimitry Andric    /// compare a register against the immediate without having to materialize
0b57cec5SDimitry Andric    /// the immediate into a register.
0b57cec5SDimitry Andric    bool isLegalICmpImmediate(int64_t Imm) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if the specified immediate is legal
0b57cec5SDimitry Andric    /// add immediate, that is the target has add instructions which can
0b57cec5SDimitry Andric    /// add a register and the immediate without having to materialize
0b57cec5SDimitry Andric    /// the immediate into a register.
0b57cec5SDimitry Andric    bool isLegalAddImmediate(int64_t Imm) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isLegalStoreImmediate(int64_t Imm) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return the cost of the scaling factor used in the addressing
0b57cec5SDimitry Andric    /// mode represented by AM for this target, for a load/store
0b57cec5SDimitry Andric    /// of the specified type.
0b57cec5SDimitry Andric    /// If the AM is supported, the return value must be >= 0.
0b57cec5SDimitry Andric    /// If the AM is not supported, it returns a negative value.
0b57cec5SDimitry Andric    int getScalingFactorCost(const DataLayout &DL, const AddrMode &AM, Type *Ty,
0b57cec5SDimitry Andric                             unsigned AS) const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    /// This is used to enable splatted operand transforms for vector shifts
*5ffd83dbSDimitry Andric    /// and vector funnel shifts.
0b57cec5SDimitry Andric    bool isVectorShiftByScalarCheap(Type *Ty) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Add x86-specific opcodes to the default list.
0b57cec5SDimitry Andric    bool isBinOp(unsigned Opcode) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Returns true if the opcode is a commutative binary operation.
0b57cec5SDimitry Andric    bool isCommutativeBinOp(unsigned Opcode) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if it's free to truncate a value of
0b57cec5SDimitry Andric    /// type Ty1 to type Ty2. e.g. On x86 it's free to truncate a i32 value in
0b57cec5SDimitry Andric    /// register EAX to i16 by referencing its sub-register AX.
0b57cec5SDimitry Andric    bool isTruncateFree(Type *Ty1, Type *Ty2) const override;
0b57cec5SDimitry Andric    bool isTruncateFree(EVT VT1, EVT VT2) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool allowTruncateForTailCall(Type *Ty1, Type *Ty2) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if any actual instruction that defines a
0b57cec5SDimitry Andric    /// value of type Ty1 implicit zero-extends the value to Ty2 in the result
0b57cec5SDimitry Andric    /// register. This does not necessarily include registers defined in
0b57cec5SDimitry Andric    /// unknown ways, such as incoming arguments, or copies from unknown
0b57cec5SDimitry Andric    /// virtual registers. Also, if isTruncateFree(Ty2, Ty1) is true, this
0b57cec5SDimitry Andric    /// does not necessarily apply to truncate instructions. e.g. on x86-64,
0b57cec5SDimitry Andric    /// all instructions that define 32-bit values implicit zero-extend the
0b57cec5SDimitry Andric    /// result out to 64 bits.
0b57cec5SDimitry Andric    bool isZExtFree(Type *Ty1, Type *Ty2) const override;
0b57cec5SDimitry Andric    bool isZExtFree(EVT VT1, EVT VT2) const override;
0b57cec5SDimitry Andric    bool isZExtFree(SDValue Val, EVT VT2) const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    bool shouldSinkOperands(Instruction *I,
*5ffd83dbSDimitry Andric                            SmallVectorImpl<Use *> &Ops) const override;
*5ffd83dbSDimitry Andric    bool shouldConvertPhiType(Type *From, Type *To) const override;
*5ffd83dbSDimitry Andric
0b57cec5SDimitry Andric    /// Return true if folding a vector load into ExtVal (a sign, zero, or any
0b57cec5SDimitry Andric    /// extend node) is profitable.
0b57cec5SDimitry Andric    bool isVectorLoadExtDesirable(SDValue) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if an FMA operation is faster than a pair of fmul and fadd
0b57cec5SDimitry Andric    /// instructions. fmuladd intrinsics will be expanded to FMAs when this
0b57cec5SDimitry Andric    /// method returns true, otherwise fmuladd is expanded to fmul + fadd.
480093f4SDimitry Andric    bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF,
480093f4SDimitry Andric                                    EVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if it's profitable to narrow
0b57cec5SDimitry Andric    /// operations of type VT1 to VT2. e.g. on x86, it's profitable to narrow
0b57cec5SDimitry Andric    /// from i32 to i8 but not from i32 to i16.
0b57cec5SDimitry Andric    bool isNarrowingProfitable(EVT VT1, EVT VT2) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Given an intrinsic, checks if on the target the intrinsic will need to map
0b57cec5SDimitry Andric    /// to a MemIntrinsicNode (touches memory). If this is the case, it returns
0b57cec5SDimitry Andric    /// true and stores the intrinsic information into the IntrinsicInfo that was
0b57cec5SDimitry Andric    /// passed to the function.
0b57cec5SDimitry Andric    bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallInst &I,
0b57cec5SDimitry Andric                            MachineFunction &MF,
0b57cec5SDimitry Andric                            unsigned Intrinsic) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Returns true if the target can instruction select the
0b57cec5SDimitry Andric    /// specified FP immediate natively. If false, the legalizer will
0b57cec5SDimitry Andric    /// materialize the FP immediate as a load from a constant pool.
0b57cec5SDimitry Andric    bool isFPImmLegal(const APFloat &Imm, EVT VT,
0b57cec5SDimitry Andric                      bool ForCodeSize) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Targets can use this to indicate that they only support *some*
0b57cec5SDimitry Andric    /// VECTOR_SHUFFLE operations, those with specific masks. By default, if a
0b57cec5SDimitry Andric    /// target supports the VECTOR_SHUFFLE node, all mask values are assumed to
0b57cec5SDimitry Andric    /// be legal.
0b57cec5SDimitry Andric    bool isShuffleMaskLegal(ArrayRef<int> Mask, EVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Similar to isShuffleMaskLegal. Targets can use this to indicate if there
0b57cec5SDimitry Andric    /// is a suitable VECTOR_SHUFFLE that can be used to replace a VAND with a
0b57cec5SDimitry Andric    /// constant pool entry.
0b57cec5SDimitry Andric    bool isVectorClearMaskLegal(ArrayRef<int> Mask, EVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Returns true if lowering to a jump table is allowed.
0b57cec5SDimitry Andric    bool areJTsAllowed(const Function *Fn) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// If true, then instruction selection should
0b57cec5SDimitry Andric    /// seek to shrink the FP constant of the specified type to a smaller type
0b57cec5SDimitry Andric    /// in order to save space and / or reduce runtime.
0b57cec5SDimitry Andric    bool ShouldShrinkFPConstant(EVT VT) const override {
0b57cec5SDimitry Andric      // Don't shrink FP constpool if SSE2 is available since cvtss2sd is more
0b57cec5SDimitry Andric      // expensive than a straight movsd. On the other hand, it's important to
0b57cec5SDimitry Andric      // shrink long double fp constant since fldt is very slow.
0b57cec5SDimitry Andric      return !X86ScalarSSEf64 || VT == MVT::f80;
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if we believe it is correct and profitable to reduce the
0b57cec5SDimitry Andric    /// load node to a smaller type.
0b57cec5SDimitry Andric    bool shouldReduceLoadWidth(SDNode *Load, ISD::LoadExtType ExtTy,
0b57cec5SDimitry Andric                               EVT NewVT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if the specified scalar FP type is computed in an SSE
0b57cec5SDimitry Andric    /// register, not on the X87 floating point stack.
0b57cec5SDimitry Andric    bool isScalarFPTypeInSSEReg(EVT VT) const {
0b57cec5SDimitry Andric      return (VT == MVT::f64 && X86ScalarSSEf64) || // f64 is when SSE2
0b57cec5SDimitry Andric             (VT == MVT::f32 && X86ScalarSSEf32);   // f32 is when SSE1
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Returns true if it is beneficial to convert a load of a constant
0b57cec5SDimitry Andric    /// to just the constant itself.
0b57cec5SDimitry Andric    bool shouldConvertConstantLoadToIntImm(const APInt &Imm,
0b57cec5SDimitry Andric                                           Type *Ty) const override;
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    bool reduceSelectOfFPConstantLoads(EVT CmpOpVT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool convertSelectOfConstantsToMath(EVT VT) const override;
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    bool decomposeMulByConstant(LLVMContext &Context, EVT VT,
8bcb0991SDimitry Andric                                SDValue C) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if EXTRACT_SUBVECTOR is cheap for this result type
0b57cec5SDimitry Andric    /// with this index.
0b57cec5SDimitry Andric    bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
0b57cec5SDimitry Andric                                 unsigned Index) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Scalar ops always have equal or better analysis/performance/power than
0b57cec5SDimitry Andric    /// the vector equivalent, so this always makes sense if the scalar op is
0b57cec5SDimitry Andric    /// supported.
0b57cec5SDimitry Andric    bool shouldScalarizeBinop(SDValue) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Extract of a scalar FP value from index 0 of a vector is free.
0b57cec5SDimitry Andric    bool isExtractVecEltCheap(EVT VT, unsigned Index) const override {
0b57cec5SDimitry Andric      EVT EltVT = VT.getScalarType();
0b57cec5SDimitry Andric      return (EltVT == MVT::f32 || EltVT == MVT::f64) && Index == 0;
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Overflow nodes should get combined/lowered to optimal instructions
0b57cec5SDimitry Andric    /// (they should allow eliminating explicit compares by getting flags from
0b57cec5SDimitry Andric    /// math ops).
*5ffd83dbSDimitry Andric    bool shouldFormOverflowOp(unsigned Opcode, EVT VT,
*5ffd83dbSDimitry Andric                              bool MathUsed) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool storeOfVectorConstantIsCheap(EVT MemVT, unsigned NumElem,
0b57cec5SDimitry Andric                                      unsigned AddrSpace) const override {
0b57cec5SDimitry Andric      // If we can replace more than 2 scalar stores, there will be a reduction
0b57cec5SDimitry Andric      // in instructions even after we add a vector constant load.
0b57cec5SDimitry Andric      return NumElem > 2;
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isLoadBitCastBeneficial(EVT LoadVT, EVT BitcastVT,
0b57cec5SDimitry Andric                                 const SelectionDAG &DAG,
0b57cec5SDimitry Andric                                 const MachineMemOperand &MMO) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Intel processors have a unified instruction and data cache
0b57cec5SDimitry Andric    const char * getClearCacheBuiltinName() const override {
0b57cec5SDimitry Andric      return nullptr; // nothing to do, move along.
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
480093f4SDimitry Andric    Register getRegisterByName(const char* RegName, LLT VT,
8bcb0991SDimitry Andric                               const MachineFunction &MF) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// If a physical register, this returns the register that receives the
0b57cec5SDimitry Andric    /// exception address on entry to an EH pad.
*5ffd83dbSDimitry Andric    Register
0b57cec5SDimitry Andric    getExceptionPointerRegister(const Constant *PersonalityFn) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// If a physical register, this returns the register that receives the
0b57cec5SDimitry Andric    /// exception typeid on entry to a landing pad.
*5ffd83dbSDimitry Andric    Register
0b57cec5SDimitry Andric    getExceptionSelectorRegister(const Constant *PersonalityFn) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    virtual bool needsFixedCatchObjects() const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// This method returns a target specific FastISel object,
0b57cec5SDimitry Andric    /// or null if the target does not support "fast" ISel.
0b57cec5SDimitry Andric    FastISel *createFastISel(FunctionLoweringInfo &funcInfo,
0b57cec5SDimitry Andric                             const TargetLibraryInfo *libInfo) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// If the target has a standard location for the stack protector cookie,
0b57cec5SDimitry Andric    /// returns the address of that location. Otherwise, returns nullptr.
0b57cec5SDimitry Andric    Value *getIRStackGuard(IRBuilder<> &IRB) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool useLoadStackGuardNode() const override;
0b57cec5SDimitry Andric    bool useStackGuardXorFP() const override;
0b57cec5SDimitry Andric    void insertSSPDeclarations(Module &M) const override;
0b57cec5SDimitry Andric    Value *getSDagStackGuard(const Module &M) const override;
0b57cec5SDimitry Andric    Function *getSSPStackGuardCheck(const Module &M) const override;
0b57cec5SDimitry Andric    SDValue emitStackGuardXorFP(SelectionDAG &DAG, SDValue Val,
0b57cec5SDimitry Andric                                const SDLoc &DL) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Return true if the target stores SafeStack pointer at a fixed offset in
0b57cec5SDimitry Andric    /// some non-standard address space, and populates the address space and
0b57cec5SDimitry Andric    /// offset as appropriate.
0b57cec5SDimitry Andric    Value *getSafeStackPointerLocation(IRBuilder<> &IRB) const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    std::pair<SDValue, SDValue> BuildFILD(EVT DstVT, EVT SrcVT, const SDLoc &DL,
*5ffd83dbSDimitry Andric                                          SDValue Chain, SDValue Pointer,
*5ffd83dbSDimitry Andric                                          MachinePointerInfo PtrInfo,
*5ffd83dbSDimitry Andric                                          Align Alignment,
0b57cec5SDimitry Andric                                          SelectionDAG &DAG) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isNoopAddrSpaceCast(unsigned SrcAS, unsigned DestAS) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Customize the preferred legalization strategy for certain types.
0b57cec5SDimitry Andric    LegalizeTypeAction getPreferredVectorAction(MVT VT) const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    bool softPromoteHalfType() const override { return true; }
*5ffd83dbSDimitry Andric
0b57cec5SDimitry Andric    MVT getRegisterTypeForCallingConv(LLVMContext &Context, CallingConv::ID CC,
0b57cec5SDimitry Andric                                      EVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    unsigned getNumRegistersForCallingConv(LLVMContext &Context,
0b57cec5SDimitry Andric                                           CallingConv::ID CC,
0b57cec5SDimitry Andric                                           EVT VT) const override;
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    unsigned getVectorTypeBreakdownForCallingConv(
8bcb0991SDimitry Andric        LLVMContext &Context, CallingConv::ID CC, EVT VT, EVT &IntermediateVT,
8bcb0991SDimitry Andric        unsigned &NumIntermediates, MVT &RegisterVT) const override;
8bcb0991SDimitry Andric
0b57cec5SDimitry Andric    bool isIntDivCheap(EVT VT, AttributeList Attr) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool supportSwiftError() const override;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    bool hasStackProbeSymbol(MachineFunction &MF) const override;
*5ffd83dbSDimitry Andric    bool hasInlineStackProbe(MachineFunction &MF) const override;
0b57cec5SDimitry Andric    StringRef getStackProbeSymbolName(MachineFunction &MF) const override;
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    unsigned getStackProbeSize(MachineFunction &MF) const;
8bcb0991SDimitry Andric
0b57cec5SDimitry Andric    bool hasVectorBlend() const override { return true; }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    unsigned getMaxSupportedInterleaveFactor() const override { return 4; }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Lower interleaved load(s) into target specific
0b57cec5SDimitry Andric    /// instructions/intrinsics.
0b57cec5SDimitry Andric    bool lowerInterleavedLoad(LoadInst *LI,
0b57cec5SDimitry Andric                              ArrayRef<ShuffleVectorInst *> Shuffles,
0b57cec5SDimitry Andric                              ArrayRef<unsigned> Indices,
0b57cec5SDimitry Andric                              unsigned Factor) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Lower interleaved store(s) into target specific
0b57cec5SDimitry Andric    /// instructions/intrinsics.
0b57cec5SDimitry Andric    bool lowerInterleavedStore(StoreInst *SI, ShuffleVectorInst *SVI,
0b57cec5SDimitry Andric                               unsigned Factor) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue expandIndirectJTBranch(const SDLoc& dl, SDValue Value,
0b57cec5SDimitry Andric                                   SDValue Addr, SelectionDAG &DAG)
0b57cec5SDimitry Andric                                   const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  protected:
0b57cec5SDimitry Andric    std::pair<const TargetRegisterClass *, uint8_t>
0b57cec5SDimitry Andric    findRepresentativeClass(const TargetRegisterInfo *TRI,
0b57cec5SDimitry Andric                            MVT VT) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  private:
0b57cec5SDimitry Andric    /// Keep a reference to the X86Subtarget around so that we can
0b57cec5SDimitry Andric    /// make the right decision when generating code for different targets.
0b57cec5SDimitry Andric    const X86Subtarget &Subtarget;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Select between SSE or x87 floating point ops.
0b57cec5SDimitry Andric    /// When SSE is available, use it for f32 operations.
0b57cec5SDimitry Andric    /// When SSE2 is available, use it for f64 operations.
0b57cec5SDimitry Andric    bool X86ScalarSSEf32;
0b57cec5SDimitry Andric    bool X86ScalarSSEf64;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// A list of legal FP immediates.
0b57cec5SDimitry Andric    std::vector<APFloat> LegalFPImmediates;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Indicate that this x86 target can instruction
0b57cec5SDimitry Andric    /// select the specified FP immediate natively.
0b57cec5SDimitry Andric    void addLegalFPImmediate(const APFloat& Imm) {
0b57cec5SDimitry Andric      LegalFPImmediates.push_back(Imm);
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue LowerCallResult(SDValue Chain, SDValue InFlag,
0b57cec5SDimitry Andric                            CallingConv::ID CallConv, bool isVarArg,
0b57cec5SDimitry Andric                            const SmallVectorImpl<ISD::InputArg> &Ins,
0b57cec5SDimitry Andric                            const SDLoc &dl, SelectionDAG &DAG,
0b57cec5SDimitry Andric                            SmallVectorImpl<SDValue> &InVals,
0b57cec5SDimitry Andric                            uint32_t *RegMask) const;
0b57cec5SDimitry Andric    SDValue LowerMemArgument(SDValue Chain, CallingConv::ID CallConv,
0b57cec5SDimitry Andric                             const SmallVectorImpl<ISD::InputArg> &ArgInfo,
0b57cec5SDimitry Andric                             const SDLoc &dl, SelectionDAG &DAG,
0b57cec5SDimitry Andric                             const CCValAssign &VA, MachineFrameInfo &MFI,
0b57cec5SDimitry Andric                             unsigned i) const;
0b57cec5SDimitry Andric    SDValue LowerMemOpCallTo(SDValue Chain, SDValue StackPtr, SDValue Arg,
0b57cec5SDimitry Andric                             const SDLoc &dl, SelectionDAG &DAG,
0b57cec5SDimitry Andric                             const CCValAssign &VA,
*5ffd83dbSDimitry Andric                             ISD::ArgFlagsTy Flags, bool isByval) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Call lowering helpers.
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Check whether the call is eligible for tail call optimization. Targets
0b57cec5SDimitry Andric    /// that want to do tail call optimization should implement this function.
0b57cec5SDimitry Andric    bool IsEligibleForTailCallOptimization(SDValue Callee,
0b57cec5SDimitry Andric                                           CallingConv::ID CalleeCC,
0b57cec5SDimitry Andric                                           bool isVarArg,
0b57cec5SDimitry Andric                                           bool isCalleeStructRet,
0b57cec5SDimitry Andric                                           bool isCallerStructRet,
0b57cec5SDimitry Andric                                           Type *RetTy,
0b57cec5SDimitry Andric                                    const SmallVectorImpl<ISD::OutputArg> &Outs,
0b57cec5SDimitry Andric                                    const SmallVectorImpl<SDValue> &OutVals,
0b57cec5SDimitry Andric                                    const SmallVectorImpl<ISD::InputArg> &Ins,
0b57cec5SDimitry Andric                                           SelectionDAG& DAG) const;
0b57cec5SDimitry Andric    SDValue EmitTailCallLoadRetAddr(SelectionDAG &DAG, SDValue &OutRetAddr,
0b57cec5SDimitry Andric                                    SDValue Chain, bool IsTailCall,
0b57cec5SDimitry Andric                                    bool Is64Bit, int FPDiff,
0b57cec5SDimitry Andric                                    const SDLoc &dl) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    unsigned GetAlignedArgumentStackSize(unsigned StackSize,
0b57cec5SDimitry Andric                                         SelectionDAG &DAG) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    unsigned getAddressSpace(void) const;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    SDValue FP_TO_INTHelper(SDValue Op, SelectionDAG &DAG, bool IsSigned,
480093f4SDimitry Andric                            SDValue &Chain) const;
*5ffd83dbSDimitry Andric    SDValue LRINT_LLRINTHelper(SDNode *N, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerVSELECT(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    unsigned getGlobalWrapperKind(const GlobalValue *GV = nullptr,
0b57cec5SDimitry Andric                                  const unsigned char OpFlags = 0) const;
0b57cec5SDimitry Andric    SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerBlockAddress(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerExternalSymbol(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Creates target global address or external symbol nodes for calls or
0b57cec5SDimitry Andric    /// other uses.
0b57cec5SDimitry Andric    SDValue LowerGlobalOrExternal(SDValue Op, SelectionDAG &DAG,
0b57cec5SDimitry Andric                                  bool ForCall) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) const;
*5ffd83dbSDimitry Andric    SDValue LowerLRINT_LLRINT(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerSETCCCARRY(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerSELECT(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerJumpTable(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerADDROFRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerFRAME_TO_ARGS_OFFSET(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerEH_RETURN(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue lowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue lowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue lowerEH_SJLJ_SETUP_DISPATCH(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerINIT_TRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerFLT_ROUNDS_(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerWin64_i128OP(SDValue Op, SelectionDAG &DAG) const;
480093f4SDimitry Andric    SDValue LowerGC_TRANSITION(SDValue Op, SelectionDAG &DAG) const;
0b57cec5SDimitry Andric    SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
8bcb0991SDimitry Andric    SDValue lowerFaddFsub(SDValue Op, SelectionDAG &DAG) const;
8bcb0991SDimitry Andric    SDValue LowerFP_EXTEND(SDValue Op, SelectionDAG &DAG) const;
8bcb0991SDimitry Andric    SDValue LowerFP_ROUND(SDValue Op, SelectionDAG &DAG) const;
8bcb0991SDimitry Andric
8bcb0991SDimitry Andric    SDValue LowerF128Call(SDValue Op, SelectionDAG &DAG,
8bcb0991SDimitry Andric                          RTLIB::Libcall Call) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue
0b57cec5SDimitry Andric    LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
0b57cec5SDimitry Andric                         const SmallVectorImpl<ISD::InputArg> &Ins,
0b57cec5SDimitry Andric                         const SDLoc &dl, SelectionDAG &DAG,
0b57cec5SDimitry Andric                         SmallVectorImpl<SDValue> &InVals) const override;
0b57cec5SDimitry Andric    SDValue LowerCall(CallLoweringInfo &CLI,
0b57cec5SDimitry Andric                      SmallVectorImpl<SDValue> &InVals) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
0b57cec5SDimitry Andric                        const SmallVectorImpl<ISD::OutputArg> &Outs,
0b57cec5SDimitry Andric                        const SmallVectorImpl<SDValue> &OutVals,
0b57cec5SDimitry Andric                        const SDLoc &dl, SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool supportSplitCSR(MachineFunction *MF) const override {
0b57cec5SDimitry Andric      return MF->getFunction().getCallingConv() == CallingConv::CXX_FAST_TLS &&
0b57cec5SDimitry Andric          MF->getFunction().hasFnAttribute(Attribute::NoUnwind);
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric    void initializeSplitCSR(MachineBasicBlock *Entry) const override;
0b57cec5SDimitry Andric    void insertCopiesSplitCSR(
0b57cec5SDimitry Andric      MachineBasicBlock *Entry,
0b57cec5SDimitry Andric      const SmallVectorImpl<MachineBasicBlock *> &Exits) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool isUsedByReturnOnly(SDNode *N, SDValue &Chain) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool mayBeEmittedAsTailCall(const CallInst *CI) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    EVT getTypeForExtReturn(LLVMContext &Context, EVT VT,
0b57cec5SDimitry Andric                            ISD::NodeType ExtendKind) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF,
0b57cec5SDimitry Andric                        bool isVarArg,
0b57cec5SDimitry Andric                        const SmallVectorImpl<ISD::OutputArg> &Outs,
0b57cec5SDimitry Andric                        LLVMContext &Context) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    const MCPhysReg *getScratchRegisters(CallingConv::ID CC) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    TargetLoweringBase::AtomicExpansionKind
*5ffd83dbSDimitry Andric    shouldExpandAtomicLoadInIR(LoadInst *LI) const override;
0b57cec5SDimitry Andric    bool shouldExpandAtomicStoreInIR(StoreInst *SI) const override;
0b57cec5SDimitry Andric    TargetLoweringBase::AtomicExpansionKind
0b57cec5SDimitry Andric    shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    LoadInst *
0b57cec5SDimitry Andric    lowerIdempotentRMWIntoFencedLoad(AtomicRMWInst *AI) const override;
0b57cec5SDimitry Andric
8bcb0991SDimitry Andric    bool lowerAtomicStoreAsStoreSDNode(const StoreInst &SI) const override;
8bcb0991SDimitry Andric    bool lowerAtomicLoadAsLoadSDNode(const LoadInst &LI) const override;
8bcb0991SDimitry Andric
0b57cec5SDimitry Andric    bool needsCmpXchgNb(Type *MemType) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    void SetupEntryBlockForSjLj(MachineInstr &MI, MachineBasicBlock *MBB,
0b57cec5SDimitry Andric                                MachineBasicBlock *DispatchBB, int FI) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    // Utility function to emit the low-level va_arg code for X86-64.
0b57cec5SDimitry Andric    MachineBasicBlock *
0b57cec5SDimitry Andric    EmitVAARG64WithCustomInserter(MachineInstr &MI,
0b57cec5SDimitry Andric                                  MachineBasicBlock *MBB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Utility function to emit the xmm reg save portion of va_start.
0b57cec5SDimitry Andric    MachineBasicBlock *
0b57cec5SDimitry Andric    EmitVAStartSaveXMMRegsWithCustomInserter(MachineInstr &BInstr,
0b57cec5SDimitry Andric                                             MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *EmitLoweredCascadedSelect(MachineInstr &MI1,
0b57cec5SDimitry Andric                                                 MachineInstr &MI2,
0b57cec5SDimitry Andric                                                 MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *EmitLoweredSelect(MachineInstr &I,
0b57cec5SDimitry Andric                                         MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *EmitLoweredCatchRet(MachineInstr &MI,
0b57cec5SDimitry Andric                                           MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    MachineBasicBlock *EmitLoweredSegAlloca(MachineInstr &MI,
0b57cec5SDimitry Andric                                            MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric    MachineBasicBlock *EmitLoweredProbedAlloca(MachineInstr &MI,
0b57cec5SDimitry Andric                                               MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *EmitLoweredTLSAddr(MachineInstr &MI,
0b57cec5SDimitry Andric                                          MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *EmitLoweredTLSCall(MachineInstr &MI,
0b57cec5SDimitry Andric                                          MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
0946e70aSDimitry Andric    MachineBasicBlock *EmitLoweredIndirectThunk(MachineInstr &MI,
0b57cec5SDimitry Andric                                                MachineBasicBlock *BB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *emitEHSjLjSetJmp(MachineInstr &MI,
0b57cec5SDimitry Andric                                        MachineBasicBlock *MBB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    void emitSetJmpShadowStackFix(MachineInstr &MI,
0b57cec5SDimitry Andric                                  MachineBasicBlock *MBB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *emitEHSjLjLongJmp(MachineInstr &MI,
0b57cec5SDimitry Andric                                         MachineBasicBlock *MBB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *emitLongJmpShadowStackFix(MachineInstr &MI,
0b57cec5SDimitry Andric                                                 MachineBasicBlock *MBB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    MachineBasicBlock *EmitSjLjDispatchBlock(MachineInstr &MI,
0b57cec5SDimitry Andric                                             MachineBasicBlock *MBB) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Emit flags for the given setcc condition and operands. Also returns the
0b57cec5SDimitry Andric    /// corresponding X86 condition code constant in X86CC.
480093f4SDimitry Andric    SDValue emitFlagsForSetcc(SDValue Op0, SDValue Op1, ISD::CondCode CC,
480093f4SDimitry Andric                              const SDLoc &dl, SelectionDAG &DAG,
*5ffd83dbSDimitry Andric                              SDValue &X86CC) const;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Check if replacement of SQRT with RSQRT should be disabled.
*5ffd83dbSDimitry Andric    bool isFsqrtCheap(SDValue Op, SelectionDAG &DAG) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Use rsqrt* to speed up sqrt calculations.
*5ffd83dbSDimitry Andric    SDValue getSqrtEstimate(SDValue Op, SelectionDAG &DAG, int Enabled,
0b57cec5SDimitry Andric                            int &RefinementSteps, bool &UseOneConstNR,
0b57cec5SDimitry Andric                            bool Reciprocal) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Use rcp* to speed up fdiv calculations.
*5ffd83dbSDimitry Andric    SDValue getRecipEstimate(SDValue Op, SelectionDAG &DAG, int Enabled,
0b57cec5SDimitry Andric                             int &RefinementSteps) const override;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    /// Reassociate floating point divisions into multiply by reciprocal.
0b57cec5SDimitry Andric    unsigned combineRepeatedFPDivisors() const override;
8bcb0991SDimitry Andric
8bcb0991SDimitry Andric    SDValue BuildSDIVPow2(SDNode *N, const APInt &Divisor, SelectionDAG &DAG,
8bcb0991SDimitry Andric                          SmallVectorImpl<SDNode *> &Created) const override;
0b57cec5SDimitry Andric  };
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  namespace X86 {
0b57cec5SDimitry Andric    FastISel *createFastISel(FunctionLoweringInfo &funcInfo,
0b57cec5SDimitry Andric                             const TargetLibraryInfo *libInfo);
0b57cec5SDimitry Andric  } // end namespace X86
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  // X86 specific Gather/Scatter nodes.
0b57cec5SDimitry Andric  // The class has the same order of operands as MaskedGatherScatterSDNode for
0b57cec5SDimitry Andric  // convenience.
*5ffd83dbSDimitry Andric  class X86MaskedGatherScatterSDNode : public MemIntrinsicSDNode {
0b57cec5SDimitry Andric  public:
*5ffd83dbSDimitry Andric    // This is a intended as a utility and should never be directly created.
*5ffd83dbSDimitry Andric    X86MaskedGatherScatterSDNode() = delete;
*5ffd83dbSDimitry Andric    ~X86MaskedGatherScatterSDNode() = delete;
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    const SDValue &getBasePtr() const { return getOperand(3); }
0b57cec5SDimitry Andric    const SDValue &getIndex()   const { return getOperand(4); }
0b57cec5SDimitry Andric    const SDValue &getMask()    const { return getOperand(2); }
0b57cec5SDimitry Andric    const SDValue &getScale()   const { return getOperand(5); }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    static bool classof(const SDNode *N) {
0b57cec5SDimitry Andric      return N->getOpcode() == X86ISD::MGATHER ||
0b57cec5SDimitry Andric             N->getOpcode() == X86ISD::MSCATTER;
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric  };
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  class X86MaskedGatherSDNode : public X86MaskedGatherScatterSDNode {
0b57cec5SDimitry Andric  public:
0b57cec5SDimitry Andric    const SDValue &getPassThru() const { return getOperand(1); }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    static bool classof(const SDNode *N) {
0b57cec5SDimitry Andric      return N->getOpcode() == X86ISD::MGATHER;
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric  };
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  class X86MaskedScatterSDNode : public X86MaskedGatherScatterSDNode {
0b57cec5SDimitry Andric  public:
0b57cec5SDimitry Andric    const SDValue &getValue() const { return getOperand(1); }
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric    static bool classof(const SDNode *N) {
0b57cec5SDimitry Andric      return N->getOpcode() == X86ISD::MSCATTER;
0b57cec5SDimitry Andric    }
0b57cec5SDimitry Andric  };
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric  /// Generate unpacklo/unpackhi shuffle mask.
*5ffd83dbSDimitry Andric  void createUnpackShuffleMask(MVT VT, SmallVectorImpl<int> &Mask, bool Lo,
*5ffd83dbSDimitry Andric                               bool Unary);
0b57cec5SDimitry Andric
*5ffd83dbSDimitry Andric  /// Similar to unpacklo/unpackhi, but without the 128-bit lane limitation
*5ffd83dbSDimitry Andric  /// imposed by AVX and specific to the unary pattern. Example:
*5ffd83dbSDimitry Andric  /// v8iX Lo --> <0, 0, 1, 1, 2, 2, 3, 3>
*5ffd83dbSDimitry Andric  /// v8iX Hi --> <4, 4, 5, 5, 6, 6, 7, 7>
*5ffd83dbSDimitry Andric  void createSplat2ShuffleMask(MVT VT, SmallVectorImpl<int> &Mask, bool Lo);
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric} // end namespace llvm
0b57cec5SDimitry Andric
0b57cec5SDimitry Andric#endif // LLVM_LIB_TARGET_X86_X86ISELLOWERING_H