Target/X86/X86ISelLowering.h

193323Sed//===-- X86ISelLowering.h - X86 DAG Lowering Interface ----------*- C++ -*-===//
193323Sed//
193323Sed//                     The LLVM Compiler Infrastructure
193323Sed//
193323Sed// This file is distributed under the University of Illinois Open Source
193323Sed// License. See LICENSE.TXT for details.
193323Sed//
193323Sed//===----------------------------------------------------------------------===//
193323Sed//
193323Sed// This file defines the interfaces that X86 uses to lower LLVM code into a
193323Sed// selection DAG.
193323Sed//
193323Sed//===----------------------------------------------------------------------===//
193323Sed
280031Sdim#ifndef LLVM_LIB_TARGET_X86_X86ISELLOWERING_H
280031Sdim#define LLVM_LIB_TARGET_X86_X86ISELLOWERING_H
193323Sed
249423Sdim#include "llvm/CodeGen/CallingConvLower.h"
249423Sdim#include "llvm/CodeGen/SelectionDAG.h"
193323Sed#include "llvm/Target/TargetLowering.h"
203954Srdivacky#include "llvm/Target/TargetOptions.h"
193323Sed
193323Sednamespace llvm {
276479Sdim  class X86Subtarget;
276479Sdim  class X86TargetMachine;
276479Sdim
193323Sed  namespace X86ISD {
193323Sed    // X86 Specific DAG Nodes
288943Sdim    enum NodeType : unsigned {
193323Sed      // Start the numbering where the builtin ops leave off.
193323Sed      FIRST_NUMBER = ISD::BUILTIN_OP_END,
193323Sed
288943Sdim      /// Bit scan forward.
193323Sed      BSF,
288943Sdim      /// Bit scan reverse.
193323Sed      BSR,
193323Sed
288943Sdim      /// Double shift instructions. These correspond to
193323Sed      /// X86::SHLDxx and X86::SHRDxx instructions.
193323Sed      SHLD,
193323Sed      SHRD,
193323Sed
288943Sdim      /// Bitwise logical AND of floating point values. This corresponds
193323Sed      /// to X86::ANDPS or X86::ANDPD.
193323Sed      FAND,
193323Sed
288943Sdim      /// Bitwise logical OR of floating point values. This corresponds
193323Sed      /// to X86::ORPS or X86::ORPD.
193323Sed      FOR,
193323Sed
288943Sdim      /// Bitwise logical XOR of floating point values. This corresponds
193323Sed      /// to X86::XORPS or X86::XORPD.
193323Sed      FXOR,
193323Sed
288943Sdim      ///  Bitwise logical ANDNOT of floating point values. This
261991Sdim      /// corresponds to X86::ANDNPS or X86::ANDNPD.
261991Sdim      FANDN,
261991Sdim
288943Sdim      /// These operations represent an abstract X86 call
193323Sed      /// instruction, which includes a bunch of information.  In particular the
193323Sed      /// operands of these node are:
193323Sed      ///
193323Sed      ///     #0 - The incoming token chain
193323Sed      ///     #1 - The callee
193323Sed      ///     #2 - The number of arg bytes the caller pushes on the stack.
193323Sed      ///     #3 - The number of arg bytes the callee pops off the stack.
193323Sed      ///     #4 - The value to pass in AL/AX/EAX (optional)
193323Sed      ///     #5 - The value to pass in DL/DX/EDX (optional)
193323Sed      ///
193323Sed      /// The result values of these nodes are:
193323Sed      ///
193323Sed      ///     #0 - The outgoing token chain
193323Sed      ///     #1 - The first register result value (optional)
193323Sed      ///     #2 - The second register result value (optional)
193323Sed      ///
193323Sed      CALL,
198090Srdivacky
288943Sdim      /// This operation implements the lowering for readcyclecounter
193323Sed      RDTSC_DAG,
193323Sed
276479Sdim      /// X86 Read Time-Stamp Counter and Processor ID.
276479Sdim      RDTSCP_DAG,
276479Sdim
276479Sdim      /// X86 Read Performance Monitoring Counters.
276479Sdim      RDPMC_DAG,
276479Sdim
193323Sed      /// X86 compare and logical compare instructions.
193323Sed      CMP, COMI, UCOMI,
193323Sed
193323Sed      /// X86 bit-test instructions.
193323Sed      BT,
193323Sed
218893Sdim      /// X86 SetCC. Operand 0 is condition code, and operand 1 is the EFLAGS
218893Sdim      /// operand, usually produced by a CMP instruction.
193323Sed      SETCC,
193323Sed
276479Sdim      /// X86 Select
276479Sdim      SELECT,
276479Sdim
200581Srdivacky      // Same as SETCC except it's materialized with a sbb and the value is all
200581Srdivacky      // one's or all zero's.
218893Sdim      SETCC_CARRY,  // R = carry_bit ? ~0 : 0
200581Srdivacky
223017Sdim      /// X86 FP SETCC, implemented with CMP{cc}SS/CMP{cc}SD.
223017Sdim      /// Operands are two FP values to compare; result is a mask of
223017Sdim      /// 0s or 1s.  Generally DTRT for C/C++ with NaNs.
276479Sdim      FSETCC,
223017Sdim
223017Sdim      /// X86 MOVMSK{pd|ps}, extracts sign bits of two or four FP values,
223017Sdim      /// result in an integer GPR.  Needs masking for scalar result.
223017Sdim      FGETSIGNx86,
223017Sdim
193323Sed      /// X86 conditional moves. Operand 0 and operand 1 are the two values
193323Sed      /// to select from. Operand 2 is the condition code, and operand 3 is the
193323Sed      /// flag operand produced by a CMP or TEST instruction. It also writes a
193323Sed      /// flag result.
193323Sed      CMOV,
193323Sed
193323Sed      /// X86 conditional branches. Operand 0 is the chain operand, operand 1
193323Sed      /// is the block to branch if condition is true, operand 2 is the
193323Sed      /// condition code, and operand 3 is the flag operand produced by a CMP
193323Sed      /// or TEST instruction.
193323Sed      BRCOND,
193323Sed
193323Sed      /// Return with a flag operand. Operand 0 is the chain operand, operand
193323Sed      /// 1 is the number of bytes of stack to pop.
193323Sed      RET_FLAG,
193323Sed
296417Sdim      /// Return from interrupt. Operand 0 is the number of bytes to pop.
296417Sdim      IRET,
296417Sdim
288943Sdim      /// Repeat fill, corresponds to X86::REP_STOSx.
193323Sed      REP_STOS,
193323Sed
288943Sdim      /// Repeat move, corresponds to X86::REP_MOVSx.
193323Sed      REP_MOVS,
193323Sed
288943Sdim      /// On Darwin, this node represents the result of the popl
193323Sed      /// at function entry, used for PIC code.
193323Sed      GlobalBaseReg,
193323Sed
288943Sdim      /// A wrapper node for TargetConstantPool,
193323Sed      /// TargetExternalSymbol, and TargetGlobalAddress.
193323Sed      Wrapper,
193323Sed
288943Sdim      /// Special wrapper used under X86-64 PIC mode for RIP
193323Sed      /// relative displacements.
193323Sed      WrapperRIP,
193323Sed
288943Sdim      /// Copies a 64-bit value from the low word of an XMM vector
218893Sdim      /// to an MMX vector.  If you think this is too close to the previous
218893Sdim      /// mnemonic, so do I; blame Intel.
218893Sdim      MOVDQ2Q,
218893Sdim
288943Sdim      /// Copies a 32-bit value from the low word of a MMX
243830Sdim      /// vector to a GPR.
243830Sdim      MMX_MOVD2W,
243830Sdim
288943Sdim      /// Copies a GPR into the low 32-bit word of a MMX vector
288943Sdim      /// and zero out the high word.
288943Sdim      MMX_MOVW2D,
288943Sdim
288943Sdim      /// Extract an 8-bit value from a vector and zero extend it to
193323Sed      /// i32, corresponds to X86::PEXTRB.
193323Sed      PEXTRB,
193323Sed
288943Sdim      /// Extract a 16-bit value from a vector and zero extend it to
193323Sed      /// i32, corresponds to X86::PEXTRW.
193323Sed      PEXTRW,
193323Sed
288943Sdim      /// Insert any element of a 4 x float vector into any element
193323Sed      /// of a destination 4 x floatvector.
193323Sed      INSERTPS,
193323Sed
288943Sdim      /// Insert the lower 8-bits of a 32-bit value to a vector,
193323Sed      /// corresponds to X86::PINSRB.
193323Sed      PINSRB,
193323Sed
288943Sdim      /// Insert the lower 16-bits of a 32-bit value to a vector,
193323Sed      /// corresponds to X86::PINSRW.
204642Srdivacky      PINSRW, MMX_PINSRW,
193323Sed
288943Sdim      /// Shuffle 16 8-bit values within a vector.
193323Sed      PSHUFB,
219077Sdim
288943Sdim      /// Compute Sum of Absolute Differences.
288943Sdim      PSADBW,
296417Sdim      /// Compute Double Block Packed Sum-Absolute-Differences
296417Sdim      DBPSADBW,
288943Sdim
288943Sdim      /// Bitwise Logical AND NOT of Packed FP values.
224145Sdim      ANDNP,
219077Sdim
288943Sdim      /// Copy integer sign.
234353Sdim      PSIGN,
219077Sdim
288943Sdim      /// Blend where the selector is an immediate.
249423Sdim      BLENDI,
234353Sdim
288943Sdim      /// Blend where the condition has been shrunk.
280031Sdim      /// This is used to emphasize that the condition mask is
280031Sdim      /// no more valid for generic VSELECT optimizations.
280031Sdim      SHRUNKBLEND,
280031Sdim
288943Sdim      /// Combined add and sub on an FP vector.
280031Sdim      ADDSUB,
280031Sdim
288943Sdim      //  FP vector ops with rounding mode.
288943Sdim      FADD_RND,
288943Sdim      FSUB_RND,
288943Sdim      FMUL_RND,
288943Sdim      FDIV_RND,
288943Sdim      FMAX_RND,
288943Sdim      FMIN_RND,
288943Sdim      FSQRT_RND,
288943Sdim
288943Sdim      // FP vector get exponent
288943Sdim      FGETEXP_RND,
296417Sdim      // Extract Normalized Mantissas
296417Sdim      VGETMANT,
288943Sdim      // FP Scale
288943Sdim      SCALEF,
288943Sdim      // Integer add/sub with unsigned saturation.
288943Sdim      ADDUS,
249423Sdim      SUBUS,
288943Sdim      // Integer add/sub with signed saturation.
288943Sdim      ADDS,
288943Sdim      SUBS,
288943Sdim      // Unsigned Integer average
288943Sdim      AVG,
288943Sdim      /// Integer horizontal add.
234353Sdim      HADD,
234353Sdim
288943Sdim      /// Integer horizontal sub.
234353Sdim      HSUB,
234353Sdim
288943Sdim      /// Floating point horizontal add.
226633Sdim      FHADD,
226633Sdim
288943Sdim      /// Floating point horizontal sub.
226633Sdim      FHSUB,
226633Sdim
288943Sdim      // Integer absolute value
288943Sdim      ABS,
249423Sdim
296417Sdim      // Detect Conflicts Within a Vector
296417Sdim      CONFLICT,
296417Sdim
288943Sdim      /// Floating point max and min.
193323Sed      FMAX, FMIN,
193323Sed
288943Sdim      /// Commutative FMIN and FMAX.
243830Sdim      FMAXC, FMINC,
243830Sdim
288943Sdim      /// Floating point reciprocal-sqrt and reciprocal approximation.
288943Sdim      /// Note that these typically require refinement
193323Sed      /// in order to obtain suitable precision.
193323Sed      FRSQRT, FRCP,
193323Sed
288943Sdim      // Thread Local Storage.
193323Sed      TLSADDR,
218893Sdim
288943Sdim      // Thread Local Storage. A call to get the start address
239462Sdim      // of the TLS block for the current module.
239462Sdim      TLSBASEADDR,
239462Sdim
288943Sdim      // Thread Local Storage.  When calling to an OS provided
210299Sed      // thunk at the address from an earlier relocation.
210299Sed      TLSCALL,
193323Sed
288943Sdim      // Exception Handling helpers.
193323Sed      EH_RETURN,
218893Sdim
288943Sdim      // SjLj exception handling setjmp.
243830Sdim      EH_SJLJ_SETJMP,
243830Sdim
288943Sdim      // SjLj exception handling longjmp.
243830Sdim      EH_SJLJ_LONGJMP,
243830Sdim
288943Sdim      /// Tail call return. See X86TargetLowering::LowerCall for
249423Sdim      /// the list of operands.
193323Sed      TC_RETURN,
193323Sed
288943Sdim      // Vector move to low scalar and zero higher vector elements.
193323Sed      VZEXT_MOVL,
193323Sed
288943Sdim      // Vector integer zero-extend.
243830Sdim      VZEXT,
243830Sdim
288943Sdim      // Vector integer signed-extend.
243830Sdim      VSEXT,
243830Sdim
288943Sdim      // Vector integer truncate.
261991Sdim      VTRUNC,
296417Sdim      // Vector integer truncate with unsigned/signed saturation.
296417Sdim      VTRUNCUS, VTRUNCS,
261991Sdim
288943Sdim      // Vector FP extend.
239462Sdim      VFPEXT,
239462Sdim
288943Sdim      // Vector FP round.
243830Sdim      VFPROUND,
243830Sdim
288943Sdim      // Vector signed/unsigned integer to double.
288943Sdim      CVTDQ2PD, CVTUDQ2PD,
288943Sdim
296417Sdim      // Convert a vector to mask, set bits base on MSB.
296417Sdim      CVT2MASK,
296417Sdim
288943Sdim      // 128-bit vector logical left / right shift
234353Sdim      VSHLDQ, VSRLDQ,
218893Sdim
288943Sdim      // Vector shift elements
234353Sdim      VSHL, VSRL, VSRA,
234353Sdim
288943Sdim      // Vector shift elements by immediate
234353Sdim      VSHLI, VSRLI, VSRAI,
234353Sdim
296417Sdim      // Bit rotate by immediate
296417Sdim      VROTLI, VROTRI,
296417Sdim
288943Sdim      // Vector packed double/float comparison.
234353Sdim      CMPP,
234353Sdim
288943Sdim      // Vector integer comparisons.
234353Sdim      PCMPEQ, PCMPGT,
288943Sdim      // Vector integer comparisons, the result is in a mask vector.
261991Sdim      PCMPEQM, PCMPGTM,
193323Sed
288943Sdim      /// Vector comparison generating mask bits for fp and
261991Sdim      /// integer signed and unsigned data types.
261991Sdim      CMPM,
261991Sdim      CMPMU,
288943Sdim      // Vector comparison with rounding mode for FP values
288943Sdim      CMPM_RND,
261991Sdim
288943Sdim      // Arithmetic operations with FLAGS results.
218893Sdim      ADD, SUB, ADC, SBB, SMUL,
198090Srdivacky      INC, DEC, OR, XOR, AND,
219077Sdim
288943Sdim      BEXTR,  // Bit field extract
234353Sdim
218893Sdim      UMUL, // LOW, HI, FLAGS = umul LHS, RHS
193323Sed
280031Sdim      // 8-bit SMUL/UMUL - AX, FLAGS = smul8/umul8 AL, RHS
280031Sdim      SMUL8, UMUL8,
280031Sdim
280031Sdim      // 8-bit divrem that zero-extend the high result (AH).
280031Sdim      UDIVREM8_ZEXT_HREG,
280031Sdim      SDIVREM8_SEXT_HREG,
280031Sdim
288943Sdim      // X86-specific multiply by immediate.
198090Srdivacky      MUL_IMM,
218893Sdim
288943Sdim      // Vector bitwise comparisons.
198090Srdivacky      PTEST,
198090Srdivacky
288943Sdim      // Vector packed fp sign bitwise comparisons.
212904Sdim      TESTP,
212904Sdim
288943Sdim      // Vector "test" in AVX-512, the result is in a mask vector.
261991Sdim      TESTM,
276479Sdim      TESTNM,
261991Sdim
261991Sdim      // OR/AND test for masks
261991Sdim      KORTEST,
296417Sdim      KTEST,
261991Sdim
212904Sdim      // Several flavors of instructions with vector shuffle behaviors.
276479Sdim      PACKSS,
276479Sdim      PACKUS,
280031Sdim      // Intra-lane alignr
249423Sdim      PALIGNR,
280031Sdim      // AVX512 inter-lane alignr
280031Sdim      VALIGN,
212904Sdim      PSHUFD,
212904Sdim      PSHUFHW,
212904Sdim      PSHUFLW,
234353Sdim      SHUFP,
288943Sdim      //Shuffle Packed Values at 128-bit granularity
288943Sdim      SHUF128,
212904Sdim      MOVDDUP,
212904Sdim      MOVSHDUP,
212904Sdim      MOVSLDUP,
212904Sdim      MOVLHPS,
212904Sdim      MOVLHPD,
212904Sdim      MOVHLPS,
212904Sdim      MOVLPS,
212904Sdim      MOVLPD,
212904Sdim      MOVSD,
212904Sdim      MOVSS,
234353Sdim      UNPCKL,
234353Sdim      UNPCKH,
280031Sdim      VPERMILPV,
280031Sdim      VPERMILPI,
234982Sdim      VPERMV,
261991Sdim      VPERMV3,
276479Sdim      VPERMIV3,
234982Sdim      VPERMI,
234353Sdim      VPERM2X128,
296417Sdim      // Bitwise ternary logic
296417Sdim      VPTERNLOG,
296417Sdim      // Fix Up Special Packed Float32/64 values
288943Sdim      VFIXUPIMM,
296417Sdim      // Range Restriction Calculation For Packed Pairs of Float32/64 values
288943Sdim      VRANGE,
296417Sdim      // Reduce - Perform Reduction Transformation on scalar\packed FP
296417Sdim      VREDUCE,
296417Sdim      // RndScale - Round FP Values To Include A Given Number Of Fraction Bits
296417Sdim      VRNDSCALE,
296417Sdim      // VFPCLASS - Tests Types Of a FP Values for packed types.
296417Sdim      VFPCLASS,
296417Sdim      // VFPCLASSS - Tests Types Of a FP Values for scalar types.
296417Sdim      VFPCLASSS,
288943Sdim      // Broadcast scalar to vector
226633Sdim      VBROADCAST,
296417Sdim      // Broadcast mask to vector
296417Sdim      VBROADCASTM,
288943Sdim      // Broadcast subvector to vector
288943Sdim      SUBV_BROADCAST,
276479Sdim      // Insert/Extract vector element
261991Sdim      VINSERT,
276479Sdim      VEXTRACT,
212904Sdim
288943Sdim      /// SSE4A Extraction and Insertion.
288943Sdim      EXTRQI, INSERTQI,
288943Sdim
296417Sdim      // XOP variable/immediate rotations
296417Sdim      VPROT, VPROTI,
296417Sdim      // XOP arithmetic/logical shifts
296417Sdim      VPSHA, VPSHL,
296417Sdim      // XOP signed/unsigned integer comparisons
296417Sdim      VPCOM, VPCOMU,
296417Sdim
280031Sdim      // Vector multiply packed unsigned doubleword integers
234353Sdim      PMULUDQ,
280031Sdim      // Vector multiply packed signed doubleword integers
276479Sdim      PMULDQ,
288943Sdim      // Vector Multiply Packed UnsignedIntegers with Round and Scale
288943Sdim      MULHRS,
296417Sdim      // Multiply and Add Packed Integers
296417Sdim      VPMADDUBSW, VPMADDWD,
239462Sdim      // FMA nodes
239462Sdim      FMADD,
239462Sdim      FNMADD,
239462Sdim      FMSUB,
239462Sdim      FNMSUB,
239462Sdim      FMADDSUB,
239462Sdim      FMSUBADD,
288943Sdim      // FMA with rounding mode
288943Sdim      FMADD_RND,
288943Sdim      FNMADD_RND,
288943Sdim      FMSUB_RND,
288943Sdim      FNMSUB_RND,
288943Sdim      FMADDSUB_RND,
288943Sdim      FMSUBADD_RND,
239462Sdim
280031Sdim      // Compress and expand
280031Sdim      COMPRESS,
280031Sdim      EXPAND,
280031Sdim
288943Sdim      //Convert Unsigned/Integer to Scalar Floating-Point Value
288943Sdim      //with rounding mode
288943Sdim      SINT_TO_FP_RND,
288943Sdim      UINT_TO_FP_RND,
288943Sdim
288943Sdim      // Vector float/double to signed/unsigned integer.
288943Sdim      FP_TO_SINT_RND, FP_TO_UINT_RND,
280031Sdim      // Save xmm argument registers to the stack, according to %al. An operator
280031Sdim      // is needed so that this can be expanded with control flow.
198090Srdivacky      VASTART_SAVE_XMM_REGS,
198090Srdivacky
280031Sdim      // Windows's _chkstk call to do stack probing.
218893Sdim      WIN_ALLOCA,
204961Srdivacky
280031Sdim      // For allocating variable amounts of stack space when using
226633Sdim      // segmented stacks. Check if the current stacklet has enough space, and
226633Sdim      // falls back to heap allocation if not.
226633Sdim      SEG_ALLOCA,
226633Sdim
218893Sdim      // Memory barrier
218893Sdim      MEMBARRIER,
218893Sdim      MFENCE,
218893Sdim      SFENCE,
218893Sdim      LFENCE,
218893Sdim
280031Sdim      // Store FP status word into i16 register.
239462Sdim      FNSTSW16r,
239462Sdim
280031Sdim      // Store contents of %ah into %eflags.
239462Sdim      SAHF,
239462Sdim
280031Sdim      // Get a random integer and indicate whether it is valid in CF.
239462Sdim      RDRAND,
239462Sdim
280031Sdim      // Get a NIST SP800-90B & C compliant random integer and
249423Sdim      // indicate whether it is valid in CF.
249423Sdim      RDSEED,
249423Sdim
239462Sdim      PCMPISTRI,
239462Sdim      PCMPESTRI,
239462Sdim
280031Sdim      // Test if in transactional execution.
249423Sdim      XTEST,
249423Sdim
280031Sdim      // ERI instructions
280031Sdim      RSQRT28, RCP28, EXP2,
280031Sdim
280031Sdim      // Compare and swap.
276479Sdim      LCMPXCHG_DAG = ISD::FIRST_TARGET_MEMORY_OPCODE,
218893Sdim      LCMPXCHG8_DAG,
226633Sdim      LCMPXCHG16_DAG,
218893Sdim
280031Sdim      // Load, scalar_to_vector, and zero extend.
218893Sdim      VZEXT_LOAD,
218893Sdim
280031Sdim      // Store FP control world into i16 memory.
218893Sdim      FNSTCW16m,
218893Sdim
280031Sdim      /// This instruction implements FP_TO_SINT with the
218893Sdim      /// integer destination in memory and a FP reg source.  This corresponds
218893Sdim      /// to the X86::FIST*m instructions and the rounding mode change stuff. It
218893Sdim      /// has two inputs (token chain and address) and two outputs (int value
218893Sdim      /// and token chain).
218893Sdim      FP_TO_INT16_IN_MEM,
218893Sdim      FP_TO_INT32_IN_MEM,
218893Sdim      FP_TO_INT64_IN_MEM,
218893Sdim
280031Sdim      /// This instruction implements SINT_TO_FP with the
218893Sdim      /// integer source in memory and FP reg result.  This corresponds to the
218893Sdim      /// X86::FILD*m instructions. It has three inputs (token chain, address,
218893Sdim      /// and source type) and two outputs (FP value and token chain). FILD_FLAG
218893Sdim      /// also produces a flag).
218893Sdim      FILD,
218893Sdim      FILD_FLAG,
218893Sdim
280031Sdim      /// This instruction implements an extending load to FP stack slots.
218893Sdim      /// This corresponds to the X86::FLD32m / X86::FLD64m. It takes a chain
218893Sdim      /// operand, ptr to load from, and a ValueType node indicating the type
218893Sdim      /// to load to.
218893Sdim      FLD,
218893Sdim
280031Sdim      /// This instruction implements a truncating store to FP stack
218893Sdim      /// slots. This corresponds to the X86::FST32m / X86::FST64m. It takes a
218893Sdim      /// chain operand, value to store, address, and a ValueType to store it
218893Sdim      /// as.
218893Sdim      FST,
218893Sdim
280031Sdim      /// This instruction grabs the address of the next argument
218893Sdim      /// from a va_list. (reads and modifies the va_list in memory)
218893Sdim      VAARG_64
218893Sdim
204961Srdivacky      // WARNING: Do not add anything in the end unless you want the node to
204961Srdivacky      // have memop! In fact, starting from ATOMADD64_DAG all opcodes will be
204961Srdivacky      // thought as target memory ops!
193323Sed    };
193323Sed  }
193323Sed
193323Sed  /// Define some predicates that are used for node matching.
193323Sed  namespace X86 {
280031Sdim    /// Return true if the specified
218893Sdim    /// EXTRACT_SUBVECTOR operand specifies a vector extract that is
261991Sdim    /// suitable for input to VEXTRACTF128, VEXTRACTI128 instructions.
261991Sdim    bool isVEXTRACT128Index(SDNode *N);
218893Sdim
280031Sdim    /// Return true if the specified
218893Sdim    /// INSERT_SUBVECTOR operand specifies a subvector insert that is
261991Sdim    /// suitable for input to VINSERTF128, VINSERTI128 instructions.
261991Sdim    bool isVINSERT128Index(SDNode *N);
218893Sdim
280031Sdim    /// Return true if the specified
261991Sdim    /// EXTRACT_SUBVECTOR operand specifies a vector extract that is
261991Sdim    /// suitable for input to VEXTRACTF64X4, VEXTRACTI64X4 instructions.
261991Sdim    bool isVEXTRACT256Index(SDNode *N);
261991Sdim
280031Sdim    /// Return true if the specified
261991Sdim    /// INSERT_SUBVECTOR operand specifies a subvector insert that is
261991Sdim    /// suitable for input to VINSERTF64X4, VINSERTI64X4 instructions.
261991Sdim    bool isVINSERT256Index(SDNode *N);
261991Sdim
280031Sdim    /// Return the appropriate
218893Sdim    /// immediate to extract the specified EXTRACT_SUBVECTOR index
261991Sdim    /// with VEXTRACTF128, VEXTRACTI128 instructions.
261991Sdim    unsigned getExtractVEXTRACT128Immediate(SDNode *N);
218893Sdim
280031Sdim    /// Return the appropriate
218893Sdim    /// immediate to insert at the specified INSERT_SUBVECTOR index
261991Sdim    /// with VINSERTF128, VINSERT128 instructions.
261991Sdim    unsigned getInsertVINSERT128Immediate(SDNode *N);
218893Sdim
280031Sdim    /// Return the appropriate
261991Sdim    /// immediate to extract the specified EXTRACT_SUBVECTOR index
261991Sdim    /// with VEXTRACTF64X4, VEXTRACTI64x4 instructions.
261991Sdim    unsigned getExtractVEXTRACT256Immediate(SDNode *N);
261991Sdim
280031Sdim    /// Return the appropriate
261991Sdim    /// immediate to insert at the specified INSERT_SUBVECTOR index
261991Sdim    /// with VINSERTF64x4, VINSERTI64x4 instructions.
261991Sdim    unsigned getInsertVINSERT256Immediate(SDNode *N);
261991Sdim
280031Sdim    /// Returns true if Elt is a constant zero or floating point constant +0.0.
198090Srdivacky    bool isZeroNode(SDValue Elt);
198090Srdivacky
280031Sdim    /// Returns true of the given offset can be
198090Srdivacky    /// fit into displacement field of the instruction.
198090Srdivacky    bool isOffsetSuitableForCodeModel(int64_t Offset, CodeModel::Model M,
198090Srdivacky                                      bool hasSymbolicDisplacement = true);
224145Sdim
224145Sdim
280031Sdim    /// Determines whether the callee is required to pop its
224145Sdim    /// own arguments. Callee pop is necessary to support tail calls.
224145Sdim    bool isCalleePop(CallingConv::ID CallingConv,
224145Sdim                     bool is64Bit, bool IsVarArg, bool TailCallOpt);
280031Sdim
193323Sed  }
193323Sed
193323Sed  //===--------------------------------------------------------------------===//
280031Sdim  //  X86 Implementation of the TargetLowering interface
276479Sdim  class X86TargetLowering final : public TargetLowering {
193323Sed  public:
288943Sdim    explicit X86TargetLowering(const X86TargetMachine &TM,
288943Sdim                               const X86Subtarget &STI);
193323Sed
276479Sdim    unsigned getJumpTableEncoding() const override;
288943Sdim    bool useSoftFloat() const override;
203954Srdivacky
288943Sdim    MVT getScalarShiftAmountTy(const DataLayout &, EVT) const override {
288943Sdim      return MVT::i8;
288943Sdim    }
219077Sdim
276479Sdim    const MCExpr *
203954Srdivacky    LowerCustomJumpTableEntry(const MachineJumpTableInfo *MJTI,
203954Srdivacky                              const MachineBasicBlock *MBB, unsigned uid,
276479Sdim                              MCContext &Ctx) const override;
218893Sdim
280031Sdim    /// Returns relocation base for the given PIC jumptable.
276479Sdim    SDValue getPICJumpTableRelocBase(SDValue Table,
276479Sdim                                     SelectionDAG &DAG) const override;
276479Sdim    const MCExpr *
203954Srdivacky    getPICJumpTableRelocBaseExpr(const MachineFunction *MF,
276479Sdim                                 unsigned JTI, MCContext &Ctx) const override;
218893Sdim
280031Sdim    /// Return the desired alignment for ByVal aggregate
193323Sed    /// function arguments in the caller parameter area. For X86, aggregates
193323Sed    /// that contains are placed at 16-byte boundaries while the rest are at
193323Sed    /// 4-byte boundaries.
288943Sdim    unsigned getByValTypeAlignment(Type *Ty,
288943Sdim                                   const DataLayout &DL) const override;
193323Sed
280031Sdim    /// Returns the target specific optimal type for load
206124Srdivacky    /// and store operations as a result of memset, memcpy, and memmove
206124Srdivacky    /// lowering. If DstAlign is zero that means it's safe to destination
206124Srdivacky    /// alignment can satisfy any constraint. Similarly if SrcAlign is zero it
206124Srdivacky    /// means there isn't a need to check it against alignment requirement,
249423Sdim    /// probably because the source does not need to be loaded. If 'IsMemset' is
249423Sdim    /// true, that means it's expanding a memset. If 'ZeroMemset' is true, that
249423Sdim    /// means it's a memset of zero. 'MemcpyStrSrc' indicates whether the memcpy
249423Sdim    /// source is constant so it does not need to be loaded.
207618Srdivacky    /// It returns EVT::Other if the type should be determined using generic
207618Srdivacky    /// target-independent logic.
276479Sdim    EVT getOptimalMemOpType(uint64_t Size, unsigned DstAlign, unsigned SrcAlign,
276479Sdim                            bool IsMemset, bool ZeroMemset, bool MemcpyStrSrc,
276479Sdim                            MachineFunction &MF) const override;
195340Sed
280031Sdim    /// Returns true if it's safe to use load / store of the
249423Sdim    /// specified type to expand memcpy / memset inline. This is mostly true
249423Sdim    /// for all types except for some special cases. For example, on X86
249423Sdim    /// targets without SSE2 f64 load / store are done with fldl / fstpl which
249423Sdim    /// also does type conversion. Note the specified type doesn't have to be
249423Sdim    /// legal as the hook is used before type legalization.
276479Sdim    bool isSafeMemOpType(MVT VT) const override;
249423Sdim
288943Sdim    /// Returns true if the target allows unaligned memory accesses of the
288943Sdim    /// specified type. Returns whether it is "fast" in the last argument.
280031Sdim    bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AS, unsigned Align,
276479Sdim                                       bool *Fast) const override;
198090Srdivacky
280031Sdim    /// Provide custom lowering hooks for some operations.
193323Sed    ///
276479Sdim    SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
193323Sed
280031Sdim    /// Replace the results of node with an illegal result
193323Sed    /// type with new values built out of custom code.
193323Sed    ///
276479Sdim    void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue>&Results,
276479Sdim                            SelectionDAG &DAG) const override;
193323Sed
218893Sdim
276479Sdim    SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
193323Sed
280031Sdim    /// Return true if the target has native support for
207618Srdivacky    /// the specified value type and it is 'desirable' to use the type for the
207618Srdivacky    /// given node type. e.g. On x86 i16 is legal, but undesirable since i16
207618Srdivacky    /// instruction encodings are longer and some i16 instructions are slow.
276479Sdim    bool isTypeDesirableForOp(unsigned Opc, EVT VT) const override;
193323Sed
280031Sdim    /// Return true if the target has native support for the
207618Srdivacky    /// specified value type and it is 'desirable' to use the type. e.g. On x86
207618Srdivacky    /// i16 is legal, but undesirable since i16 instruction encodings are longer
207618Srdivacky    /// and some i16 instructions are slow.
276479Sdim    bool IsDesirableToPromoteOp(SDValue Op, EVT &PVT) const override;
207618Srdivacky
296417Sdim    /// Return true if the MachineFunction contains a COPY which would imply
296417Sdim    /// HasOpaqueSPAdjustment.
296417Sdim    bool hasCopyImplyingStackAdjustment(MachineFunction *MF) const override;
296417Sdim
276479Sdim    MachineBasicBlock *
207618Srdivacky      EmitInstrWithCustomInserter(MachineInstr *MI,
276479Sdim                                  MachineBasicBlock *MBB) const override;
207618Srdivacky
218893Sdim
280031Sdim    /// This method returns the name of a target specific DAG node.
276479Sdim    const char *getTargetNodeName(unsigned Opcode) const override;
193323Sed
280031Sdim    bool isCheapToSpeculateCttz() const override;
280031Sdim
280031Sdim    bool isCheapToSpeculateCtlz() const override;
280031Sdim
280031Sdim    /// Return the value type to use for ISD::SETCC.
288943Sdim    EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context,
288943Sdim                           EVT VT) const override;
193323Sed
280031Sdim    /// Determine which of the bits specified in Mask are known to be either
280031Sdim    /// zero or one and return them in the KnownZero/KnownOne bitsets.
276479Sdim    void computeKnownBitsForTargetNode(const SDValue Op,
276479Sdim                                       APInt &KnownZero,
276479Sdim                                       APInt &KnownOne,
276479Sdim                                       const SelectionDAG &DAG,
276479Sdim                                       unsigned Depth = 0) const override;
193323Sed
280031Sdim    /// Determine the number of bits in the operation that are sign bits.
276479Sdim    unsigned ComputeNumSignBitsForTargetNode(SDValue Op,
276479Sdim                                             const SelectionDAG &DAG,
276479Sdim                                             unsigned Depth) const override;
218893Sdim
276479Sdim    bool isGAPlusOffset(SDNode *N, const GlobalValue* &GA,
276479Sdim                        int64_t &Offset) const override;
218893Sdim
207618Srdivacky    SDValue getReturnAddressFrameIndex(SelectionDAG &DAG) const;
193323Sed
276479Sdim    bool ExpandInlineAsm(CallInst *CI) const override;
218893Sdim
288943Sdim    ConstraintType getConstraintType(StringRef Constraint) const override;
218893Sdim
218893Sdim    /// Examine constraint string and operand type and determine a weight value.
218893Sdim    /// The operand object must already have been set up with the operand type.
276479Sdim    ConstraintWeight
276479Sdim      getSingleConstraintMatchWeight(AsmOperandInfo &info,
276479Sdim                                     const char *constraint) const override;
218893Sdim
276479Sdim    const char *LowerXConstraint(EVT ConstraintVT) const override;
193323Sed
280031Sdim    /// Lower the specified operand into the Ops vector. If it is invalid, don't
280031Sdim    /// add anything to Ops. If hasMemory is true it means one of the asm
280031Sdim    /// constraint of the inline asm instruction being processed is 'm'.
276479Sdim    void LowerAsmOperandForConstraint(SDValue Op,
276479Sdim                                      std::string &Constraint,
276479Sdim                                      std::vector<SDValue> &Ops,
276479Sdim                                      SelectionDAG &DAG) const override;
218893Sdim
288943Sdim    unsigned
288943Sdim    getInlineAsmMemConstraint(StringRef ConstraintCode) const override {
288943Sdim      if (ConstraintCode == "i")
288943Sdim        return InlineAsm::Constraint_i;
288943Sdim      else if (ConstraintCode == "o")
288943Sdim        return InlineAsm::Constraint_o;
288943Sdim      else if (ConstraintCode == "v")
288943Sdim        return InlineAsm::Constraint_v;
288943Sdim      else if (ConstraintCode == "X")
288943Sdim        return InlineAsm::Constraint_X;
288943Sdim      return TargetLowering::getInlineAsmMemConstraint(ConstraintCode);
288943Sdim    }
288943Sdim
280031Sdim    /// Given a physical register constraint
193323Sed    /// (e.g. {edx}), return the register number and the register class for the
193323Sed    /// register.  This should only be used for C_Register constraints.  On
193323Sed    /// error, this returns a register number of 0.
288943Sdim    std::pair<unsigned, const TargetRegisterClass *>
288943Sdim    getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
288943Sdim                                 StringRef Constraint, MVT VT) const override;
218893Sdim
280031Sdim    /// Return true if the addressing mode represented
193323Sed    /// by AM is legal for this target, for a load/store of the specified type.
288943Sdim    bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM,
288943Sdim                               Type *Ty, unsigned AS) const override;
193323Sed
280031Sdim    /// Return true if the specified immediate is legal
239462Sdim    /// icmp immediate, that is the target has icmp instructions which can
239462Sdim    /// compare a register against the immediate without having to materialize
239462Sdim    /// the immediate into a register.
276479Sdim    bool isLegalICmpImmediate(int64_t Imm) const override;
239462Sdim
280031Sdim    /// Return true if the specified immediate is legal
239462Sdim    /// add immediate, that is the target has add instructions which can
239462Sdim    /// add a register and the immediate without having to materialize
239462Sdim    /// the immediate into a register.
276479Sdim    bool isLegalAddImmediate(int64_t Imm) const override;
239462Sdim
276479Sdim    /// \brief Return the cost of the scaling factor used in the addressing
276479Sdim    /// mode represented by AM for this target, for a load/store
276479Sdim    /// of the specified type.
276479Sdim    /// If the AM is supported, the return value must be >= 0.
276479Sdim    /// If the AM is not supported, it returns a negative value.
288943Sdim    int getScalingFactorCost(const DataLayout &DL, const AddrMode &AM, Type *Ty,
288943Sdim                             unsigned AS) const override;
276479Sdim
276479Sdim    bool isVectorShiftByScalarCheap(Type *Ty) const override;
276479Sdim
280031Sdim    /// Return true if it's free to truncate a value of
193323Sed    /// type Ty1 to type Ty2. e.g. On x86 it's free to truncate a i32 value in
193323Sed    /// register EAX to i16 by referencing its sub-register AX.
276479Sdim    bool isTruncateFree(Type *Ty1, Type *Ty2) const override;
276479Sdim    bool isTruncateFree(EVT VT1, EVT VT2) const override;
193323Sed
276479Sdim    bool allowTruncateForTailCall(Type *Ty1, Type *Ty2) const override;
261991Sdim
280031Sdim    /// Return true if any actual instruction that defines a
193323Sed    /// value of type Ty1 implicit zero-extends the value to Ty2 in the result
193323Sed    /// register. This does not necessarily include registers defined in
193323Sed    /// unknown ways, such as incoming arguments, or copies from unknown
193323Sed    /// virtual registers. Also, if isTruncateFree(Ty2, Ty1) is true, this
193323Sed    /// does not necessarily apply to truncate instructions. e.g. on x86-64,
193323Sed    /// all instructions that define 32-bit values implicit zero-extend the
193323Sed    /// result out to 64 bits.
276479Sdim    bool isZExtFree(Type *Ty1, Type *Ty2) const override;
276479Sdim    bool isZExtFree(EVT VT1, EVT VT2) const override;
276479Sdim    bool isZExtFree(SDValue Val, EVT VT2) const override;
193323Sed
288943Sdim    /// Return true if folding a vector load into ExtVal (a sign, zero, or any
288943Sdim    /// extend node) is profitable.
288943Sdim    bool isVectorLoadExtDesirable(SDValue) const override;
288943Sdim
280031Sdim    /// Return true if an FMA operation is faster than a pair of fmul and fadd
280031Sdim    /// instructions. fmuladd intrinsics will be expanded to FMAs when this
280031Sdim    /// method returns true, otherwise fmuladd is expanded to fmul + fadd.
276479Sdim    bool isFMAFasterThanFMulAndFAdd(EVT VT) const override;
239462Sdim
280031Sdim    /// Return true if it's profitable to narrow
193323Sed    /// operations of type VT1 to VT2. e.g. on x86, it's profitable to narrow
193323Sed    /// from i32 to i8 but not from i32 to i16.
276479Sdim    bool isNarrowingProfitable(EVT VT1, EVT VT2) const override;
193323Sed
296417Sdim    /// Given an intrinsic, checks if on the target the intrinsic will need to map
296417Sdim    /// to a MemIntrinsicNode (touches memory). If this is the case, it returns
296417Sdim    /// true and stores the intrinsic information into the IntrinsicInfo that was
296417Sdim    /// passed to the function.
296417Sdim    bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallInst &I,
296417Sdim                            unsigned Intrinsic) const override;
296417Sdim
280031Sdim    /// Returns true if the target can instruction select the
198892Srdivacky    /// specified FP immediate natively. If false, the legalizer will
198892Srdivacky    /// materialize the FP immediate as a load from a constant pool.
276479Sdim    bool isFPImmLegal(const APFloat &Imm, EVT VT) const override;
198892Srdivacky
280031Sdim    /// Targets can use this to indicate that they only support *some*
280031Sdim    /// VECTOR_SHUFFLE operations, those with specific masks. By default, if a
280031Sdim    /// target supports the VECTOR_SHUFFLE node, all mask values are assumed to
280031Sdim    /// be legal.
276479Sdim    bool isShuffleMaskLegal(const SmallVectorImpl<int> &Mask,
276479Sdim                            EVT VT) const override;
193323Sed
280031Sdim    /// Similar to isShuffleMaskLegal. This is used by Targets can use this to
280031Sdim    /// indicate if there is a suitable VECTOR_SHUFFLE that can be used to
280031Sdim    /// replace a VAND with a constant pool entry.
276479Sdim    bool isVectorClearMaskLegal(const SmallVectorImpl<int> &Mask,
276479Sdim                                EVT VT) const override;
193323Sed
280031Sdim    /// If true, then instruction selection should
193323Sed    /// seek to shrink the FP constant of the specified type to a smaller type
193323Sed    /// in order to save space and / or reduce runtime.
276479Sdim    bool ShouldShrinkFPConstant(EVT VT) const override {
193323Sed      // Don't shrink FP constpool if SSE2 is available since cvtss2sd is more
193323Sed      // expensive than a straight movsd. On the other hand, it's important to
193323Sed      // shrink long double fp constant since fldt is very slow.
193323Sed      return !X86ScalarSSEf64 || VT == MVT::f80;
193323Sed    }
218893Sdim
280031Sdim    /// Return true if we believe it is correct and profitable to reduce the
280031Sdim    /// load node to a smaller type.
280031Sdim    bool shouldReduceLoadWidth(SDNode *Load, ISD::LoadExtType ExtTy,
280031Sdim                               EVT NewVT) const override;
280031Sdim
280031Sdim    /// Return true if the specified scalar FP type is computed in an SSE
280031Sdim    /// register, not on the X87 floating point stack.
198090Srdivacky    bool isScalarFPTypeInSSEReg(EVT VT) const {
193323Sed      return (VT == MVT::f64 && X86ScalarSSEf64) || // f64 is when SSE2
296417Sdim             (VT == MVT::f32 && X86ScalarSSEf32);   // f32 is when SSE1
193323Sed    }
193323Sed
276479Sdim    /// \brief Returns true if it is beneficial to convert a load of a constant
276479Sdim    /// to just the constant itself.
276479Sdim    bool shouldConvertConstantLoadToIntImm(const APInt &Imm,
276479Sdim                                           Type *Ty) const override;
276479Sdim
280031Sdim    /// Return true if EXTRACT_SUBVECTOR is cheap for this result type
280031Sdim    /// with this index.
280031Sdim    bool isExtractSubvectorCheap(EVT ResVT, unsigned Index) const override;
280031Sdim
276479Sdim    /// Intel processors have a unified instruction and data cache
276479Sdim    const char * getClearCacheBuiltinName() const override {
276479Sdim      return nullptr; // nothing to do, move along.
276479Sdim    }
276479Sdim
288943Sdim    unsigned getRegisterByName(const char* RegName, EVT VT,
288943Sdim                               SelectionDAG &DAG) const override;
276479Sdim
296417Sdim    /// If a physical register, this returns the register that receives the
296417Sdim    /// exception address on entry to an EH pad.
296417Sdim    unsigned
296417Sdim    getExceptionPointerRegister(const Constant *PersonalityFn) const override;
296417Sdim
296417Sdim    /// If a physical register, this returns the register that receives the
296417Sdim    /// exception typeid on entry to a landing pad.
296417Sdim    unsigned
296417Sdim    getExceptionSelectorRegister(const Constant *PersonalityFn) const override;
296417Sdim
280031Sdim    /// This method returns a target specific FastISel object,
193323Sed    /// or null if the target does not support "fast" ISel.
276479Sdim    FastISel *createFastISel(FunctionLoweringInfo &funcInfo,
276479Sdim                             const TargetLibraryInfo *libInfo) const override;
195340Sed
280031Sdim    /// Return true if the target stores stack protector cookies at a fixed
280031Sdim    /// offset in some non-standard address space, and populates the address
280031Sdim    /// space and offset as appropriate.
276479Sdim    bool getStackCookieLocation(unsigned &AddressSpace,
276479Sdim                                unsigned &Offset) const override;
210299Sed
296417Sdim    /// Return true if the target stores SafeStack pointer at a fixed offset in
296417Sdim    /// some non-standard address space, and populates the address space and
296417Sdim    /// offset as appropriate.
296417Sdim    Value *getSafeStackPointerLocation(IRBuilder<> &IRB) const override;
296417Sdim
223017Sdim    SDValue BuildFILD(SDValue Op, EVT SrcVT, SDValue Chain, SDValue StackSlot,
223017Sdim                      SelectionDAG &DAG) const;
223017Sdim
276479Sdim    bool isNoopAddrSpaceCast(unsigned SrcAS, unsigned DestAS) const override;
261991Sdim
280031Sdim    bool useLoadStackGuardNode() const override;
276479Sdim    /// \brief Customize the preferred legalization strategy for certain types.
276479Sdim    LegalizeTypeAction getPreferredVectorAction(EVT VT) const override;
276479Sdim
296417Sdim    bool isIntDivCheap(EVT VT, AttributeSet Attr) const override;
296417Sdim
212904Sdim  protected:
288943Sdim    std::pair<const TargetRegisterClass *, uint8_t>
288943Sdim    findRepresentativeClass(const TargetRegisterInfo *TRI,
288943Sdim                            MVT VT) const override;
212904Sdim
193323Sed  private:
280031Sdim    /// Keep a pointer to the X86Subtarget around so that we can
193323Sed    /// make the right decision when generating code for different targets.
193323Sed    const X86Subtarget *Subtarget;
193323Sed
280031Sdim    /// Select between SSE or x87 floating point ops.
193323Sed    /// When SSE is available, use it for f32 operations.
193323Sed    /// When SSE2 is available, use it for f64 operations.
193323Sed    bool X86ScalarSSEf32;
193323Sed    bool X86ScalarSSEf64;
193323Sed
280031Sdim    /// A list of legal FP immediates.
198892Srdivacky    std::vector<APFloat> LegalFPImmediates;
198892Srdivacky
280031Sdim    /// Indicate that this x86 target can instruction
198892Srdivacky    /// select the specified FP immediate natively.
198892Srdivacky    void addLegalFPImmediate(const APFloat& Imm) {
198892Srdivacky      LegalFPImmediates.push_back(Imm);
198892Srdivacky    }
198892Srdivacky
198090Srdivacky    SDValue LowerCallResult(SDValue Chain, SDValue InFlag,
198090Srdivacky                            CallingConv::ID CallConv, bool isVarArg,
198090Srdivacky                            const SmallVectorImpl<ISD::InputArg> &Ins,
261991Sdim                            SDLoc dl, SelectionDAG &DAG,
207618Srdivacky                            SmallVectorImpl<SDValue> &InVals) const;
198090Srdivacky    SDValue LowerMemArgument(SDValue Chain,
198090Srdivacky                             CallingConv::ID CallConv,
198090Srdivacky                             const SmallVectorImpl<ISD::InputArg> &ArgInfo,
261991Sdim                             SDLoc dl, SelectionDAG &DAG,
198090Srdivacky                             const CCValAssign &VA,  MachineFrameInfo *MFI,
207618Srdivacky                              unsigned i) const;
198090Srdivacky    SDValue LowerMemOpCallTo(SDValue Chain, SDValue StackPtr, SDValue Arg,
261991Sdim                             SDLoc dl, SelectionDAG &DAG,
198090Srdivacky                             const CCValAssign &VA,
207618Srdivacky                             ISD::ArgFlagsTy Flags) const;
193323Sed
193323Sed    // Call lowering helpers.
203954Srdivacky
280031Sdim    /// Check whether the call is eligible for tail call optimization. Targets
280031Sdim    /// that want to do tail call optimization should implement this function.
203954Srdivacky    bool IsEligibleForTailCallOptimization(SDValue Callee,
203954Srdivacky                                           CallingConv::ID CalleeCC,
203954Srdivacky                                           bool isVarArg,
205218Srdivacky                                           bool isCalleeStructRet,
205218Srdivacky                                           bool isCallerStructRet,
243830Sdim                                           Type *RetTy,
203954Srdivacky                                    const SmallVectorImpl<ISD::OutputArg> &Outs,
210299Sed                                    const SmallVectorImpl<SDValue> &OutVals,
203954Srdivacky                                    const SmallVectorImpl<ISD::InputArg> &Ins,
203954Srdivacky                                           SelectionDAG& DAG) const;
193323Sed    SDValue EmitTailCallLoadRetAddr(SelectionDAG &DAG, SDValue &OutRetAddr,
193323Sed                                SDValue Chain, bool IsTailCall, bool Is64Bit,
261991Sdim                                int FPDiff, SDLoc dl) const;
193323Sed
207618Srdivacky    unsigned GetAlignedArgumentStackSize(unsigned StackSize,
207618Srdivacky                                         SelectionDAG &DAG) const;
193323Sed
193323Sed    std::pair<SDValue,SDValue> FP_TO_INTHelper(SDValue Op, SelectionDAG &DAG,
234353Sdim                                               bool isSigned,
234353Sdim                                               bool isReplace) const;
200581Srdivacky
207618Srdivacky    SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const;
261991Sdim    SDValue LowerBUILD_VECTORvXi1(SDValue Op, SelectionDAG &DAG) const;
276479Sdim    SDValue LowerVSELECT(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
276479Sdim    SDValue ExtractBitFromMaskVector(SDValue Op, SelectionDAG &DAG) const;
276479Sdim    SDValue InsertBitToMaskVector(SDValue Op, SelectionDAG &DAG) const;
276479Sdim
207618Srdivacky    SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerBlockAddress(SDValue Op, SelectionDAG &DAG) const;
261991Sdim    SDValue LowerGlobalAddress(const GlobalValue *GV, SDLoc dl,
193323Sed                               int64_t Offset, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerExternalSymbol(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerUINT_TO_FP_i64(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerUINT_TO_FP_i32(SDValue Op, SelectionDAG &DAG) const;
243830Sdim    SDValue lowerUINT_TO_FP_vec(SDValue Op, SelectionDAG &DAG) const;
249423Sdim    SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerFP_TO_SINT(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerFP_TO_UINT(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerToBT(SDValue And, ISD::CondCode CC,
261991Sdim                      SDLoc dl, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG) const;
296417Sdim    SDValue LowerSETCCE(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerSELECT(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerJumpTable(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerFRAME_TO_ARGS_OFFSET(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerEH_RETURN(SDValue Op, SelectionDAG &DAG) const;
243830Sdim    SDValue lowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const;
243830Sdim    SDValue lowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const;
226633Sdim    SDValue LowerINIT_TRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
207618Srdivacky    SDValue LowerFLT_ROUNDS_(SDValue Op, SelectionDAG &DAG) const;
276479Sdim    SDValue LowerWin64_i128OP(SDValue Op, SelectionDAG &DAG) const;
288943Sdim    SDValue LowerGC_TRANSITION_START(SDValue Op, SelectionDAG &DAG) const;
288943Sdim    SDValue LowerGC_TRANSITION_END(SDValue Op, SelectionDAG &DAG) const;
193323Sed
276479Sdim    SDValue
198090Srdivacky      LowerFormalArguments(SDValue Chain,
198090Srdivacky                           CallingConv::ID CallConv, bool isVarArg,
198090Srdivacky                           const SmallVectorImpl<ISD::InputArg> &Ins,
261991Sdim                           SDLoc dl, SelectionDAG &DAG,
276479Sdim                           SmallVectorImpl<SDValue> &InVals) const override;
276479Sdim    SDValue LowerCall(CallLoweringInfo &CLI,
276479Sdim                      SmallVectorImpl<SDValue> &InVals) const override;
198090Srdivacky
276479Sdim    SDValue LowerReturn(SDValue Chain,
276479Sdim                        CallingConv::ID CallConv, bool isVarArg,
276479Sdim                        const SmallVectorImpl<ISD::OutputArg> &Outs,
276479Sdim                        const SmallVectorImpl<SDValue> &OutVals,
276479Sdim                        SDLoc dl, SelectionDAG &DAG) const override;
198090Srdivacky
296417Sdim    bool supportSplitCSR(MachineFunction *MF) const override {
296417Sdim      return MF->getFunction()->getCallingConv() == CallingConv::CXX_FAST_TLS &&
296417Sdim          MF->getFunction()->hasFnAttribute(Attribute::NoUnwind);
296417Sdim    }
296417Sdim    void initializeSplitCSR(MachineBasicBlock *Entry) const override;
296417Sdim    void insertCopiesSplitCSR(
296417Sdim      MachineBasicBlock *Entry,
296417Sdim      const SmallVectorImpl<MachineBasicBlock *> &Exits) const override;
296417Sdim
276479Sdim    bool isUsedByReturnOnly(SDNode *N, SDValue &Chain) const override;
218893Sdim
276479Sdim    bool mayBeEmittedAsTailCall(CallInst *CI) const override;
221345Sdim
280031Sdim    EVT getTypeForExtArgOrReturn(LLVMContext &Context, EVT VT,
276479Sdim                                 ISD::NodeType ExtendKind) const override;
221345Sdim
276479Sdim    bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF,
276479Sdim                        bool isVarArg,
276479Sdim                        const SmallVectorImpl<ISD::OutputArg> &Outs,
276479Sdim                        LLVMContext &Context) const override;
199481Srdivacky
276479Sdim    const MCPhysReg *getScratchRegisters(CallingConv::ID CC) const override;
261991Sdim
296417Sdim    TargetLoweringBase::AtomicExpansionKind
296417Sdim    shouldExpandAtomicLoadInIR(LoadInst *SI) const override;
280031Sdim    bool shouldExpandAtomicStoreInIR(StoreInst *SI) const override;
296417Sdim    TargetLoweringBase::AtomicExpansionKind
288943Sdim    shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
280031Sdim
280031Sdim    LoadInst *
280031Sdim    lowerIdempotentRMWIntoFencedLoad(AtomicRMWInst *AI) const override;
280031Sdim
296417Sdim    bool needsCmpXchgNb(Type *MemType) const;
280031Sdim
218893Sdim    // Utility function to emit the low-level va_arg code for X86-64.
218893Sdim    MachineBasicBlock *EmitVAARG64WithCustomInserter(
218893Sdim                       MachineInstr *MI,
218893Sdim                       MachineBasicBlock *MBB) const;
218893Sdim
198090Srdivacky    /// Utility function to emit the xmm reg save portion of va_start.
198090Srdivacky    MachineBasicBlock *EmitVAStartSaveXMMRegsWithCustomInserter(
198090Srdivacky                                                   MachineInstr *BInstr,
198090Srdivacky                                                   MachineBasicBlock *BB) const;
198090Srdivacky
198090Srdivacky    MachineBasicBlock *EmitLoweredSelect(MachineInstr *I,
207618Srdivacky                                         MachineBasicBlock *BB) const;
204961Srdivacky
296417Sdim    MachineBasicBlock *EmitLoweredAtomicFP(MachineInstr *I,
296417Sdim                                           MachineBasicBlock *BB) const;
296417Sdim
218893Sdim    MachineBasicBlock *EmitLoweredWinAlloca(MachineInstr *MI,
207618Srdivacky                                              MachineBasicBlock *BB) const;
218893Sdim
296417Sdim    MachineBasicBlock *EmitLoweredCatchRet(MachineInstr *MI,
296417Sdim                                           MachineBasicBlock *BB) const;
296417Sdim
296417Sdim    MachineBasicBlock *EmitLoweredCatchPad(MachineInstr *MI,
296417Sdim                                           MachineBasicBlock *BB) const;
296417Sdim
226633Sdim    MachineBasicBlock *EmitLoweredSegAlloca(MachineInstr *MI,
280031Sdim                                            MachineBasicBlock *BB) const;
226633Sdim
296417Sdim    MachineBasicBlock *EmitLoweredTLSAddr(MachineInstr *MI,
210299Sed                                          MachineBasicBlock *BB) const;
204961Srdivacky
296417Sdim    MachineBasicBlock *EmitLoweredTLSCall(MachineInstr *MI,
218893Sdim                                          MachineBasicBlock *BB) const;
218893Sdim
243830Sdim    MachineBasicBlock *emitEHSjLjSetJmp(MachineInstr *MI,
243830Sdim                                        MachineBasicBlock *MBB) const;
243830Sdim
243830Sdim    MachineBasicBlock *emitEHSjLjLongJmp(MachineInstr *MI,
243830Sdim                                         MachineBasicBlock *MBB) const;
243830Sdim
276479Sdim    MachineBasicBlock *emitFMA3Instr(MachineInstr *MI,
276479Sdim                                     MachineBasicBlock *MBB) const;
276479Sdim
193323Sed    /// Emit nodes that will be selected as "test Op0,Op0", or something
193323Sed    /// equivalent, for use with the given x86 condition code.
276479Sdim    SDValue EmitTest(SDValue Op0, unsigned X86CC, SDLoc dl,
276479Sdim                     SelectionDAG &DAG) const;
193323Sed
193323Sed    /// Emit nodes that will be selected as "cmp Op0,Op1", or something
193323Sed    /// equivalent, for use with the given x86 condition code.
276479Sdim    SDValue EmitCmp(SDValue Op0, SDValue Op1, unsigned X86CC, SDLoc dl,
207618Srdivacky                    SelectionDAG &DAG) const;
239462Sdim
239462Sdim    /// Convert a comparison if required by the subtarget.
239462Sdim    SDValue ConvertCmpIfNecessary(SDValue Cmp, SelectionDAG &DAG) const;
280031Sdim
280031Sdim    /// Use rsqrt* to speed up sqrt calculations.
280031Sdim    SDValue getRsqrtEstimate(SDValue Operand, DAGCombinerInfo &DCI,
280031Sdim                             unsigned &RefinementSteps,
280031Sdim                             bool &UseOneConstNR) const override;
280031Sdim
280031Sdim    /// Use rcp* to speed up fdiv calculations.
280031Sdim    SDValue getRecipEstimate(SDValue Operand, DAGCombinerInfo &DCI,
280031Sdim                             unsigned &RefinementSteps) const override;
288943Sdim
288943Sdim    /// Reassociate floating point divisions into multiply by reciprocal.
296417Sdim    unsigned combineRepeatedFPDivisors() const override;
193323Sed  };
193323Sed
193323Sed  namespace X86 {
239462Sdim    FastISel *createFastISel(FunctionLoweringInfo &funcInfo,
239462Sdim                             const TargetLibraryInfo *libInfo);
193323Sed  }
193323Sed}
193323Sed
193323Sed#endif    // X86ISELLOWERING_H