Target/PowerPC/PPCISelLowering.h

06f32e7eSjoerg//===-- PPCISelLowering.h - PPC32 DAG Lowering Interface --------*- C++ -*-===//
06f32e7eSjoerg//
06f32e7eSjoerg// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
06f32e7eSjoerg// See https://llvm.org/LICENSE.txt for license information.
06f32e7eSjoerg// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
06f32e7eSjoerg//
06f32e7eSjoerg//===----------------------------------------------------------------------===//
06f32e7eSjoerg//
06f32e7eSjoerg// This file defines the interfaces that PPC uses to lower LLVM code into a
06f32e7eSjoerg// selection DAG.
06f32e7eSjoerg//
06f32e7eSjoerg//===----------------------------------------------------------------------===//
06f32e7eSjoerg
06f32e7eSjoerg#ifndef LLVM_LIB_TARGET_POWERPC_PPCISELLOWERING_H
06f32e7eSjoerg#define LLVM_LIB_TARGET_POWERPC_PPCISELLOWERING_H
06f32e7eSjoerg
06f32e7eSjoerg#include "PPCInstrInfo.h"
06f32e7eSjoerg#include "llvm/CodeGen/CallingConvLower.h"
06f32e7eSjoerg#include "llvm/CodeGen/MachineFunction.h"
06f32e7eSjoerg#include "llvm/CodeGen/MachineMemOperand.h"
06f32e7eSjoerg#include "llvm/CodeGen/SelectionDAG.h"
06f32e7eSjoerg#include "llvm/CodeGen/SelectionDAGNodes.h"
06f32e7eSjoerg#include "llvm/CodeGen/TargetLowering.h"
06f32e7eSjoerg#include "llvm/CodeGen/ValueTypes.h"
06f32e7eSjoerg#include "llvm/IR/Attributes.h"
06f32e7eSjoerg#include "llvm/IR/CallingConv.h"
06f32e7eSjoerg#include "llvm/IR/Function.h"
06f32e7eSjoerg#include "llvm/IR/InlineAsm.h"
06f32e7eSjoerg#include "llvm/IR/Metadata.h"
06f32e7eSjoerg#include "llvm/IR/Type.h"
06f32e7eSjoerg#include "llvm/Support/MachineValueType.h"
06f32e7eSjoerg#include <utility>
06f32e7eSjoerg
06f32e7eSjoergnamespace llvm {
06f32e7eSjoerg
06f32e7eSjoerg  namespace PPCISD {
06f32e7eSjoerg
06f32e7eSjoerg    // When adding a NEW PPCISD node please add it to the correct position in
06f32e7eSjoerg    // the enum. The order of elements in this enum matters!
06f32e7eSjoerg    // Values that are added after this entry:
06f32e7eSjoerg    //     STBRX = ISD::FIRST_TARGET_MEMORY_OPCODE
06f32e7eSjoerg    // are considered memory opcodes and are treated differently than entries
06f32e7eSjoerg    // that come before it. For example, ADD or MUL should be placed before
06f32e7eSjoerg    // the ISD::FIRST_TARGET_MEMORY_OPCODE while a LOAD or STORE should come
06f32e7eSjoerg    // after it.
06f32e7eSjoerg  enum NodeType : unsigned {
06f32e7eSjoerg    // Start the numbering where the builtin ops and target ops leave off.
06f32e7eSjoerg    FIRST_NUMBER = ISD::BUILTIN_OP_END,
06f32e7eSjoerg
06f32e7eSjoerg    /// FSEL - Traditional three-operand fsel node.
06f32e7eSjoerg    ///
06f32e7eSjoerg    FSEL,
06f32e7eSjoerg
*da58b97aSjoerg    /// XSMAXCDP, XSMINCDP - C-type min/max instructions.
*da58b97aSjoerg    XSMAXCDP,
*da58b97aSjoerg    XSMINCDP,
*da58b97aSjoerg
06f32e7eSjoerg    /// FCFID - The FCFID instruction, taking an f64 operand and producing
06f32e7eSjoerg    /// and f64 value containing the FP representation of the integer that
06f32e7eSjoerg    /// was temporarily in the f64 operand.
06f32e7eSjoerg    FCFID,
06f32e7eSjoerg
06f32e7eSjoerg    /// Newer FCFID[US] integer-to-floating-point conversion instructions for
06f32e7eSjoerg    /// unsigned integers and single-precision outputs.
*da58b97aSjoerg    FCFIDU,
*da58b97aSjoerg    FCFIDS,
*da58b97aSjoerg    FCFIDUS,
06f32e7eSjoerg
06f32e7eSjoerg    /// FCTI[D,W]Z - The FCTIDZ and FCTIWZ instructions, taking an f32 or f64
06f32e7eSjoerg    /// operand, producing an f64 value containing the integer representation
06f32e7eSjoerg    /// of that FP value.
*da58b97aSjoerg    FCTIDZ,
*da58b97aSjoerg    FCTIWZ,
06f32e7eSjoerg
06f32e7eSjoerg    /// Newer FCTI[D,W]UZ floating-point-to-integer conversion instructions for
06f32e7eSjoerg    /// unsigned integers with round toward zero.
*da58b97aSjoerg    FCTIDUZ,
*da58b97aSjoerg    FCTIWUZ,
06f32e7eSjoerg
06f32e7eSjoerg    /// Floating-point-to-interger conversion instructions
*da58b97aSjoerg    FP_TO_UINT_IN_VSR,
*da58b97aSjoerg    FP_TO_SINT_IN_VSR,
06f32e7eSjoerg
06f32e7eSjoerg    /// VEXTS, ByteWidth - takes an input in VSFRC and produces an output in
06f32e7eSjoerg    /// VSFRC that is sign-extended from ByteWidth to a 64-byte integer.
06f32e7eSjoerg    VEXTS,
06f32e7eSjoerg
06f32e7eSjoerg    /// Reciprocal estimate instructions (unary FP ops).
*da58b97aSjoerg    FRE,
*da58b97aSjoerg    FRSQRTE,
06f32e7eSjoerg
*da58b97aSjoerg    /// Test instruction for software square root.
*da58b97aSjoerg    FTSQRT,
*da58b97aSjoerg
*da58b97aSjoerg    /// Square root instruction.
*da58b97aSjoerg    FSQRT,
06f32e7eSjoerg
06f32e7eSjoerg    /// VPERM - The PPC VPERM Instruction.
06f32e7eSjoerg    ///
06f32e7eSjoerg    VPERM,
06f32e7eSjoerg
06f32e7eSjoerg    /// XXSPLT - The PPC VSX splat instructions
06f32e7eSjoerg    ///
06f32e7eSjoerg    XXSPLT,
06f32e7eSjoerg
*da58b97aSjoerg    /// XXSPLTI_SP_TO_DP - The PPC VSX splat instructions for immediates for
*da58b97aSjoerg    /// converting immediate single precision numbers to double precision
*da58b97aSjoerg    /// vector or scalar.
*da58b97aSjoerg    XXSPLTI_SP_TO_DP,
*da58b97aSjoerg
*da58b97aSjoerg    /// XXSPLTI32DX - The PPC XXSPLTI32DX instruction.
*da58b97aSjoerg    ///
*da58b97aSjoerg    XXSPLTI32DX,
*da58b97aSjoerg
06f32e7eSjoerg    /// VECINSERT - The PPC vector insert instruction
06f32e7eSjoerg    ///
06f32e7eSjoerg    VECINSERT,
06f32e7eSjoerg
06f32e7eSjoerg    /// VECSHL - The PPC vector shift left instruction
06f32e7eSjoerg    ///
06f32e7eSjoerg    VECSHL,
06f32e7eSjoerg
06f32e7eSjoerg    /// XXPERMDI - The PPC XXPERMDI instruction
06f32e7eSjoerg    ///
06f32e7eSjoerg    XXPERMDI,
06f32e7eSjoerg
06f32e7eSjoerg    /// The CMPB instruction (takes two operands of i32 or i64).
06f32e7eSjoerg    CMPB,
06f32e7eSjoerg
06f32e7eSjoerg    /// Hi/Lo - These represent the high and low 16-bit parts of a global
06f32e7eSjoerg    /// address respectively.  These nodes have two operands, the first of
06f32e7eSjoerg    /// which must be a TargetGlobalAddress, and the second of which must be a
06f32e7eSjoerg    /// Constant.  Selected naively, these turn into 'lis G+C' and 'li G+C',
06f32e7eSjoerg    /// though these are usually folded into other nodes.
*da58b97aSjoerg    Hi,
*da58b97aSjoerg    Lo,
06f32e7eSjoerg
06f32e7eSjoerg    /// The following two target-specific nodes are used for calls through
06f32e7eSjoerg    /// function pointers in the 64-bit SVR4 ABI.
06f32e7eSjoerg
06f32e7eSjoerg    /// OPRC, CHAIN = DYNALLOC(CHAIN, NEGSIZE, FRAME_INDEX)
06f32e7eSjoerg    /// This instruction is lowered in PPCRegisterInfo::eliminateFrameIndex to
06f32e7eSjoerg    /// compute an allocation on the stack.
06f32e7eSjoerg    DYNALLOC,
06f32e7eSjoerg
06f32e7eSjoerg    /// This instruction is lowered in PPCRegisterInfo::eliminateFrameIndex to
06f32e7eSjoerg    /// compute an offset from native SP to the address  of the most recent
06f32e7eSjoerg    /// dynamic alloca.
06f32e7eSjoerg    DYNAREAOFFSET,
06f32e7eSjoerg
*da58b97aSjoerg    /// To avoid stack clash, allocation is performed by block and each block is
*da58b97aSjoerg    /// probed.
*da58b97aSjoerg    PROBED_ALLOCA,
*da58b97aSjoerg
*da58b97aSjoerg    /// The result of the mflr at function entry, used for PIC code.
06f32e7eSjoerg    GlobalBaseReg,
06f32e7eSjoerg
06f32e7eSjoerg    /// These nodes represent PPC shifts.
06f32e7eSjoerg    ///
06f32e7eSjoerg    /// For scalar types, only the last `n + 1` bits of the shift amounts
06f32e7eSjoerg    /// are used, where n is log2(sizeof(element) * 8). See sld/slw, etc.
06f32e7eSjoerg    /// for exact behaviors.
06f32e7eSjoerg    ///
06f32e7eSjoerg    /// For vector types, only the last n bits are used. See vsld.
*da58b97aSjoerg    SRL,
*da58b97aSjoerg    SRA,
*da58b97aSjoerg    SHL,
*da58b97aSjoerg
*da58b97aSjoerg    /// FNMSUB - Negated multiply-subtract instruction.
*da58b97aSjoerg    FNMSUB,
06f32e7eSjoerg
06f32e7eSjoerg    /// EXTSWSLI = The PPC extswsli instruction, which does an extend-sign
06f32e7eSjoerg    /// word and shift left immediate.
06f32e7eSjoerg    EXTSWSLI,
06f32e7eSjoerg
06f32e7eSjoerg    /// The combination of sra[wd]i and addze used to implemented signed
06f32e7eSjoerg    /// integer division by a power of 2. The first operand is the dividend,
06f32e7eSjoerg    /// and the second is the constant shift amount (representing the
06f32e7eSjoerg    /// divisor).
06f32e7eSjoerg    SRA_ADDZE,
06f32e7eSjoerg
06f32e7eSjoerg    /// CALL - A direct function call.
06f32e7eSjoerg    /// CALL_NOP is a call with the special NOP which follows 64-bit
*da58b97aSjoerg    /// CALL_NOTOC the caller does not use the TOC.
06f32e7eSjoerg    /// SVR4 calls and 32-bit/64-bit AIX calls.
*da58b97aSjoerg    CALL,
*da58b97aSjoerg    CALL_NOP,
*da58b97aSjoerg    CALL_NOTOC,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN,FLAG = MTCTR(VAL, CHAIN[, INFLAG]) - Directly corresponds to a
06f32e7eSjoerg    /// MTCTR instruction.
06f32e7eSjoerg    MTCTR,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN,FLAG = BCTRL(CHAIN, INFLAG) - Directly corresponds to a
06f32e7eSjoerg    /// BCTRL instruction.
06f32e7eSjoerg    BCTRL,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN,FLAG = BCTRL(CHAIN, ADDR, INFLAG) - The combination of a bctrl
*da58b97aSjoerg    /// instruction and the TOC reload required on 64-bit ELF, 32-bit AIX
*da58b97aSjoerg    /// and 64-bit AIX.
06f32e7eSjoerg    BCTRL_LOAD_TOC,
06f32e7eSjoerg
06f32e7eSjoerg    /// Return with a flag operand, matched by 'blr'
06f32e7eSjoerg    RET_FLAG,
06f32e7eSjoerg
06f32e7eSjoerg    /// R32 = MFOCRF(CRREG, INFLAG) - Represents the MFOCRF instruction.
06f32e7eSjoerg    /// This copies the bits corresponding to the specified CRREG into the
06f32e7eSjoerg    /// resultant GPR.  Bits corresponding to other CR regs are undefined.
06f32e7eSjoerg    MFOCRF,
06f32e7eSjoerg
06f32e7eSjoerg    /// Direct move from a VSX register to a GPR
06f32e7eSjoerg    MFVSR,
06f32e7eSjoerg
06f32e7eSjoerg    /// Direct move from a GPR to a VSX register (algebraic)
06f32e7eSjoerg    MTVSRA,
06f32e7eSjoerg
06f32e7eSjoerg    /// Direct move from a GPR to a VSX register (zero)
06f32e7eSjoerg    MTVSRZ,
06f32e7eSjoerg
06f32e7eSjoerg    /// Direct move of 2 consecutive GPR to a VSX register.
06f32e7eSjoerg    BUILD_FP128,
06f32e7eSjoerg
06f32e7eSjoerg    /// BUILD_SPE64 and EXTRACT_SPE are analogous to BUILD_PAIR and
06f32e7eSjoerg    /// EXTRACT_ELEMENT but take f64 arguments instead of i64, as i64 is
06f32e7eSjoerg    /// unsupported for this target.
06f32e7eSjoerg    /// Merge 2 GPRs to a single SPE register.
06f32e7eSjoerg    BUILD_SPE64,
06f32e7eSjoerg
06f32e7eSjoerg    /// Extract SPE register component, second argument is high or low.
06f32e7eSjoerg    EXTRACT_SPE,
06f32e7eSjoerg
06f32e7eSjoerg    /// Extract a subvector from signed integer vector and convert to FP.
06f32e7eSjoerg    /// It is primarily used to convert a (widened) illegal integer vector
06f32e7eSjoerg    /// type to a legal floating point vector type.
06f32e7eSjoerg    /// For example v2i32 -> widened to v4i32 -> v2f64
06f32e7eSjoerg    SINT_VEC_TO_FP,
06f32e7eSjoerg
06f32e7eSjoerg    /// Extract a subvector from unsigned integer vector and convert to FP.
06f32e7eSjoerg    /// As with SINT_VEC_TO_FP, used for converting illegal types.
06f32e7eSjoerg    UINT_VEC_TO_FP,
06f32e7eSjoerg
*da58b97aSjoerg    /// PowerPC instructions that have SCALAR_TO_VECTOR semantics tend to
*da58b97aSjoerg    /// place the value into the least significant element of the most
*da58b97aSjoerg    /// significant doubleword in the vector. This is not element zero for
*da58b97aSjoerg    /// anything smaller than a doubleword on either endianness. This node has
*da58b97aSjoerg    /// the same semantics as SCALAR_TO_VECTOR except that the value remains in
*da58b97aSjoerg    /// the aforementioned location in the vector register.
*da58b97aSjoerg    SCALAR_TO_VECTOR_PERMUTED,
*da58b97aSjoerg
06f32e7eSjoerg    // FIXME: Remove these once the ANDI glue bug is fixed:
*da58b97aSjoerg    /// i1 = ANDI_rec_1_[EQ|GT]_BIT(i32 or i64 x) - Represents the result of the
06f32e7eSjoerg    /// eq or gt bit of CR0 after executing andi. x, 1. This is used to
06f32e7eSjoerg    /// implement truncation of i32 or i64 to i1.
*da58b97aSjoerg    ANDI_rec_1_EQ_BIT,
*da58b97aSjoerg    ANDI_rec_1_GT_BIT,
06f32e7eSjoerg
06f32e7eSjoerg    // READ_TIME_BASE - A read of the 64-bit time-base register on a 32-bit
06f32e7eSjoerg    // target (returns (Lo, Hi)). It takes a chain operand.
06f32e7eSjoerg    READ_TIME_BASE,
06f32e7eSjoerg
06f32e7eSjoerg    // EH_SJLJ_SETJMP - SjLj exception handling setjmp.
06f32e7eSjoerg    EH_SJLJ_SETJMP,
06f32e7eSjoerg
06f32e7eSjoerg    // EH_SJLJ_LONGJMP - SjLj exception handling longjmp.
06f32e7eSjoerg    EH_SJLJ_LONGJMP,
06f32e7eSjoerg
06f32e7eSjoerg    /// RESVEC = VCMP(LHS, RHS, OPC) - Represents one of the altivec VCMP*
06f32e7eSjoerg    /// instructions.  For lack of better number, we use the opcode number
06f32e7eSjoerg    /// encoding for the OPC field to identify the compare.  For example, 838
06f32e7eSjoerg    /// is VCMPGTSH.
06f32e7eSjoerg    VCMP,
06f32e7eSjoerg
*da58b97aSjoerg    /// RESVEC, OUTFLAG = VCMP_rec(LHS, RHS, OPC) - Represents one of the
*da58b97aSjoerg    /// altivec VCMP*_rec instructions.  For lack of better number, we use the
06f32e7eSjoerg    /// opcode number encoding for the OPC field to identify the compare.  For
06f32e7eSjoerg    /// example, 838 is VCMPGTSH.
*da58b97aSjoerg    VCMP_rec,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN = COND_BRANCH CHAIN, CRRC, OPC, DESTBB [, INFLAG] - This
06f32e7eSjoerg    /// corresponds to the COND_BRANCH pseudo instruction.  CRRC is the
06f32e7eSjoerg    /// condition register to branch on, OPC is the branch opcode to use (e.g.
06f32e7eSjoerg    /// PPC::BLE), DESTBB is the destination block to branch to, and INFLAG is
06f32e7eSjoerg    /// an optional input flag argument.
06f32e7eSjoerg    COND_BRANCH,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN = BDNZ CHAIN, DESTBB - These are used to create counter-based
06f32e7eSjoerg    /// loops.
*da58b97aSjoerg    BDNZ,
*da58b97aSjoerg    BDZ,
06f32e7eSjoerg
06f32e7eSjoerg    /// F8RC = FADDRTZ F8RC, F8RC - This is an FADD done with rounding
06f32e7eSjoerg    /// towards zero.  Used only as part of the long double-to-int
06f32e7eSjoerg    /// conversion sequence.
06f32e7eSjoerg    FADDRTZ,
06f32e7eSjoerg
06f32e7eSjoerg    /// F8RC = MFFS - This moves the FPSCR (not modeled) into the register.
06f32e7eSjoerg    MFFS,
06f32e7eSjoerg
06f32e7eSjoerg    /// TC_RETURN - A tail call return.
06f32e7eSjoerg    ///   operand #0 chain
06f32e7eSjoerg    ///   operand #1 callee (register or absolute)
06f32e7eSjoerg    ///   operand #2 stack adjustment
06f32e7eSjoerg    ///   operand #3 optional in flag
06f32e7eSjoerg    TC_RETURN,
06f32e7eSjoerg
06f32e7eSjoerg    /// ch, gl = CR6[UN]SET ch, inglue - Toggle CR bit 6 for SVR4 vararg calls
06f32e7eSjoerg    CR6SET,
06f32e7eSjoerg    CR6UNSET,
06f32e7eSjoerg
06f32e7eSjoerg    /// GPRC = address of _GLOBAL_OFFSET_TABLE_. Used by initial-exec TLS
06f32e7eSjoerg    /// for non-position independent code on PPC32.
06f32e7eSjoerg    PPC32_GOT,
06f32e7eSjoerg
06f32e7eSjoerg    /// GPRC = address of _GLOBAL_OFFSET_TABLE_. Used by general dynamic and
06f32e7eSjoerg    /// local dynamic TLS and position indendepent code on PPC32.
06f32e7eSjoerg    PPC32_PICGOT,
06f32e7eSjoerg
06f32e7eSjoerg    /// G8RC = ADDIS_GOT_TPREL_HA %x2, Symbol - Used by the initial-exec
06f32e7eSjoerg    /// TLS model, produces an ADDIS8 instruction that adds the GOT
06f32e7eSjoerg    /// base to sym\@got\@tprel\@ha.
06f32e7eSjoerg    ADDIS_GOT_TPREL_HA,
06f32e7eSjoerg
06f32e7eSjoerg    /// G8RC = LD_GOT_TPREL_L Symbol, G8RReg - Used by the initial-exec
06f32e7eSjoerg    /// TLS model, produces a LD instruction with base register G8RReg
06f32e7eSjoerg    /// and offset sym\@got\@tprel\@l.  This completes the addition that
06f32e7eSjoerg    /// finds the offset of "sym" relative to the thread pointer.
06f32e7eSjoerg    LD_GOT_TPREL_L,
06f32e7eSjoerg
06f32e7eSjoerg    /// G8RC = ADD_TLS G8RReg, Symbol - Used by the initial-exec TLS
06f32e7eSjoerg    /// model, produces an ADD instruction that adds the contents of
06f32e7eSjoerg    /// G8RReg to the thread pointer.  Symbol contains a relocation
06f32e7eSjoerg    /// sym\@tls which is to be replaced by the thread pointer and
06f32e7eSjoerg    /// identifies to the linker that the instruction is part of a
06f32e7eSjoerg    /// TLS sequence.
06f32e7eSjoerg    ADD_TLS,
06f32e7eSjoerg
06f32e7eSjoerg    /// G8RC = ADDIS_TLSGD_HA %x2, Symbol - For the general-dynamic TLS
06f32e7eSjoerg    /// model, produces an ADDIS8 instruction that adds the GOT base
06f32e7eSjoerg    /// register to sym\@got\@tlsgd\@ha.
06f32e7eSjoerg    ADDIS_TLSGD_HA,
06f32e7eSjoerg
06f32e7eSjoerg    /// %x3 = ADDI_TLSGD_L G8RReg, Symbol - For the general-dynamic TLS
06f32e7eSjoerg    /// model, produces an ADDI8 instruction that adds G8RReg to
06f32e7eSjoerg    /// sym\@got\@tlsgd\@l and stores the result in X3.  Hidden by
06f32e7eSjoerg    /// ADDIS_TLSGD_L_ADDR until after register assignment.
06f32e7eSjoerg    ADDI_TLSGD_L,
06f32e7eSjoerg
06f32e7eSjoerg    /// %x3 = GET_TLS_ADDR %x3, Symbol - For the general-dynamic TLS
06f32e7eSjoerg    /// model, produces a call to __tls_get_addr(sym\@tlsgd).  Hidden by
06f32e7eSjoerg    /// ADDIS_TLSGD_L_ADDR until after register assignment.
06f32e7eSjoerg    GET_TLS_ADDR,
06f32e7eSjoerg
06f32e7eSjoerg    /// G8RC = ADDI_TLSGD_L_ADDR G8RReg, Symbol, Symbol - Op that
06f32e7eSjoerg    /// combines ADDI_TLSGD_L and GET_TLS_ADDR until expansion following
06f32e7eSjoerg    /// register assignment.
06f32e7eSjoerg    ADDI_TLSGD_L_ADDR,
06f32e7eSjoerg
*da58b97aSjoerg    /// GPRC = TLSGD_AIX, TOC_ENTRY, TOC_ENTRY
*da58b97aSjoerg    /// G8RC = TLSGD_AIX, TOC_ENTRY, TOC_ENTRY
*da58b97aSjoerg    /// Op that combines two register copies of TOC entries
*da58b97aSjoerg    /// (region handle into R3 and variable offset into R4) followed by a
*da58b97aSjoerg    /// GET_TLS_ADDR node which will be expanded to a call to __get_tls_addr.
*da58b97aSjoerg    /// This node is used in 64-bit mode as well (in which case the result is
*da58b97aSjoerg    /// G8RC and inputs are X3/X4).
*da58b97aSjoerg    TLSGD_AIX,
*da58b97aSjoerg
06f32e7eSjoerg    /// G8RC = ADDIS_TLSLD_HA %x2, Symbol - For the local-dynamic TLS
06f32e7eSjoerg    /// model, produces an ADDIS8 instruction that adds the GOT base
06f32e7eSjoerg    /// register to sym\@got\@tlsld\@ha.
06f32e7eSjoerg    ADDIS_TLSLD_HA,
06f32e7eSjoerg
06f32e7eSjoerg    /// %x3 = ADDI_TLSLD_L G8RReg, Symbol - For the local-dynamic TLS
06f32e7eSjoerg    /// model, produces an ADDI8 instruction that adds G8RReg to
06f32e7eSjoerg    /// sym\@got\@tlsld\@l and stores the result in X3.  Hidden by
06f32e7eSjoerg    /// ADDIS_TLSLD_L_ADDR until after register assignment.
06f32e7eSjoerg    ADDI_TLSLD_L,
06f32e7eSjoerg
06f32e7eSjoerg    /// %x3 = GET_TLSLD_ADDR %x3, Symbol - For the local-dynamic TLS
06f32e7eSjoerg    /// model, produces a call to __tls_get_addr(sym\@tlsld).  Hidden by
06f32e7eSjoerg    /// ADDIS_TLSLD_L_ADDR until after register assignment.
06f32e7eSjoerg    GET_TLSLD_ADDR,
06f32e7eSjoerg
06f32e7eSjoerg    /// G8RC = ADDI_TLSLD_L_ADDR G8RReg, Symbol, Symbol - Op that
06f32e7eSjoerg    /// combines ADDI_TLSLD_L and GET_TLSLD_ADDR until expansion
06f32e7eSjoerg    /// following register assignment.
06f32e7eSjoerg    ADDI_TLSLD_L_ADDR,
06f32e7eSjoerg
06f32e7eSjoerg    /// G8RC = ADDIS_DTPREL_HA %x3, Symbol - For the local-dynamic TLS
06f32e7eSjoerg    /// model, produces an ADDIS8 instruction that adds X3 to
06f32e7eSjoerg    /// sym\@dtprel\@ha.
06f32e7eSjoerg    ADDIS_DTPREL_HA,
06f32e7eSjoerg
06f32e7eSjoerg    /// G8RC = ADDI_DTPREL_L G8RReg, Symbol - For the local-dynamic TLS
06f32e7eSjoerg    /// model, produces an ADDI8 instruction that adds G8RReg to
06f32e7eSjoerg    /// sym\@got\@dtprel\@l.
06f32e7eSjoerg    ADDI_DTPREL_L,
06f32e7eSjoerg
*da58b97aSjoerg    /// G8RC = PADDI_DTPREL %x3, Symbol - For the pc-rel based local-dynamic TLS
*da58b97aSjoerg    /// model, produces a PADDI8 instruction that adds X3 to sym\@dtprel.
*da58b97aSjoerg    PADDI_DTPREL,
*da58b97aSjoerg
06f32e7eSjoerg    /// VRRC = VADD_SPLAT Elt, EltSize - Temporary node to be expanded
06f32e7eSjoerg    /// during instruction selection to optimize a BUILD_VECTOR into
06f32e7eSjoerg    /// operations on splats.  This is necessary to avoid losing these
06f32e7eSjoerg    /// optimizations due to constant folding.
06f32e7eSjoerg    VADD_SPLAT,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN = SC CHAIN, Imm128 - System call.  The 7-bit unsigned
06f32e7eSjoerg    /// operand identifies the operating system entry point.
06f32e7eSjoerg    SC,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN = CLRBHRB CHAIN - Clear branch history rolling buffer.
06f32e7eSjoerg    CLRBHRB,
06f32e7eSjoerg
06f32e7eSjoerg    /// GPRC, CHAIN = MFBHRBE CHAIN, Entry, Dummy - Move from branch
06f32e7eSjoerg    /// history rolling buffer entry.
06f32e7eSjoerg    MFBHRBE,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN = RFEBB CHAIN, State - Return from event-based branch.
06f32e7eSjoerg    RFEBB,
06f32e7eSjoerg
06f32e7eSjoerg    /// VSRC, CHAIN = XXSWAPD CHAIN, VSRC - Occurs only for little
06f32e7eSjoerg    /// endian.  Maps to an xxswapd instruction that corrects an lxvd2x
06f32e7eSjoerg    /// or stxvd2x instruction.  The chain is necessary because the
06f32e7eSjoerg    /// sequence replaces a load and needs to provide the same number
06f32e7eSjoerg    /// of outputs.
06f32e7eSjoerg    XXSWAPD,
06f32e7eSjoerg
06f32e7eSjoerg    /// An SDNode for swaps that are not associated with any loads/stores
06f32e7eSjoerg    /// and thereby have no chain.
06f32e7eSjoerg    SWAP_NO_CHAIN,
06f32e7eSjoerg
06f32e7eSjoerg    /// An SDNode for Power9 vector absolute value difference.
06f32e7eSjoerg    /// operand #0 vector
06f32e7eSjoerg    /// operand #1 vector
06f32e7eSjoerg    /// operand #2 constant i32 0 or 1, to indicate whether needs to patch
06f32e7eSjoerg    /// the most significant bit for signed i32
06f32e7eSjoerg    ///
06f32e7eSjoerg    /// Power9 VABSD* instructions are designed to support unsigned integer
06f32e7eSjoerg    /// vectors (byte/halfword/word), if we want to make use of them for signed
06f32e7eSjoerg    /// integer vectors, we have to flip their sign bits first. To flip sign bit
06f32e7eSjoerg    /// for byte/halfword integer vector would become inefficient, but for word
06f32e7eSjoerg    /// integer vector, we can leverage XVNEGSP to make it efficiently. eg:
06f32e7eSjoerg    /// abs(sub(a,b)) => VABSDUW(a+0x80000000, b+0x80000000)
06f32e7eSjoerg    ///               => VABSDUW((XVNEGSP a), (XVNEGSP b))
06f32e7eSjoerg    VABSD,
06f32e7eSjoerg
06f32e7eSjoerg    /// FP_EXTEND_HALF(VECTOR, IDX) - Custom extend upper (IDX=0) half or
06f32e7eSjoerg    /// lower (IDX=1) half of v4f32 to v2f64.
06f32e7eSjoerg    FP_EXTEND_HALF,
06f32e7eSjoerg
*da58b97aSjoerg    /// MAT_PCREL_ADDR = Materialize a PC Relative address. This can be done
*da58b97aSjoerg    /// either through an add like PADDI or through a PC Relative load like
*da58b97aSjoerg    /// PLD.
*da58b97aSjoerg    MAT_PCREL_ADDR,
*da58b97aSjoerg
*da58b97aSjoerg    /// TLS_DYNAMIC_MAT_PCREL_ADDR = Materialize a PC Relative address for
*da58b97aSjoerg    /// TLS global address when using dynamic access models. This can be done
*da58b97aSjoerg    /// through an add like PADDI.
*da58b97aSjoerg    TLS_DYNAMIC_MAT_PCREL_ADDR,
*da58b97aSjoerg
*da58b97aSjoerg    /// TLS_LOCAL_EXEC_MAT_ADDR = Materialize an address for TLS global address
*da58b97aSjoerg    /// when using local exec access models, and when prefixed instructions are
*da58b97aSjoerg    /// available. This is used with ADD_TLS to produce an add like PADDI.
*da58b97aSjoerg    TLS_LOCAL_EXEC_MAT_ADDR,
*da58b97aSjoerg
*da58b97aSjoerg    /// ACC_BUILD = Build an accumulator register from 4 VSX registers.
*da58b97aSjoerg    ACC_BUILD,
*da58b97aSjoerg
*da58b97aSjoerg    /// PAIR_BUILD = Build a vector pair register from 2 VSX registers.
*da58b97aSjoerg    PAIR_BUILD,
*da58b97aSjoerg
*da58b97aSjoerg    /// EXTRACT_VSX_REG = Extract one of the underlying vsx registers of
*da58b97aSjoerg    /// an accumulator or pair register. This node is needed because
*da58b97aSjoerg    /// EXTRACT_SUBVECTOR expects the input and output vectors to have the same
*da58b97aSjoerg    /// element type.
*da58b97aSjoerg    EXTRACT_VSX_REG,
*da58b97aSjoerg
*da58b97aSjoerg    /// XXMFACC = This corresponds to the xxmfacc instruction.
*da58b97aSjoerg    XXMFACC,
*da58b97aSjoerg
*da58b97aSjoerg    // Constrained conversion from floating point to int
*da58b97aSjoerg    STRICT_FCTIDZ = ISD::FIRST_TARGET_STRICTFP_OPCODE,
*da58b97aSjoerg    STRICT_FCTIWZ,
*da58b97aSjoerg    STRICT_FCTIDUZ,
*da58b97aSjoerg    STRICT_FCTIWUZ,
*da58b97aSjoerg
*da58b97aSjoerg    /// Constrained integer-to-floating-point conversion instructions.
*da58b97aSjoerg    STRICT_FCFID,
*da58b97aSjoerg    STRICT_FCFIDU,
*da58b97aSjoerg    STRICT_FCFIDS,
*da58b97aSjoerg    STRICT_FCFIDUS,
*da58b97aSjoerg
*da58b97aSjoerg    /// Constrained floating point add in round-to-zero mode.
*da58b97aSjoerg    STRICT_FADDRTZ,
*da58b97aSjoerg
06f32e7eSjoerg    /// CHAIN = STBRX CHAIN, GPRC, Ptr, Type - This is a
06f32e7eSjoerg    /// byte-swapping store instruction.  It byte-swaps the low "Type" bits of
06f32e7eSjoerg    /// the GPRC input, then stores it through Ptr.  Type can be either i16 or
06f32e7eSjoerg    /// i32.
06f32e7eSjoerg    STBRX = ISD::FIRST_TARGET_MEMORY_OPCODE,
06f32e7eSjoerg
06f32e7eSjoerg    /// GPRC, CHAIN = LBRX CHAIN, Ptr, Type - This is a
06f32e7eSjoerg    /// byte-swapping load instruction.  It loads "Type" bits, byte swaps it,
06f32e7eSjoerg    /// then puts it in the bottom bits of the GPRC.  TYPE can be either i16
06f32e7eSjoerg    /// or i32.
06f32e7eSjoerg    LBRX,
06f32e7eSjoerg
06f32e7eSjoerg    /// STFIWX - The STFIWX instruction.  The first operand is an input token
06f32e7eSjoerg    /// chain, then an f64 value to store, then an address to store it to.
06f32e7eSjoerg    STFIWX,
06f32e7eSjoerg
06f32e7eSjoerg    /// GPRC, CHAIN = LFIWAX CHAIN, Ptr - This is a floating-point
06f32e7eSjoerg    /// load which sign-extends from a 32-bit integer value into the
06f32e7eSjoerg    /// destination 64-bit register.
06f32e7eSjoerg    LFIWAX,
06f32e7eSjoerg
06f32e7eSjoerg    /// GPRC, CHAIN = LFIWZX CHAIN, Ptr - This is a floating-point
06f32e7eSjoerg    /// load which zero-extends from a 32-bit integer value into the
06f32e7eSjoerg    /// destination 64-bit register.
06f32e7eSjoerg    LFIWZX,
06f32e7eSjoerg
06f32e7eSjoerg    /// GPRC, CHAIN = LXSIZX, CHAIN, Ptr, ByteWidth - This is a load of an
06f32e7eSjoerg    /// integer smaller than 64 bits into a VSR. The integer is zero-extended.
06f32e7eSjoerg    /// This can be used for converting loaded integers to floating point.
06f32e7eSjoerg    LXSIZX,
06f32e7eSjoerg
06f32e7eSjoerg    /// STXSIX - The STXSI[bh]X instruction. The first operand is an input
06f32e7eSjoerg    /// chain, then an f64 value to store, then an address to store it to,
06f32e7eSjoerg    /// followed by a byte-width for the store.
06f32e7eSjoerg    STXSIX,
06f32e7eSjoerg
06f32e7eSjoerg    /// VSRC, CHAIN = LXVD2X_LE CHAIN, Ptr - Occurs only for little endian.
06f32e7eSjoerg    /// Maps directly to an lxvd2x instruction that will be followed by
06f32e7eSjoerg    /// an xxswapd.
06f32e7eSjoerg    LXVD2X,
06f32e7eSjoerg
*da58b97aSjoerg    /// LXVRZX - Load VSX Vector Rightmost and Zero Extend
*da58b97aSjoerg    /// This node represents v1i128 BUILD_VECTOR of a zero extending load
*da58b97aSjoerg    /// instruction from <byte, halfword, word, or doubleword> to i128.
*da58b97aSjoerg    /// Allows utilization of the Load VSX Vector Rightmost Instructions.
*da58b97aSjoerg    LXVRZX,
*da58b97aSjoerg
06f32e7eSjoerg    /// VSRC, CHAIN = LOAD_VEC_BE CHAIN, Ptr - Occurs only for little endian.
06f32e7eSjoerg    /// Maps directly to one of lxvd2x/lxvw4x/lxvh8x/lxvb16x depending on
06f32e7eSjoerg    /// the vector type to load vector in big-endian element order.
06f32e7eSjoerg    LOAD_VEC_BE,
06f32e7eSjoerg
06f32e7eSjoerg    /// VSRC, CHAIN = LD_VSX_LH CHAIN, Ptr - This is a floating-point load of a
06f32e7eSjoerg    /// v2f32 value into the lower half of a VSR register.
06f32e7eSjoerg    LD_VSX_LH,
06f32e7eSjoerg
06f32e7eSjoerg    /// VSRC, CHAIN = LD_SPLAT, CHAIN, Ptr - a splatting load memory
06f32e7eSjoerg    /// instructions such as LXVDSX, LXVWSX.
06f32e7eSjoerg    LD_SPLAT,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN = STXVD2X CHAIN, VSRC, Ptr - Occurs only for little endian.
06f32e7eSjoerg    /// Maps directly to an stxvd2x instruction that will be preceded by
06f32e7eSjoerg    /// an xxswapd.
06f32e7eSjoerg    STXVD2X,
06f32e7eSjoerg
06f32e7eSjoerg    /// CHAIN = STORE_VEC_BE CHAIN, VSRC, Ptr - Occurs only for little endian.
06f32e7eSjoerg    /// Maps directly to one of stxvd2x/stxvw4x/stxvh8x/stxvb16x depending on
06f32e7eSjoerg    /// the vector type to store vector in big-endian element order.
06f32e7eSjoerg    STORE_VEC_BE,
06f32e7eSjoerg
06f32e7eSjoerg    /// Store scalar integers from VSR.
06f32e7eSjoerg    ST_VSR_SCAL_INT,
06f32e7eSjoerg
06f32e7eSjoerg    /// ATOMIC_CMP_SWAP - the exact same as the target-independent nodes
06f32e7eSjoerg    /// except they ensure that the compare input is zero-extended for
06f32e7eSjoerg    /// sub-word versions because the atomic loads zero-extend.
*da58b97aSjoerg    ATOMIC_CMP_SWAP_8,
*da58b97aSjoerg    ATOMIC_CMP_SWAP_16,
06f32e7eSjoerg
06f32e7eSjoerg    /// GPRC = TOC_ENTRY GA, TOC
06f32e7eSjoerg    /// Loads the entry for GA from the TOC, where the TOC base is given by
06f32e7eSjoerg    /// the last operand.
06f32e7eSjoerg    TOC_ENTRY
06f32e7eSjoerg  };
06f32e7eSjoerg
06f32e7eSjoerg  } // end namespace PPCISD
06f32e7eSjoerg
06f32e7eSjoerg  /// Define some predicates that are used for node matching.
06f32e7eSjoerg  namespace PPC {
06f32e7eSjoerg
06f32e7eSjoerg    /// isVPKUHUMShuffleMask - Return true if this is the shuffle mask for a
06f32e7eSjoerg    /// VPKUHUM instruction.
06f32e7eSjoerg    bool isVPKUHUMShuffleMask(ShuffleVectorSDNode *N, unsigned ShuffleKind,
06f32e7eSjoerg                              SelectionDAG &DAG);
06f32e7eSjoerg
06f32e7eSjoerg    /// isVPKUWUMShuffleMask - Return true if this is the shuffle mask for a
06f32e7eSjoerg    /// VPKUWUM instruction.
06f32e7eSjoerg    bool isVPKUWUMShuffleMask(ShuffleVectorSDNode *N, unsigned ShuffleKind,
06f32e7eSjoerg                              SelectionDAG &DAG);
06f32e7eSjoerg
06f32e7eSjoerg    /// isVPKUDUMShuffleMask - Return true if this is the shuffle mask for a
06f32e7eSjoerg    /// VPKUDUM instruction.
06f32e7eSjoerg    bool isVPKUDUMShuffleMask(ShuffleVectorSDNode *N, unsigned ShuffleKind,
06f32e7eSjoerg                              SelectionDAG &DAG);
06f32e7eSjoerg
06f32e7eSjoerg    /// isVMRGLShuffleMask - Return true if this is a shuffle mask suitable for
06f32e7eSjoerg    /// a VRGL* instruction with the specified unit size (1,2 or 4 bytes).
06f32e7eSjoerg    bool isVMRGLShuffleMask(ShuffleVectorSDNode *N, unsigned UnitSize,
06f32e7eSjoerg                            unsigned ShuffleKind, SelectionDAG &DAG);
06f32e7eSjoerg
06f32e7eSjoerg    /// isVMRGHShuffleMask - Return true if this is a shuffle mask suitable for
06f32e7eSjoerg    /// a VRGH* instruction with the specified unit size (1,2 or 4 bytes).
06f32e7eSjoerg    bool isVMRGHShuffleMask(ShuffleVectorSDNode *N, unsigned UnitSize,
06f32e7eSjoerg                            unsigned ShuffleKind, SelectionDAG &DAG);
06f32e7eSjoerg
06f32e7eSjoerg    /// isVMRGEOShuffleMask - Return true if this is a shuffle mask suitable for
06f32e7eSjoerg    /// a VMRGEW or VMRGOW instruction
06f32e7eSjoerg    bool isVMRGEOShuffleMask(ShuffleVectorSDNode *N, bool CheckEven,
06f32e7eSjoerg                             unsigned ShuffleKind, SelectionDAG &DAG);
06f32e7eSjoerg    /// isXXSLDWIShuffleMask - Return true if this is a shuffle mask suitable
06f32e7eSjoerg    /// for a XXSLDWI instruction.
06f32e7eSjoerg    bool isXXSLDWIShuffleMask(ShuffleVectorSDNode *N, unsigned &ShiftElts,
06f32e7eSjoerg                              bool &Swap, bool IsLE);
06f32e7eSjoerg
06f32e7eSjoerg    /// isXXBRHShuffleMask - Return true if this is a shuffle mask suitable
06f32e7eSjoerg    /// for a XXBRH instruction.
06f32e7eSjoerg    bool isXXBRHShuffleMask(ShuffleVectorSDNode *N);
06f32e7eSjoerg
06f32e7eSjoerg    /// isXXBRWShuffleMask - Return true if this is a shuffle mask suitable
06f32e7eSjoerg    /// for a XXBRW instruction.
06f32e7eSjoerg    bool isXXBRWShuffleMask(ShuffleVectorSDNode *N);
06f32e7eSjoerg
06f32e7eSjoerg    /// isXXBRDShuffleMask - Return true if this is a shuffle mask suitable
06f32e7eSjoerg    /// for a XXBRD instruction.
06f32e7eSjoerg    bool isXXBRDShuffleMask(ShuffleVectorSDNode *N);
06f32e7eSjoerg
06f32e7eSjoerg    /// isXXBRQShuffleMask - Return true if this is a shuffle mask suitable
06f32e7eSjoerg    /// for a XXBRQ instruction.
06f32e7eSjoerg    bool isXXBRQShuffleMask(ShuffleVectorSDNode *N);
06f32e7eSjoerg
06f32e7eSjoerg    /// isXXPERMDIShuffleMask - Return true if this is a shuffle mask suitable
06f32e7eSjoerg    /// for a XXPERMDI instruction.
06f32e7eSjoerg    bool isXXPERMDIShuffleMask(ShuffleVectorSDNode *N, unsigned &ShiftElts,
06f32e7eSjoerg                              bool &Swap, bool IsLE);
06f32e7eSjoerg
06f32e7eSjoerg    /// isVSLDOIShuffleMask - If this is a vsldoi shuffle mask, return the
06f32e7eSjoerg    /// shift amount, otherwise return -1.
06f32e7eSjoerg    int isVSLDOIShuffleMask(SDNode *N, unsigned ShuffleKind,
06f32e7eSjoerg                            SelectionDAG &DAG);
06f32e7eSjoerg
06f32e7eSjoerg    /// isSplatShuffleMask - Return true if the specified VECTOR_SHUFFLE operand
06f32e7eSjoerg    /// specifies a splat of a single element that is suitable for input to
06f32e7eSjoerg    /// VSPLTB/VSPLTH/VSPLTW.
06f32e7eSjoerg    bool isSplatShuffleMask(ShuffleVectorSDNode *N, unsigned EltSize);
06f32e7eSjoerg
06f32e7eSjoerg    /// isXXINSERTWMask - Return true if this VECTOR_SHUFFLE can be handled by
06f32e7eSjoerg    /// the XXINSERTW instruction introduced in ISA 3.0. This is essentially any
06f32e7eSjoerg    /// shuffle of v4f32/v4i32 vectors that just inserts one element from one
06f32e7eSjoerg    /// vector into the other. This function will also set a couple of
06f32e7eSjoerg    /// output parameters for how much the source vector needs to be shifted and
06f32e7eSjoerg    /// what byte number needs to be specified for the instruction to put the
06f32e7eSjoerg    /// element in the desired location of the target vector.
06f32e7eSjoerg    bool isXXINSERTWMask(ShuffleVectorSDNode *N, unsigned &ShiftElts,
06f32e7eSjoerg                         unsigned &InsertAtByte, bool &Swap, bool IsLE);
06f32e7eSjoerg
06f32e7eSjoerg    /// getSplatIdxForPPCMnemonics - Return the splat index as a value that is
06f32e7eSjoerg    /// appropriate for PPC mnemonics (which have a big endian bias - namely
06f32e7eSjoerg    /// elements are counted from the left of the vector register).
06f32e7eSjoerg    unsigned getSplatIdxForPPCMnemonics(SDNode *N, unsigned EltSize,
06f32e7eSjoerg                                        SelectionDAG &DAG);
06f32e7eSjoerg
06f32e7eSjoerg    /// get_VSPLTI_elt - If this is a build_vector of constants which can be
06f32e7eSjoerg    /// formed by using a vspltis[bhw] instruction of the specified element
06f32e7eSjoerg    /// size, return the constant being splatted.  The ByteSize field indicates
06f32e7eSjoerg    /// the number of bytes of each element [124] -> [bhw].
06f32e7eSjoerg    SDValue get_VSPLTI_elt(SDNode *N, unsigned ByteSize, SelectionDAG &DAG);
06f32e7eSjoerg
*da58b97aSjoerg    // Flags for computing the optimal addressing mode for loads and stores.
*da58b97aSjoerg    enum MemOpFlags {
*da58b97aSjoerg      MOF_None = 0,
06f32e7eSjoerg
*da58b97aSjoerg      // Extension mode for integer loads.
*da58b97aSjoerg      MOF_SExt = 1,
*da58b97aSjoerg      MOF_ZExt = 1 << 1,
*da58b97aSjoerg      MOF_NoExt = 1 << 2,
*da58b97aSjoerg
*da58b97aSjoerg      // Address computation flags.
*da58b97aSjoerg      MOF_NotAddNorCst = 1 << 5,      // Not const. or sum of ptr and scalar.
*da58b97aSjoerg      MOF_RPlusSImm16 = 1 << 6,       // Reg plus signed 16-bit constant.
*da58b97aSjoerg      MOF_RPlusLo = 1 << 7,           // Reg plus signed 16-bit relocation
*da58b97aSjoerg      MOF_RPlusSImm16Mult4 = 1 << 8,  // Reg plus 16-bit signed multiple of 4.
*da58b97aSjoerg      MOF_RPlusSImm16Mult16 = 1 << 9, // Reg plus 16-bit signed multiple of 16.
*da58b97aSjoerg      MOF_RPlusSImm34 = 1 << 10,      // Reg plus 34-bit signed constant.
*da58b97aSjoerg      MOF_RPlusR = 1 << 11,           // Sum of two variables.
*da58b97aSjoerg      MOF_PCRel = 1 << 12,            // PC-Relative relocation.
*da58b97aSjoerg      MOF_AddrIsSImm32 = 1 << 13,     // A simple 32-bit constant.
*da58b97aSjoerg
*da58b97aSjoerg      // The in-memory type.
*da58b97aSjoerg      MOF_SubWordInt = 1 << 15,
*da58b97aSjoerg      MOF_WordInt = 1 << 16,
*da58b97aSjoerg      MOF_DoubleWordInt = 1 << 17,
*da58b97aSjoerg      MOF_ScalarFloat = 1 << 18, // Scalar single or double precision.
*da58b97aSjoerg      MOF_Vector = 1 << 19,      // Vector types and quad precision scalars.
*da58b97aSjoerg      MOF_Vector256 = 1 << 20,
*da58b97aSjoerg
*da58b97aSjoerg      // Subtarget features.
*da58b97aSjoerg      MOF_SubtargetBeforeP9 = 1 << 22,
*da58b97aSjoerg      MOF_SubtargetP9 = 1 << 23,
*da58b97aSjoerg      MOF_SubtargetP10 = 1 << 24,
*da58b97aSjoerg      MOF_SubtargetSPE = 1 << 25
*da58b97aSjoerg    };
*da58b97aSjoerg
*da58b97aSjoerg    // The addressing modes for loads and stores.
*da58b97aSjoerg    enum AddrMode {
*da58b97aSjoerg      AM_None,
*da58b97aSjoerg      AM_DForm,
*da58b97aSjoerg      AM_DSForm,
*da58b97aSjoerg      AM_DQForm,
*da58b97aSjoerg      AM_XForm,
*da58b97aSjoerg    };
06f32e7eSjoerg  } // end namespace PPC
06f32e7eSjoerg
06f32e7eSjoerg  class PPCTargetLowering : public TargetLowering {
06f32e7eSjoerg    const PPCSubtarget &Subtarget;
06f32e7eSjoerg
06f32e7eSjoerg  public:
06f32e7eSjoerg    explicit PPCTargetLowering(const PPCTargetMachine &TM,
06f32e7eSjoerg                               const PPCSubtarget &STI);
06f32e7eSjoerg
06f32e7eSjoerg    /// getTargetNodeName() - This method returns the name of a target specific
06f32e7eSjoerg    /// DAG node.
06f32e7eSjoerg    const char *getTargetNodeName(unsigned Opcode) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool isSelectSupported(SelectSupportKind Kind) const override {
06f32e7eSjoerg      // PowerPC does not support scalar condition selects on vectors.
06f32e7eSjoerg      return (Kind != SelectSupportKind::ScalarCondVectorVal);
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    /// getPreferredVectorAction - The code we generate when vector types are
06f32e7eSjoerg    /// legalized by promoting the integer element type is often much worse
06f32e7eSjoerg    /// than code we generate if we widen the type for applicable vector types.
06f32e7eSjoerg    /// The issue with promoting is that the vector is scalaraized, individual
06f32e7eSjoerg    /// elements promoted and then the vector is rebuilt. So say we load a pair
06f32e7eSjoerg    /// of v4i8's and shuffle them. This will turn into a mess of 8 extending
06f32e7eSjoerg    /// loads, moves back into VSR's (or memory ops if we don't have moves) and
06f32e7eSjoerg    /// then the VPERM for the shuffle. All in all a very slow sequence.
06f32e7eSjoerg    TargetLoweringBase::LegalizeTypeAction getPreferredVectorAction(MVT VT)
06f32e7eSjoerg      const override {
*da58b97aSjoerg      if (!VT.isScalableVector() && VT.getVectorNumElements() != 1 &&
*da58b97aSjoerg          VT.getScalarSizeInBits() % 8 == 0)
06f32e7eSjoerg        return TypeWidenVector;
06f32e7eSjoerg      return TargetLoweringBase::getPreferredVectorAction(VT);
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    bool useSoftFloat() const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool hasSPE() const;
06f32e7eSjoerg
06f32e7eSjoerg    MVT getScalarShiftAmountTy(const DataLayout &, EVT) const override {
06f32e7eSjoerg      return MVT::i32;
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    bool isCheapToSpeculateCttz() const override {
06f32e7eSjoerg      return true;
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    bool isCheapToSpeculateCtlz() const override {
06f32e7eSjoerg      return true;
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    bool isCtlzFast() const override {
06f32e7eSjoerg      return true;
06f32e7eSjoerg    }
06f32e7eSjoerg
*da58b97aSjoerg    bool isEqualityCmpFoldedWithSignedCmp() const override {
*da58b97aSjoerg      return false;
*da58b97aSjoerg    }
*da58b97aSjoerg
06f32e7eSjoerg    bool hasAndNotCompare(SDValue) const override {
06f32e7eSjoerg      return true;
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    bool preferIncOfAddToSubOfNot(EVT VT) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool convertSetCCLogicToBitwiseLogic(EVT VT) const override {
06f32e7eSjoerg      return VT.isScalarInteger();
06f32e7eSjoerg    }
06f32e7eSjoerg
*da58b97aSjoerg    SDValue getNegatedExpression(SDValue Op, SelectionDAG &DAG, bool LegalOps,
*da58b97aSjoerg                                 bool OptForSize, NegatibleCost &Cost,
*da58b97aSjoerg                                 unsigned Depth = 0) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// getSetCCResultType - Return the ISD::SETCC ValueType
06f32e7eSjoerg    EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context,
06f32e7eSjoerg                           EVT VT) const override;
06f32e7eSjoerg
*da58b97aSjoerg    /// Return true if target always benefits from combining into FMA for a
06f32e7eSjoerg    /// given value type. This must typically return false on targets where FMA
06f32e7eSjoerg    /// takes more cycles to execute than FADD.
06f32e7eSjoerg    bool enableAggressiveFMAFusion(EVT VT) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// getPreIndexedAddressParts - returns true by value, base pointer and
06f32e7eSjoerg    /// offset pointer and addressing mode by reference if the node's address
06f32e7eSjoerg    /// can be legally represented as pre-indexed load / store address.
06f32e7eSjoerg    bool getPreIndexedAddressParts(SDNode *N, SDValue &Base,
06f32e7eSjoerg                                   SDValue &Offset,
06f32e7eSjoerg                                   ISD::MemIndexedMode &AM,
06f32e7eSjoerg                                   SelectionDAG &DAG) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// SelectAddressEVXRegReg - Given the specified addressed, check to see if
06f32e7eSjoerg    /// it can be more efficiently represented as [r+imm].
06f32e7eSjoerg    bool SelectAddressEVXRegReg(SDValue N, SDValue &Base, SDValue &Index,
06f32e7eSjoerg                                SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    /// SelectAddressRegReg - Given the specified addressed, check to see if it
06f32e7eSjoerg    /// can be more efficiently represented as [r+imm]. If \p EncodingAlignment
06f32e7eSjoerg    /// is non-zero, only accept displacement which is not suitable for [r+imm].
06f32e7eSjoerg    /// Returns false if it can be represented by [r+imm], which are preferred.
06f32e7eSjoerg    bool SelectAddressRegReg(SDValue N, SDValue &Base, SDValue &Index,
06f32e7eSjoerg                             SelectionDAG &DAG,
*da58b97aSjoerg                             MaybeAlign EncodingAlignment = None) const;
06f32e7eSjoerg
06f32e7eSjoerg    /// SelectAddressRegImm - Returns true if the address N can be represented
06f32e7eSjoerg    /// by a base register plus a signed 16-bit displacement [r+imm], and if it
06f32e7eSjoerg    /// is not better represented as reg+reg. If \p EncodingAlignment is
06f32e7eSjoerg    /// non-zero, only accept displacements suitable for instruction encoding
06f32e7eSjoerg    /// requirement, i.e. multiples of 4 for DS form.
06f32e7eSjoerg    bool SelectAddressRegImm(SDValue N, SDValue &Disp, SDValue &Base,
06f32e7eSjoerg                             SelectionDAG &DAG,
*da58b97aSjoerg                             MaybeAlign EncodingAlignment) const;
*da58b97aSjoerg    bool SelectAddressRegImm34(SDValue N, SDValue &Disp, SDValue &Base,
*da58b97aSjoerg                               SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    /// SelectAddressRegRegOnly - Given the specified addressed, force it to be
06f32e7eSjoerg    /// represented as an indexed [r+r] operation.
06f32e7eSjoerg    bool SelectAddressRegRegOnly(SDValue N, SDValue &Base, SDValue &Index,
06f32e7eSjoerg                                 SelectionDAG &DAG) const;
06f32e7eSjoerg
*da58b97aSjoerg    /// SelectAddressPCRel - Represent the specified address as pc relative to
*da58b97aSjoerg    /// be represented as [pc+imm]
*da58b97aSjoerg    bool SelectAddressPCRel(SDValue N, SDValue &Base) const;
*da58b97aSjoerg
06f32e7eSjoerg    Sched::Preference getSchedulingPreference(SDNode *N) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// LowerOperation - Provide custom lowering hooks for some operations.
06f32e7eSjoerg    ///
06f32e7eSjoerg    SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// ReplaceNodeResults - Replace the results of node with an illegal result
06f32e7eSjoerg    /// type with new values built out of custom code.
06f32e7eSjoerg    ///
06f32e7eSjoerg    void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue>&Results,
06f32e7eSjoerg                            SelectionDAG &DAG) const override;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue expandVSXLoadForLE(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue expandVSXStoreForLE(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue BuildSDIVPow2(SDNode *N, const APInt &Divisor, SelectionDAG &DAG,
06f32e7eSjoerg                          SmallVectorImpl<SDNode *> &Created) const override;
06f32e7eSjoerg
*da58b97aSjoerg    Register getRegisterByName(const char* RegName, LLT VT,
06f32e7eSjoerg                               const MachineFunction &MF) const override;
06f32e7eSjoerg
06f32e7eSjoerg    void computeKnownBitsForTargetNode(const SDValue Op,
06f32e7eSjoerg                                       KnownBits &Known,
06f32e7eSjoerg                                       const APInt &DemandedElts,
06f32e7eSjoerg                                       const SelectionDAG &DAG,
06f32e7eSjoerg                                       unsigned Depth = 0) const override;
06f32e7eSjoerg
06f32e7eSjoerg    Align getPrefLoopAlignment(MachineLoop *ML) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool shouldInsertFencesForAtomic(const Instruction *I) const override {
06f32e7eSjoerg      return true;
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    Instruction *emitLeadingFence(IRBuilder<> &Builder, Instruction *Inst,
06f32e7eSjoerg                                  AtomicOrdering Ord) const override;
06f32e7eSjoerg    Instruction *emitTrailingFence(IRBuilder<> &Builder, Instruction *Inst,
06f32e7eSjoerg                                   AtomicOrdering Ord) const override;
06f32e7eSjoerg
06f32e7eSjoerg    MachineBasicBlock *
06f32e7eSjoerg    EmitInstrWithCustomInserter(MachineInstr &MI,
06f32e7eSjoerg                                MachineBasicBlock *MBB) const override;
06f32e7eSjoerg    MachineBasicBlock *EmitAtomicBinary(MachineInstr &MI,
06f32e7eSjoerg                                        MachineBasicBlock *MBB,
06f32e7eSjoerg                                        unsigned AtomicSize,
06f32e7eSjoerg                                        unsigned BinOpcode,
06f32e7eSjoerg                                        unsigned CmpOpcode = 0,
06f32e7eSjoerg                                        unsigned CmpPred = 0) const;
06f32e7eSjoerg    MachineBasicBlock *EmitPartwordAtomicBinary(MachineInstr &MI,
06f32e7eSjoerg                                                MachineBasicBlock *MBB,
06f32e7eSjoerg                                                bool is8bit,
06f32e7eSjoerg                                                unsigned Opcode,
06f32e7eSjoerg                                                unsigned CmpOpcode = 0,
06f32e7eSjoerg                                                unsigned CmpPred = 0) const;
06f32e7eSjoerg
06f32e7eSjoerg    MachineBasicBlock *emitEHSjLjSetJmp(MachineInstr &MI,
06f32e7eSjoerg                                        MachineBasicBlock *MBB) const;
06f32e7eSjoerg
06f32e7eSjoerg    MachineBasicBlock *emitEHSjLjLongJmp(MachineInstr &MI,
06f32e7eSjoerg                                         MachineBasicBlock *MBB) const;
06f32e7eSjoerg
*da58b97aSjoerg    MachineBasicBlock *emitProbedAlloca(MachineInstr &MI,
*da58b97aSjoerg                                        MachineBasicBlock *MBB) const;
*da58b97aSjoerg
*da58b97aSjoerg    bool hasInlineStackProbe(MachineFunction &MF) const override;
*da58b97aSjoerg
*da58b97aSjoerg    unsigned getStackProbeSize(MachineFunction &MF) const;
*da58b97aSjoerg
06f32e7eSjoerg    ConstraintType getConstraintType(StringRef Constraint) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// Examine constraint string and operand type and determine a weight value.
06f32e7eSjoerg    /// The operand object must already have been set up with the operand type.
06f32e7eSjoerg    ConstraintWeight getSingleConstraintMatchWeight(
06f32e7eSjoerg      AsmOperandInfo &info, const char *constraint) const override;
06f32e7eSjoerg
06f32e7eSjoerg    std::pair<unsigned, const TargetRegisterClass *>
06f32e7eSjoerg    getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
06f32e7eSjoerg                                 StringRef Constraint, MVT VT) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
06f32e7eSjoerg    /// function arguments in the caller parameter area.  This is the actual
06f32e7eSjoerg    /// alignment, not its logarithm.
06f32e7eSjoerg    unsigned getByValTypeAlignment(Type *Ty,
06f32e7eSjoerg                                   const DataLayout &DL) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
06f32e7eSjoerg    /// vector.  If it is invalid, don't add anything to Ops.
06f32e7eSjoerg    void LowerAsmOperandForConstraint(SDValue Op,
06f32e7eSjoerg                                      std::string &Constraint,
06f32e7eSjoerg                                      std::vector<SDValue> &Ops,
06f32e7eSjoerg                                      SelectionDAG &DAG) const override;
06f32e7eSjoerg
06f32e7eSjoerg    unsigned
06f32e7eSjoerg    getInlineAsmMemConstraint(StringRef ConstraintCode) const override {
06f32e7eSjoerg      if (ConstraintCode == "es")
06f32e7eSjoerg        return InlineAsm::Constraint_es;
06f32e7eSjoerg      else if (ConstraintCode == "Q")
06f32e7eSjoerg        return InlineAsm::Constraint_Q;
06f32e7eSjoerg      else if (ConstraintCode == "Z")
06f32e7eSjoerg        return InlineAsm::Constraint_Z;
06f32e7eSjoerg      else if (ConstraintCode == "Zy")
06f32e7eSjoerg        return InlineAsm::Constraint_Zy;
06f32e7eSjoerg      return TargetLowering::getInlineAsmMemConstraint(ConstraintCode);
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    /// isLegalAddressingMode - Return true if the addressing mode represented
06f32e7eSjoerg    /// by AM is legal for this target, for a load/store of the specified type.
06f32e7eSjoerg    bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM,
06f32e7eSjoerg                               Type *Ty, unsigned AS,
06f32e7eSjoerg                               Instruction *I = nullptr) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// isLegalICmpImmediate - Return true if the specified immediate is legal
06f32e7eSjoerg    /// icmp immediate, that is the target has icmp instructions which can
06f32e7eSjoerg    /// compare a register against the immediate without having to materialize
06f32e7eSjoerg    /// the immediate into a register.
06f32e7eSjoerg    bool isLegalICmpImmediate(int64_t Imm) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// isLegalAddImmediate - Return true if the specified immediate is legal
06f32e7eSjoerg    /// add immediate, that is the target has add instructions which can
06f32e7eSjoerg    /// add a register and the immediate without having to materialize
06f32e7eSjoerg    /// the immediate into a register.
06f32e7eSjoerg    bool isLegalAddImmediate(int64_t Imm) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// isTruncateFree - Return true if it's free to truncate a value of
06f32e7eSjoerg    /// type Ty1 to type Ty2. e.g. On PPC it's free to truncate a i64 value in
06f32e7eSjoerg    /// register X1 to i32 by referencing its sub-register R1.
06f32e7eSjoerg    bool isTruncateFree(Type *Ty1, Type *Ty2) const override;
06f32e7eSjoerg    bool isTruncateFree(EVT VT1, EVT VT2) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool isZExtFree(SDValue Val, EVT VT2) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool isFPExtFree(EVT DestVT, EVT SrcVT) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// Returns true if it is beneficial to convert a load of a constant
06f32e7eSjoerg    /// to just the constant itself.
06f32e7eSjoerg    bool shouldConvertConstantLoadToIntImm(const APInt &Imm,
06f32e7eSjoerg                                           Type *Ty) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool convertSelectOfConstantsToMath(EVT VT) const override {
06f32e7eSjoerg      return true;
06f32e7eSjoerg    }
06f32e7eSjoerg
*da58b97aSjoerg    bool decomposeMulByConstant(LLVMContext &Context, EVT VT,
*da58b97aSjoerg                                SDValue C) const override;
*da58b97aSjoerg
06f32e7eSjoerg    bool isDesirableToTransformToIntegerOp(unsigned Opc,
06f32e7eSjoerg                                           EVT VT) const override {
06f32e7eSjoerg      // Only handle float load/store pair because float(fpr) load/store
06f32e7eSjoerg      // instruction has more cycles than integer(gpr) load/store in PPC.
06f32e7eSjoerg      if (Opc != ISD::LOAD && Opc != ISD::STORE)
06f32e7eSjoerg        return false;
06f32e7eSjoerg      if (VT != MVT::f32 && VT != MVT::f64)
06f32e7eSjoerg        return false;
06f32e7eSjoerg
06f32e7eSjoerg      return true;
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    // Returns true if the address of the global is stored in TOC entry.
06f32e7eSjoerg    bool isAccessedAsGotIndirect(SDValue N) const;
06f32e7eSjoerg
06f32e7eSjoerg    bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool getTgtMemIntrinsic(IntrinsicInfo &Info,
06f32e7eSjoerg                            const CallInst &I,
06f32e7eSjoerg                            MachineFunction &MF,
06f32e7eSjoerg                            unsigned Intrinsic) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// It returns EVT::Other if the type should be determined using generic
06f32e7eSjoerg    /// target-independent logic.
*da58b97aSjoerg    EVT getOptimalMemOpType(const MemOp &Op,
06f32e7eSjoerg                            const AttributeList &FuncAttributes) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// Is unaligned memory access allowed for the given type, and is it fast
06f32e7eSjoerg    /// relative to software emulation.
06f32e7eSjoerg    bool allowsMisalignedMemoryAccesses(
*da58b97aSjoerg        EVT VT, unsigned AddrSpace, Align Alignment = Align(1),
06f32e7eSjoerg        MachineMemOperand::Flags Flags = MachineMemOperand::MONone,
06f32e7eSjoerg        bool *Fast = nullptr) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// isFMAFasterThanFMulAndFAdd - Return true if an FMA operation is faster
06f32e7eSjoerg    /// than a pair of fmul and fadd instructions. fmuladd intrinsics will be
06f32e7eSjoerg    /// expanded to FMAs when this method returns true, otherwise fmuladd is
06f32e7eSjoerg    /// expanded to fmul + fadd.
*da58b97aSjoerg    bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF,
*da58b97aSjoerg                                    EVT VT) const override;
*da58b97aSjoerg
*da58b97aSjoerg    bool isFMAFasterThanFMulAndFAdd(const Function &F, Type *Ty) const override;
*da58b97aSjoerg
*da58b97aSjoerg    /// isProfitableToHoist - Check if it is profitable to hoist instruction
*da58b97aSjoerg    /// \p I to its dominator block.
*da58b97aSjoerg    /// For example, it is not profitable if \p I and it's only user can form a
*da58b97aSjoerg    /// FMA instruction, because Powerpc prefers FMADD.
*da58b97aSjoerg    bool isProfitableToHoist(Instruction *I) const override;
06f32e7eSjoerg
06f32e7eSjoerg    const MCPhysReg *getScratchRegisters(CallingConv::ID CC) const override;
06f32e7eSjoerg
06f32e7eSjoerg    // Should we expand the build vector with shuffles?
06f32e7eSjoerg    bool
06f32e7eSjoerg    shouldExpandBuildVectorWithShuffles(EVT VT,
06f32e7eSjoerg                                        unsigned DefinedValues) const override;
06f32e7eSjoerg
*da58b97aSjoerg    // Keep the zero-extensions for arguments to libcalls.
*da58b97aSjoerg    bool shouldKeepZExtForFP16Conv() const override { return true; }
*da58b97aSjoerg
06f32e7eSjoerg    /// createFastISel - This method returns a target-specific FastISel object,
06f32e7eSjoerg    /// or null if the target does not support "fast" instruction selection.
06f32e7eSjoerg    FastISel *createFastISel(FunctionLoweringInfo &FuncInfo,
06f32e7eSjoerg                             const TargetLibraryInfo *LibInfo) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// Returns true if an argument of type Ty needs to be passed in a
06f32e7eSjoerg    /// contiguous block of registers in calling convention CallConv.
06f32e7eSjoerg    bool functionArgumentNeedsConsecutiveRegisters(
06f32e7eSjoerg      Type *Ty, CallingConv::ID CallConv, bool isVarArg) const override {
06f32e7eSjoerg      // We support any array type as "consecutive" block in the parameter
06f32e7eSjoerg      // save area.  The element type defines the alignment requirement and
06f32e7eSjoerg      // whether the argument should go in GPRs, FPRs, or VRs if available.
06f32e7eSjoerg      //
06f32e7eSjoerg      // Note that clang uses this capability both to implement the ELFv2
06f32e7eSjoerg      // homogeneous float/vector aggregate ABI, and to avoid having to use
06f32e7eSjoerg      // "byval" when passing aggregates that might fully fit in registers.
06f32e7eSjoerg      return Ty->isArrayTy();
06f32e7eSjoerg    }
06f32e7eSjoerg
06f32e7eSjoerg    /// If a physical register, this returns the register that receives the
06f32e7eSjoerg    /// exception address on entry to an EH pad.
*da58b97aSjoerg    Register
06f32e7eSjoerg    getExceptionPointerRegister(const Constant *PersonalityFn) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// If a physical register, this returns the register that receives the
06f32e7eSjoerg    /// exception typeid on entry to a landing pad.
*da58b97aSjoerg    Register
06f32e7eSjoerg    getExceptionSelectorRegister(const Constant *PersonalityFn) const override;
06f32e7eSjoerg
06f32e7eSjoerg    /// Override to support customized stack guard loading.
06f32e7eSjoerg    bool useLoadStackGuardNode() const override;
06f32e7eSjoerg    void insertSSPDeclarations(Module &M) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool isFPImmLegal(const APFloat &Imm, EVT VT,
06f32e7eSjoerg                      bool ForCodeSize) const override;
06f32e7eSjoerg
06f32e7eSjoerg    unsigned getJumpTableEncoding() const override;
06f32e7eSjoerg    bool isJumpTableRelative() const override;
06f32e7eSjoerg    SDValue getPICJumpTableRelocBase(SDValue Table,
06f32e7eSjoerg                                     SelectionDAG &DAG) const override;
06f32e7eSjoerg    const MCExpr *getPICJumpTableRelocBaseExpr(const MachineFunction *MF,
06f32e7eSjoerg                                               unsigned JTI,
06f32e7eSjoerg                                               MCContext &Ctx) const override;
06f32e7eSjoerg
*da58b97aSjoerg    /// SelectOptimalAddrMode - Based on a node N and it's Parent (a MemSDNode),
*da58b97aSjoerg    /// compute the address flags of the node, get the optimal address mode
*da58b97aSjoerg    /// based on the flags, and set the Base and Disp based on the address mode.
*da58b97aSjoerg    PPC::AddrMode SelectOptimalAddrMode(const SDNode *Parent, SDValue N,
*da58b97aSjoerg                                        SDValue &Disp, SDValue &Base,
*da58b97aSjoerg                                        SelectionDAG &DAG,
*da58b97aSjoerg                                        MaybeAlign Align) const;
*da58b97aSjoerg    /// SelectForceXFormMode - Given the specified address, force it to be
*da58b97aSjoerg    /// represented as an indexed [r+r] operation (an XForm instruction).
*da58b97aSjoerg    PPC::AddrMode SelectForceXFormMode(SDValue N, SDValue &Disp, SDValue &Base,
*da58b97aSjoerg                                       SelectionDAG &DAG) const;
*da58b97aSjoerg
*da58b97aSjoerg    /// Structure that collects some common arguments that get passed around
*da58b97aSjoerg    /// between the functions for call lowering.
*da58b97aSjoerg    struct CallFlags {
*da58b97aSjoerg      const CallingConv::ID CallConv;
*da58b97aSjoerg      const bool IsTailCall : 1;
*da58b97aSjoerg      const bool IsVarArg : 1;
*da58b97aSjoerg      const bool IsPatchPoint : 1;
*da58b97aSjoerg      const bool IsIndirect : 1;
*da58b97aSjoerg      const bool HasNest : 1;
*da58b97aSjoerg      const bool NoMerge : 1;
*da58b97aSjoerg
*da58b97aSjoerg      CallFlags(CallingConv::ID CC, bool IsTailCall, bool IsVarArg,
*da58b97aSjoerg                bool IsPatchPoint, bool IsIndirect, bool HasNest, bool NoMerge)
*da58b97aSjoerg          : CallConv(CC), IsTailCall(IsTailCall), IsVarArg(IsVarArg),
*da58b97aSjoerg            IsPatchPoint(IsPatchPoint), IsIndirect(IsIndirect),
*da58b97aSjoerg            HasNest(HasNest), NoMerge(NoMerge) {}
*da58b97aSjoerg    };
*da58b97aSjoerg
06f32e7eSjoerg  private:
06f32e7eSjoerg    struct ReuseLoadInfo {
06f32e7eSjoerg      SDValue Ptr;
06f32e7eSjoerg      SDValue Chain;
06f32e7eSjoerg      SDValue ResChain;
06f32e7eSjoerg      MachinePointerInfo MPI;
06f32e7eSjoerg      bool IsDereferenceable = false;
06f32e7eSjoerg      bool IsInvariant = false;
*da58b97aSjoerg      Align Alignment;
06f32e7eSjoerg      AAMDNodes AAInfo;
06f32e7eSjoerg      const MDNode *Ranges = nullptr;
06f32e7eSjoerg
06f32e7eSjoerg      ReuseLoadInfo() = default;
06f32e7eSjoerg
06f32e7eSjoerg      MachineMemOperand::Flags MMOFlags() const {
06f32e7eSjoerg        MachineMemOperand::Flags F = MachineMemOperand::MONone;
06f32e7eSjoerg        if (IsDereferenceable)
06f32e7eSjoerg          F |= MachineMemOperand::MODereferenceable;
06f32e7eSjoerg        if (IsInvariant)
06f32e7eSjoerg          F |= MachineMemOperand::MOInvariant;
06f32e7eSjoerg        return F;
06f32e7eSjoerg      }
06f32e7eSjoerg    };
06f32e7eSjoerg
*da58b97aSjoerg    // Map that relates a set of common address flags to PPC addressing modes.
*da58b97aSjoerg    std::map<PPC::AddrMode, SmallVector<unsigned, 16>> AddrModesMap;
*da58b97aSjoerg    void initializeAddrModeMap();
06f32e7eSjoerg
06f32e7eSjoerg    bool canReuseLoadAddress(SDValue Op, EVT MemVT, ReuseLoadInfo &RLI,
06f32e7eSjoerg                             SelectionDAG &DAG,
06f32e7eSjoerg                             ISD::LoadExtType ET = ISD::NON_EXTLOAD) const;
06f32e7eSjoerg    void spliceIntoChain(SDValue ResChain, SDValue NewResChain,
06f32e7eSjoerg                         SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    void LowerFP_TO_INTForReuse(SDValue Op, ReuseLoadInfo &RLI,
06f32e7eSjoerg                                SelectionDAG &DAG, const SDLoc &dl) const;
06f32e7eSjoerg    SDValue LowerFP_TO_INTDirectMove(SDValue Op, SelectionDAG &DAG,
06f32e7eSjoerg                                     const SDLoc &dl) const;
06f32e7eSjoerg
06f32e7eSjoerg    bool directMoveIsProfitable(const SDValue &Op) const;
06f32e7eSjoerg    SDValue LowerINT_TO_FPDirectMove(SDValue Op, SelectionDAG &DAG,
06f32e7eSjoerg                                     const SDLoc &dl) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue LowerINT_TO_FPVector(SDValue Op, SelectionDAG &DAG,
06f32e7eSjoerg                                 const SDLoc &dl) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue LowerTRUNCATEVector(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue getFramePointerFrameIndex(SelectionDAG & DAG) const;
06f32e7eSjoerg    SDValue getReturnAddrFrameIndex(SelectionDAG & DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    bool
06f32e7eSjoerg    IsEligibleForTailCallOptimization(SDValue Callee,
06f32e7eSjoerg                                      CallingConv::ID CalleeCC,
06f32e7eSjoerg                                      bool isVarArg,
06f32e7eSjoerg                                      const SmallVectorImpl<ISD::InputArg> &Ins,
06f32e7eSjoerg                                      SelectionDAG& DAG) const;
06f32e7eSjoerg
*da58b97aSjoerg    bool IsEligibleForTailCallOptimization_64SVR4(
*da58b97aSjoerg        SDValue Callee, CallingConv::ID CalleeCC, const CallBase *CB,
*da58b97aSjoerg        bool isVarArg, const SmallVectorImpl<ISD::OutputArg> &Outs,
*da58b97aSjoerg        const SmallVectorImpl<ISD::InputArg> &Ins, SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue EmitTailCallLoadFPAndRetAddr(SelectionDAG &DAG, int SPDiff,
06f32e7eSjoerg                                         SDValue Chain, SDValue &LROpOut,
06f32e7eSjoerg                                         SDValue &FPOpOut,
06f32e7eSjoerg                                         const SDLoc &dl) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue getTOCEntry(SelectionDAG &DAG, const SDLoc &dl, SDValue GA) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerBlockAddress(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
*da58b97aSjoerg    SDValue LowerGlobalTLSAddressAIX(SDValue Op, SelectionDAG &DAG) const;
*da58b97aSjoerg    SDValue LowerGlobalTLSAddressLinux(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerJumpTable(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerINIT_TRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerADJUST_TRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
*da58b97aSjoerg    SDValue LowerINLINEASM(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerVACOPY(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerSTACKRESTORE(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerGET_DYNAMIC_AREA_OFFSET(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerEH_DWARF_CFA(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerLOAD(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG,
06f32e7eSjoerg                           const SDLoc &dl) const;
06f32e7eSjoerg    SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerFLT_ROUNDS_(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerSHL_PARTS(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerSRL_PARTS(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerSRA_PARTS(SDValue Op, SelectionDAG &DAG) const;
*da58b97aSjoerg    SDValue LowerFunnelShift(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerINTRINSIC_VOID(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerBSWAP(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerATOMIC_CMP_SWAP(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerMUL(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerFP_EXTEND(SDValue Op, SelectionDAG &DAG) const;
*da58b97aSjoerg    SDValue LowerFP_ROUND(SDValue Op, SelectionDAG &DAG) const;
*da58b97aSjoerg    SDValue LowerROTL(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue LowerVectorLoad(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerVectorStore(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue LowerCallResult(SDValue Chain, SDValue InFlag,
06f32e7eSjoerg                            CallingConv::ID CallConv, bool isVarArg,
06f32e7eSjoerg                            const SmallVectorImpl<ISD::InputArg> &Ins,
06f32e7eSjoerg                            const SDLoc &dl, SelectionDAG &DAG,
06f32e7eSjoerg                            SmallVectorImpl<SDValue> &InVals) const;
*da58b97aSjoerg
*da58b97aSjoerg    SDValue FinishCall(CallFlags CFlags, const SDLoc &dl, SelectionDAG &DAG,
06f32e7eSjoerg                       SmallVector<std::pair<unsigned, SDValue>, 8> &RegsToPass,
06f32e7eSjoerg                       SDValue InFlag, SDValue Chain, SDValue CallSeqStart,
06f32e7eSjoerg                       SDValue &Callee, int SPDiff, unsigned NumBytes,
06f32e7eSjoerg                       const SmallVectorImpl<ISD::InputArg> &Ins,
06f32e7eSjoerg                       SmallVectorImpl<SDValue> &InVals,
*da58b97aSjoerg                       const CallBase *CB) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue
06f32e7eSjoerg    LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
06f32e7eSjoerg                         const SmallVectorImpl<ISD::InputArg> &Ins,
06f32e7eSjoerg                         const SDLoc &dl, SelectionDAG &DAG,
06f32e7eSjoerg                         SmallVectorImpl<SDValue> &InVals) const override;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue LowerCall(TargetLowering::CallLoweringInfo &CLI,
06f32e7eSjoerg                      SmallVectorImpl<SDValue> &InVals) const override;
06f32e7eSjoerg
06f32e7eSjoerg    bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF,
06f32e7eSjoerg                        bool isVarArg,
06f32e7eSjoerg                        const SmallVectorImpl<ISD::OutputArg> &Outs,
06f32e7eSjoerg                        LLVMContext &Context) const override;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
06f32e7eSjoerg                        const SmallVectorImpl<ISD::OutputArg> &Outs,
06f32e7eSjoerg                        const SmallVectorImpl<SDValue> &OutVals,
06f32e7eSjoerg                        const SDLoc &dl, SelectionDAG &DAG) const override;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue extendArgForPPC64(ISD::ArgFlagsTy Flags, EVT ObjectVT,
06f32e7eSjoerg                              SelectionDAG &DAG, SDValue ArgVal,
06f32e7eSjoerg                              const SDLoc &dl) const;
06f32e7eSjoerg
*da58b97aSjoerg    SDValue LowerFormalArguments_AIX(
06f32e7eSjoerg        SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
06f32e7eSjoerg        const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &dl,
06f32e7eSjoerg        SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const;
06f32e7eSjoerg    SDValue LowerFormalArguments_64SVR4(
06f32e7eSjoerg        SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
06f32e7eSjoerg        const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &dl,
06f32e7eSjoerg        SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const;
06f32e7eSjoerg    SDValue LowerFormalArguments_32SVR4(
06f32e7eSjoerg        SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
06f32e7eSjoerg        const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &dl,
06f32e7eSjoerg        SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue createMemcpyOutsideCallSeq(SDValue Arg, SDValue PtrOff,
06f32e7eSjoerg                                       SDValue CallSeqStart,
06f32e7eSjoerg                                       ISD::ArgFlagsTy Flags, SelectionDAG &DAG,
06f32e7eSjoerg                                       const SDLoc &dl) const;
06f32e7eSjoerg
*da58b97aSjoerg    SDValue LowerCall_64SVR4(SDValue Chain, SDValue Callee, CallFlags CFlags,
06f32e7eSjoerg                             const SmallVectorImpl<ISD::OutputArg> &Outs,
06f32e7eSjoerg                             const SmallVectorImpl<SDValue> &OutVals,
06f32e7eSjoerg                             const SmallVectorImpl<ISD::InputArg> &Ins,
06f32e7eSjoerg                             const SDLoc &dl, SelectionDAG &DAG,
06f32e7eSjoerg                             SmallVectorImpl<SDValue> &InVals,
*da58b97aSjoerg                             const CallBase *CB) const;
*da58b97aSjoerg    SDValue LowerCall_32SVR4(SDValue Chain, SDValue Callee, CallFlags CFlags,
06f32e7eSjoerg                             const SmallVectorImpl<ISD::OutputArg> &Outs,
06f32e7eSjoerg                             const SmallVectorImpl<SDValue> &OutVals,
06f32e7eSjoerg                             const SmallVectorImpl<ISD::InputArg> &Ins,
06f32e7eSjoerg                             const SDLoc &dl, SelectionDAG &DAG,
06f32e7eSjoerg                             SmallVectorImpl<SDValue> &InVals,
*da58b97aSjoerg                             const CallBase *CB) const;
*da58b97aSjoerg    SDValue LowerCall_AIX(SDValue Chain, SDValue Callee, CallFlags CFlags,
06f32e7eSjoerg                          const SmallVectorImpl<ISD::OutputArg> &Outs,
06f32e7eSjoerg                          const SmallVectorImpl<SDValue> &OutVals,
06f32e7eSjoerg                          const SmallVectorImpl<ISD::InputArg> &Ins,
06f32e7eSjoerg                          const SDLoc &dl, SelectionDAG &DAG,
06f32e7eSjoerg                          SmallVectorImpl<SDValue> &InVals,
*da58b97aSjoerg                          const CallBase *CB) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue lowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue lowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue LowerBITCAST(SDValue Op, SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue DAGCombineExtBoolTrunc(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue DAGCombineBuildVector(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue DAGCombineTruncBoolExt(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineStoreFPToInt(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineFPToIntToFP(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineSHL(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineSRA(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineSRL(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineMUL(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineADD(SDNode *N, DAGCombinerInfo &DCI) const;
*da58b97aSjoerg    SDValue combineFMALike(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineTRUNCATE(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineSetCC(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineABS(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg    SDValue combineVSelect(SDNode *N, DAGCombinerInfo &DCI) const;
*da58b97aSjoerg    SDValue combineVectorShuffle(ShuffleVectorSDNode *SVN,
*da58b97aSjoerg                                 SelectionDAG &DAG) const;
06f32e7eSjoerg    SDValue combineVReverseMemOP(ShuffleVectorSDNode *SVN, LSBaseSDNode *LSBase,
06f32e7eSjoerg                                 DAGCombinerInfo &DCI) const;
06f32e7eSjoerg
06f32e7eSjoerg    /// ConvertSETCCToSubtract - looks at SETCC that compares ints. It replaces
06f32e7eSjoerg    /// SETCC with integer subtraction when (1) there is a legal way of doing it
06f32e7eSjoerg    /// (2) keeping the result of comparison in GPR has performance benefit.
06f32e7eSjoerg    SDValue ConvertSETCCToSubtract(SDNode *N, DAGCombinerInfo &DCI) const;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,
06f32e7eSjoerg                            int &RefinementSteps, bool &UseOneConstNR,
06f32e7eSjoerg                            bool Reciprocal) const override;
06f32e7eSjoerg    SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,
06f32e7eSjoerg                             int &RefinementSteps) const override;
*da58b97aSjoerg    SDValue getSqrtInputTest(SDValue Operand, SelectionDAG &DAG,
*da58b97aSjoerg                             const DenormalMode &Mode) const override;
*da58b97aSjoerg    SDValue getSqrtResultForDenormInput(SDValue Operand,
*da58b97aSjoerg                                        SelectionDAG &DAG) const override;
06f32e7eSjoerg    unsigned combineRepeatedFPDivisors() const override;
06f32e7eSjoerg
06f32e7eSjoerg    SDValue
06f32e7eSjoerg    combineElementTruncationToVectorTruncation(SDNode *N,
06f32e7eSjoerg                                               DAGCombinerInfo &DCI) const;
06f32e7eSjoerg
06f32e7eSjoerg    /// lowerToVINSERTH - Return the SDValue if this VECTOR_SHUFFLE can be
06f32e7eSjoerg    /// handled by the VINSERTH instruction introduced in ISA 3.0. This is
06f32e7eSjoerg    /// essentially any shuffle of v8i16 vectors that just inserts one element
06f32e7eSjoerg    /// from one vector into the other.
06f32e7eSjoerg    SDValue lowerToVINSERTH(ShuffleVectorSDNode *N, SelectionDAG &DAG) const;
06f32e7eSjoerg
06f32e7eSjoerg    /// lowerToVINSERTB - Return the SDValue if this VECTOR_SHUFFLE can be
06f32e7eSjoerg    /// handled by the VINSERTB instruction introduced in ISA 3.0. This is
06f32e7eSjoerg    /// essentially v16i8 vector version of VINSERTH.
06f32e7eSjoerg    SDValue lowerToVINSERTB(ShuffleVectorSDNode *N, SelectionDAG &DAG) const;
06f32e7eSjoerg
*da58b97aSjoerg    /// lowerToXXSPLTI32DX - Return the SDValue if this VECTOR_SHUFFLE can be
*da58b97aSjoerg    /// handled by the XXSPLTI32DX instruction introduced in ISA 3.1.
*da58b97aSjoerg    SDValue lowerToXXSPLTI32DX(ShuffleVectorSDNode *N, SelectionDAG &DAG) const;
*da58b97aSjoerg
06f32e7eSjoerg    // Return whether the call instruction can potentially be optimized to a
06f32e7eSjoerg    // tail call. This will cause the optimizers to attempt to move, or
06f32e7eSjoerg    // duplicate return instructions to help enable tail call optimizations.
06f32e7eSjoerg    bool mayBeEmittedAsTailCall(const CallInst *CI) const override;
06f32e7eSjoerg    bool hasBitPreservingFPLogic(EVT VT) const override;
06f32e7eSjoerg    bool isMaskAndCmp0FoldingBeneficial(const Instruction &AndI) const override;
*da58b97aSjoerg
*da58b97aSjoerg    /// getAddrModeForFlags - Based on the set of address flags, select the most
*da58b97aSjoerg    /// optimal instruction format to match by.
*da58b97aSjoerg    PPC::AddrMode getAddrModeForFlags(unsigned Flags) const;
*da58b97aSjoerg
*da58b97aSjoerg    /// computeMOFlags - Given a node N and it's Parent (a MemSDNode), compute
*da58b97aSjoerg    /// the address flags of the load/store instruction that is to be matched.
*da58b97aSjoerg    /// The address flags are stored in a map, which is then searched
*da58b97aSjoerg    /// through to determine the optimal load/store instruction format.
*da58b97aSjoerg    unsigned computeMOFlags(const SDNode *Parent, SDValue N,
*da58b97aSjoerg                            SelectionDAG &DAG) const;
06f32e7eSjoerg  }; // end class PPCTargetLowering
06f32e7eSjoerg
06f32e7eSjoerg  namespace PPC {
06f32e7eSjoerg
06f32e7eSjoerg    FastISel *createFastISel(FunctionLoweringInfo &FuncInfo,
06f32e7eSjoerg                             const TargetLibraryInfo *LibInfo);
06f32e7eSjoerg
06f32e7eSjoerg  } // end namespace PPC
06f32e7eSjoerg
06f32e7eSjoerg  bool isIntS16Immediate(SDNode *N, int16_t &Imm);
06f32e7eSjoerg  bool isIntS16Immediate(SDValue Op, int16_t &Imm);
*da58b97aSjoerg  bool isIntS34Immediate(SDNode *N, int64_t &Imm);
*da58b97aSjoerg  bool isIntS34Immediate(SDValue Op, int64_t &Imm);
*da58b97aSjoerg
*da58b97aSjoerg  bool convertToNonDenormSingle(APInt &ArgAPInt);
*da58b97aSjoerg  bool convertToNonDenormSingle(APFloat &ArgAPFloat);
*da58b97aSjoerg  bool checkConvertToNonDenormSingle(APFloat &ArgAPFloat);
06f32e7eSjoerg
06f32e7eSjoerg} // end namespace llvm
06f32e7eSjoerg
06f32e7eSjoerg#endif // LLVM_TARGET_POWERPC_PPC32ISELLOWERING_H