21#define GET_SDNODE_DESC
22#include "X86GenSDNodeInfo.inc"
26#define DEBUG_TYPE "x86-selectiondag-info"
30 cl::desc(
"Use fast short rep mov in memcpy lowering"));
36#define NODE_NAME_CASE(NODE) \
38 return "X86ISD::" #NODE;
70 switch (
N->getOpcode()) {
73 case X86ISD::VP2INTERSECT:
75 case X86ISD::FSETCCM_SAE:
77 case X86ISD::CVTTP2SI_SAE:
78 case X86ISD::CVTTP2UI_SAE:
79 case X86ISD::CVTTP2IBS_SAE:
81 case X86ISD::CMPMM_SAE:
84 case X86ISD::NT_BRIND:
86 case X86ISD::INSERTQI:
89 case X86ISD::CMPCCXADD:
110 return Subtarget.is64Bit() ? MVT::i64 : MVT::i32;
114bool X86SelectionDAGInfo::isBaseRegConflictPossible(
125 const X86RegisterInfo *
TRI =
static_cast<const X86RegisterInfo *
>(
135 unsigned AX = X86::AL;
151 const unsigned CX = Use64BitRegs ? X86::RCX : X86::ECX;
152 const unsigned DI = Use64BitRegs ? X86::RDI : X86::EDI;
164 return DAG.
getNode(X86ISD::REP_STOS, dl, Tys,
Ops);
171 return emitRepstos(Subtarget, DAG, dl, Chain, Dst, Val,
184 bool isVolatile,
bool AlwaysInline,
192 if ((
Size & 31) == 0 && (ValC->getZExtValue() & 255) == 0) {
193 MVT BlockType = MVT::i32;
194 const uint64_t BlockBits = BlockType.getSizeInBits();
195 const uint64_t BlockBytes = BlockBits / 8;
200 return emitRepstos(Subtarget, DAG, dl, Chain, Dst, Val,
213 if (Alignment <
Align(4))
216 MVT BlockType = MVT::i8;
224 const uint64_t BlockBits = BlockType.getSizeInBits();
235 const uint64_t BlockBytes = BlockBits / 8;
236 BlockCount =
Size / BlockBytes;
237 BytesLeft =
Size % BlockBytes;
252 EVT AddrVT = Dst.getValueType();
258 OriginalVal, DAG.
getConstant(BytesLeft, dl, SizeVT),
259 Alignment, isVolatile, AlwaysInline,
274 const MCPhysReg ClobberSet[] = {X86::RCX, X86::RAX, X86::RDI,
275 X86::ECX, X86::EAX, X86::EDI};
276 if (isBaseRegConflictPossible(DAG, ClobberSet))
286 DAG, Subtarget, dl, Chain, Dst, Val, ConstantSize->
getZExtValue(),
287 Size.getValueType(), Alignment, isVolatile, AlwaysInline, DstPtrInfo);
295 const unsigned CX = Use64BitRegs ? X86::RCX : X86::ECX;
296 const unsigned DI = Use64BitRegs ? X86::RDI : X86::EDI;
297 const unsigned SI = Use64BitRegs ? X86::RSI : X86::ESI;
309 return DAG.
getNode(X86ISD::REP_MOVS, dl, Tys,
Ops);
316 return emitRepmovs(Subtarget, DAG, dl, Chain, Dst, Src,
327 Align Alignment,
bool isVolatile,
bool AlwaysInline,
340 if (Subtarget.hasERMSB())
343 assert(!Subtarget.hasERMSB() &&
"No efficient RepMovs");
346 if (!AlwaysInline && (Alignment <
Align(4)))
350 const uint64_t BlockBytes = BlockType.getSizeInBits() / 8;
361 assert(BytesLeft &&
"We have leftover at this point");
367 EVT DstVT = Dst.getValueType();
368 EVT SrcVT = Src.getValueType();
373 DAG.
getConstant(BytesLeft, dl, SizeVT), Alignment, isVolatile,
374 true,
nullptr, std::nullopt,
389 const MCPhysReg ClobberSet[] = {X86::RCX, X86::RSI, X86::RDI,
390 X86::ECX, X86::ESI, X86::EDI};
391 if (isBaseRegConflictPossible(DAG, ClobberSet))
399 return emitRepmovs(Subtarget, DAG, dl, Chain, Dst, Src,
Size, MVT::i8);
404 ConstantSize->getZExtValue(),
405 Size.getValueType(), Alignment, isVolatile,
406 AlwaysInline, DstPtrInfo, SrcPtrInfo);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
#define NODE_NAME_CASE(node)
Function Alias Analysis Results
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Register const TargetRegisterInfo * TRI
This file describes how to lower LLVM code to machine code.
static SDValue emitRepstos(const X86Subtarget &Subtarget, SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Val, SDValue Size, MVT AVT)
Emit a single REP STOSB instruction for a particular constant size.
static SDValue emitRepmovsB(const X86Subtarget &Subtarget, SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src, uint64_t Size)
Emit a single REP MOVSB instruction for a particular constant size.
static SDValue emitRepstosB(const X86Subtarget &Subtarget, SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Val, uint64_t Size)
Emit a single REP STOSB instruction for a particular constant size.
static SDValue emitConstantSizeRepmov(SelectionDAG &DAG, const X86Subtarget &Subtarget, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src, uint64_t Size, EVT SizeVT, Align Alignment, bool isVolatile, bool AlwaysInline, MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo)
Returns a REP MOVS instruction, possibly with a few load/stores to implement a constant size memory c...
static MVT getOptimalRepType(const X86Subtarget &Subtarget, Align Alignment)
Returns the best type to use with repmovs/repstos depending on alignment.
static cl::opt< bool > UseFSRMForMemcpy("x86-use-fsrm-for-memcpy", cl::Hidden, cl::init(false), cl::desc("Use fast short rep mov in memcpy lowering"))
static SDValue emitConstantSizeRepstos(SelectionDAG &DAG, const X86Subtarget &Subtarget, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Val, uint64_t Size, EVT SizeVT, Align Alignment, bool isVolatile, bool AlwaysInline, MachinePointerInfo DstPtrInfo)
Returns a REP STOS instruction, possibly with a few load/stores to implement a constant size memory s...
static SDValue emitRepmovs(const X86Subtarget &Subtarget, SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src, SDValue Size, MVT AVT)
Emit a single REP MOVS{B,W,D,Q} instruction.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
uint64_t getZExtValue() const
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
TypeSize getSizeInBits() const
Returns the size of the specified MVT in bits.
bool hasVarSizedObjects() const
This method may be called any time after instruction selection is complete to determine if the stack ...
bool hasOpaqueSPAdjustment() const
Returns true if the function contains opaque dynamic stack adjustments.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Function & getFunction()
Return the LLVM function that this machine code represents.
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
SDValue getValue(unsigned R) const
const char * getTargetNodeName(unsigned Opcode) const override
Returns the name of the given target-specific opcode, suitable for debug printing.
SelectionDAGGenTargetInfo(const SDNodeInfo &GenNodeInfo)
bool isTargetMemoryOpcode(unsigned Opcode) const override
Returns true if a node with the given target-specific opcode has a memory operand.
void verifyTargetNode(const SelectionDAG &DAG, const SDNode *N) const override
Checks that the given target-specific node is valid. Aborts if it is not.
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
const TargetSubtargetInfo & getSubtarget() const
SDValue getCopyToReg(SDValue Chain, const SDLoc &dl, Register Reg, SDValue N)
LLVM_ABI SDVTList getVTList(EVT VT)
Return an SDVTList that represents the list of values specified.
LLVM_ABI SDValue getMemset(SDValue Chain, const SDLoc &dl, SDValue Dst, SDValue Src, SDValue Size, Align Alignment, bool isVol, bool AlwaysInline, const CallInst *CI, MachinePointerInfo DstPtrInfo, const AAMDNodes &AAInfo=AAMDNodes())
LLVM_ABI SDValue getMemcpy(SDValue Chain, const SDLoc &dl, SDValue Dst, SDValue Src, SDValue Size, Align Alignment, bool isVol, bool AlwaysInline, const CallInst *CI, std::optional< bool > OverrideTailCall, MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo, const AAMDNodes &AAInfo=AAMDNodes(), BatchAAResults *BatchAA=nullptr)
LLVM_ABI SDValue getConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Create a ConstantSDNode wrapping a constant value.
LLVM_ABI SDValue getIntPtrConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
LLVM_ABI SDValue getValueType(EVT)
LLVM_ABI SDValue getNode(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDUse > Ops)
Gets or creates the specified node.
MachineFunction & getMachineFunction() const
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
LLVM Value Representation.
bool isTargetMemoryOpcode(unsigned Opcode) const override
Returns true if a node with the given target-specific opcode has a memory operand.
void verifyTargetNode(const SelectionDAG &DAG, const SDNode *N) const override
Checks that the given target-specific node is valid. Aborts if it is not.
const char * getTargetNodeName(unsigned Opcode) const override
Returns the name of the given target-specific opcode, suitable for debug printing.
SDValue EmitTargetCodeForMemcpy(SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src, SDValue Size, Align Alignment, bool isVolatile, bool AlwaysInline, MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo) const override
Emit target-specific code that performs a memcpy.
SDValue EmitTargetCodeForMemset(SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src, SDValue Size, Align Alignment, bool isVolatile, bool AlwaysInline, MachinePointerInfo DstPtrInfo) const override
Emit target-specific code that performs a memset.
bool isTarget64BitLP64() const
Is this x86_64 with the LP64 programming model (standard AMD64, no x32)?
unsigned getMaxInlineSizeThreshold() const
Returns the maximum memset / memcpy size that still makes it profitable to inline the call.
@ ADD
Simple integer binary arithmetic operators.
@ TokenFactor
TokenFactor - This node takes multiple tokens as input and produces a single token result.
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
uint16_t MCPhysReg
An unsigned integer type large enough to represent all physical registers, but not necessarily virtua...
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
This struct is a compact representation of a valid (non-zero power of two) alignment.
constexpr uint64_t value() const
This is a hole in the type system and should not be abused.
This class contains a discriminated union of information about pointers in memory operands,...
LLVM_ABI unsigned getAddrSpace() const
Return the LLVM IR address space number that this pointer points into.
MachinePointerInfo getWithOffset(int64_t O) const
This represents a list of ValueType's that has been intern'd by a SelectionDAG.