24#include "llvm/IR/IntrinsicsDirectX.h"
34#define DEBUG_TYPE "dxil-intrinsic-expansion"
49 if (IsRaw && M->getTargetTriple().getDXILVersion() >
VersionTuple(1, 2))
58 if (M->getTargetTriple().getDXILVersion() >=
VersionTuple(1, 9))
63 if (!ValTy->getScalarType()->isHalfTy())
73 ConstantInt::get(IType, 0x7c00))
74 : ConstantInt::get(IType, 0x7c00);
81 ConstantInt::get(IType, 0xfc00))
82 : ConstantInt::get(IType, 0xfc00);
84 Value *IVal = Builder.CreateBitCast(Val, PosInf->
getType());
85 Value *B1 = Builder.CreateICmpEQ(IVal, PosInf);
86 Value *B2 = Builder.CreateICmpEQ(IVal, NegInf);
87 Value *B3 = Builder.CreateOr(B1, B2);
93 if (M->getTargetTriple().getDXILVersion() >=
VersionTuple(1, 9))
98 if (!ValTy->getScalarType()->isHalfTy())
109 ConstantInt::get(IType, 0x7c00))
110 : ConstantInt::get(IType, 0x7c00);
116 ConstantInt::get(IType, 0x3ff))
117 : ConstantInt::get(IType, 0x3ff);
124 ConstantInt::get(IType, 0))
125 : ConstantInt::get(IType, 0);
127 Value *IVal = Builder.CreateBitCast(Val, ExpBitMask->
getType());
128 Value *Exp = Builder.CreateAnd(IVal, ExpBitMask);
129 Value *B1 = Builder.CreateICmpEQ(Exp, ExpBitMask);
131 Value *Sig = Builder.CreateAnd(IVal, SigBitMask);
132 Value *B2 = Builder.CreateICmpNE(Sig, Zero);
133 Value *B3 = Builder.CreateAnd(B1, B2);
139 if (M->getTargetTriple().getDXILVersion() >=
VersionTuple(1, 9))
144 if (!ValTy->getScalarType()->isHalfTy())
155 ConstantInt::get(IType, 0x7c00))
156 : ConstantInt::get(IType, 0x7c00);
158 Value *IVal = Builder.CreateBitCast(Val, ExpBitMask->
getType());
159 Value *Exp = Builder.CreateAnd(IVal, ExpBitMask);
160 Value *B1 = Builder.CreateICmpNE(Exp, ExpBitMask);
166 if (M->getTargetTriple().getDXILVersion() >=
VersionTuple(1, 9))
171 if (!ValTy->getScalarType()->isHalfTy())
182 ConstantInt::get(IType, 0x7c00))
183 : ConstantInt::get(IType, 0x7c00);
189 ConstantInt::get(IType, 0))
190 : ConstantInt::get(IType, 0);
192 Value *IVal = Builder.CreateBitCast(Val, ExpBitMask->
getType());
193 Value *Exp = Builder.CreateAnd(IVal, ExpBitMask);
194 Value *NotAllZeroes = Builder.CreateICmpNE(Exp, Zero);
195 Value *NotAllOnes = Builder.CreateICmpNE(Exp, ExpBitMask);
196 Value *B1 = Builder.CreateAnd(NotAllZeroes, NotAllOnes);
201 switch (
F.getIntrinsicID()) {
202 case Intrinsic::assume:
204 case Intrinsic::atan2:
205 case Intrinsic::fshl:
206 case Intrinsic::fshr:
208 case Intrinsic::is_fpclass:
210 case Intrinsic::log10:
212 case Intrinsic::powi:
213 case Intrinsic::dx_all:
214 case Intrinsic::dx_any:
215 case Intrinsic::dx_cross:
216 case Intrinsic::dx_uclamp:
217 case Intrinsic::dx_sclamp:
218 case Intrinsic::dx_nclamp:
219 case Intrinsic::dx_degrees:
220 case Intrinsic::dx_isinf:
221 case Intrinsic::dx_isnan:
222 case Intrinsic::dx_lerp:
223 case Intrinsic::dx_normalize:
224 case Intrinsic::dx_fdot:
225 case Intrinsic::dx_sdot:
226 case Intrinsic::dx_udot:
227 case Intrinsic::dx_sign:
228 case Intrinsic::dx_step:
229 case Intrinsic::dx_radians:
230 case Intrinsic::usub_sat:
231 case Intrinsic::vector_reduce_add:
232 case Intrinsic::vector_reduce_fadd:
233 case Intrinsic::matrix_multiply:
235 case Intrinsic::dx_resource_load_rawbuffer:
237 F.getParent(),
F.getReturnType()->getStructElementType(0),
239 case Intrinsic::dx_resource_load_typedbuffer:
241 F.getParent(),
F.getReturnType()->getStructElementType(0),
243 case Intrinsic::dx_resource_store_rawbuffer:
245 F.getParent(),
F.getFunctionType()->getParamType(3),
true);
246 case Intrinsic::dx_resource_store_typedbuffer:
248 F.getParent(),
F.getFunctionType()->getParamType(2),
false);
256 Type *Ty =
A->getType();
260 Value *Cmp = Builder.CreateICmpULT(
A,
B,
"usub.cmp");
261 Value *
Sub = Builder.CreateSub(
A,
B,
"usub.sub");
262 Value *Zero = ConstantInt::get(Ty, 0);
263 return Builder.CreateSelect(Cmp, Zero,
Sub,
"usub.sat");
267 assert(IntrinsicId == Intrinsic::vector_reduce_add ||
268 IntrinsicId == Intrinsic::vector_reduce_fadd);
271 bool IsFAdd = (IntrinsicId == Intrinsic::vector_reduce_fadd);
274 Type *Ty =
X->getType();
276 unsigned XVecSize = XVec->getNumElements();
277 Value *Sum = Builder.CreateExtractElement(
X,
static_cast<uint64_t>(0));
283 Sum = Builder.CreateFAdd(Sum, StartValue);
287 for (
unsigned I = 1;
I < XVecSize;
I++) {
288 Value *Elt = Builder.CreateExtractElement(
X,
I);
290 Sum = Builder.CreateFAdd(Sum, Elt);
292 Sum = Builder.CreateAdd(Sum, Elt);
301 Type *Ty =
X->getType();
307 ConstantInt::get(EltTy, 0))
308 : ConstantInt::get(EltTy, 0);
309 auto *V = Builder.CreateSub(Zero,
X);
310 return Builder.CreateIntrinsic(Ty, Intrinsic::smax, {
X, V},
nullptr,
324 Value *op0_x = Builder.CreateExtractElement(op0, (
uint64_t)0,
"x0");
325 Value *op0_y = Builder.CreateExtractElement(op0, 1,
"x1");
326 Value *op0_z = Builder.CreateExtractElement(op0, 2,
"x2");
328 Value *op1_x = Builder.CreateExtractElement(op1, (
uint64_t)0,
"y0");
329 Value *op1_y = Builder.CreateExtractElement(op1, 1,
"y1");
330 Value *op1_z = Builder.CreateExtractElement(op1, 2,
"y2");
333 Value *xy = Builder.CreateFMul(x0, y1);
334 Value *yx = Builder.CreateFMul(y0, x1);
335 return Builder.CreateFSub(xy, yx, Orig->
getName());
338 Value *yz_zy = MulSub(op0_y, op0_z, op1_y, op1_z);
339 Value *zx_xz = MulSub(op0_z, op0_x, op1_z, op1_x);
340 Value *xy_yx = MulSub(op0_x, op0_y, op1_x, op1_y);
343 cross = Builder.CreateInsertElement(cross, yz_zy, (
uint64_t)0);
344 cross = Builder.CreateInsertElement(cross, zx_xz, 1);
345 cross = Builder.CreateInsertElement(cross, xy_yx, 2);
353 Type *ATy =
A->getType();
354 [[maybe_unused]]
Type *BTy =
B->getType();
364 int NumElts = AVec->getNumElements();
367 DotIntrinsic = Intrinsic::dx_dot2;
370 DotIntrinsic = Intrinsic::dx_dot3;
373 DotIntrinsic = Intrinsic::dx_dot4;
377 "Invalid dot product input vector: length is outside 2-4");
382 for (
int I = 0;
I < NumElts; ++
I)
383 Args.push_back(Builder.CreateExtractElement(
A, Builder.getInt32(
I)));
384 for (
int I = 0;
I < NumElts; ++
I)
385 Args.push_back(Builder.CreateExtractElement(
B, Builder.getInt32(
I)));
386 return Builder.CreateIntrinsic(ATy->
getScalarType(), DotIntrinsic, Args,
401 assert(DotIntrinsic == Intrinsic::dx_sdot ||
402 DotIntrinsic == Intrinsic::dx_udot);
405 Type *ATy =
A->getType();
406 [[maybe_unused]]
Type *BTy =
B->getType();
416 Intrinsic::ID MadIntrinsic = DotIntrinsic == Intrinsic::dx_sdot
418 : Intrinsic::dx_umad;
421 Result = Builder.CreateMul(Elt0, Elt1);
422 for (
unsigned I = 1;
I < AVec->getNumElements();
I++) {
423 Elt0 = Builder.CreateExtractElement(
A,
I);
424 Elt1 = Builder.CreateExtractElement(
B,
I);
425 Result = Builder.CreateIntrinsic(Result->getType(), MadIntrinsic,
435 Type *Ty =
X->getType();
443 Value *NewX = Builder.CreateFMul(Log2eConst,
X);
445 Builder.CreateIntrinsic(Ty, Intrinsic::exp2, {NewX},
nullptr,
"dx.exp2");
457 switch (TCI->getZExtValue()) {
471 Type *FTy =
F->getType();
472 unsigned FNumElem = 0;
478 Type *ElemTy = FVecTy->getElementType();
479 FNumElem = FVecTy->getNumElements();
480 BitWidth = ElemTy->getPrimitiveSizeInBits();
487 Value *FBitCast = Builder.CreateBitCast(
F, BitCastTy);
488 switch (TCI->getZExtValue()) {
495 Value *NegZeroSplat = Builder.CreateVectorSplat(FNumElem, NegZero);
497 Builder.CreateICmpEQ(FBitCast, NegZeroSplat,
"is.fpclass.negzero");
499 RetVal = Builder.CreateICmpEQ(FBitCast, NegZero,
"is.fpclass.negzero");
511 Type *Ty =
X->getType();
516 if (IntrinsicId == Intrinsic::dx_any)
517 return Builder.CreateOr(Result, Elt);
518 assert(IntrinsicId == Intrinsic::dx_all);
519 return Builder.CreateAnd(Result, Elt);
522 Value *Result =
nullptr;
523 if (!Ty->isVectorTy()) {
525 ? Builder.CreateFCmpUNE(
X, ConstantFP::get(EltTy, 0))
526 : Builder.CreateICmpNE(
X, ConstantInt::get(EltTy, 0));
531 ? Builder.CreateFCmpUNE(
534 ConstantFP::get(EltTy, 0)))
535 : Builder.CreateICmpNE(
538 ConstantInt::get(EltTy, 0)));
539 Result = Builder.CreateExtractElement(
Cond, (
uint64_t)0);
540 for (
unsigned I = 1;
I < XVec->getNumElements();
I++) {
541 Value *Elt = Builder.CreateExtractElement(
Cond,
I);
542 Result = ApplyOp(IntrinsicId, Result, Elt);
553 auto *V = Builder.CreateFSub(
Y,
X);
554 V = Builder.CreateFMul(S, V);
555 return Builder.CreateFAdd(
X, V,
"dx.lerp");
562 Type *Ty =
X->getType();
568 ConstantFP::get(EltTy, LogConstVal))
569 : ConstantFP::get(EltTy, LogConstVal);
571 Builder.CreateIntrinsic(Ty, Intrinsic::log2, {
X},
nullptr,
"elt.log2");
574 return Builder.CreateFMul(Ln2Const, Log2Call);
591 const APFloat &fpVal = constantFP->getValueAPF();
595 return Builder.CreateFDiv(
X,
X);
603 const APFloat &fpVal = constantFP->getValueAPF();
608 Value *Multiplicand = Builder.CreateIntrinsic(EltTy, Intrinsic::dx_rsqrt,
610 nullptr,
"dx.rsqrt");
612 Value *MultiplicandVec =
613 Builder.CreateVectorSplat(XVec->getNumElements(), Multiplicand);
614 return Builder.CreateFMul(
X, MultiplicandVec);
620 Type *Ty =
X->getType();
624 Value *Tan = Builder.CreateFDiv(
Y,
X);
627 Builder.CreateIntrinsic(Ty, Intrinsic::atan, {Tan},
nullptr,
"Elt.Atan");
635 Constant *Zero = ConstantFP::get(Ty, 0);
636 Value *AtanAddPi = Builder.CreateFAdd(Atan, Pi);
637 Value *AtanSubPi = Builder.CreateFSub(Atan, Pi);
640 Value *Result = Atan;
641 Value *XLt0 = Builder.CreateFCmpOLT(
X, Zero);
642 Value *XEq0 = Builder.CreateFCmpOEQ(
X, Zero);
643 Value *YGe0 = Builder.CreateFCmpOGE(
Y, Zero);
644 Value *YLt0 = Builder.CreateFCmpOLT(
Y, Zero);
647 Value *XLt0AndYGe0 = Builder.CreateAnd(XLt0, YGe0);
648 Result = Builder.CreateSelect(XLt0AndYGe0, AtanAddPi, Result);
651 Value *XLt0AndYLt0 = Builder.CreateAnd(XLt0, YLt0);
652 Result = Builder.CreateSelect(XLt0AndYLt0, AtanSubPi, Result);
655 Value *XEq0AndYLt0 = Builder.CreateAnd(XEq0, YLt0);
656 Result = Builder.CreateSelect(XEq0AndYLt0, NegHalfPi, Result);
659 Value *XEq0AndYGe0 = Builder.CreateAnd(XEq0, YGe0);
660 Result = Builder.CreateSelect(XEq0AndYGe0, HalfPi, Result);
665template <
bool LeftFunnel>
674 unsigned BitWidth = Ty->getScalarSizeInBits();
676 "Can't use Mask to compute modulo and inverse");
691 Constant *Mask = ConstantInt::get(Ty, Ty->getScalarSizeInBits() - 1);
696 Value *MaskedShift = Builder.CreateAnd(Shift, Mask);
701 Value *NotShift = Builder.CreateNot(Shift);
702 Value *InverseShift = Builder.CreateAnd(NotShift, Mask);
704 Constant *One = ConstantInt::get(Ty, 1);
709 ShiftedA = Builder.CreateShl(
A, MaskedShift);
710 Value *ShiftB1 = Builder.CreateLShr(
B, One);
711 ShiftedB = Builder.CreateLShr(ShiftB1, InverseShift);
713 Value *ShiftA1 = Builder.CreateShl(
A, One);
714 ShiftedA = Builder.CreateShl(ShiftA1, InverseShift);
715 ShiftedB = Builder.CreateLShr(
B, MaskedShift);
718 Value *Result = Builder.CreateOr(ShiftedA, ShiftedB);
726 Type *Ty =
X->getType();
729 if (IntrinsicId == Intrinsic::powi)
730 Y = Builder.CreateSIToFP(
Y, Ty);
733 Builder.CreateIntrinsic(Ty, Intrinsic::log2, {
X},
nullptr,
"elt.log2");
734 auto *
Mul = Builder.CreateFMul(Log2Call,
Y);
736 Builder.CreateIntrinsic(Ty, Intrinsic::exp2, {
Mul},
nullptr,
"elt.exp2");
746 Type *Ty =
X->getType();
749 Constant *One = ConstantFP::get(Ty->getScalarType(), 1.0);
750 Constant *Zero = ConstantFP::get(Ty->getScalarType(), 0.0);
753 if (Ty != Ty->getScalarType()) {
761 return Builder.CreateSelect(
Cond, Zero, One);
766 Type *Ty =
X->getType();
769 return Builder.CreateFMul(
X, PiOver180);
779 "Only expand double or int64 scalars or vectors");
780 bool IsVector =
false;
781 unsigned ExtractNum = 2;
783 ExtractNum = 2 * VT->getNumElements();
785 assert(IsRaw || ExtractNum == 4 &&
"TypedBufferLoad vector must be size 2");
794 while (ExtractNum > 0) {
795 unsigned LoadNum = std::min(ExtractNum, 4u);
799 Intrinsic::ID LoadIntrinsic = Intrinsic::dx_resource_load_typedbuffer;
802 LoadIntrinsic = Intrinsic::dx_resource_load_rawbuffer;
803 Value *Tmp = Builder.getInt32(4 *
Base * 2);
804 Args.push_back(Builder.CreateAdd(Orig->
getOperand(2), Tmp));
807 CallInst *Load = Builder.CreateIntrinsic(LoadType, LoadIntrinsic, Args);
811 Value *Extract = Builder.CreateExtractValue(Load, {0});
814 for (
unsigned I = 0;
I < LoadNum; ++
I)
816 Builder.CreateExtractElement(Extract, Builder.getInt32(
I)));
819 for (
unsigned I = 0;
I < LoadNum;
I += 2) {
820 Value *Combined =
nullptr;
823 Combined = Builder.CreateIntrinsic(
824 Builder.getDoubleTy(), Intrinsic::dx_asdouble,
825 {ExtractElements[I], ExtractElements[I + 1]});
830 Builder.CreateZExt(ExtractElements[
I], Builder.getInt64Ty());
832 Builder.CreateZExt(ExtractElements[
I + 1], Builder.getInt64Ty());
834 Value *ShiftedHi = Builder.CreateShl(
Hi, Builder.getInt64(32));
836 Combined = Builder.CreateOr(
Lo, ShiftedHi);
840 Result = Builder.CreateInsertElement(Result, Combined,
841 Builder.getInt32((
I / 2) +
Base));
846 ExtractNum -= LoadNum;
850 Value *CheckBit =
nullptr;
861 if (Indices[0] == 0) {
863 EVI->replaceAllUsesWith(Result);
866 assert(Indices[0] == 1 &&
"Unexpected type for typedbufferload");
871 for (
Value *L : Loads)
872 CheckBits.
push_back(Builder.CreateExtractValue(L, {1}));
873 CheckBit = Builder.CreateAnd(CheckBits);
875 EVI->replaceAllUsesWith(CheckBit);
877 EVI->eraseFromParent();
886 unsigned ValIndex = IsRaw ? 3 : 2;
891 "Only expand double or int64 scalars or vectors");
894 bool IsVector =
false;
895 unsigned ExtractNum = 2;
898 VecLen = VT->getNumElements();
899 assert(IsRaw || VecLen == 2 &&
"TypedBufferStore vector must be size 2");
900 ExtractNum = VecLen * 2;
913 Value *LowBits =
nullptr;
914 Value *HighBits =
nullptr;
918 Value *Split = Builder.CreateIntrinsic(SplitTy, Intrinsic::dx_splitdouble,
920 LowBits = Builder.CreateExtractValue(Split, 0);
921 HighBits = Builder.CreateExtractValue(Split, 1);
925 Constant *ShiftAmt = Builder.getInt64(32);
931 LowBits = Builder.CreateTrunc(InputVal, SplitElementTy);
932 Value *ShiftedVal = Builder.CreateLShr(InputVal, ShiftAmt);
933 HighBits = Builder.CreateTrunc(ShiftedVal, SplitElementTy);
938 for (
unsigned I = 0;
I < VecLen; ++
I) {
940 Mask.push_back(
I + VecLen);
942 Val = Builder.CreateShuffleVector(LowBits, HighBits, Mask);
944 Val = Builder.CreateInsertElement(Val, LowBits, Builder.getInt32(0));
945 Val = Builder.CreateInsertElement(Val, HighBits, Builder.getInt32(1));
952 while (ExtractNum > 0) {
953 unsigned StoreNum = std::min(ExtractNum, 4u);
955 Intrinsic::ID StoreIntrinsic = Intrinsic::dx_resource_store_typedbuffer;
958 StoreIntrinsic = Intrinsic::dx_resource_store_rawbuffer;
960 Args.push_back(Builder.CreateAdd(Orig->
getOperand(2), Tmp));
964 for (
unsigned I = 0;
I < StoreNum; ++
I) {
965 Mask.push_back(
Base +
I);
970 SubVal = Builder.CreateShuffleVector(Val, Mask);
972 Args.push_back(SubVal);
974 Builder.CreateIntrinsic(Builder.getVoidTy(), StoreIntrinsic, Args);
976 ExtractNum -= StoreNum;
984 if (ClampIntrinsic == Intrinsic::dx_uclamp)
985 return Intrinsic::umax;
986 if (ClampIntrinsic == Intrinsic::dx_sclamp)
987 return Intrinsic::smax;
988 assert(ClampIntrinsic == Intrinsic::dx_nclamp);
989 return Intrinsic::maxnum;
993 if (ClampIntrinsic == Intrinsic::dx_uclamp)
994 return Intrinsic::umin;
995 if (ClampIntrinsic == Intrinsic::dx_sclamp)
996 return Intrinsic::smin;
997 assert(ClampIntrinsic == Intrinsic::dx_nclamp);
998 return Intrinsic::minnum;
1006 Type *Ty =
X->getType();
1008 auto *MaxCall = Builder.CreateIntrinsic(Ty,
getMaxForClamp(ClampIntrinsic),
1009 {
X, Min},
nullptr,
"dx.max");
1010 return Builder.CreateIntrinsic(Ty,
getMinForClamp(ClampIntrinsic),
1011 {MaxCall, Max},
nullptr,
"dx.min");
1016 Type *Ty =
X->getType();
1019 return Builder.CreateFMul(
X, DegreesRatio);
1024 Type *Ty =
X->getType();
1034 GT = Builder.CreateFCmpOLT(Zero,
X);
1035 LT = Builder.CreateFCmpOLT(
X, Zero);
1038 GT = Builder.CreateICmpSLT(Zero,
X);
1039 LT = Builder.CreateICmpSLT(
X, Zero);
1042 Value *ZextGT = Builder.CreateZExt(GT, RetTy);
1043 Value *ZextLT = Builder.CreateZExt(LT, RetTy);
1045 return Builder.CreateSub(ZextGT, ZextLT);
1060 Type *EltTy = RetTy->getElementType();
1071 unsigned LHSSize = LHSRows * LHSCols;
1072 unsigned RHSSize = LHSCols * RHSCols;
1075 for (
unsigned I = 0;
I < LHSSize; ++
I)
1076 LHSElts[
I] = Builder.CreateExtractElement(
LHS,
I);
1077 for (
unsigned I = 0;
I < RHSSize; ++
I)
1078 RHSElts[
I] = Builder.CreateExtractElement(
RHS,
I);
1083 bool UseScalarFP = IsFP && (EltTy->
isDoubleTy() || LHSCols == 1);
1084 if (IsFP && !UseScalarFP) {
1087 FloatDotID = Intrinsic::dx_dot2;
1090 FloatDotID = Intrinsic::dx_dot3;
1093 FloatDotID = Intrinsic::dx_dot4;
1097 "Invalid matrix inner dimension for dot product: must be 2-4");
1102 for (
unsigned C = 0;
C < RHSCols; ++
C) {
1103 for (
unsigned R = 0; R < LHSRows; ++R) {
1106 for (
unsigned K = 0; K < LHSCols; ++K) {
1107 RowElts.
push_back(LHSElts[K * LHSRows + R]);
1114 Dot = Builder.CreateFMul(RowElts[0], ColElts[0]);
1115 for (
unsigned K = 1; K < LHSCols; ++K)
1116 Dot = Builder.CreateIntrinsic(EltTy, Intrinsic::fmuladd,
1117 {RowElts[K], ColElts[K], Dot});
1121 Args.append(RowElts.
begin(), RowElts.
end());
1122 Args.append(ColElts.
begin(), ColElts.
end());
1123 Dot = Builder.CreateIntrinsic(EltTy, FloatDotID, Args);
1126 Dot = Builder.CreateMul(RowElts[0], ColElts[0]);
1127 for (
unsigned K = 1; K < LHSCols; ++K)
1128 Dot = Builder.CreateIntrinsic(EltTy, Intrinsic::dx_imad,
1129 {RowElts[K], ColElts[K], Dot});
1131 unsigned ResIdx =
C * LHSRows + R;
1132 Result = Builder.CreateInsertElement(Result, Dot, ResIdx);
1139 Value *Result =
nullptr;
1141 switch (IntrinsicId) {
1142 case Intrinsic::abs:
1145 case Intrinsic::assume:
1148 case Intrinsic::atan2:
1151 case Intrinsic::fshl:
1154 case Intrinsic::fshr:
1157 case Intrinsic::exp:
1160 case Intrinsic::is_fpclass:
1163 case Intrinsic::log:
1166 case Intrinsic::log10:
1169 case Intrinsic::pow:
1170 case Intrinsic::powi:
1173 case Intrinsic::dx_all:
1174 case Intrinsic::dx_any:
1177 case Intrinsic::dx_cross:
1180 case Intrinsic::dx_uclamp:
1181 case Intrinsic::dx_sclamp:
1182 case Intrinsic::dx_nclamp:
1185 case Intrinsic::dx_degrees:
1188 case Intrinsic::dx_isinf:
1191 case Intrinsic::dx_isnan:
1194 case Intrinsic::dx_lerp:
1197 case Intrinsic::dx_normalize:
1200 case Intrinsic::dx_fdot:
1203 case Intrinsic::dx_sdot:
1204 case Intrinsic::dx_udot:
1207 case Intrinsic::dx_sign:
1210 case Intrinsic::dx_step:
1213 case Intrinsic::dx_radians:
1216 case Intrinsic::dx_resource_load_rawbuffer:
1220 case Intrinsic::dx_resource_store_rawbuffer:
1224 case Intrinsic::dx_resource_load_typedbuffer:
1228 case Intrinsic::dx_resource_store_typedbuffer:
1232 case Intrinsic::usub_sat:
1235 case Intrinsic::vector_reduce_add:
1236 case Intrinsic::vector_reduce_fadd:
1239 case Intrinsic::matrix_multiply:
1255 bool IntrinsicExpanded =
false;
1262 if (
F.user_empty() && IntrinsicExpanded)
1263 F.eraseFromParent();
1282 "DXIL Intrinsic Expansion",
false,
false)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This file contains the declarations for the subclasses of Constant, which represent the different fla...
static Value * expand16BitIsNormal(CallInst *Orig)
static Value * expandNormalizeIntrinsic(CallInst *Orig)
static bool expandIntrinsic(Function &F, CallInst *Orig)
static Value * expandClampIntrinsic(CallInst *Orig, Intrinsic::ID ClampIntrinsic)
static Value * expand16BitIsInf(CallInst *Orig)
static bool expansionIntrinsics(Module &M)
static Value * expand16BitIsFinite(CallInst *Orig)
static Value * expandLerpIntrinsic(CallInst *Orig)
static Value * expandCrossIntrinsic(CallInst *Orig)
static Value * expandUsubSat(CallInst *Orig)
static Value * expandAnyOrAllIntrinsic(CallInst *Orig, Intrinsic::ID IntrinsicId)
static Value * expandVecReduceAdd(CallInst *Orig, Intrinsic::ID IntrinsicId)
static Value * expandAtan2Intrinsic(CallInst *Orig)
static Value * expandLog10Intrinsic(CallInst *Orig)
static Intrinsic::ID getMinForClamp(Intrinsic::ID ClampIntrinsic)
static Value * expandStepIntrinsic(CallInst *Orig)
static Value * expandIntegerDotIntrinsic(CallInst *Orig, Intrinsic::ID DotIntrinsic)
static bool expandBufferStoreIntrinsic(CallInst *Orig, bool IsRaw)
static Value * expandLogIntrinsic(CallInst *Orig, float LogConstVal=numbers::ln2f)
static Value * expandDegreesIntrinsic(CallInst *Orig)
static Value * expandPowIntrinsic(CallInst *Orig, Intrinsic::ID IntrinsicId)
static bool resourceAccessNeeds64BitExpansion(Module *M, Type *OverloadTy, bool IsRaw)
static Value * expandExpIntrinsic(CallInst *Orig)
static Value * expand16BitIsNaN(CallInst *Orig)
static Value * expandSignIntrinsic(CallInst *Orig)
static Intrinsic::ID getMaxForClamp(Intrinsic::ID ClampIntrinsic)
static Value * expandAbs(CallInst *Orig)
static Value * expandFloatDotIntrinsic(CallInst *Orig, Value *A, Value *B)
static Value * expandRadiansIntrinsic(CallInst *Orig)
static bool isIntrinsicExpansion(Function &F)
static bool expandBufferLoadIntrinsic(CallInst *Orig, bool IsRaw)
static Value * expandMatrixMultiply(CallInst *Orig)
static Value * expandIsFPClass(CallInst *Orig)
static Value * expandFunnelShiftIntrinsic(CallInst *Orig)
Module.h This file contains the declarations for the Module class.
This header defines various interfaces for pass management in LLVM.
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
const SmallVectorImpl< MachineOperand > & Cond
static unsigned getNumElements(Type *Ty)
This file defines the SmallVector class.
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")
bool runOnModule(Module &M) override
runOnModule - Virtual method overriden by subclasses to process the module being operated on.
DXILIntrinsicExpansionLegacy()
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
size_t size() const
size - Get the array size.
void setAttributes(AttributeList A)
Set the attributes for this call.
Value * getArgOperand(unsigned i) const
FunctionType * getFunctionType() const
AttributeList getAttributes() const
Return the attributes for this call.
This class represents a function call, abstracting a target machine's calling convention.
void setTailCall(bool IsTc=true)
static LLVM_ABI Constant * getSplat(ElementCount EC, Constant *Elt)
Return a ConstantVector with the specified constant in each element.
This is an important base class in LLVM.
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
LLVM_ABI bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
PreservedAnalyses run(Module &M, ModuleAnalysisManager &)
static constexpr ElementCount getFixed(ScalarTy MinVal)
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Type * getParamType(unsigned i) const
Parameter type accessors.
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
LLVM_ABI const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
LLVM_ABI FastMathFlags getFastMathFlags() const LLVM_READONLY
Convenience function for getting all the fast-math flags, which must be an operator which supports th...
ModulePass class - This class is used to implement unstructured interprocedural optimizations and ana...
A Module instance is used to store all the information related to an LLVM module.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
static LLVM_ABI StructType * get(LLVMContext &Context, ArrayRef< Type * > Elements, bool isPacked=false)
This static method is the primary way to create a literal StructType.
The instances of the Type class are immutable: once they are created, they are never changed.
LLVM_ABI Type * getStructElementType(unsigned N) const
bool isVectorTy() const
True if this is an instance of VectorType.
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
static LLVM_ABI IntegerType * getInt16Ty(LLVMContext &C)
bool isDoubleTy() const
Return true if this is 'double', a 64-bit IEEE fp type.
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
bool isIntegerTy() const
True if this is an instance of IntegerType.
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
Value * getOperand(unsigned i) const
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
iterator_range< user_iterator > users()
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.
Represents a version number in the form major[.minor[.subminor[.build]]].
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
FunctionAddr VTableAddr uintptr_t uintptr_t Int32Ty
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
ModulePass * createDXILIntrinsicExpansionLegacyPass()
Pass to expand intrinsic operations that lack DXIL opCodes.
@ Sub
Subtraction of integers.
constexpr unsigned BitWidth
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
AnalysisManager< Module > ModuleAnalysisManager
Convenience typedef for the Module analysis manager.
LLVM_ABI void reportFatalUsageError(Error Err)
Report a fatal error that does not indicate a bug in LLVM.