LLVM 23.0.0git
InstCombineInternal.h
Go to the documentation of this file.
1//===- InstCombineInternal.h - InstCombine pass internals -------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9/// \file
10///
11/// This file provides internal interfaces used to implement the InstCombine.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef LLVM_LIB_TRANSFORMS_INSTCOMBINE_INSTCOMBINEINTERNAL_H
16#define LLVM_LIB_TRANSFORMS_INSTCOMBINE_INSTCOMBINEINTERNAL_H
17
19#include "llvm/ADT/Statistic.h"
23#include "llvm/IR/IRBuilder.h"
24#include "llvm/IR/InstVisitor.h"
27#include "llvm/IR/Value.h"
28#include "llvm/Support/Debug.h"
33#include <cassert>
34
35#define DEBUG_TYPE "instcombine"
37
38// As a default, let's assume that we want to be aggressive,
39// and attempt to traverse with no limits in attempt to sink negation.
40static constexpr unsigned NegatorDefaultMaxDepth = ~0U;
41
42// Let's guesstimate that most often we will end up visiting/producing
43// fairly small number of new instructions.
44static constexpr unsigned NegatorMaxNodesSSO = 16;
45
46namespace llvm {
47
48class AAResults;
49class APInt;
50class AssumptionCache;
51class BlockFrequencyInfo;
52class DataLayout;
53class DominatorTree;
54class GEPOperator;
55class GlobalVariable;
56class OptimizationRemarkEmitter;
57class ProfileSummaryInfo;
58class TargetLibraryInfo;
59class User;
60
62 : public InstCombiner,
63 public InstVisitor<InstCombinerImpl, Instruction *> {
64public:
74
75 ~InstCombinerImpl() override = default;
76
77 /// Perform early cleanup and prepare the InstCombine worklist.
79
80 /// Run the combiner over the entire worklist until it is empty.
81 ///
82 /// \returns true if the IR is changed.
83 bool run();
84
85 // Visitation implementation - Implement instruction combining for different
86 // instruction types. The semantics are as follows:
87 // Return Value:
88 // null - No change was made
89 // I - Change was made, I is still valid, I may be dead though
90 // otherwise - Change was made, replace I with returned instruction
91 //
96 Value *LHS, Value *RHS, Type *Ty, bool isNUW);
113 Value *simplifyRangeCheck(ICmpInst *Cmp0, ICmpInst *Cmp1, bool Inverted);
122 BinaryOperator *Sh0, const SimplifyQuery &SQ,
123 bool AnalyzeForSignBitExtraction = false);
127 BinaryOperator &OldAShr);
158
165 Instruction *visitFree(CallInst &FI, Value *FreedOp);
186 bool freezeOtherUses(FreezeInst &FI);
189
190 /// Specify what to return for unhandled instructions.
192
193 /// True when DB dominates all uses of DI except UI.
194 /// UI must be in the same block as DI.
195 /// The routine checks that the DI parent and DB are different.
196 bool dominatesAllUses(const Instruction *DI, const Instruction *UI,
197 const BasicBlock *DB) const;
198
199 /// Try to replace select with select operand SIOpd in SI-ICmp sequence.
200 bool replacedSelectWithOperand(SelectInst *SI, const ICmpInst *Icmp,
201 const unsigned SIOpd);
202
203 LoadInst *combineLoadToNewType(LoadInst &LI, Type *NewTy,
204 const Twine &Suffix = "");
205
206 /// Check if fmul \p MulVal, +0.0 will yield +0.0 (or signed zero is
207 /// ignorable).
209 const Instruction *CtxI) const;
210
211 std::optional<std::pair<Intrinsic::ID, SmallVector<Value *, 3>>>
213
214private:
215 bool annotateAnyAllocSite(CallBase &Call, const TargetLibraryInfo *TLI);
216 bool isDesirableIntType(unsigned BitWidth) const;
217 bool shouldChangeType(unsigned FromBitWidth, unsigned ToBitWidth) const;
218 bool shouldChangeType(Type *From, Type *To) const;
219 Value *dyn_castNegVal(Value *V) const;
220
221 /// Classify whether a cast is worth optimizing.
222 ///
223 /// This is a helper to decide whether the simplification of
224 /// logic(cast(A), cast(B)) to cast(logic(A, B)) should be performed.
225 ///
226 /// \param CI The cast we are interested in.
227 ///
228 /// \return true if this cast actually results in any code being generated and
229 /// if it cannot already be eliminated by some other transformation.
230 bool shouldOptimizeCast(CastInst *CI);
231
232 /// Try to optimize a sequence of instructions checking if an operation
233 /// on LHS and RHS overflows.
234 ///
235 /// If this overflow check is done via one of the overflow check intrinsics,
236 /// then CtxI has to be the call instruction calling that intrinsic. If this
237 /// overflow check is done by arithmetic followed by a compare, then CtxI has
238 /// to be the arithmetic instruction.
239 ///
240 /// If a simplification is possible, stores the simplified result of the
241 /// operation in OperationResult and result of the overflow check in
242 /// OverflowResult, and return true. If no simplification is possible,
243 /// returns false.
244 bool OptimizeOverflowCheck(Instruction::BinaryOps BinaryOp, bool IsSigned,
245 Value *LHS, Value *RHS,
246 Instruction &CtxI, Value *&OperationResult,
248
249 Instruction *visitCallBase(CallBase &Call);
250 Instruction *tryOptimizeCall(CallInst *CI);
251 bool transformConstExprCastCall(CallBase &Call);
252 Instruction *transformCallThroughTrampoline(CallBase &Call,
253 IntrinsicInst &Tramp);
254
255 /// Try to optimize a call to the result of a ptrauth intrinsic, potentially
256 /// into the ptrauth call bundle:
257 /// - call(ptrauth.resign(p)), ["ptrauth"()] -> call p, ["ptrauth"()]
258 /// - call(ptrauth.sign(p)), ["ptrauth"()] -> call p
259 /// as long as the key/discriminator are the same in sign and auth-bundle,
260 /// and we don't change the key in the bundle (to a potentially-invalid key.)
261 Instruction *foldPtrAuthIntrinsicCallee(CallBase &Call);
262
263 /// Try to optimize a call to a ptrauth constant, into its ptrauth bundle:
264 /// call(ptrauth(f)), ["ptrauth"()] -> call f
265 /// as long as the key/discriminator are the same in constant and bundle.
266 Instruction *foldPtrAuthConstantCallee(CallBase &Call);
267
268 // Return (a, b) if (LHS, RHS) is known to be (a, b) or (b, a).
269 // Otherwise, return std::nullopt
270 // Currently it matches:
271 // - LHS = (select c, a, b), RHS = (select c, b, a)
272 // - LHS = (phi [a, BB0], [b, BB1]), RHS = (phi [b, BB0], [a, BB1])
273 // - LHS = min(a, b), RHS = max(a, b)
274 std::optional<std::pair<Value *, Value *>> matchSymmetricPair(Value *LHS,
275 Value *RHS);
276
277 Value *simplifyMaskedLoad(IntrinsicInst &II);
278 Instruction *simplifyMaskedStore(IntrinsicInst &II);
279 Instruction *simplifyMaskedGather(IntrinsicInst &II);
280 Instruction *simplifyMaskedScatter(IntrinsicInst &II);
281
282 /// Transform (zext icmp) to bitwise / integer operations in order to
283 /// eliminate it.
284 ///
285 /// \param ICI The icmp of the (zext icmp) pair we are interested in.
286 /// \parem CI The zext of the (zext icmp) pair we are interested in.
287 ///
288 /// \return null if the transformation cannot be performed. If the
289 /// transformation can be performed the new instruction that replaces the
290 /// (zext icmp) pair will be returned.
291 Instruction *transformZExtICmp(ICmpInst *Cmp, ZExtInst &Zext);
292
293 Instruction *transformSExtICmp(ICmpInst *Cmp, SExtInst &Sext);
294
295 bool willNotOverflowSignedAdd(const WithCache<const Value *> &LHS,
297 const Instruction &CxtI) const {
298 return computeOverflowForSignedAdd(LHS, RHS, &CxtI) ==
300 }
301
302 bool willNotOverflowUnsignedAdd(const WithCache<const Value *> &LHS,
304 const Instruction &CxtI) const {
305 return computeOverflowForUnsignedAdd(LHS, RHS, &CxtI) ==
307 }
308
309 bool willNotOverflowAdd(const Value *LHS, const Value *RHS,
310 const Instruction &CxtI, bool IsSigned) const {
311 return IsSigned ? willNotOverflowSignedAdd(LHS, RHS, CxtI)
312 : willNotOverflowUnsignedAdd(LHS, RHS, CxtI);
313 }
314
315 bool willNotOverflowSignedSub(const Value *LHS, const Value *RHS,
316 const Instruction &CxtI) const {
317 return computeOverflowForSignedSub(LHS, RHS, &CxtI) ==
318 OverflowResult::NeverOverflows;
319 }
320
321 bool willNotOverflowUnsignedSub(const Value *LHS, const Value *RHS,
322 const Instruction &CxtI) const {
323 return computeOverflowForUnsignedSub(LHS, RHS, &CxtI) ==
324 OverflowResult::NeverOverflows;
325 }
326
327 bool willNotOverflowSub(const Value *LHS, const Value *RHS,
328 const Instruction &CxtI, bool IsSigned) const {
329 return IsSigned ? willNotOverflowSignedSub(LHS, RHS, CxtI)
330 : willNotOverflowUnsignedSub(LHS, RHS, CxtI);
331 }
332
333 bool willNotOverflowSignedMul(const Value *LHS, const Value *RHS,
334 const Instruction &CxtI) const {
335 return computeOverflowForSignedMul(LHS, RHS, &CxtI) ==
336 OverflowResult::NeverOverflows;
337 }
338
339 bool willNotOverflowUnsignedMul(const Value *LHS, const Value *RHS,
340 const Instruction &CxtI,
341 bool IsNSW = false) const {
342 return computeOverflowForUnsignedMul(LHS, RHS, &CxtI, IsNSW) ==
343 OverflowResult::NeverOverflows;
344 }
345
346 bool willNotOverflowMul(const Value *LHS, const Value *RHS,
347 const Instruction &CxtI, bool IsSigned) const {
348 return IsSigned ? willNotOverflowSignedMul(LHS, RHS, CxtI)
349 : willNotOverflowUnsignedMul(LHS, RHS, CxtI);
350 }
351
352 bool willNotOverflow(BinaryOperator::BinaryOps Opcode, const Value *LHS,
353 const Value *RHS, const Instruction &CxtI,
354 bool IsSigned) const {
355 switch (Opcode) {
356 case Instruction::Add: return willNotOverflowAdd(LHS, RHS, CxtI, IsSigned);
357 case Instruction::Sub: return willNotOverflowSub(LHS, RHS, CxtI, IsSigned);
358 case Instruction::Mul: return willNotOverflowMul(LHS, RHS, CxtI, IsSigned);
359 default: llvm_unreachable("Unexpected opcode for overflow query");
360 }
361 }
362
363 Value *EmitGEPOffset(GEPOperator *GEP, bool RewriteGEP = false);
364 /// Emit sum of multiple GEP offsets. The GEPs are processed in reverse
365 /// order.
366 Value *EmitGEPOffsets(ArrayRef<GEPOperator *> GEPs, GEPNoWrapFlags NW,
367 Type *IdxTy, bool RewriteGEPs);
368 Instruction *scalarizePHI(ExtractElementInst &EI, PHINode *PN);
369 Instruction *foldBitcastExtElt(ExtractElementInst &ExtElt);
370 Instruction *foldCastedBitwiseLogic(BinaryOperator &I);
371 Instruction *foldFBinOpOfIntCasts(BinaryOperator &I);
372 // Should only be called by `foldFBinOpOfIntCasts`.
373 Instruction *foldFBinOpOfIntCastsFromSign(
374 BinaryOperator &BO, bool OpsFromSigned, std::array<Value *, 2> IntOps,
375 Constant *Op1FpC, SmallVectorImpl<WithCache<const Value *>> &OpsKnown);
376 Instruction *foldBinopOfSextBoolToSelect(BinaryOperator &I);
377 Instruction *narrowBinOp(TruncInst &Trunc);
378 Instruction *narrowMaskedBinOp(BinaryOperator &And);
379 Instruction *narrowMathIfNoOverflow(BinaryOperator &I);
380 Instruction *narrowFunnelShift(TruncInst &Trunc);
381 Instruction *optimizeBitCastFromPhi(CastInst &CI, PHINode *PN);
382 Instruction *matchSAddSubSat(IntrinsicInst &MinMax1);
383 Instruction *foldNot(BinaryOperator &I);
384 Instruction *foldBinOpOfDisplacedShifts(BinaryOperator &I);
385
386 /// Determine if a pair of casts can be replaced by a single cast.
387 ///
388 /// \param CI1 The first of a pair of casts.
389 /// \param CI2 The second of a pair of casts.
390 ///
391 /// \return 0 if the cast pair cannot be eliminated, otherwise returns an
392 /// Instruction::CastOps value for a cast that can replace the pair, casting
393 /// CI1->getSrcTy() to CI2->getDstTy().
394 ///
395 /// \see CastInst::isEliminableCastPair
396 Instruction::CastOps isEliminableCastPair(const CastInst *CI1,
397 const CastInst *CI2);
398 Value *simplifyIntToPtrRoundTripCast(Value *Val);
399
400 Value *foldAndOrOfICmps(ICmpInst *LHS, ICmpInst *RHS, Instruction &I,
401 bool IsAnd, bool IsLogical = false);
402 Value *foldXorOfICmps(ICmpInst *LHS, ICmpInst *RHS, BinaryOperator &Xor);
403
404 Value *foldEqOfParts(Value *Cmp0, Value *Cmp1, bool IsAnd);
405
406 Value *foldAndOrOfICmpsUsingRanges(ICmpInst *ICmp1, ICmpInst *ICmp2,
407 bool IsAnd);
408
409 /// Optimize (fcmp)&(fcmp) or (fcmp)|(fcmp).
410 /// NOTE: Unlike most of instcombine, this returns a Value which should
411 /// already be inserted into the function.
412 Value *foldLogicOfFCmps(FCmpInst *LHS, FCmpInst *RHS, bool IsAnd,
413 bool IsLogicalSelect = false);
414
415 Instruction *foldLogicOfIsFPClass(BinaryOperator &Operator, Value *LHS,
416 Value *RHS);
417
418 Value *foldBooleanAndOr(Value *LHS, Value *RHS, Instruction &I, bool IsAnd,
419 bool IsLogical);
420
421 Value *reassociateBooleanAndOr(Value *LHS, Value *X, Value *Y, Instruction &I,
422 bool IsAnd, bool RHSIsLogical);
423
424 Value *foldDisjointOr(Value *LHS, Value *RHS);
425
426 Value *reassociateDisjointOr(Value *LHS, Value *RHS);
427
429 canonicalizeConditionalNegationViaMathToSelect(BinaryOperator &i);
430
431 Value *matchSelectFromAndOr(Value *A, Value *B, Value *C, Value *D,
432 bool InvertFalseVal = false);
433 Value *getSelectCondition(Value *A, Value *B, bool ABIsTheSame);
434
435 Instruction *foldLShrOverflowBit(BinaryOperator &I);
436 Instruction *foldExtractOfOverflowIntrinsic(ExtractValueInst &EV);
437 Instruction *foldIntrinsicWithOverflowCommon(IntrinsicInst *II);
438 Instruction *foldIntrinsicIsFPClass(IntrinsicInst &II);
439 Instruction *foldFPSignBitOps(BinaryOperator &I);
440 Instruction *foldFDivConstantDivisor(BinaryOperator &I);
441
442 // Optimize one of these forms:
443 // and i1 Op, SI / select i1 Op, i1 SI, i1 false (if IsAnd = true)
444 // or i1 Op, SI / select i1 Op, i1 true, i1 SI (if IsAnd = false)
445 // into simplier select instruction using isImpliedCondition.
446 Instruction *foldAndOrOfSelectUsingImpliedCond(Value *Op, SelectInst &SI,
447 bool IsAnd);
448
449 Instruction *hoistFNegAboveFMulFDiv(Value *FNegOp, Instruction &FMFSource);
450
451 /// Simplify \p V given that it is known to be non-null.
452 /// Returns the simplified value if possible, otherwise returns nullptr.
453 /// If \p HasDereferenceable is true, the simplification will not perform
454 /// same object checks.
455 Value *simplifyNonNullOperand(Value *V, bool HasDereferenceable,
456 unsigned Depth = 0);
457
458 /// Create `select C, S1, S2`. Use only when the profile cannot be calculated
459 /// from existing profile metadata: if the Function has profiles, this will
460 /// set the profile of this select to "unknown".
461 SelectInst *
462 createSelectInstWithUnknownProfile(Value *C, Value *S1, Value *S2,
463 const Twine &NameStr = "",
464 InsertPosition InsertBefore = nullptr) {
465 auto *Sel = SelectInst::Create(C, S1, S2, NameStr, InsertBefore, nullptr);
467 return Sel;
468 }
469
470public:
471 /// Create and insert the idiom we use to indicate a block is unreachable
472 /// without having to rewrite the CFG from within InstCombine.
474 auto &Ctx = InsertAt->getContext();
475 auto *SI = new StoreInst(ConstantInt::getTrue(Ctx),
477 /*isVolatile*/ false, Align(1));
478 InsertNewInstWith(SI, InsertAt->getIterator());
479 }
480
481 /// Combiner aware instruction erasure.
482 ///
483 /// When dealing with an instruction that has side effects or produces a void
484 /// value, we can't rely on DCE to delete the instruction. Instead, visit
485 /// methods should return the value returned by this function.
487 LLVM_DEBUG(dbgs() << "IC: ERASE " << I << '\n');
488 assert(I.use_empty() && "Cannot erase instruction that is used!");
490
491 // Make sure that we reprocess all operands now that we reduced their
492 // use counts.
493 SmallVector<Value *> Ops(I.operands());
494 Worklist.remove(&I);
495 DC.removeValue(&I);
496 I.eraseFromParent();
497 for (Value *Op : Ops)
498 Worklist.handleUseCountDecrement(Op);
499 MadeIRChange = true;
500 return nullptr; // Don't do anything with FI
501 }
502
503 OverflowResult computeOverflow(
504 Instruction::BinaryOps BinaryOp, bool IsSigned,
505 Value *LHS, Value *RHS, Instruction *CxtI) const;
506
507 /// Performs a few simplifications for operators which are associative
508 /// or commutative.
509 bool SimplifyAssociativeOrCommutative(BinaryOperator &I);
510
511 /// Tries to simplify binary operations which some other binary
512 /// operation distributes over.
513 ///
514 /// It does this by either by factorizing out common terms (eg "(A*B)+(A*C)"
515 /// -> "A*(B+C)") or expanding out if this results in simplifications (eg: "A
516 /// & (B | C) -> (A&B) | (A&C)" if this is a win). Returns the simplified
517 /// value, or null if it didn't simplify.
518 Value *foldUsingDistributiveLaws(BinaryOperator &I);
519
520 /// Tries to simplify add operations using the definition of remainder.
521 ///
522 /// The definition of remainder is X % C = X - (X / C ) * C. The add
523 /// expression X % C0 + (( X / C0 ) % C1) * C0 can be simplified to
524 /// X % (C0 * C1)
525 Value *SimplifyAddWithRemainder(BinaryOperator &I);
526
527 // Binary Op helper for select operations where the expression can be
528 // efficiently reorganized.
529 Value *SimplifySelectsFeedingBinaryOp(BinaryOperator &I, Value *LHS,
530 Value *RHS);
531
532 // If `I` has operand `(ctpop (not x))`, fold `I` with `(sub nuw nsw
533 // BitWidth(x), (ctpop x))`.
534 Instruction *tryFoldInstWithCtpopWithNot(Instruction *I);
535
536 // (Binop1 (Binop2 (logic_shift X, C), C1), (logic_shift Y, C))
537 // -> (logic_shift (Binop1 (Binop2 X, inv_logic_shift(C1, C)), Y), C)
538 // (Binop1 (Binop2 (logic_shift X, Amt), Mask), (logic_shift Y, Amt))
539 // -> (BinOp (logic_shift (BinOp X, Y)), Mask)
540 Instruction *foldBinOpShiftWithShift(BinaryOperator &I);
541
542 /// Tries to simplify binops of select and cast of the select condition.
543 ///
544 /// (Binop (cast C), (select C, T, F))
545 /// -> (select C, C0, C1)
546 Instruction *foldBinOpOfSelectAndCastOfSelectCondition(BinaryOperator &I);
547
548 /// This tries to simplify binary operations by factorizing out common terms
549 /// (e. g. "(A*B)+(A*C)" -> "A*(B+C)").
550 Value *tryFactorizationFolds(BinaryOperator &I);
551
552 /// Match a select chain which produces one of three values based on whether
553 /// the LHS is less than, equal to, or greater than RHS respectively.
554 /// Return true if we matched a three way compare idiom. The LHS, RHS, Less,
555 /// Equal and Greater values are saved in the matching process and returned to
556 /// the caller.
557 bool matchThreeWayIntCompare(SelectInst *SI, Value *&LHS, Value *&RHS,
558 ConstantInt *&Less, ConstantInt *&Equal,
559 ConstantInt *&Greater);
560
561 /// Attempts to replace I with a simpler value based on the demanded
562 /// bits.
563 Value *SimplifyDemandedUseBits(Instruction *I, const APInt &DemandedMask,
564 KnownBits &Known, const SimplifyQuery &Q,
565 unsigned Depth = 0);
567 bool SimplifyDemandedBits(Instruction *I, unsigned Op,
568 const APInt &DemandedMask, KnownBits &Known,
569 const SimplifyQuery &Q,
570 unsigned Depth = 0) override;
571
572 /// Helper routine of SimplifyDemandedUseBits. It computes KnownZero/KnownOne
573 /// bits. It also tries to handle simplifications that can be done based on
574 /// DemandedMask, but without modifying the Instruction.
575 Value *SimplifyMultipleUseDemandedBits(Instruction *I,
576 const APInt &DemandedMask,
577 KnownBits &Known,
578 const SimplifyQuery &Q,
579 unsigned Depth = 0);
580
581 /// Helper routine of SimplifyDemandedUseBits. It tries to simplify demanded
582 /// bit for "r1 = shr x, c1; r2 = shl r1, c2" instruction sequence.
583 Value *simplifyShrShlDemandedBits(
584 Instruction *Shr, const APInt &ShrOp1, Instruction *Shl,
585 const APInt &ShlOp1, const APInt &DemandedMask, KnownBits &Known);
586
587 /// Tries to simplify operands to an integer instruction based on its
588 /// demanded bits.
589 bool SimplifyDemandedInstructionBits(Instruction &Inst);
590 bool SimplifyDemandedInstructionBits(Instruction &Inst, KnownBits &Known);
591
592 Value *SimplifyDemandedVectorElts(Value *V, APInt DemandedElts,
593 APInt &PoisonElts, unsigned Depth = 0,
594 bool AllowMultipleUsers = false) override;
595
596 /// Attempts to replace V with a simpler value based on the demanded
597 /// floating-point classes
598 Value *SimplifyDemandedUseFPClass(Instruction *I, FPClassTest DemandedMask,
599 KnownFPClass &Known, const SimplifyQuery &Q,
600 unsigned Depth = 0);
601 Value *SimplifyMultipleUseDemandedFPClass(Instruction *I,
602 FPClassTest DemandedMask,
603 KnownFPClass &Known,
604 const SimplifyQuery &Q,
605 unsigned Depth);
606
607 bool SimplifyDemandedFPClass(Instruction *I, unsigned Op,
608 FPClassTest DemandedMask, KnownFPClass &Known,
609 unsigned Depth = 0);
610
611 bool SimplifyDemandedInstructionFPClass(Instruction &Inst);
612
613 /// Common transforms for add / disjoint or
614 Instruction *foldAddLikeCommutative(Value *LHS, Value *RHS, bool NSW,
615 bool NUW);
616
617 /// Canonicalize the position of binops relative to shufflevector.
618 Instruction *foldVectorBinop(BinaryOperator &Inst);
622 VectorType *NewCTy);
623
624 /// Given a binary operator, cast instruction, or select which has a PHI node
625 /// as operand #0, see if we can fold the instruction into the PHI (which is
626 /// only possible if all operands to the PHI are constants).
628 bool AllowMultipleUses = false);
629
630 /// Try to fold binary operators whose operands are simple interleaved
631 /// recurrences to a single recurrence. This is a common pattern in reduction
632 /// operations.
633 /// Example:
634 /// %phi1 = phi [init1, %BB1], [%op1, %BB2]
635 /// %phi2 = phi [init2, %BB1], [%op2, %BB2]
636 /// %op1 = binop %phi1, constant1
637 /// %op2 = binop %phi2, constant2
638 /// %rdx = binop %op1, %op2
639 /// -->
640 /// %phi_combined = phi [init_combined, %BB1], [%op_combined, %BB2]
641 /// %rdx_combined = binop %phi_combined, constant_combined
643
644 /// For a binary operator with 2 phi operands, try to hoist the binary
645 /// operation before the phi. This can result in fewer instructions in
646 /// patterns where at least one set of phi operands simplifies.
647 /// Example:
648 /// BB3: binop (phi [X, BB1], [C1, BB2]), (phi [Y, BB1], [C2, BB2])
649 /// -->
650 /// BB1: BO = binop X, Y
651 /// BB3: phi [BO, BB1], [(binop C1, C2), BB2]
653
654 /// Given an instruction with a select as one operand and a constant as the
655 /// other operand, try to fold the binary operator into the select arguments.
656 /// This also works for Cast instructions, which obviously do not have a
657 /// second operand.
659 bool FoldWithMultiUse = false,
660 bool SimplifyBothArms = false);
661
663
664 /// This is a convenience wrapper function for the above two functions.
666
668
671
672 /// Try to rotate an operation below a PHI node, using PHI nodes for
673 /// its operands.
682
683 /// If the phi is within a phi web, which is formed by the def-use chain
684 /// of phis and all the phis in the web are only used in the other phis.
685 /// In this case, these phis are dead and we will remove all of them.
686 bool foldDeadPhiWeb(PHINode &PN);
687
688 /// If an integer typed PHI has only one use which is an IntToPtr operation,
689 /// replace the PHI with an existing pointer typed PHI if it exists. Otherwise
690 /// insert a new pointer typed PHI and replace the original one.
692
693 /// Helper function for FoldPHIArgXIntoPHI() to set debug location for the
694 /// folded operation.
696
699 Instruction &I);
701 const ICmpInst &I);
702 bool foldAllocaCmp(AllocaInst *Alloca);
705 CmpInst &ICI,
706 ConstantInt *AndCst = nullptr);
708 Constant *RHSC);
712
721 const APInt &C);
724 Value *Z, CmpPredicate Pred);
730
732
734 const APInt &C);
736 ConstantInt *C);
738 const APInt &C);
740 const SimplifyQuery &Q);
742 const APInt &C);
744 const APInt &C);
746 const APInt &C);
748 const APInt &C);
750 const APInt &C);
752 const APInt &C);
754 const APInt &C);
756 const APInt &C);
758 const APInt &C);
760 const APInt &C);
762 const APInt &C);
764 const APInt &C1);
766 const APInt &C1, const APInt &C2);
768 const APInt &C);
770 const APInt &C2);
772 const APInt &C2);
773
775 BinaryOperator *BO,
776 const APInt &C);
778 BinaryOperator *BO,
779 const APInt &C);
781 const APInt &C);
783 const APInt &C);
787 ICmpInst &CxtI);
788
789 // Helpers of visitSelectInst().
798 Value *A, Value *B, Instruction &Outer,
802 Value *FalseVal);
805 unsigned Depth = 0);
806
807 Value *insertRangeTest(Value *V, const APInt &Lo, const APInt &Hi,
808 bool isSigned, bool Inside);
810
811 /// Given an initial instruction, check to see if it is the root of a
812 /// bswap/bitreverse idiom. If so, return the equivalent bswap/bitreverse
813 /// intrinsic.
815 bool MatchBitReversals);
816
819
820 Value *EvaluateInDifferentType(Value *V, Type *Ty, bool isSigned);
821
822 bool tryToSinkInstruction(Instruction *I, BasicBlock *DestBlock);
824 Instruction *I, BasicBlock::iterator InsertPos, BasicBlock *SrcBlock,
826
828 void addDeadEdge(BasicBlock *From, BasicBlock *To,
834 void freelyInvertAllUsersOf(Value *V, Value *IgnoredUser = nullptr);
835
836 /// Take the exact integer log2 of the value. If DoFold is true, create the
837 /// actual instructions, otherwise return a non-null dummy value. Return
838 /// nullptr on failure. Note, if DoFold is true the caller must ensure that
839 /// takeLog2 will succeed, otherwise it may create stray instructions.
840 Value *takeLog2(Value *Op, unsigned Depth, bool AssumeNonZero, bool DoFold);
841
842 Value *tryGetLog2(Value *Op, bool AssumeNonZero) {
843 if (takeLog2(Op, /*Depth=*/0, AssumeNonZero, /*DoFold=*/false))
844 return takeLog2(Op, /*Depth=*/0, AssumeNonZero, /*DoFold=*/true);
845 return nullptr;
846 }
847};
848
849class Negator final {
850 /// Top-to-bottom, def-to-use negated instruction tree we produced.
852
854 BuilderTy Builder;
855
856 const DominatorTree &DT;
857
858 const bool IsTrulyNegation;
859
860 SmallDenseMap<Value *, Value *> NegationsCache;
861
862 Negator(LLVMContext &C, const DataLayout &DL, const DominatorTree &DT,
863 bool IsTrulyNegation);
864
865#if LLVM_ENABLE_STATS
866 unsigned NumValuesVisitedInThisNegator = 0;
867 ~Negator();
868#endif
869
870 using Result = std::pair<ArrayRef<Instruction *> /*NewInstructions*/,
871 Value * /*NegatedRoot*/>;
872
873 std::array<Value *, 2> getSortedOperandsOfBinOp(Instruction *I);
874
875 [[nodiscard]] Value *visitImpl(Value *V, bool IsNSW, unsigned Depth);
876
877 [[nodiscard]] Value *negate(Value *V, bool IsNSW, unsigned Depth);
878
879 /// Recurse depth-first and attempt to sink the negation.
880 /// FIXME: use worklist?
881 [[nodiscard]] std::optional<Result> run(Value *Root, bool IsNSW);
882
883 Negator(const Negator &) = delete;
884 Negator(Negator &&) = delete;
885 Negator &operator=(const Negator &) = delete;
886 Negator &operator=(Negator &&) = delete;
887
888public:
889 /// Attempt to negate \p Root. Retuns nullptr if negation can't be performed,
890 /// otherwise returns negated value.
891 [[nodiscard]] static Value *Negate(bool LHSIsZero, bool IsNSW, Value *Root,
892 InstCombinerImpl &IC);
893};
894
896 /// Common base pointer.
897 Value *Ptr = nullptr;
898 /// LHS GEPs until common base.
900 /// RHS GEPs until common base.
902 /// LHS GEP NoWrapFlags until common base.
904 /// RHS GEP NoWrapFlags until common base.
906
908
909 /// Whether expanding the GEP chains is expensive.
910 bool isExpensive() const;
911};
912
913} // end namespace llvm
914
915#undef DEBUG_TYPE
916
917#endif // LLVM_LIB_TRANSFORMS_INSTCOMBINE_INSTCOMBINEINTERNAL_H
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
constexpr LLT S1
AMDGPU Register Bank Select
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< ShadowStackGC > C("shadow-stack", "Very portable GC for uncooperative code generators")
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static bool foldICmpWithDominatingICmp(CmpInst *Cmp, const TargetLowering &TLI)
For pattern like:
#define LLVM_LIBRARY_VISIBILITY
Definition Compiler.h:137
static bool willNotOverflow(BinaryOpIntrinsic *BO, LazyValueInfo *LVI)
#define DEBUG_TYPE
Hexagon Common GEP
IRTranslator LLVM IR MI
static constexpr unsigned NegatorMaxNodesSSO
static constexpr unsigned NegatorDefaultMaxDepth
This file provides the interface for the instcombine pass implementation.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
uint64_t IntrinsicInst * II
StandardInstrumentations SI(Mod->getContext(), Debug, VerifyEach)
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
This file contains the declarations for profiling metadata utility functions.
const SmallVectorImpl< MachineOperand > & Cond
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define LLVM_DEBUG(...)
Definition Debug.h:114
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")
static OverflowResult computeOverflowForSignedAdd(const WithCache< const Value * > &LHS, const WithCache< const Value * > &RHS, const AddOperator *Add, const SimplifyQuery &SQ)
Value * RHS
Value * LHS
static const uint32_t IV[8]
Definition blake3_impl.h:83
Class for arbitrary precision integers.
Definition APInt.h:78
This class represents a conversion between pointers from one address space to another.
an instruction to allocate memory on the stack
This class represents any memset intrinsic.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
A cache of @llvm.assume calls within a function.
an instruction that atomically reads a memory location, combines it with another value,...
LLVM Basic Block Representation.
Definition BasicBlock.h:62
InstListType::iterator iterator
Instruction iterators...
Definition BasicBlock.h:170
This class represents a no-op cast from one type to another.
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Conditional or Unconditional Branch instruction.
Analysis providing branch probability information.
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
CallBr instruction, tracking function calls that may not return control but instead transfer it to a ...
This class represents a function call, abstracting a target machine's calling convention.
This is the base class for all instructions that perform data casts.
Definition InstrTypes.h:448
This class is the base class for the comparison instructions.
Definition InstrTypes.h:664
An abstraction over a floating-point predicate, and a pack of an integer predicate with samesign info...
This is the shared class of boolean and integer constants.
Definition Constants.h:87
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
This is an important base class in LLVM.
Definition Constant.h:43
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:164
This instruction extracts a single (scalar) element from a VectorType value.
This instruction extracts a struct member or array element value from an aggregate value.
This instruction compares its operands according to the predicate given to the constructor.
This class represents a cast from floating point to signed integer.
This class represents a cast from floating point to unsigned integer.
This class represents a truncation of floating point types.
Convenience struct for specifying and reasoning about fast-math flags.
Definition FMF.h:23
An instruction for ordering other memory operations.
This class represents a freeze function that returns random concrete value if an operand is either a ...
Represents flags for the getelementptr instruction/expression.
static GEPNoWrapFlags all()
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
This instruction compares its operands according to the predicate given to the constructor.
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2788
This instruction inserts a single (scalar) element into a VectorType value.
This instruction inserts a struct field of array element value into an aggregate value.
Instruction * visitMul(BinaryOperator &I)
Instruction * foldICmpShrConstant(ICmpInst &Cmp, BinaryOperator *Shr, const APInt &C)
Fold icmp ({al}shr X, Y), C.
Instruction * foldICmpWithZextOrSext(ICmpInst &ICmp)
Instruction * foldICmpSelectConstant(ICmpInst &Cmp, SelectInst *Select, ConstantInt *C)
Instruction * foldICmpSRemConstant(ICmpInst &Cmp, BinaryOperator *UDiv, const APInt &C)
Instruction * foldSelectToCmp(SelectInst &SI)
Instruction * visitAdd(BinaryOperator &I)
bool fmulByZeroIsZero(Value *MulVal, FastMathFlags FMF, const Instruction *CtxI) const
Check if fmul MulVal, +0.0 will yield +0.0 (or signed zero is ignorable).
Instruction * foldICmpBinOpWithConstant(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Fold an icmp with BinaryOp and constant operand: icmp Pred BO, C.
Instruction * foldICmpOrConstant(ICmpInst &Cmp, BinaryOperator *Or, const APInt &C)
Fold icmp (or X, Y), C.
Instruction * canonicalizeCondSignextOfHighBitExtractToSignextHighBitExtract(BinaryOperator &I)
Instruction * foldICmpTruncWithTruncOrExt(ICmpInst &Cmp, const SimplifyQuery &Q)
Fold icmp (trunc nuw/nsw X), (trunc nuw/nsw Y).
Instruction * visitLShr(BinaryOperator &I)
Instruction * foldBinOpIntoSelectOrPhi(BinaryOperator &I)
This is a convenience wrapper function for the above two functions.
Instruction * visitUDiv(BinaryOperator &I)
Instruction * visitOr(BinaryOperator &I)
Instruction * foldSignBitTest(ICmpInst &I)
Fold equality-comparison between zero and any (maybe truncated) right-shift by one-less-than-bitwidth...
Instruction * foldSelectEqualityTest(SelectInst &SI)
Instruction * visitZExt(ZExtInst &Zext)
Instruction * visitGEPOfGEP(GetElementPtrInst &GEP, GEPOperator *Src)
Instruction * foldSelectValueEquivalence(SelectInst &SI, CmpInst &CI)
Instruction * visitAddrSpaceCast(AddrSpaceCastInst &CI)
Instruction * foldPHIArgInsertValueInstructionIntoPHI(PHINode &PN)
If we have something like phi [insertvalue(a,b,0), insertvalue(c,d,0)], turn this into a phi[a,...
~InstCombinerImpl() override=default
Instruction * visitSExt(SExtInst &Sext)
Instruction * visitUnreachableInst(UnreachableInst &I)
Instruction * visitURem(BinaryOperator &I)
Instruction * foldSquareSumInt(BinaryOperator &I)
Instruction * foldOpIntoPhi(Instruction &I, PHINode *PN, bool AllowMultipleUses=false)
Given a binary operator, cast instruction, or select which has a PHI node as operand #0,...
InstCombinerImpl(InstructionWorklist &Worklist, BuilderTy &Builder, Function &F, AAResults *AA, AssumptionCache &AC, TargetLibraryInfo &TLI, TargetTransformInfo &TTI, DominatorTree &DT, OptimizationRemarkEmitter &ORE, BlockFrequencyInfo *BFI, BranchProbabilityInfo *BPI, ProfileSummaryInfo *PSI, const DataLayout &DL, ReversePostOrderTraversal< BasicBlock * > &RPOT)
Value * insertRangeTest(Value *V, const APInt &Lo, const APInt &Hi, bool isSigned, bool Inside)
Emit a computation of: (V >= Lo && V < Hi) if Inside is true, otherwise (V < Lo || V >= Hi).
void handleUnreachableFrom(Instruction *I, SmallVectorImpl< BasicBlock * > &Worklist)
Instruction * foldICmpBinOp(ICmpInst &Cmp, const SimplifyQuery &SQ)
Try to fold icmp (binop), X or icmp X, (binop).
Instruction * foldVectorSelect(SelectInst &Sel)
Instruction * foldCmpLoadFromIndexedGlobal(LoadInst *LI, GetElementPtrInst *GEP, CmpInst &ICI, ConstantInt *AndCst=nullptr)
This is called when we see this pattern: cmp pred (load (gep GV, ...)), cmpcst where GV is a global v...
Instruction * visitFreeze(FreezeInst &I)
Instruction * foldICmpSubConstant(ICmpInst &Cmp, BinaryOperator *Sub, const APInt &C)
Fold icmp (sub X, Y), C.
Instruction * foldSelectShuffle(ShuffleVectorInst &Shuf)
Try to fold shuffles that are the equivalent of a vector select.
Instruction * visitLoadInst(LoadInst &LI)
Value * takeLog2(Value *Op, unsigned Depth, bool AssumeNonZero, bool DoFold)
Take the exact integer log2 of the value.
Instruction * visitFPToSI(FPToSIInst &FI)
Instruction * foldICmpWithClamp(ICmpInst &Cmp, Value *X, MinMaxIntrinsic *Min)
Match and fold patterns like: icmp eq/ne X, min(max(X, Lo), Hi) which represents a range check and ca...
Instruction * foldICmpInstWithConstantNotInt(ICmpInst &Cmp)
Handle icmp with constant (but not simple integer constant) RHS.
Instruction * visitAtomicRMWInst(AtomicRMWInst &SI)
Instruction * visitSRem(BinaryOperator &I)
Instruction * foldSPFofSPF(Instruction *Inner, SelectPatternFlavor SPF1, Value *A, Value *B, Instruction &Outer, SelectPatternFlavor SPF2, Value *C)
Instruction * visitTrunc(TruncInst &CI)
Instruction * foldBinOpSelectBinOp(BinaryOperator &Op)
In some cases it is beneficial to fold a select into a binary operator.
Instruction * foldICmpShlConstConst(ICmpInst &I, Value *ShAmt, const APInt &C1, const APInt &C2)
Handle "(icmp eq/ne (shl AP2, A), AP1)" -> (icmp eq/ne A, TrailingZeros(AP1) - TrailingZeros(AP2)).
Instruction * foldSquareSumFP(BinaryOperator &I)
Value * reassociateShiftAmtsOfTwoSameDirectionShifts(BinaryOperator *Sh0, const SimplifyQuery &SQ, bool AnalyzeForSignBitExtraction=false)
Instruction * foldSelectOpOp(SelectInst &SI, Instruction *TI, Instruction *FI)
We have (select c, TI, FI), and we know that TI and FI have the same opcode.
Instruction * visitUIToFP(CastInst &CI)
Instruction * foldPHIArgBinOpIntoPHI(PHINode &PN)
If we have something like phi [add (a,b), add(a,c)] and if a/b/c and the adds all have a single user,...
void handlePotentiallyDeadBlocks(SmallVectorImpl< BasicBlock * > &Worklist)
bool sinkNotIntoLogicalOp(Instruction &I)
Instruction * foldICmpEqIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst *II, const APInt &C)
Fold an equality icmp with LLVM intrinsic and constant operand.
Instruction * visitPtrToInt(PtrToIntInst &CI)
bool prepareWorklist(Function &F)
Perform early cleanup and prepare the InstCombine worklist.
Instruction * foldSelectIntrinsic(SelectInst &SI)
This transforms patterns of the form: select cond, intrinsic(x, ...), intrinsic(y,...
std::optional< std::pair< Intrinsic::ID, SmallVector< Value *, 3 > > > convertOrOfShiftsToFunnelShift(Instruction &Or)
Instruction * visitFDiv(BinaryOperator &I)
Instruction * FoldOpIntoSelect(Instruction &Op, SelectInst *SI, bool FoldWithMultiUse=false, bool SimplifyBothArms=false)
Given an instruction with a select as one operand and a constant as the other operand,...
Instruction * SimplifyAnyMemSet(AnyMemSetInst *MI)
bool simplifyDivRemOfSelectWithZeroOp(BinaryOperator &I)
Fold a divide or remainder with a select instruction divisor when one of the select operands is zero.
Instruction * visitSIToFP(CastInst &CI)
Instruction * visitSub(BinaryOperator &I)
Instruction * visitAShr(BinaryOperator &I)
bool replaceInInstruction(Value *V, Value *Old, Value *New, unsigned Depth=0)
Instruction * visitFree(CallInst &FI, Value *FreedOp)
Instruction * visitInsertValueInst(InsertValueInst &IV)
Try to find redundant insertvalue instructions, like the following ones: %0 = insertvalue { i8,...
Instruction * visitAnd(BinaryOperator &I)
Value * foldMultiplicationOverflowCheck(ICmpInst &Cmp)
Fold (-1 u/ x) u< y ((x * y) ?
Instruction * visitCallBrInst(CallBrInst &CBI)
Instruction * visitExtractValueInst(ExtractValueInst &EV)
Instruction * visitInsertElementInst(InsertElementInst &IE)
void handlePotentiallyDeadSuccessors(BasicBlock *BB, BasicBlock *LiveSucc)
Instruction * visitUnconditionalBranchInst(BranchInst &BI)
Instruction * commonCastTransforms(CastInst &CI)
Implement the transforms common to all CastInst visitors.
Instruction * foldICmpWithConstant(ICmpInst &Cmp)
Fold icmp Pred X, C.
CmpInst * canonicalizeICmpPredicate(CmpInst &I)
If we have a comparison with a non-canonical predicate, if we can update all the users,...
Instruction * foldBinopWithRecurrence(BinaryOperator &BO)
Try to fold binary operators whose operands are simple interleaved recurrences to a single recurrence...
Instruction * eraseInstFromFunction(Instruction &I) override
Combiner aware instruction erasure.
Instruction * foldICmpWithZero(ICmpInst &Cmp)
Instruction * visitExtractElementInst(ExtractElementInst &EI)
Instruction * commonIDivRemTransforms(BinaryOperator &I)
Common integer divide/remainder transforms.
Value * foldReversedIntrinsicOperands(IntrinsicInst *II)
If all arguments of the intrinsic are reverses, try to pull the reverse after the intrinsic.
Instruction * visitPHINode(PHINode &PN)
Instruction * foldICmpCommutative(CmpPredicate Pred, Value *Op0, Value *Op1, ICmpInst &CxtI)
Instruction * foldICmpBinOpEqualityWithConstant(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Fold an icmp equality instruction with binary operator LHS and constant RHS: icmp eq/ne BO,...
Instruction * foldItoFPtoI(CastInst &FI)
fpto{s/u}i({u/s}itofp(X)) --> X or zext(X) or sext(X) or trunc(X) This is safe if the intermediate ty...
Instruction * foldPHIArgOpIntoPHI(PHINode &PN)
Try to rotate an operation below a PHI node, using PHI nodes for its operands.
Instruction * visitLandingPadInst(LandingPadInst &LI)
Instruction * foldICmpUsingBoolRange(ICmpInst &I)
If one operand of an icmp is effectively a bool (value range of {0,1}), then try to reduce patterns b...
Instruction * foldICmpWithTrunc(ICmpInst &Cmp)
Instruction * foldICmpIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst *II, const APInt &C)
Fold an icmp with LLVM intrinsic and constant operand: icmp Pred II, C.
Instruction * visitFPTrunc(FPTruncInst &CI)
Instruction * visitStoreInst(StoreInst &SI)
Value * tryGetLog2(Value *Op, bool AssumeNonZero)
Instruction * foldPHIArgZextsIntoPHI(PHINode &PN)
TODO: This function could handle other cast types, but then it might require special-casing a cast fr...
Instruction * foldSelectInstWithICmp(SelectInst &SI, ICmpInst *ICI)
Instruction * visitFenceInst(FenceInst &FI)
Value * foldPtrToIntOrAddrOfGEP(Type *IntTy, Value *Ptr)
Instruction * visitFCmpInst(FCmpInst &I)
Value * OptimizePointerDifference(Value *LHS, Value *RHS, Type *Ty, bool isNUW)
Optimize pointer differences into the same array into a size.
Instruction * visitBitCast(BitCastInst &CI)
Instruction * visitReturnInst(ReturnInst &RI)
bool sinkNotIntoOtherHandOfLogicalOp(Instruction &I)
Instruction * commonIDivTransforms(BinaryOperator &I)
This function implements the transforms common to both integer division instructions (udiv and sdiv).
Instruction * foldICmpUsingKnownBits(ICmpInst &Cmp)
Try to fold the comparison based on range information we can get by checking whether bits are known t...
Instruction * foldICmpDivConstant(ICmpInst &Cmp, BinaryOperator *Div, const APInt &C)
Fold icmp ({su}div X, Y), C.
Instruction * foldIRemByPowerOfTwoToBitTest(ICmpInst &I)
If we have: icmp eq/ne (urem/srem x, y), 0 iff y is a power-of-two, we can replace this with a bit te...
Instruction * foldFCmpIntToFPConst(FCmpInst &I, Instruction *LHSI, Constant *RHSC)
Fold fcmp ([us]itofp x, cst) if possible.
Instruction * visitShl(BinaryOperator &I)
Instruction * visitSwitchInst(SwitchInst &SI)
Instruction * foldICmpUDivConstant(ICmpInst &Cmp, BinaryOperator *UDiv, const APInt &C)
Fold icmp (udiv X, Y), C.
Instruction * visitFAdd(BinaryOperator &I)
Instruction * foldBinopWithPhiOperands(BinaryOperator &BO)
For a binary operator with 2 phi operands, try to hoist the binary operation before the phi.
Instruction * visitIntToPtr(IntToPtrInst &CI)
Instruction * foldICmpAddOpConst(Value *X, const APInt &C, CmpPredicate Pred)
Fold "icmp pred (X+C), X".
Instruction * foldICmpWithCastOp(ICmpInst &ICmp)
Handle icmp (cast x), (cast or constant).
Instruction * visitFPToUI(FPToUIInst &FI)
Instruction * foldICmpTruncConstant(ICmpInst &Cmp, TruncInst *Trunc, const APInt &C)
Fold icmp (trunc X), C.
bool mergeStoreIntoSuccessor(StoreInst &SI)
Try to transform: if () { *P = v1; } else { *P = v2 } or: *P = v1; if () { *P = v2; }...
Instruction * visitPtrToAddr(PtrToAddrInst &CI)
Instruction * visitInstruction(Instruction &I)
Specify what to return for unhandled instructions.
Instruction * foldSelectIntoOp(SelectInst &SI, Value *, Value *)
Try to fold the select into one of the operands to allow further optimization.
Instruction * foldShuffledIntrinsicOperands(IntrinsicInst *II)
If all arguments of the intrinsic are unary shuffles with the same mask, try to shuffle after the int...
Instruction * foldICmpAddConstant(ICmpInst &Cmp, BinaryOperator *Add, const APInt &C)
Fold icmp (add X, Y), C.
Instruction * foldICmpMulConstant(ICmpInst &Cmp, BinaryOperator *Mul, const APInt &C)
Fold icmp (mul X, Y), C.
Instruction * visitInvokeInst(InvokeInst &II)
Value * simplifyRangeCheck(ICmpInst *Cmp0, ICmpInst *Cmp1, bool Inverted)
Try to fold a signed range checked with lower bound 0 to an unsigned icmp.
Instruction * foldVariableSignZeroExtensionOfVariableHighBitExtract(BinaryOperator &OldAShr)
Instruction * commonShiftTransforms(BinaryOperator &I)
Instruction * visitFRem(BinaryOperator &I)
Instruction * foldPHIArgLoadIntoPHI(PHINode &PN)
Instruction * foldICmpXorConstant(ICmpInst &Cmp, BinaryOperator *Xor, const APInt &C)
Fold icmp (xor X, Y), C.
Instruction * FoldOrOfLogicalAnds(Value *Op0, Value *Op1)
Instruction * foldSelectICmp(CmpPredicate Pred, SelectInst *SI, Value *RHS, const ICmpInst &I)
bool foldIntegerTypedPHI(PHINode &PN)
If an integer typed PHI has only one use which is an IntToPtr operation, replace the PHI with an exis...
Instruction * foldICmpInstWithConstantAllowPoison(ICmpInst &Cmp, const APInt &C)
Try to fold integer comparisons with a constant operand: icmp Pred X, C where X is some kind of instr...
bool foldDeadPhiWeb(PHINode &PN)
If the phi is within a phi web, which is formed by the def-use chain of phis and all the phis in the ...
Instruction * foldIsMultipleOfAPowerOfTwo(ICmpInst &Cmp)
Fold icmp eq (num + mask) & ~mask, num to icmp eq (and num, mask), 0 Where mask is a low bit mask.
Instruction * visitXor(BinaryOperator &I)
Value * foldSelectWithConstOpToBinOp(ICmpInst *Cmp, Value *TrueVal, Value *FalseVal)
Value * EvaluateInDifferentType(Value *V, Type *Ty, bool isSigned)
Given an expression that CanEvaluateTruncated or CanEvaluateSExtd returns true for,...
Instruction * simplifyBinOpSplats(ShuffleVectorInst &SVI)
void CreateNonTerminatorUnreachable(Instruction *InsertAt)
Create and insert the idiom we use to indicate a block is unreachable without having to rewrite the C...
Instruction * foldICmpAndShift(ICmpInst &Cmp, BinaryOperator *And, const APInt &C1, const APInt &C2)
Fold icmp (and (sh X, Y), C2), C1.
Value * pushFreezeToPreventPoisonFromPropagating(FreezeInst &FI)
Instruction * foldICmpBinOpWithConstantViaTruthTable(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Instruction * foldICmpInstWithConstant(ICmpInst &Cmp)
Try to fold integer comparisons with a constant operand: icmp Pred X, C where X is some kind of instr...
Instruction * visitSelectInst(SelectInst &SI)
Instruction * foldICmpXorShiftConst(ICmpInst &Cmp, BinaryOperator *Xor, const APInt &C)
For power-of-2 C: ((X s>> ShiftC) ^ X) u< C --> (X + C) u< (C << 1) ((X s>> ShiftC) ^ X) u> (C - 1) -...
Instruction * foldPHIArgIntToPtrToPHI(PHINode &PN)
Instruction * visitFPExt(CastInst &CI)
Instruction * foldICmpShlConstant(ICmpInst &Cmp, BinaryOperator *Shl, const APInt &C)
Fold icmp (shl X, Y), C.
Instruction * visitFMul(BinaryOperator &I)
Instruction * foldSelectOfBools(SelectInst &SI)
Instruction * foldSelectExtConst(SelectInst &Sel)
Instruction * foldAddWithConstant(BinaryOperator &Add)
Instruction * foldICmpAndConstant(ICmpInst &Cmp, BinaryOperator *And, const APInt &C)
Fold icmp (and X, Y), C.
bool run()
Run the combiner over the entire worklist until it is empty.
Instruction * foldFMulReassoc(BinaryOperator &I)
Instruction * SliceUpIllegalIntegerPHI(PHINode &PN)
This is an integer PHI and we know that it has an illegal type: see if it is only used by trunc or tr...
Instruction * foldAggregateConstructionIntoAggregateReuse(InsertValueInst &OrigIVI)
Look for chain of insertvalue's that fully define an aggregate, and trace back the values inserted,...
Instruction * foldICmpEquality(ICmpInst &Cmp)
bool removeInstructionsBeforeUnreachable(Instruction &I)
Instruction * foldPHIArgGEPIntoPHI(PHINode &PN)
Instruction * foldICmpWithMinMax(Instruction &I, MinMaxIntrinsic *MinMax, Value *Z, CmpPredicate Pred)
Fold icmp Pred min|max(X, Y), Z.
Instruction * visitShuffleVectorInst(ShuffleVectorInst &SVI)
Instruction * FoldShiftByConstant(Value *Op0, Constant *Op1, BinaryOperator &I)
void tryToSinkInstructionDbgVariableRecords(Instruction *I, BasicBlock::iterator InsertPos, BasicBlock *SrcBlock, BasicBlock *DestBlock, SmallVectorImpl< DbgVariableRecord * > &DPUsers)
bool foldAllocaCmp(AllocaInst *Alloca)
void addDeadEdge(BasicBlock *From, BasicBlock *To, SmallVectorImpl< BasicBlock * > &Worklist)
void PHIArgMergedDebugLoc(Instruction *Inst, PHINode &PN)
Helper function for FoldPHIArgXIntoPHI() to set debug location for the folded operation.
Instruction * visitVAEndInst(VAEndInst &I)
Instruction * matchBSwapOrBitReverse(Instruction &I, bool MatchBSwaps, bool MatchBitReversals)
Given an initial instruction, check to see if it is the root of a bswap/bitreverse idiom.
Constant * unshuffleConstant(ArrayRef< int > ShMask, Constant *C, VectorType *NewCTy)
Find a constant NewC that has property: shuffle(NewC, ShMask) = C Returns nullptr if such a constant ...
Instruction * visitAllocSite(Instruction &FI)
Instruction * visitICmpInst(ICmpInst &I)
Instruction * SimplifyAnyMemTransfer(AnyMemTransferInst *MI)
Instruction * visitGetElementPtrInst(GetElementPtrInst &GEP)
Instruction * visitBranchInst(BranchInst &BI)
Instruction * foldPowiReassoc(BinaryOperator &I)
Instruction * foldFreezeIntoRecurrence(FreezeInst &I, PHINode *PN)
Instruction * visitSDiv(BinaryOperator &I)
bool tryToSinkInstruction(Instruction *I, BasicBlock *DestBlock)
Try to move the specified instruction from its current block into the beginning of DestBlock,...
Instruction * foldPHIArgExtractValueInstructionIntoPHI(PHINode &PN)
If we have something like phi [extractvalue(a,0), extractvalue(b,0)], turn this into a phi[a,...
Instruction * foldICmpShrConstConst(ICmpInst &I, Value *ShAmt, const APInt &C1, const APInt &C2)
Handle "(icmp eq/ne (ashr/lshr AP2, A), AP1)" -> (icmp eq/ne A, Log2(AP2/AP1)) -> (icmp eq/ne A,...
bool freezeOtherUses(FreezeInst &FI)
Instruction * visitFNeg(UnaryOperator &I)
void freelyInvertAllUsersOf(Value *V, Value *IgnoredUser=nullptr)
Freely adapt every user of V as-if V was changed to !V.
Instruction * commonIRemTransforms(BinaryOperator &I)
This function implements the transforms common to both integer remainder instructions (urem and srem)...
Instruction * visitAllocaInst(AllocaInst &AI)
Instruction * visitCallInst(CallInst &CI)
CallInst simplification.
Instruction * foldICmpAndConstConst(ICmpInst &Cmp, BinaryOperator *And, const APInt &C1)
Fold icmp (and X, C2), C1.
Instruction * visitFSub(BinaryOperator &I)
Instruction * foldICmpBitCast(ICmpInst &Cmp)
Instruction * foldGEPICmp(GEPOperator *GEPLHS, Value *RHS, CmpPredicate Cond, Instruction &I)
Fold comparisons between a GEP instruction and something else.
SimplifyQuery SQ
IRBuilder< TargetFolder, IRBuilderCallbackInserter > BuilderTy
An IRBuilder that automatically inserts new instructions into the worklist.
BlockFrequencyInfo * BFI
TargetLibraryInfo & TLI
InstructionWorklist & Worklist
A worklist of the instructions that need to be simplified.
Instruction * InsertNewInstWith(Instruction *New, BasicBlock::iterator Old)
Same as InsertNewInstBefore, but also sets the debug loc.
BranchProbabilityInfo * BPI
virtual bool SimplifyDemandedBits(Instruction *I, unsigned OpNo, const APInt &DemandedMask, KnownBits &Known, const SimplifyQuery &Q, unsigned Depth=0)=0
ReversePostOrderTraversal< BasicBlock * > & RPOT
const DataLayout & DL
DomConditionCache DC
AssumptionCache & AC
DominatorTree & DT
ProfileSummaryInfo * PSI
BuilderTy & Builder
OptimizationRemarkEmitter & ORE
InstCombiner(InstructionWorklist &Worklist, BuilderTy &Builder, Function &F, AAResults *AA, AssumptionCache &AC, TargetLibraryInfo &TLI, TargetTransformInfo &TTI, DominatorTree &DT, OptimizationRemarkEmitter &ORE, BlockFrequencyInfo *BFI, BranchProbabilityInfo *BPI, ProfileSummaryInfo *PSI, const DataLayout &DL, ReversePostOrderTraversal< BasicBlock * > &RPOT)
Base class for instruction visitors.
Definition InstVisitor.h:78
InstructionWorklist - This is the worklist management logic for InstCombine and other simplification ...
This class represents a cast from an integer to a pointer.
A wrapper class for inspecting calls to intrinsic functions.
Invoke instruction.
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
The landingpad instruction holds all of the information necessary to generate correct exception handl...
An instruction for reading from memory.
This class represents min/max intrinsics.
static Value * Negate(bool LHSIsZero, bool IsNSW, Value *Root, InstCombinerImpl &IC)
Attempt to negate Root.
The optimization diagnostic interface.
static PointerType * getUnqual(Type *ElementType)
This constructs a pointer to an object of the specified type in the default address space (address sp...
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Analysis providing profile information.
This class represents a cast from a pointer to an address (non-capturing ptrtoint).
This class represents a cast from a pointer to an integer.
Return a value (possibly void), from a function.
This class represents a sign extension of integer types.
This class represents the LLVM 'select' instruction.
This instruction constructs a fixed permutation of two input vectors.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
An instruction for storing to memory.
Multiway switch.
Provides information about what library functions are available for the current target.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
This class represents a truncation of integer types.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45
This function has undefined behavior.
This represents the llvm.va_end intrinsic.
LLVM Value Representation.
Definition Value.h:75
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:259
Base class of all SIMD vector types.
This class represents zero extension of integer types.
self_iterator getIterator()
Definition ilist_node.h:123
CallInst * Call
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26
@ NeverOverflows
Never overflows.
LLVM_ABI void setExplicitlyUnknownBranchWeightsIfProfiled(Instruction &I, StringRef PassName, const Function *F=nullptr)
Like setExplicitlyUnknownBranchWeights(...), but only sets unknown branch weights in the new instruct...
LLVM_ABI void salvageDebugInfo(const MachineRegisterInfo &MRI, MachineInstr &MI)
Assuming the instruction MI is going to be deleted, attempt to salvage debug users of MI by writing t...
Definition Utils.cpp:1726
LLVM_ABI OverflowResult computeOverflowForUnsignedMul(const Value *LHS, const Value *RHS, const SimplifyQuery &SQ, bool IsNSW=false)
LLVM_ABI OverflowResult computeOverflowForSignedSub(const Value *LHS, const Value *RHS, const SimplifyQuery &SQ)
SelectPatternFlavor
Specific patterns of select instructions we can match.
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207
LLVM_ABI OverflowResult computeOverflowForSignedMul(const Value *LHS, const Value *RHS, const SimplifyQuery &SQ)
TargetTransformInfo TTI
@ Mul
Product of integers.
@ Xor
Bitwise or logical XOR of integers.
@ Sub
Subtraction of integers.
@ Add
Sum of integers.
DWARFExpression::Operation Op
constexpr unsigned BitWidth
LLVM_ABI OverflowResult computeOverflowForUnsignedSub(const Value *LHS, const Value *RHS, const SimplifyQuery &SQ)
LLVM_ABI OverflowResult computeOverflowForUnsignedAdd(const WithCache< const Value * > &LHS, const WithCache< const Value * > &RHS, const SimplifyQuery &SQ)
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
Value * Ptr
Common base pointer.
SmallVector< GEPOperator * > RHSGEPs
RHS GEPs until common base.
GEPNoWrapFlags LHSNW
LHS GEP NoWrapFlags until common base.
GEPNoWrapFlags RHSNW
RHS GEP NoWrapFlags until common base.
SmallVector< GEPOperator * > LHSGEPs
LHS GEPs until common base.
bool isExpensive() const
Whether expanding the GEP chains is expensive.
static CommonPointerBase compute(Value *LHS, Value *RHS)
Matching combinators.