LLVM 22.0.0git
InstCombineInternal.h
Go to the documentation of this file.
1//===- InstCombineInternal.h - InstCombine pass internals -------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9/// \file
10///
11/// This file provides internal interfaces used to implement the InstCombine.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef LLVM_LIB_TRANSFORMS_INSTCOMBINE_INSTCOMBINEINTERNAL_H
16#define LLVM_LIB_TRANSFORMS_INSTCOMBINE_INSTCOMBINEINTERNAL_H
17
19#include "llvm/ADT/Statistic.h"
23#include "llvm/IR/IRBuilder.h"
24#include "llvm/IR/InstVisitor.h"
27#include "llvm/IR/Value.h"
28#include "llvm/Support/Debug.h"
33#include <cassert>
34
35#define DEBUG_TYPE "instcombine"
37
38// As a default, let's assume that we want to be aggressive,
39// and attempt to traverse with no limits in attempt to sink negation.
40static constexpr unsigned NegatorDefaultMaxDepth = ~0U;
41
42// Let's guesstimate that most often we will end up visiting/producing
43// fairly small number of new instructions.
44static constexpr unsigned NegatorMaxNodesSSO = 16;
45
46namespace llvm {
47
48class AAResults;
49class APInt;
50class AssumptionCache;
51class BlockFrequencyInfo;
52class DataLayout;
53class DominatorTree;
54class GEPOperator;
55class GlobalVariable;
56class OptimizationRemarkEmitter;
57class ProfileSummaryInfo;
58class TargetLibraryInfo;
59class User;
60
62 : public InstCombiner,
63 public InstVisitor<InstCombinerImpl, Instruction *> {
64public:
74
75 virtual ~InstCombinerImpl() = default;
76
77 /// Perform early cleanup and prepare the InstCombine worklist.
79
80 /// Run the combiner over the entire worklist until it is empty.
81 ///
82 /// \returns true if the IR is changed.
83 bool run();
84
85 // Visitation implementation - Implement instruction combining for different
86 // instruction types. The semantics are as follows:
87 // Return Value:
88 // null - No change was made
89 // I - Change was made, I is still valid, I may be dead though
90 // otherwise - Change was made, replace I with returned instruction
91 //
96 Value *LHS, Value *RHS, Type *Ty, bool isNUW);
113 Value *simplifyRangeCheck(ICmpInst *Cmp0, ICmpInst *Cmp1, bool Inverted);
121 BinaryOperator *Sh0, const SimplifyQuery &SQ,
122 bool AnalyzeForSignBitExtraction = false);
126 BinaryOperator &OldAShr);
157
164 Instruction *visitFree(CallInst &FI, Value *FreedOp);
185 bool freezeOtherUses(FreezeInst &FI);
188
189 /// Specify what to return for unhandled instructions.
191
192 /// True when DB dominates all uses of DI except UI.
193 /// UI must be in the same block as DI.
194 /// The routine checks that the DI parent and DB are different.
195 bool dominatesAllUses(const Instruction *DI, const Instruction *UI,
196 const BasicBlock *DB) const;
197
198 /// Try to replace select with select operand SIOpd in SI-ICmp sequence.
199 bool replacedSelectWithOperand(SelectInst *SI, const ICmpInst *Icmp,
200 const unsigned SIOpd);
201
202 LoadInst *combineLoadToNewType(LoadInst &LI, Type *NewTy,
203 const Twine &Suffix = "");
204
206 FPClassTest Interested = fcAllFlags,
207 const Instruction *CtxI = nullptr,
208 unsigned Depth = 0) const {
210 Val, FMF, Interested, getSimplifyQuery().getWithInstruction(CtxI),
211 Depth);
212 }
213
215 FPClassTest Interested = fcAllFlags,
216 const Instruction *CtxI = nullptr,
217 unsigned Depth = 0) const {
219 Val, Interested, getSimplifyQuery().getWithInstruction(CtxI), Depth);
220 }
221
222 /// Check if fmul \p MulVal, +0.0 will yield +0.0 (or signed zero is
223 /// ignorable).
225 const Instruction *CtxI) const;
226
227 std::optional<std::pair<Intrinsic::ID, SmallVector<Value *, 3>>>
229
230private:
231 bool annotateAnyAllocSite(CallBase &Call, const TargetLibraryInfo *TLI);
232 bool isDesirableIntType(unsigned BitWidth) const;
233 bool shouldChangeType(unsigned FromBitWidth, unsigned ToBitWidth) const;
234 bool shouldChangeType(Type *From, Type *To) const;
235 Value *dyn_castNegVal(Value *V) const;
236
237 /// Classify whether a cast is worth optimizing.
238 ///
239 /// This is a helper to decide whether the simplification of
240 /// logic(cast(A), cast(B)) to cast(logic(A, B)) should be performed.
241 ///
242 /// \param CI The cast we are interested in.
243 ///
244 /// \return true if this cast actually results in any code being generated and
245 /// if it cannot already be eliminated by some other transformation.
246 bool shouldOptimizeCast(CastInst *CI);
247
248 /// Try to optimize a sequence of instructions checking if an operation
249 /// on LHS and RHS overflows.
250 ///
251 /// If this overflow check is done via one of the overflow check intrinsics,
252 /// then CtxI has to be the call instruction calling that intrinsic. If this
253 /// overflow check is done by arithmetic followed by a compare, then CtxI has
254 /// to be the arithmetic instruction.
255 ///
256 /// If a simplification is possible, stores the simplified result of the
257 /// operation in OperationResult and result of the overflow check in
258 /// OverflowResult, and return true. If no simplification is possible,
259 /// returns false.
260 bool OptimizeOverflowCheck(Instruction::BinaryOps BinaryOp, bool IsSigned,
261 Value *LHS, Value *RHS,
262 Instruction &CtxI, Value *&OperationResult,
264
265 Instruction *visitCallBase(CallBase &Call);
266 Instruction *tryOptimizeCall(CallInst *CI);
267 bool transformConstExprCastCall(CallBase &Call);
268 Instruction *transformCallThroughTrampoline(CallBase &Call,
269 IntrinsicInst &Tramp);
270
271 /// Try to optimize a call to the result of a ptrauth intrinsic, potentially
272 /// into the ptrauth call bundle:
273 /// - call(ptrauth.resign(p)), ["ptrauth"()] -> call p, ["ptrauth"()]
274 /// - call(ptrauth.sign(p)), ["ptrauth"()] -> call p
275 /// as long as the key/discriminator are the same in sign and auth-bundle,
276 /// and we don't change the key in the bundle (to a potentially-invalid key.)
277 Instruction *foldPtrAuthIntrinsicCallee(CallBase &Call);
278
279 /// Try to optimize a call to a ptrauth constant, into its ptrauth bundle:
280 /// call(ptrauth(f)), ["ptrauth"()] -> call f
281 /// as long as the key/discriminator are the same in constant and bundle.
282 Instruction *foldPtrAuthConstantCallee(CallBase &Call);
283
284 // Return (a, b) if (LHS, RHS) is known to be (a, b) or (b, a).
285 // Otherwise, return std::nullopt
286 // Currently it matches:
287 // - LHS = (select c, a, b), RHS = (select c, b, a)
288 // - LHS = (phi [a, BB0], [b, BB1]), RHS = (phi [b, BB0], [a, BB1])
289 // - LHS = min(a, b), RHS = max(a, b)
290 std::optional<std::pair<Value *, Value *>> matchSymmetricPair(Value *LHS,
291 Value *RHS);
292
293 Value *simplifyMaskedLoad(IntrinsicInst &II);
294 Instruction *simplifyMaskedStore(IntrinsicInst &II);
295 Instruction *simplifyMaskedGather(IntrinsicInst &II);
296 Instruction *simplifyMaskedScatter(IntrinsicInst &II);
297
298 /// Transform (zext icmp) to bitwise / integer operations in order to
299 /// eliminate it.
300 ///
301 /// \param ICI The icmp of the (zext icmp) pair we are interested in.
302 /// \parem CI The zext of the (zext icmp) pair we are interested in.
303 ///
304 /// \return null if the transformation cannot be performed. If the
305 /// transformation can be performed the new instruction that replaces the
306 /// (zext icmp) pair will be returned.
307 Instruction *transformZExtICmp(ICmpInst *Cmp, ZExtInst &Zext);
308
309 Instruction *transformSExtICmp(ICmpInst *Cmp, SExtInst &Sext);
310
311 bool willNotOverflowSignedAdd(const WithCache<const Value *> &LHS,
313 const Instruction &CxtI) const {
314 return computeOverflowForSignedAdd(LHS, RHS, &CxtI) ==
316 }
317
318 bool willNotOverflowUnsignedAdd(const WithCache<const Value *> &LHS,
320 const Instruction &CxtI) const {
321 return computeOverflowForUnsignedAdd(LHS, RHS, &CxtI) ==
323 }
324
325 bool willNotOverflowAdd(const Value *LHS, const Value *RHS,
326 const Instruction &CxtI, bool IsSigned) const {
327 return IsSigned ? willNotOverflowSignedAdd(LHS, RHS, CxtI)
328 : willNotOverflowUnsignedAdd(LHS, RHS, CxtI);
329 }
330
331 bool willNotOverflowSignedSub(const Value *LHS, const Value *RHS,
332 const Instruction &CxtI) const {
333 return computeOverflowForSignedSub(LHS, RHS, &CxtI) ==
334 OverflowResult::NeverOverflows;
335 }
336
337 bool willNotOverflowUnsignedSub(const Value *LHS, const Value *RHS,
338 const Instruction &CxtI) const {
339 return computeOverflowForUnsignedSub(LHS, RHS, &CxtI) ==
340 OverflowResult::NeverOverflows;
341 }
342
343 bool willNotOverflowSub(const Value *LHS, const Value *RHS,
344 const Instruction &CxtI, bool IsSigned) const {
345 return IsSigned ? willNotOverflowSignedSub(LHS, RHS, CxtI)
346 : willNotOverflowUnsignedSub(LHS, RHS, CxtI);
347 }
348
349 bool willNotOverflowSignedMul(const Value *LHS, const Value *RHS,
350 const Instruction &CxtI) const {
351 return computeOverflowForSignedMul(LHS, RHS, &CxtI) ==
352 OverflowResult::NeverOverflows;
353 }
354
355 bool willNotOverflowUnsignedMul(const Value *LHS, const Value *RHS,
356 const Instruction &CxtI,
357 bool IsNSW = false) const {
358 return computeOverflowForUnsignedMul(LHS, RHS, &CxtI, IsNSW) ==
359 OverflowResult::NeverOverflows;
360 }
361
362 bool willNotOverflowMul(const Value *LHS, const Value *RHS,
363 const Instruction &CxtI, bool IsSigned) const {
364 return IsSigned ? willNotOverflowSignedMul(LHS, RHS, CxtI)
365 : willNotOverflowUnsignedMul(LHS, RHS, CxtI);
366 }
367
368 bool willNotOverflow(BinaryOperator::BinaryOps Opcode, const Value *LHS,
369 const Value *RHS, const Instruction &CxtI,
370 bool IsSigned) const {
371 switch (Opcode) {
372 case Instruction::Add: return willNotOverflowAdd(LHS, RHS, CxtI, IsSigned);
373 case Instruction::Sub: return willNotOverflowSub(LHS, RHS, CxtI, IsSigned);
374 case Instruction::Mul: return willNotOverflowMul(LHS, RHS, CxtI, IsSigned);
375 default: llvm_unreachable("Unexpected opcode for overflow query");
376 }
377 }
378
379 Value *EmitGEPOffset(GEPOperator *GEP, bool RewriteGEP = false);
380 /// Emit sum of multiple GEP offsets. The GEPs are processed in reverse
381 /// order.
382 Value *EmitGEPOffsets(ArrayRef<GEPOperator *> GEPs, GEPNoWrapFlags NW,
383 Type *IdxTy, bool RewriteGEPs);
384 Instruction *scalarizePHI(ExtractElementInst &EI, PHINode *PN);
385 Instruction *foldBitcastExtElt(ExtractElementInst &ExtElt);
386 Instruction *foldCastedBitwiseLogic(BinaryOperator &I);
387 Instruction *foldFBinOpOfIntCasts(BinaryOperator &I);
388 // Should only be called by `foldFBinOpOfIntCasts`.
389 Instruction *foldFBinOpOfIntCastsFromSign(
390 BinaryOperator &BO, bool OpsFromSigned, std::array<Value *, 2> IntOps,
391 Constant *Op1FpC, SmallVectorImpl<WithCache<const Value *>> &OpsKnown);
392 Instruction *foldBinopOfSextBoolToSelect(BinaryOperator &I);
393 Instruction *narrowBinOp(TruncInst &Trunc);
394 Instruction *narrowMaskedBinOp(BinaryOperator &And);
395 Instruction *narrowMathIfNoOverflow(BinaryOperator &I);
396 Instruction *narrowFunnelShift(TruncInst &Trunc);
397 Instruction *optimizeBitCastFromPhi(CastInst &CI, PHINode *PN);
398 Instruction *matchSAddSubSat(IntrinsicInst &MinMax1);
399 Instruction *foldNot(BinaryOperator &I);
400 Instruction *foldBinOpOfDisplacedShifts(BinaryOperator &I);
401
402 /// Determine if a pair of casts can be replaced by a single cast.
403 ///
404 /// \param CI1 The first of a pair of casts.
405 /// \param CI2 The second of a pair of casts.
406 ///
407 /// \return 0 if the cast pair cannot be eliminated, otherwise returns an
408 /// Instruction::CastOps value for a cast that can replace the pair, casting
409 /// CI1->getSrcTy() to CI2->getDstTy().
410 ///
411 /// \see CastInst::isEliminableCastPair
412 Instruction::CastOps isEliminableCastPair(const CastInst *CI1,
413 const CastInst *CI2);
414 Value *simplifyIntToPtrRoundTripCast(Value *Val);
415
416 Value *foldAndOrOfICmps(ICmpInst *LHS, ICmpInst *RHS, Instruction &I,
417 bool IsAnd, bool IsLogical = false);
418 Value *foldXorOfICmps(ICmpInst *LHS, ICmpInst *RHS, BinaryOperator &Xor);
419
420 Value *foldEqOfParts(Value *Cmp0, Value *Cmp1, bool IsAnd);
421
422 Value *foldAndOrOfICmpsUsingRanges(ICmpInst *ICmp1, ICmpInst *ICmp2,
423 bool IsAnd);
424
425 /// Optimize (fcmp)&(fcmp) or (fcmp)|(fcmp).
426 /// NOTE: Unlike most of instcombine, this returns a Value which should
427 /// already be inserted into the function.
428 Value *foldLogicOfFCmps(FCmpInst *LHS, FCmpInst *RHS, bool IsAnd,
429 bool IsLogicalSelect = false);
430
431 Instruction *foldLogicOfIsFPClass(BinaryOperator &Operator, Value *LHS,
432 Value *RHS);
433
434 Value *foldBooleanAndOr(Value *LHS, Value *RHS, Instruction &I, bool IsAnd,
435 bool IsLogical);
436
437 Value *reassociateBooleanAndOr(Value *LHS, Value *X, Value *Y, Instruction &I,
438 bool IsAnd, bool RHSIsLogical);
439
440 Value *foldDisjointOr(Value *LHS, Value *RHS);
441
442 Value *reassociateDisjointOr(Value *LHS, Value *RHS);
443
445 canonicalizeConditionalNegationViaMathToSelect(BinaryOperator &i);
446
447 Value *matchSelectFromAndOr(Value *A, Value *B, Value *C, Value *D,
448 bool InvertFalseVal = false);
449 Value *getSelectCondition(Value *A, Value *B, bool ABIsTheSame);
450
451 Instruction *foldLShrOverflowBit(BinaryOperator &I);
452 Instruction *foldExtractOfOverflowIntrinsic(ExtractValueInst &EV);
453 Instruction *foldIntrinsicWithOverflowCommon(IntrinsicInst *II);
454 Instruction *foldIntrinsicIsFPClass(IntrinsicInst &II);
455 Instruction *foldFPSignBitOps(BinaryOperator &I);
456 Instruction *foldFDivConstantDivisor(BinaryOperator &I);
457
458 // Optimize one of these forms:
459 // and i1 Op, SI / select i1 Op, i1 SI, i1 false (if IsAnd = true)
460 // or i1 Op, SI / select i1 Op, i1 true, i1 SI (if IsAnd = false)
461 // into simplier select instruction using isImpliedCondition.
462 Instruction *foldAndOrOfSelectUsingImpliedCond(Value *Op, SelectInst &SI,
463 bool IsAnd);
464
465 Instruction *hoistFNegAboveFMulFDiv(Value *FNegOp, Instruction &FMFSource);
466
467 /// Simplify \p V given that it is known to be non-null.
468 /// Returns the simplified value if possible, otherwise returns nullptr.
469 /// If \p HasDereferenceable is true, the simplification will not perform
470 /// same object checks.
471 Value *simplifyNonNullOperand(Value *V, bool HasDereferenceable,
472 unsigned Depth = 0);
473
474public:
475 /// Create `select C, S1, S2`. Use only when the profile cannot be calculated
476 /// from existing profile metadata: if the Function has profiles, this will
477 /// set the profile of this select to "unknown".
478 SelectInst *
480 const Twine &NameStr = "",
481 InsertPosition InsertBefore = nullptr) {
482 auto *Sel = SelectInst::Create(C, S1, S2, NameStr, InsertBefore, nullptr);
484 return Sel;
485 }
486
487 /// Create and insert the idiom we use to indicate a block is unreachable
488 /// without having to rewrite the CFG from within InstCombine.
490 auto &Ctx = InsertAt->getContext();
491 auto *SI = new StoreInst(ConstantInt::getTrue(Ctx),
493 /*isVolatile*/ false, Align(1));
494 InsertNewInstWith(SI, InsertAt->getIterator());
495 }
496
497 /// Combiner aware instruction erasure.
498 ///
499 /// When dealing with an instruction that has side effects or produces a void
500 /// value, we can't rely on DCE to delete the instruction. Instead, visit
501 /// methods should return the value returned by this function.
503 LLVM_DEBUG(dbgs() << "IC: ERASE " << I << '\n');
504 assert(I.use_empty() && "Cannot erase instruction that is used!");
506
507 // Make sure that we reprocess all operands now that we reduced their
508 // use counts.
509 SmallVector<Value *> Ops(I.operands());
510 Worklist.remove(&I);
511 DC.removeValue(&I);
512 I.eraseFromParent();
513 for (Value *Op : Ops)
514 Worklist.handleUseCountDecrement(Op);
515 MadeIRChange = true;
516 return nullptr; // Don't do anything with FI
517 }
518
519 OverflowResult computeOverflow(
520 Instruction::BinaryOps BinaryOp, bool IsSigned,
521 Value *LHS, Value *RHS, Instruction *CxtI) const;
522
523 /// Performs a few simplifications for operators which are associative
524 /// or commutative.
525 bool SimplifyAssociativeOrCommutative(BinaryOperator &I);
526
527 /// Tries to simplify binary operations which some other binary
528 /// operation distributes over.
529 ///
530 /// It does this by either by factorizing out common terms (eg "(A*B)+(A*C)"
531 /// -> "A*(B+C)") or expanding out if this results in simplifications (eg: "A
532 /// & (B | C) -> (A&B) | (A&C)" if this is a win). Returns the simplified
533 /// value, or null if it didn't simplify.
534 Value *foldUsingDistributiveLaws(BinaryOperator &I);
535
536 /// Tries to simplify add operations using the definition of remainder.
537 ///
538 /// The definition of remainder is X % C = X - (X / C ) * C. The add
539 /// expression X % C0 + (( X / C0 ) % C1) * C0 can be simplified to
540 /// X % (C0 * C1)
541 Value *SimplifyAddWithRemainder(BinaryOperator &I);
542
543 // Binary Op helper for select operations where the expression can be
544 // efficiently reorganized.
545 Value *SimplifySelectsFeedingBinaryOp(BinaryOperator &I, Value *LHS,
546 Value *RHS);
547
548 // If `I` has operand `(ctpop (not x))`, fold `I` with `(sub nuw nsw
549 // BitWidth(x), (ctpop x))`.
550 Instruction *tryFoldInstWithCtpopWithNot(Instruction *I);
551
552 // (Binop1 (Binop2 (logic_shift X, C), C1), (logic_shift Y, C))
553 // -> (logic_shift (Binop1 (Binop2 X, inv_logic_shift(C1, C)), Y), C)
554 // (Binop1 (Binop2 (logic_shift X, Amt), Mask), (logic_shift Y, Amt))
555 // -> (BinOp (logic_shift (BinOp X, Y)), Mask)
556 Instruction *foldBinOpShiftWithShift(BinaryOperator &I);
557
558 /// Tries to simplify binops of select and cast of the select condition.
559 ///
560 /// (Binop (cast C), (select C, T, F))
561 /// -> (select C, C0, C1)
562 Instruction *foldBinOpOfSelectAndCastOfSelectCondition(BinaryOperator &I);
563
564 /// This tries to simplify binary operations by factorizing out common terms
565 /// (e. g. "(A*B)+(A*C)" -> "A*(B+C)").
566 Value *tryFactorizationFolds(BinaryOperator &I);
567
568 /// Match a select chain which produces one of three values based on whether
569 /// the LHS is less than, equal to, or greater than RHS respectively.
570 /// Return true if we matched a three way compare idiom. The LHS, RHS, Less,
571 /// Equal and Greater values are saved in the matching process and returned to
572 /// the caller.
573 bool matchThreeWayIntCompare(SelectInst *SI, Value *&LHS, Value *&RHS,
574 ConstantInt *&Less, ConstantInt *&Equal,
575 ConstantInt *&Greater);
576
577 /// Attempts to replace I with a simpler value based on the demanded
578 /// bits.
579 Value *SimplifyDemandedUseBits(Instruction *I, const APInt &DemandedMask,
580 KnownBits &Known, const SimplifyQuery &Q,
581 unsigned Depth = 0);
583 bool SimplifyDemandedBits(Instruction *I, unsigned Op,
584 const APInt &DemandedMask, KnownBits &Known,
585 const SimplifyQuery &Q,
586 unsigned Depth = 0) override;
587
588 /// Helper routine of SimplifyDemandedUseBits. It computes KnownZero/KnownOne
589 /// bits. It also tries to handle simplifications that can be done based on
590 /// DemandedMask, but without modifying the Instruction.
591 Value *SimplifyMultipleUseDemandedBits(Instruction *I,
592 const APInt &DemandedMask,
593 KnownBits &Known,
594 const SimplifyQuery &Q,
595 unsigned Depth = 0);
596
597 /// Helper routine of SimplifyDemandedUseBits. It tries to simplify demanded
598 /// bit for "r1 = shr x, c1; r2 = shl r1, c2" instruction sequence.
599 Value *simplifyShrShlDemandedBits(
600 Instruction *Shr, const APInt &ShrOp1, Instruction *Shl,
601 const APInt &ShlOp1, const APInt &DemandedMask, KnownBits &Known);
602
603 /// Tries to simplify operands to an integer instruction based on its
604 /// demanded bits.
605 bool SimplifyDemandedInstructionBits(Instruction &Inst);
606 bool SimplifyDemandedInstructionBits(Instruction &Inst, KnownBits &Known);
607
608 Value *SimplifyDemandedVectorElts(Value *V, APInt DemandedElts,
609 APInt &PoisonElts, unsigned Depth = 0,
610 bool AllowMultipleUsers = false) override;
611
612 /// Attempts to replace V with a simpler value based on the demanded
613 /// floating-point classes
614 Value *SimplifyDemandedUseFPClass(Value *V, FPClassTest DemandedMask,
615 KnownFPClass &Known, Instruction *CxtI,
616 unsigned Depth = 0);
617 bool SimplifyDemandedFPClass(Instruction *I, unsigned Op,
618 FPClassTest DemandedMask, KnownFPClass &Known,
619 unsigned Depth = 0);
620
621 /// Common transforms for add / disjoint or
622 Instruction *foldAddLikeCommutative(Value *LHS, Value *RHS, bool NSW,
623 bool NUW);
624
625 /// Canonicalize the position of binops relative to shufflevector.
626 Instruction *foldVectorBinop(BinaryOperator &Inst);
630 VectorType *NewCTy);
631
632 /// Given a binary operator, cast instruction, or select which has a PHI node
633 /// as operand #0, see if we can fold the instruction into the PHI (which is
634 /// only possible if all operands to the PHI are constants).
636 bool AllowMultipleUses = false);
637
638 /// Try to fold binary operators whose operands are simple interleaved
639 /// recurrences to a single recurrence. This is a common pattern in reduction
640 /// operations.
641 /// Example:
642 /// %phi1 = phi [init1, %BB1], [%op1, %BB2]
643 /// %phi2 = phi [init2, %BB1], [%op2, %BB2]
644 /// %op1 = binop %phi1, constant1
645 /// %op2 = binop %phi2, constant2
646 /// %rdx = binop %op1, %op2
647 /// -->
648 /// %phi_combined = phi [init_combined, %BB1], [%op_combined, %BB2]
649 /// %rdx_combined = binop %phi_combined, constant_combined
651
652 /// For a binary operator with 2 phi operands, try to hoist the binary
653 /// operation before the phi. This can result in fewer instructions in
654 /// patterns where at least one set of phi operands simplifies.
655 /// Example:
656 /// BB3: binop (phi [X, BB1], [C1, BB2]), (phi [Y, BB1], [C2, BB2])
657 /// -->
658 /// BB1: BO = binop X, Y
659 /// BB3: phi [BO, BB1], [(binop C1, C2), BB2]
661
662 /// Given an instruction with a select as one operand and a constant as the
663 /// other operand, try to fold the binary operator into the select arguments.
664 /// This also works for Cast instructions, which obviously do not have a
665 /// second operand.
667 bool FoldWithMultiUse = false);
668
669 /// This is a convenience wrapper function for the above two functions.
671
673
676
677 /// Try to rotate an operation below a PHI node, using PHI nodes for
678 /// its operands.
687
688 /// If the phi is within a phi web, which is formed by the def-use chain
689 /// of phis and all the phis in the web are only used in the other phis.
690 /// In this case, these phis are dead and we will remove all of them.
691 bool foldDeadPhiWeb(PHINode &PN);
692
693 /// If an integer typed PHI has only one use which is an IntToPtr operation,
694 /// replace the PHI with an existing pointer typed PHI if it exists. Otherwise
695 /// insert a new pointer typed PHI and replace the original one.
697
698 /// Helper function for FoldPHIArgXIntoPHI() to set debug location for the
699 /// folded operation.
701
704 Instruction &I);
706 const ICmpInst &I);
707 bool foldAllocaCmp(AllocaInst *Alloca);
710 CmpInst &ICI,
711 ConstantInt *AndCst = nullptr);
713 Constant *RHSC);
717
726 const APInt &C);
729 Value *Z, CmpPredicate Pred);
735
737
739 const APInt &C);
741 ConstantInt *C);
743 const APInt &C);
745 const SimplifyQuery &Q);
747 const APInt &C);
749 const APInt &C);
751 const APInt &C);
753 const APInt &C);
755 const APInt &C);
757 const APInt &C);
759 const APInt &C);
761 const APInt &C);
763 const APInt &C);
765 const APInt &C);
767 const APInt &C);
769 const APInt &C1);
771 const APInt &C1, const APInt &C2);
773 const APInt &C);
775 const APInt &C2);
777 const APInt &C2);
778
780 BinaryOperator *BO,
781 const APInt &C);
783 BinaryOperator *BO,
784 const APInt &C);
786 const APInt &C);
788 const APInt &C);
792 ICmpInst &CxtI);
793
794 // Helpers of visitSelectInst().
802 Value *A, Value *B, Instruction &Outer,
806 Value *FalseVal);
809 unsigned Depth = 0);
810
811 Value *insertRangeTest(Value *V, const APInt &Lo, const APInt &Hi,
812 bool isSigned, bool Inside);
814
815 /// Given an initial instruction, check to see if it is the root of a
816 /// bswap/bitreverse idiom. If so, return the equivalent bswap/bitreverse
817 /// intrinsic.
819 bool MatchBitReversals);
820
823
825
826 bool tryToSinkInstruction(Instruction *I, BasicBlock *DestBlock);
828 Instruction *I, BasicBlock::iterator InsertPos, BasicBlock *SrcBlock,
830
832 void addDeadEdge(BasicBlock *From, BasicBlock *To,
838 void freelyInvertAllUsersOf(Value *V, Value *IgnoredUser = nullptr);
839
840 /// Take the exact integer log2 of the value. If DoFold is true, create the
841 /// actual instructions, otherwise return a non-null dummy value. Return
842 /// nullptr on failure. Note, if DoFold is true the caller must ensure that
843 /// takeLog2 will succeed, otherwise it may create stray instructions.
844 Value *takeLog2(Value *Op, unsigned Depth, bool AssumeNonZero, bool DoFold);
845
846 Value *tryGetLog2(Value *Op, bool AssumeNonZero) {
847 if (takeLog2(Op, /*Depth=*/0, AssumeNonZero, /*DoFold=*/false))
848 return takeLog2(Op, /*Depth=*/0, AssumeNonZero, /*DoFold=*/true);
849 return nullptr;
850 }
851};
852
853class Negator final {
854 /// Top-to-bottom, def-to-use negated instruction tree we produced.
856
858 BuilderTy Builder;
859
860 const DominatorTree &DT;
861
862 const bool IsTrulyNegation;
863
864 SmallDenseMap<Value *, Value *> NegationsCache;
865
866 Negator(LLVMContext &C, const DataLayout &DL, const DominatorTree &DT,
867 bool IsTrulyNegation);
868
869#if LLVM_ENABLE_STATS
870 unsigned NumValuesVisitedInThisNegator = 0;
871 ~Negator();
872#endif
873
874 using Result = std::pair<ArrayRef<Instruction *> /*NewInstructions*/,
875 Value * /*NegatedRoot*/>;
876
877 std::array<Value *, 2> getSortedOperandsOfBinOp(Instruction *I);
878
879 [[nodiscard]] Value *visitImpl(Value *V, bool IsNSW, unsigned Depth);
880
881 [[nodiscard]] Value *negate(Value *V, bool IsNSW, unsigned Depth);
882
883 /// Recurse depth-first and attempt to sink the negation.
884 /// FIXME: use worklist?
885 [[nodiscard]] std::optional<Result> run(Value *Root, bool IsNSW);
886
887 Negator(const Negator &) = delete;
888 Negator(Negator &&) = delete;
889 Negator &operator=(const Negator &) = delete;
890 Negator &operator=(Negator &&) = delete;
891
892public:
893 /// Attempt to negate \p Root. Retuns nullptr if negation can't be performed,
894 /// otherwise returns negated value.
895 [[nodiscard]] static Value *Negate(bool LHSIsZero, bool IsNSW, Value *Root,
896 InstCombinerImpl &IC);
897};
898
900 /// Common base pointer.
901 Value *Ptr = nullptr;
902 /// LHS GEPs until common base.
904 /// RHS GEPs until common base.
906 /// LHS GEP NoWrapFlags until common base.
908 /// RHS GEP NoWrapFlags until common base.
910
912
913 /// Whether expanding the GEP chains is expensive.
914 bool isExpensive() const;
915};
916
917} // end namespace llvm
918
919#undef DEBUG_TYPE
920
921#endif // LLVM_LIB_TRANSFORMS_INSTCOMBINE_INSTCOMBINEINTERNAL_H
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
constexpr LLT S1
AMDGPU Register Bank Select
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< ShadowStackGC > C("shadow-stack", "Very portable GC for uncooperative code generators")
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static bool foldICmpWithDominatingICmp(CmpInst *Cmp, const TargetLowering &TLI)
For pattern like:
#define LLVM_LIBRARY_VISIBILITY
Definition Compiler.h:137
static bool willNotOverflow(BinaryOpIntrinsic *BO, LazyValueInfo *LVI)
static bool isSigned(unsigned int Opcode)
#define DEBUG_TYPE
Hexagon Common GEP
IRTranslator LLVM IR MI
static constexpr unsigned NegatorMaxNodesSSO
static constexpr unsigned NegatorDefaultMaxDepth
This file provides the interface for the instcombine pass implementation.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define I(x, y, z)
Definition MD5.cpp:58
uint64_t IntrinsicInst * II
StandardInstrumentations SI(Mod->getContext(), Debug, VerifyEach)
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
This file contains the declarations for profiling metadata utility functions.
const SmallVectorImpl< MachineOperand > & Cond
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define LLVM_DEBUG(...)
Definition Debug.h:114
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")
static OverflowResult computeOverflowForSignedAdd(const WithCache< const Value * > &LHS, const WithCache< const Value * > &RHS, const AddOperator *Add, const SimplifyQuery &SQ)
Value * RHS
Value * LHS
static const uint32_t IV[8]
Definition blake3_impl.h:83
Class for arbitrary precision integers.
Definition APInt.h:78
This class represents a conversion between pointers from one address space to another.
an instruction to allocate memory on the stack
This class represents any memset intrinsic.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41
A cache of @llvm.assume calls within a function.
an instruction that atomically reads a memory location, combines it with another value,...
LLVM Basic Block Representation.
Definition BasicBlock.h:62
InstListType::iterator iterator
Instruction iterators...
Definition BasicBlock.h:170
This class represents a no-op cast from one type to another.
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Conditional or Unconditional Branch instruction.
Analysis providing branch probability information.
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
CallBr instruction, tracking function calls that may not return control but instead transfer it to a ...
This class represents a function call, abstracting a target machine's calling convention.
This is the base class for all instructions that perform data casts.
Definition InstrTypes.h:448
This class is the base class for the comparison instructions.
Definition InstrTypes.h:664
An abstraction over a floating-point predicate, and a pack of an integer predicate with samesign info...
This is the shared class of boolean and integer constants.
Definition Constants.h:87
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
This is an important base class in LLVM.
Definition Constant.h:43
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:165
This instruction extracts a single (scalar) element from a VectorType value.
This instruction extracts a struct member or array element value from an aggregate value.
This instruction compares its operands according to the predicate given to the constructor.
This class represents a cast from floating point to signed integer.
This class represents a cast from floating point to unsigned integer.
This class represents a truncation of floating point types.
Convenience struct for specifying and reasoning about fast-math flags.
Definition FMF.h:22
An instruction for ordering other memory operations.
This class represents a freeze function that returns random concrete value if an operand is either a ...
Represents flags for the getelementptr instruction/expression.
static GEPNoWrapFlags all()
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
This instruction compares its operands according to the predicate given to the constructor.
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2783
This instruction inserts a single (scalar) element into a VectorType value.
This instruction inserts a struct field of array element value into an aggregate value.
Instruction * visitMul(BinaryOperator &I)
Instruction * foldICmpShrConstant(ICmpInst &Cmp, BinaryOperator *Shr, const APInt &C)
Fold icmp ({al}shr X, Y), C.
Instruction * FoldOpIntoSelect(Instruction &Op, SelectInst *SI, bool FoldWithMultiUse=false)
Given an instruction with a select as one operand and a constant as the other operand,...
Instruction * foldICmpWithZextOrSext(ICmpInst &ICmp)
Instruction * foldICmpSelectConstant(ICmpInst &Cmp, SelectInst *Select, ConstantInt *C)
Instruction * foldICmpSRemConstant(ICmpInst &Cmp, BinaryOperator *UDiv, const APInt &C)
Instruction * foldSelectToCmp(SelectInst &SI)
Instruction * visitAdd(BinaryOperator &I)
bool fmulByZeroIsZero(Value *MulVal, FastMathFlags FMF, const Instruction *CtxI) const
Check if fmul MulVal, +0.0 will yield +0.0 (or signed zero is ignorable).
Instruction * foldICmpBinOpWithConstant(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Fold an icmp with BinaryOp and constant operand: icmp Pred BO, C.
Instruction * foldICmpOrConstant(ICmpInst &Cmp, BinaryOperator *Or, const APInt &C)
Fold icmp (or X, Y), C.
Instruction * canonicalizeCondSignextOfHighBitExtractToSignextHighBitExtract(BinaryOperator &I)
virtual ~InstCombinerImpl()=default
Instruction * foldICmpTruncWithTruncOrExt(ICmpInst &Cmp, const SimplifyQuery &Q)
Fold icmp (trunc nuw/nsw X), (trunc nuw/nsw Y).
KnownFPClass computeKnownFPClass(Value *Val, FastMathFlags FMF, FPClassTest Interested=fcAllFlags, const Instruction *CtxI=nullptr, unsigned Depth=0) const
Instruction * visitLShr(BinaryOperator &I)
Instruction * foldBinOpIntoSelectOrPhi(BinaryOperator &I)
This is a convenience wrapper function for the above two functions.
Instruction * visitUDiv(BinaryOperator &I)
Instruction * visitOr(BinaryOperator &I)
Instruction * foldSignBitTest(ICmpInst &I)
Fold equality-comparison between zero and any (maybe truncated) right-shift by one-less-than-bitwidth...
Instruction * foldSelectEqualityTest(SelectInst &SI)
Instruction * visitZExt(ZExtInst &Zext)
Instruction * visitGEPOfGEP(GetElementPtrInst &GEP, GEPOperator *Src)
Instruction * foldSelectValueEquivalence(SelectInst &SI, CmpInst &CI)
Instruction * visitAddrSpaceCast(AddrSpaceCastInst &CI)
Instruction * foldPHIArgInsertValueInstructionIntoPHI(PHINode &PN)
If we have something like phi [insertvalue(a,b,0), insertvalue(c,d,0)], turn this into a phi[a,...
Instruction * visitSExt(SExtInst &Sext)
Instruction * visitUnreachableInst(UnreachableInst &I)
Instruction * visitURem(BinaryOperator &I)
Instruction * foldSquareSumInt(BinaryOperator &I)
Instruction * foldOpIntoPhi(Instruction &I, PHINode *PN, bool AllowMultipleUses=false)
Given a binary operator, cast instruction, or select which has a PHI node as operand #0,...
InstCombinerImpl(InstructionWorklist &Worklist, BuilderTy &Builder, Function &F, AAResults *AA, AssumptionCache &AC, TargetLibraryInfo &TLI, TargetTransformInfo &TTI, DominatorTree &DT, OptimizationRemarkEmitter &ORE, BlockFrequencyInfo *BFI, BranchProbabilityInfo *BPI, ProfileSummaryInfo *PSI, const DataLayout &DL, ReversePostOrderTraversal< BasicBlock * > &RPOT)
Value * insertRangeTest(Value *V, const APInt &Lo, const APInt &Hi, bool isSigned, bool Inside)
Emit a computation of: (V >= Lo && V < Hi) if Inside is true, otherwise (V < Lo || V >= Hi).
void handleUnreachableFrom(Instruction *I, SmallVectorImpl< BasicBlock * > &Worklist)
Instruction * foldICmpBinOp(ICmpInst &Cmp, const SimplifyQuery &SQ)
Try to fold icmp (binop), X or icmp X, (binop).
Instruction * foldVectorSelect(SelectInst &Sel)
Instruction * foldCmpLoadFromIndexedGlobal(LoadInst *LI, GetElementPtrInst *GEP, CmpInst &ICI, ConstantInt *AndCst=nullptr)
This is called when we see this pattern: cmp pred (load (gep GV, ...)), cmpcst where GV is a global v...
Instruction * visitFreeze(FreezeInst &I)
Instruction * foldICmpSubConstant(ICmpInst &Cmp, BinaryOperator *Sub, const APInt &C)
Fold icmp (sub X, Y), C.
Instruction * foldSelectShuffle(ShuffleVectorInst &Shuf)
Try to fold shuffles that are the equivalent of a vector select.
Instruction * visitLoadInst(LoadInst &LI)
Value * takeLog2(Value *Op, unsigned Depth, bool AssumeNonZero, bool DoFold)
Take the exact integer log2 of the value.
Instruction * visitFPToSI(FPToSIInst &FI)
Instruction * foldICmpWithClamp(ICmpInst &Cmp, Value *X, MinMaxIntrinsic *Min)
Match and fold patterns like: icmp eq/ne X, min(max(X, Lo), Hi) which represents a range check and ca...
Instruction * foldICmpInstWithConstantNotInt(ICmpInst &Cmp)
Handle icmp with constant (but not simple integer constant) RHS.
Instruction * visitAtomicRMWInst(AtomicRMWInst &SI)
Instruction * visitSRem(BinaryOperator &I)
Instruction * foldSPFofSPF(Instruction *Inner, SelectPatternFlavor SPF1, Value *A, Value *B, Instruction &Outer, SelectPatternFlavor SPF2, Value *C)
Instruction * visitTrunc(TruncInst &CI)
Instruction * foldICmpShlConstConst(ICmpInst &I, Value *ShAmt, const APInt &C1, const APInt &C2)
Handle "(icmp eq/ne (shl AP2, A), AP1)" -> (icmp eq/ne A, TrailingZeros(AP1) - TrailingZeros(AP2)).
SelectInst * createSelectInstWithUnknownProfile(Value *C, Value *S1, Value *S2, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Create select C, S1, S2.
Instruction * foldSquareSumFP(BinaryOperator &I)
Value * reassociateShiftAmtsOfTwoSameDirectionShifts(BinaryOperator *Sh0, const SimplifyQuery &SQ, bool AnalyzeForSignBitExtraction=false)
Instruction * foldSelectOpOp(SelectInst &SI, Instruction *TI, Instruction *FI)
We have (select c, TI, FI), and we know that TI and FI have the same opcode.
Instruction * visitUIToFP(CastInst &CI)
Instruction * foldPHIArgBinOpIntoPHI(PHINode &PN)
If we have something like phi [add (a,b), add(a,c)] and if a/b/c and the adds all have a single user,...
void handlePotentiallyDeadBlocks(SmallVectorImpl< BasicBlock * > &Worklist)
bool sinkNotIntoLogicalOp(Instruction &I)
Instruction * foldICmpEqIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst *II, const APInt &C)
Fold an equality icmp with LLVM intrinsic and constant operand.
Instruction * visitPtrToInt(PtrToIntInst &CI)
bool prepareWorklist(Function &F)
Perform early cleanup and prepare the InstCombine worklist.
std::optional< std::pair< Intrinsic::ID, SmallVector< Value *, 3 > > > convertOrOfShiftsToFunnelShift(Instruction &Or)
Instruction * visitFDiv(BinaryOperator &I)
Instruction * SimplifyAnyMemSet(AnyMemSetInst *MI)
bool simplifyDivRemOfSelectWithZeroOp(BinaryOperator &I)
Fold a divide or remainder with a select instruction divisor when one of the select operands is zero.
Instruction * visitSIToFP(CastInst &CI)
Instruction * visitSub(BinaryOperator &I)
Instruction * visitAShr(BinaryOperator &I)
bool replaceInInstruction(Value *V, Value *Old, Value *New, unsigned Depth=0)
Instruction * visitFree(CallInst &FI, Value *FreedOp)
Instruction * visitInsertValueInst(InsertValueInst &IV)
Try to find redundant insertvalue instructions, like the following ones: %0 = insertvalue { i8,...
Instruction * visitAnd(BinaryOperator &I)
Value * foldMultiplicationOverflowCheck(ICmpInst &Cmp)
Fold (-1 u/ x) u< y ((x * y) ?
Instruction * visitCallBrInst(CallBrInst &CBI)
Instruction * visitExtractValueInst(ExtractValueInst &EV)
Instruction * visitInsertElementInst(InsertElementInst &IE)
void handlePotentiallyDeadSuccessors(BasicBlock *BB, BasicBlock *LiveSucc)
Value * foldPtrToIntOfGEP(Type *IntTy, Value *Ptr)
Instruction * visitUnconditionalBranchInst(BranchInst &BI)
Instruction * commonCastTransforms(CastInst &CI)
Implement the transforms common to all CastInst visitors.
Instruction * foldICmpWithConstant(ICmpInst &Cmp)
Fold icmp Pred X, C.
CmpInst * canonicalizeICmpPredicate(CmpInst &I)
If we have a comparison with a non-canonical predicate, if we can update all the users,...
Instruction * foldBinopWithRecurrence(BinaryOperator &BO)
Try to fold binary operators whose operands are simple interleaved recurrences to a single recurrence...
Instruction * eraseInstFromFunction(Instruction &I) override
Combiner aware instruction erasure.
Instruction * foldICmpWithZero(ICmpInst &Cmp)
Instruction * visitExtractElementInst(ExtractElementInst &EI)
Instruction * commonIDivRemTransforms(BinaryOperator &I)
Common integer divide/remainder transforms.
Value * foldReversedIntrinsicOperands(IntrinsicInst *II)
If all arguments of the intrinsic are reverses, try to pull the reverse after the intrinsic.
Instruction * visitPHINode(PHINode &PN)
Instruction * foldICmpCommutative(CmpPredicate Pred, Value *Op0, Value *Op1, ICmpInst &CxtI)
Instruction * foldICmpBinOpEqualityWithConstant(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Fold an icmp equality instruction with binary operator LHS and constant RHS: icmp eq/ne BO,...
Instruction * foldItoFPtoI(CastInst &FI)
fpto{s/u}i({u/s}itofp(X)) --> X or zext(X) or sext(X) or trunc(X) This is safe if the intermediate ty...
Instruction * foldPHIArgOpIntoPHI(PHINode &PN)
Try to rotate an operation below a PHI node, using PHI nodes for its operands.
Instruction * visitLandingPadInst(LandingPadInst &LI)
Instruction * foldICmpUsingBoolRange(ICmpInst &I)
If one operand of an icmp is effectively a bool (value range of {0,1}), then try to reduce patterns b...
Instruction * foldICmpWithTrunc(ICmpInst &Cmp)
Instruction * foldICmpIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst *II, const APInt &C)
Fold an icmp with LLVM intrinsic and constant operand: icmp Pred II, C.
Instruction * visitFPTrunc(FPTruncInst &CI)
Instruction * visitStoreInst(StoreInst &SI)
Value * tryGetLog2(Value *Op, bool AssumeNonZero)
Instruction * foldPHIArgZextsIntoPHI(PHINode &PN)
TODO: This function could handle other cast types, but then it might require special-casing a cast fr...
Instruction * foldSelectInstWithICmp(SelectInst &SI, ICmpInst *ICI)
Instruction * visitFenceInst(FenceInst &FI)
Instruction * visitFCmpInst(FCmpInst &I)
Value * OptimizePointerDifference(Value *LHS, Value *RHS, Type *Ty, bool isNUW)
Optimize pointer differences into the same array into a size.
Instruction * visitBitCast(BitCastInst &CI)
Instruction * visitReturnInst(ReturnInst &RI)
bool sinkNotIntoOtherHandOfLogicalOp(Instruction &I)
Instruction * commonIDivTransforms(BinaryOperator &I)
This function implements the transforms common to both integer division instructions (udiv and sdiv).
Instruction * foldICmpUsingKnownBits(ICmpInst &Cmp)
Try to fold the comparison based on range information we can get by checking whether bits are known t...
Instruction * foldICmpDivConstant(ICmpInst &Cmp, BinaryOperator *Div, const APInt &C)
Fold icmp ({su}div X, Y), C.
Instruction * foldIRemByPowerOfTwoToBitTest(ICmpInst &I)
If we have: icmp eq/ne (urem/srem x, y), 0 iff y is a power-of-two, we can replace this with a bit te...
Instruction * foldFCmpIntToFPConst(FCmpInst &I, Instruction *LHSI, Constant *RHSC)
Fold fcmp ([us]itofp x, cst) if possible.
Instruction * visitShl(BinaryOperator &I)
Instruction * visitSwitchInst(SwitchInst &SI)
Instruction * foldICmpUDivConstant(ICmpInst &Cmp, BinaryOperator *UDiv, const APInt &C)
Fold icmp (udiv X, Y), C.
Instruction * visitFAdd(BinaryOperator &I)
Instruction * foldBinopWithPhiOperands(BinaryOperator &BO)
For a binary operator with 2 phi operands, try to hoist the binary operation before the phi.
Instruction * visitIntToPtr(IntToPtrInst &CI)
Instruction * foldICmpAddOpConst(Value *X, const APInt &C, CmpPredicate Pred)
Fold "icmp pred (X+C), X".
Instruction * foldICmpWithCastOp(ICmpInst &ICmp)
Handle icmp (cast x), (cast or constant).
Instruction * visitFPToUI(FPToUIInst &FI)
Instruction * foldICmpTruncConstant(ICmpInst &Cmp, TruncInst *Trunc, const APInt &C)
Fold icmp (trunc X), C.
bool mergeStoreIntoSuccessor(StoreInst &SI)
Try to transform: if () { *P = v1; } else { *P = v2 } or: *P = v1; if () { *P = v2; }...
Instruction * visitPtrToAddr(PtrToAddrInst &CI)
Instruction * visitInstruction(Instruction &I)
Specify what to return for unhandled instructions.
Instruction * foldSelectIntoOp(SelectInst &SI, Value *, Value *)
Try to fold the select into one of the operands to allow further optimization.
Instruction * foldShuffledIntrinsicOperands(IntrinsicInst *II)
If all arguments of the intrinsic are unary shuffles with the same mask, try to shuffle after the int...
Instruction * foldICmpAddConstant(ICmpInst &Cmp, BinaryOperator *Add, const APInt &C)
Fold icmp (add X, Y), C.
Instruction * foldICmpMulConstant(ICmpInst &Cmp, BinaryOperator *Mul, const APInt &C)
Fold icmp (mul X, Y), C.
Instruction * visitInvokeInst(InvokeInst &II)
Value * simplifyRangeCheck(ICmpInst *Cmp0, ICmpInst *Cmp1, bool Inverted)
Try to fold a signed range checked with lower bound 0 to an unsigned icmp.
KnownFPClass computeKnownFPClass(Value *Val, FPClassTest Interested=fcAllFlags, const Instruction *CtxI=nullptr, unsigned Depth=0) const
Instruction * foldVariableSignZeroExtensionOfVariableHighBitExtract(BinaryOperator &OldAShr)
Instruction * commonShiftTransforms(BinaryOperator &I)
Instruction * visitFRem(BinaryOperator &I)
Instruction * foldPHIArgLoadIntoPHI(PHINode &PN)
Instruction * foldICmpXorConstant(ICmpInst &Cmp, BinaryOperator *Xor, const APInt &C)
Fold icmp (xor X, Y), C.
Instruction * foldSelectICmp(CmpPredicate Pred, SelectInst *SI, Value *RHS, const ICmpInst &I)
bool foldIntegerTypedPHI(PHINode &PN)
If an integer typed PHI has only one use which is an IntToPtr operation, replace the PHI with an exis...
Instruction * foldICmpInstWithConstantAllowPoison(ICmpInst &Cmp, const APInt &C)
Try to fold integer comparisons with a constant operand: icmp Pred X, C where X is some kind of instr...
bool foldDeadPhiWeb(PHINode &PN)
If the phi is within a phi web, which is formed by the def-use chain of phis and all the phis in the ...
Instruction * foldIsMultipleOfAPowerOfTwo(ICmpInst &Cmp)
Fold icmp eq (num + mask) & ~mask, num to icmp eq (and num, mask), 0 Where mask is a low bit mask.
Instruction * visitXor(BinaryOperator &I)
Value * foldSelectWithConstOpToBinOp(ICmpInst *Cmp, Value *TrueVal, Value *FalseVal)
Value * EvaluateInDifferentType(Value *V, Type *Ty, bool isSigned)
Given an expression that CanEvaluateTruncated or CanEvaluateSExtd returns true for,...
Instruction * simplifyBinOpSplats(ShuffleVectorInst &SVI)
void CreateNonTerminatorUnreachable(Instruction *InsertAt)
Create and insert the idiom we use to indicate a block is unreachable without having to rewrite the C...
Instruction * foldICmpAndShift(ICmpInst &Cmp, BinaryOperator *And, const APInt &C1, const APInt &C2)
Fold icmp (and (sh X, Y), C2), C1.
Value * pushFreezeToPreventPoisonFromPropagating(FreezeInst &FI)
Instruction * foldICmpBinOpWithConstantViaTruthTable(ICmpInst &Cmp, BinaryOperator *BO, const APInt &C)
Instruction * foldICmpInstWithConstant(ICmpInst &Cmp)
Try to fold integer comparisons with a constant operand: icmp Pred X, C where X is some kind of instr...
Instruction * visitSelectInst(SelectInst &SI)
Instruction * foldICmpXorShiftConst(ICmpInst &Cmp, BinaryOperator *Xor, const APInt &C)
For power-of-2 C: ((X s>> ShiftC) ^ X) u< C --> (X + C) u< (C << 1) ((X s>> ShiftC) ^ X) u> (C - 1) -...
Instruction * foldPHIArgIntToPtrToPHI(PHINode &PN)
Instruction * visitFPExt(CastInst &CI)
Instruction * foldICmpShlConstant(ICmpInst &Cmp, BinaryOperator *Shl, const APInt &C)
Fold icmp (shl X, Y), C.
Instruction * visitFMul(BinaryOperator &I)
Instruction * foldSelectOfBools(SelectInst &SI)
Instruction * foldSelectExtConst(SelectInst &Sel)
Instruction * foldAddWithConstant(BinaryOperator &Add)
Instruction * foldICmpAndConstant(ICmpInst &Cmp, BinaryOperator *And, const APInt &C)
Fold icmp (and X, Y), C.
bool run()
Run the combiner over the entire worklist until it is empty.
Instruction * foldFMulReassoc(BinaryOperator &I)
Instruction * SliceUpIllegalIntegerPHI(PHINode &PN)
This is an integer PHI and we know that it has an illegal type: see if it is only used by trunc or tr...
Instruction * foldAggregateConstructionIntoAggregateReuse(InsertValueInst &OrigIVI)
Look for chain of insertvalue's that fully define an aggregate, and trace back the values inserted,...
Instruction * foldICmpEquality(ICmpInst &Cmp)
bool removeInstructionsBeforeUnreachable(Instruction &I)
Instruction * foldPHIArgGEPIntoPHI(PHINode &PN)
Instruction * foldICmpWithMinMax(Instruction &I, MinMaxIntrinsic *MinMax, Value *Z, CmpPredicate Pred)
Fold icmp Pred min|max(X, Y), Z.
Instruction * visitShuffleVectorInst(ShuffleVectorInst &SVI)
Instruction * FoldShiftByConstant(Value *Op0, Constant *Op1, BinaryOperator &I)
void tryToSinkInstructionDbgVariableRecords(Instruction *I, BasicBlock::iterator InsertPos, BasicBlock *SrcBlock, BasicBlock *DestBlock, SmallVectorImpl< DbgVariableRecord * > &DPUsers)
bool foldAllocaCmp(AllocaInst *Alloca)
void addDeadEdge(BasicBlock *From, BasicBlock *To, SmallVectorImpl< BasicBlock * > &Worklist)
void PHIArgMergedDebugLoc(Instruction *Inst, PHINode &PN)
Helper function for FoldPHIArgXIntoPHI() to set debug location for the folded operation.
Instruction * visitVAEndInst(VAEndInst &I)
Instruction * matchBSwapOrBitReverse(Instruction &I, bool MatchBSwaps, bool MatchBitReversals)
Given an initial instruction, check to see if it is the root of a bswap/bitreverse idiom.
Constant * unshuffleConstant(ArrayRef< int > ShMask, Constant *C, VectorType *NewCTy)
Find a constant NewC that has property: shuffle(NewC, ShMask) = C Returns nullptr if such a constant ...
Instruction * visitAllocSite(Instruction &FI)
Instruction * visitICmpInst(ICmpInst &I)
Instruction * SimplifyAnyMemTransfer(AnyMemTransferInst *MI)
Instruction * visitGetElementPtrInst(GetElementPtrInst &GEP)
Instruction * visitBranchInst(BranchInst &BI)
Instruction * foldPowiReassoc(BinaryOperator &I)
Instruction * foldFreezeIntoRecurrence(FreezeInst &I, PHINode *PN)
Instruction * visitSDiv(BinaryOperator &I)
bool tryToSinkInstruction(Instruction *I, BasicBlock *DestBlock)
Try to move the specified instruction from its current block into the beginning of DestBlock,...
Instruction * foldPHIArgExtractValueInstructionIntoPHI(PHINode &PN)
If we have something like phi [extractvalue(a,0), extractvalue(b,0)], turn this into a phi[a,...
Instruction * foldICmpShrConstConst(ICmpInst &I, Value *ShAmt, const APInt &C1, const APInt &C2)
Handle "(icmp eq/ne (ashr/lshr AP2, A), AP1)" -> (icmp eq/ne A, Log2(AP2/AP1)) -> (icmp eq/ne A,...
bool freezeOtherUses(FreezeInst &FI)
Instruction * visitFNeg(UnaryOperator &I)
void freelyInvertAllUsersOf(Value *V, Value *IgnoredUser=nullptr)
Freely adapt every user of V as-if V was changed to !V.
Instruction * commonIRemTransforms(BinaryOperator &I)
This function implements the transforms common to both integer remainder instructions (urem and srem)...
Instruction * visitAllocaInst(AllocaInst &AI)
Instruction * visitCallInst(CallInst &CI)
CallInst simplification.
Instruction * foldICmpAndConstConst(ICmpInst &Cmp, BinaryOperator *And, const APInt &C1)
Fold icmp (and X, C2), C1.
Instruction * visitFSub(BinaryOperator &I)
Instruction * foldICmpBitCast(ICmpInst &Cmp)
Instruction * foldGEPICmp(GEPOperator *GEPLHS, Value *RHS, CmpPredicate Cond, Instruction &I)
Fold comparisons between a GEP instruction and something else.
SimplifyQuery SQ
IRBuilder< TargetFolder, IRBuilderCallbackInserter > BuilderTy
An IRBuilder that automatically inserts new instructions into the worklist.
BlockFrequencyInfo * BFI
TargetLibraryInfo & TLI
InstructionWorklist & Worklist
A worklist of the instructions that need to be simplified.
Instruction * InsertNewInstWith(Instruction *New, BasicBlock::iterator Old)
Same as InsertNewInstBefore, but also sets the debug loc.
BranchProbabilityInfo * BPI
virtual bool SimplifyDemandedBits(Instruction *I, unsigned OpNo, const APInt &DemandedMask, KnownBits &Known, const SimplifyQuery &Q, unsigned Depth=0)=0
ReversePostOrderTraversal< BasicBlock * > & RPOT
const DataLayout & DL
DomConditionCache DC
AssumptionCache & AC
DominatorTree & DT
ProfileSummaryInfo * PSI
BuilderTy & Builder
OptimizationRemarkEmitter & ORE
InstCombiner(InstructionWorklist &Worklist, BuilderTy &Builder, Function &F, AAResults *AA, AssumptionCache &AC, TargetLibraryInfo &TLI, TargetTransformInfo &TTI, DominatorTree &DT, OptimizationRemarkEmitter &ORE, BlockFrequencyInfo *BFI, BranchProbabilityInfo *BPI, ProfileSummaryInfo *PSI, const DataLayout &DL, ReversePostOrderTraversal< BasicBlock * > &RPOT)
const SimplifyQuery & getSimplifyQuery() const
Base class for instruction visitors.
Definition InstVisitor.h:78
InstructionWorklist - This is the worklist management logic for InstCombine and other simplification ...
This class represents a cast from an integer to a pointer.
A wrapper class for inspecting calls to intrinsic functions.
Invoke instruction.
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
The landingpad instruction holds all of the information necessary to generate correct exception handl...
An instruction for reading from memory.
This class represents min/max intrinsics.
static Value * Negate(bool LHSIsZero, bool IsNSW, Value *Root, InstCombinerImpl &IC)
Attempt to negate Root.
The optimization diagnostic interface.
static PointerType * getUnqual(Type *ElementType)
This constructs a pointer to an object of the specified type in the default address space (address sp...
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Analysis providing profile information.
This class represents a cast from a pointer to an address (non-capturing ptrtoint).
This class represents a cast from a pointer to an integer.
Return a value (possibly void), from a function.
This class represents a sign extension of integer types.
This class represents the LLVM 'select' instruction.
static SelectInst * Create(Value *C, Value *S1, Value *S2, const Twine &NameStr="", InsertPosition InsertBefore=nullptr, const Instruction *MDFrom=nullptr)
This instruction constructs a fixed permutation of two input vectors.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
An instruction for storing to memory.
Multiway switch.
Provides information about what library functions are available for the current target.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
This class represents a truncation of integer types.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45
This function has undefined behavior.
This represents the llvm.va_end intrinsic.
LLVM Value Representation.
Definition Value.h:75
LLVM_ABI LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.cpp:1099
Base class of all SIMD vector types.
This class represents zero extension of integer types.
self_iterator getIterator()
Definition ilist_node.h:123
CallInst * Call
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73
This is an optimization pass for GlobalISel generic memory operations.
@ NeverOverflows
Never overflows.
LLVM_ABI KnownFPClass computeKnownFPClass(const Value *V, const APInt &DemandedElts, FPClassTest InterestedClasses, const SimplifyQuery &SQ, unsigned Depth=0)
Determine which floating-point classes are valid for V, and return them in KnownFPClass bit sets.
LLVM_ABI void salvageDebugInfo(const MachineRegisterInfo &MRI, MachineInstr &MI)
Assuming the instruction MI is going to be deleted, attempt to salvage debug users of MI by writing t...
Definition Utils.cpp:1725
LLVM_ABI void setExplicitlyUnknownBranchWeightsIfProfiled(Instruction &I, Function &F, StringRef PassName)
Like setExplicitlyUnknownBranchWeights(...), but only sets unknown branch weights in the new instruct...
LLVM_ABI OverflowResult computeOverflowForUnsignedMul(const Value *LHS, const Value *RHS, const SimplifyQuery &SQ, bool IsNSW=false)
LLVM_ABI OverflowResult computeOverflowForSignedSub(const Value *LHS, const Value *RHS, const SimplifyQuery &SQ)
SelectPatternFlavor
Specific patterns of select instructions we can match.
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207
LLVM_ABI OverflowResult computeOverflowForSignedMul(const Value *LHS, const Value *RHS, const SimplifyQuery &SQ)
TargetTransformInfo TTI
@ Mul
Product of integers.
@ Xor
Bitwise or logical XOR of integers.
@ Sub
Subtraction of integers.
@ Add
Sum of integers.
DWARFExpression::Operation Op
constexpr unsigned BitWidth
LLVM_ABI OverflowResult computeOverflowForUnsignedSub(const Value *LHS, const Value *RHS, const SimplifyQuery &SQ)
LLVM_ABI OverflowResult computeOverflowForUnsignedAdd(const WithCache< const Value * > &LHS, const WithCache< const Value * > &RHS, const SimplifyQuery &SQ)
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
Value * Ptr
Common base pointer.
SmallVector< GEPOperator * > RHSGEPs
RHS GEPs until common base.
GEPNoWrapFlags LHSNW
LHS GEP NoWrapFlags until common base.
GEPNoWrapFlags RHSNW
RHS GEP NoWrapFlags until common base.
SmallVector< GEPOperator * > LHSGEPs
LHS GEPs until common base.
bool isExpensive() const
Whether expanding the GEP chains is expensive.
static CommonPointerBase compute(Value *LHS, Value *RHS)
Matching combinators.