doxygen/InstCombineCalls_8cpp_source.html

//===- InstCombineCalls.cpp -----------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the visitCall, visitInvoke, and visitCallBr functions.

//

//===----------------------------------------------------------------------===//


#include "InstCombineInternal.h"

#include "llvm/ADT/APFloat.h"

#include "llvm/ADT/APInt.h"

#include "llvm/ADT/APSInt.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/ADT/STLFunctionalExtras.h"

#include "llvm/ADT/SmallBitVector.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/AssumeBundleQueries.h"

#include "llvm/Analysis/AssumptionCache.h"

#include "llvm/Analysis/InstructionSimplify.h"

#include "llvm/Analysis/Loads.h"

#include "llvm/Analysis/MemoryBuiltins.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/IR/AttributeMask.h"

#include "llvm/IR/Attributes.h"

#include "llvm/IR/BasicBlock.h"

#include "llvm/IR/Constant.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/DebugInfo.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/GlobalVariable.h"

#include "llvm/IR/InlineAsm.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instruction.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/IntrinsicsAArch64.h"

#include "llvm/IR/IntrinsicsAMDGPU.h"

#include "llvm/IR/IntrinsicsARM.h"

#include "llvm/IR/IntrinsicsHexagon.h"

#include "llvm/IR/LLVMContext.h"

#include "llvm/IR/Metadata.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/IR/Statepoint.h"

#include "llvm/IR/Type.h"

#include "llvm/IR/User.h"

#include "llvm/IR/Value.h"

#include "llvm/IR/ValueHandle.h"

#include "llvm/Support/AtomicOrdering.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Support/MathExtras.h"

#include "llvm/Support/raw_ostream.h"

#include "llvm/Transforms/InstCombine/InstCombiner.h"

#include "llvm/Transforms/Utils/AssumeBundleBuilder.h"

#include "llvm/Transforms/Utils/Local.h"

#include "llvm/Transforms/Utils/SimplifyLibCalls.h"

#include <algorithm>

#include <cassert>

#include <cstdint>

#include <optional>

#include <utility>

#include <vector>


#define DEBUG_TYPE "instcombine"

#include "llvm/Transforms/Utils/InstructionWorklist.h"


using namespace llvm;

using namespace PatternMatch;


STATISTIC(NumSimplified, "Number of library calls simplified");


static cl::opt<unsigned> GuardWideningWindow(

    "instcombine-guard-widening-window",

    cl::init(3),

    cl::desc("How wide an instruction window to bypass looking for "

             "another guard"));


/// Return the specified type promoted as it would be to pass though a va_arg

/// area.

static Type *getPromotedType(Type *Ty) {

  if (IntegerType* ITy = dyn_cast<IntegerType>(Ty)) {

    if (ITy->getBitWidth() < 32)

      return Type::getInt32Ty(Ty->getContext());

  }

  return Ty;

}


/// Recognize a memcpy/memmove from a trivially otherwise unused alloca.

/// TODO: This should probably be integrated with visitAllocSites, but that

/// requires a deeper change to allow either unread or unwritten objects.

static bool hasUndefSource(AnyMemTransferInst *MI) {

  auto *Src = MI->getRawSource();

  while (isa<GetElementPtrInst>(Src) || isa<BitCastInst>(Src)) {

    if (!Src->hasOneUse())

      return false;

    Src = cast<Instruction>(Src)->getOperand(0);

  }

  return isa<AllocaInst>(Src) && Src->hasOneUse();

}


Instruction *InstCombinerImpl::SimplifyAnyMemTransfer(AnyMemTransferInst *MI) {

  Align DstAlign = getKnownAlignment(MI->getRawDest(), DL, MI, &AC, &DT);

  MaybeAlign CopyDstAlign = MI->getDestAlign();

  if (!CopyDstAlign || *CopyDstAlign < DstAlign) {

    MI->setDestAlignment(DstAlign);

    return MI;

  }


  Align SrcAlign = getKnownAlignment(MI->getRawSource(), DL, MI, &AC, &DT);

  MaybeAlign CopySrcAlign = MI->getSourceAlign();

  if (!CopySrcAlign || *CopySrcAlign < SrcAlign) {

    MI->setSourceAlignment(SrcAlign);

    return MI;

  }


  // If we have a store to a location which is known constant, we can conclude

  // that the store must be storing the constant value (else the memory

  // wouldn't be constant), and this must be a noop.

  if (!isModSet(AA->getModRefInfoMask(MI->getDest()))) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // If the source is provably undef, the memcpy/memmove doesn't do anything

  // (unless the transfer is volatile).

  if (hasUndefSource(MI) && !MI->isVolatile()) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // If MemCpyInst length is 1/2/4/8 bytes then replace memcpy with

  // load/store.

  ConstantInt *MemOpLength = dyn_cast<ConstantInt>(MI->getLength());

  if (!MemOpLength) return nullptr;


  // Source and destination pointer types are always "i8*" for intrinsic.  See

  // if the size is something we can handle with a single primitive load/store.

  // A single load+store correctly handles overlapping memory in the memmove

  // case.

  uint64_t Size = MemOpLength->getLimitedValue();

  assert(Size && "0-sized memory transferring should be removed already.");


  if (Size > 8 || (Size&(Size-1)))

    return nullptr;  // If not 1/2/4/8 bytes, exit.


  // If it is an atomic and alignment is less than the size then we will

  // introduce the unaligned memory access which will be later transformed

  // into libcall in CodeGen. This is not evident performance gain so disable

  // it now.

  if (isa<AtomicMemTransferInst>(MI))

    if (*CopyDstAlign < Size || *CopySrcAlign < Size)

      return nullptr;


  // Use an integer load+store unless we can find something better.

  IntegerType* IntType = IntegerType::get(MI->getContext(), Size<<3);


  // If the memcpy has metadata describing the members, see if we can get the

  // TBAA tag describing our copy.

  AAMDNodes AACopyMD = MI->getAAMetadata().adjustForAccess(Size);


  Value *Src = MI->getArgOperand(1);

  Value *Dest = MI->getArgOperand(0);

  LoadInst *L = Builder.CreateLoad(IntType, Src);

  // Alignment from the mem intrinsic will be better, so use it.

  L->setAlignment(*CopySrcAlign);

  L->setAAMetadata(AACopyMD);

  MDNode *LoopMemParallelMD =

    MI->getMetadata(LLVMContext::MD_mem_parallel_loop_access);

  if (LoopMemParallelMD)

    L->setMetadata(LLVMContext::MD_mem_parallel_loop_access, LoopMemParallelMD);

  MDNode *AccessGroupMD = MI->getMetadata(LLVMContext::MD_access_group);

  if (AccessGroupMD)

    L->setMetadata(LLVMContext::MD_access_group, AccessGroupMD);


  StoreInst *S = Builder.CreateStore(L, Dest);

  // Alignment from the mem intrinsic will be better, so use it.

  S->setAlignment(*CopyDstAlign);

  S->setAAMetadata(AACopyMD);

  if (LoopMemParallelMD)

    S->setMetadata(LLVMContext::MD_mem_parallel_loop_access, LoopMemParallelMD);

  if (AccessGroupMD)

    S->setMetadata(LLVMContext::MD_access_group, AccessGroupMD);

  S->copyMetadata(*MI, LLVMContext::MD_DIAssignID);


  if (auto *MT = dyn_cast<MemTransferInst>(MI)) {

    // non-atomics can be volatile

    L->setVolatile(MT->isVolatile());

    S->setVolatile(MT->isVolatile());

  }

  if (isa<AtomicMemTransferInst>(MI)) {

    // atomics have to be unordered

    L->setOrdering(AtomicOrdering::Unordered);

    S->setOrdering(AtomicOrdering::Unordered);

  }


  // Set the size of the copy to 0, it will be deleted on the next iteration.

  MI->setLength(Constant::getNullValue(MemOpLength->getType()));

  return MI;

}


Instruction *InstCombinerImpl::SimplifyAnyMemSet(AnyMemSetInst *MI) {

  const Align KnownAlignment =

      getKnownAlignment(MI->getDest(), DL, MI, &AC, &DT);

  MaybeAlign MemSetAlign = MI->getDestAlign();

  if (!MemSetAlign || *MemSetAlign < KnownAlignment) {

    MI->setDestAlignment(KnownAlignment);

    return MI;

  }


  // If we have a store to a location which is known constant, we can conclude

  // that the store must be storing the constant value (else the memory

  // wouldn't be constant), and this must be a noop.

  if (!isModSet(AA->getModRefInfoMask(MI->getDest()))) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // Remove memset with an undef value.

  // FIXME: This is technically incorrect because it might overwrite a poison

  // value. Change to PoisonValue once #52930 is resolved.

  if (isa<UndefValue>(MI->getValue())) {

    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(MI->getLength()->getType()));

    return MI;

  }


  // Extract the length and alignment and fill if they are constant.

  ConstantInt *LenC = dyn_cast<ConstantInt>(MI->getLength());

  ConstantInt *FillC = dyn_cast<ConstantInt>(MI->getValue());

  if (!LenC || !FillC || !FillC->getType()->isIntegerTy(8))

    return nullptr;

  const uint64_t Len = LenC->getLimitedValue();

  assert(Len && "0-sized memory setting should be removed already.");

  const Align Alignment = MI->getDestAlign().valueOrOne();


  // If it is an atomic and alignment is less than the size then we will

  // introduce the unaligned memory access which will be later transformed

  // into libcall in CodeGen. This is not evident performance gain so disable

  // it now.

  if (isa<AtomicMemSetInst>(MI))

    if (Alignment < Len)

      return nullptr;


  // memset(s,c,n) -> store s, c (for n=1,2,4,8)

  if (Len <= 8 && isPowerOf2_32((uint32_t)Len)) {

    Type *ITy = IntegerType::get(MI->getContext(), Len*8);  // n=1 -> i8.


    Value *Dest = MI->getDest();


    // Extract the fill value and store.

    const uint64_t Fill = FillC->getZExtValue()*0x0101010101010101ULL;

    Constant *FillVal = ConstantInt::get(ITy, Fill);

    StoreInst *S = Builder.CreateStore(FillVal, Dest, MI->isVolatile());

    S->copyMetadata(*MI, LLVMContext::MD_DIAssignID);

    auto replaceOpForAssignmentMarkers = [FillC, FillVal](auto *DbgAssign) {

      if (llvm::is_contained(DbgAssign->location_ops(), FillC))

        DbgAssign->replaceVariableLocationOp(FillC, FillVal);

    };

    for_each(at::getAssignmentMarkers(S), replaceOpForAssignmentMarkers);

    for_each(at::getDVRAssignmentMarkers(S), replaceOpForAssignmentMarkers);


    S->setAlignment(Alignment);

    if (isa<AtomicMemSetInst>(MI))

      S->setOrdering(AtomicOrdering::Unordered);


    // Set the size of the copy to 0, it will be deleted on the next iteration.

    MI->setLength(Constant::getNullValue(LenC->getType()));

    return MI;

  }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Narrow width by halfs excluding zero/undef lanes

Value *InstCombinerImpl::simplifyMaskedLoad(IntrinsicInst &II) {

  Value *LoadPtr = II.getArgOperand(0);

  const Align Alignment =

      cast<ConstantInt>(II.getArgOperand(1))->getAlignValue();


  // If the mask is all ones or undefs, this is a plain vector load of the 1st

  // argument.

  if (maskIsAllOneOrUndef(II.getArgOperand(2))) {

    LoadInst *L = Builder.CreateAlignedLoad(II.getType(), LoadPtr, Alignment,

                                            "unmaskedload");

    L->copyMetadata(II);

    return L;

  }


  // If we can unconditionally load from this address, replace with a

  // load/select idiom. TODO: use DT for context sensitive query

  if (isDereferenceablePointer(LoadPtr, II.getType(),

                               II.getModule()->getDataLayout(), &II, &AC)) {

    LoadInst *LI = Builder.CreateAlignedLoad(II.getType(), LoadPtr, Alignment,

                                             "unmaskedload");

    LI->copyMetadata(II);

    return Builder.CreateSelect(II.getArgOperand(2), LI, II.getArgOperand(3));

  }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane -> store

// * Narrow width by halfs excluding zero/undef lanes

Instruction *InstCombinerImpl::simplifyMaskedStore(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(3));

  if (!ConstMask)

    return nullptr;


  // If the mask is all zeros, this instruction does nothing.

  if (ConstMask->isNullValue())

    return eraseInstFromFunction(II);


  // If the mask is all ones, this is a plain vector store of the 1st argument.

  if (ConstMask->isAllOnesValue()) {

    Value *StorePtr = II.getArgOperand(1);

    Align Alignment = cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

    StoreInst *S =

        new StoreInst(II.getArgOperand(0), StorePtr, false, Alignment);

    S->copyMetadata(II);

    return S;

  }


  if (isa<ScalableVectorType>(ConstMask->getType()))

    return nullptr;


  // Use masked off lanes to simplify operands via SimplifyDemandedVectorElts

  APInt DemandedElts = possiblyDemandedEltsInMask(ConstMask);

  APInt PoisonElts(DemandedElts.getBitWidth(), 0);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(0), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 0, V);


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane load -> load

// * Dereferenceable address & few lanes -> scalarize speculative load/selects

// * Adjacent vector addresses -> masked.load

// * Narrow width by halfs excluding zero/undef lanes

// * Vector incrementing address -> vector masked load

Instruction *InstCombinerImpl::simplifyMaskedGather(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(2));

  if (!ConstMask)

    return nullptr;


  // Vector splat address w/known mask -> scalar load

  // Fold the gather to load the source vector first lane

  // because it is reloading the same value each time

  if (ConstMask->isAllOnesValue())

    if (auto *SplatPtr = getSplatValue(II.getArgOperand(0))) {

      auto *VecTy = cast<VectorType>(II.getType());

      const Align Alignment =

          cast<ConstantInt>(II.getArgOperand(1))->getAlignValue();

      LoadInst *L = Builder.CreateAlignedLoad(VecTy->getElementType(), SplatPtr,

                                              Alignment, "load.scalar");

      Value *Shuf =

          Builder.CreateVectorSplat(VecTy->getElementCount(), L, "broadcast");

      return replaceInstUsesWith(II, cast<Instruction>(Shuf));

    }


  return nullptr;

}


// TODO, Obvious Missing Transforms:

// * Single constant active lane -> store

// * Adjacent vector addresses -> masked.store

// * Narrow store width by halfs excluding zero/undef lanes

// * Vector incrementing address -> vector masked store

Instruction *InstCombinerImpl::simplifyMaskedScatter(IntrinsicInst &II) {

  auto *ConstMask = dyn_cast<Constant>(II.getArgOperand(3));

  if (!ConstMask)

    return nullptr;


  // If the mask is all zeros, a scatter does nothing.

  if (ConstMask->isNullValue())

    return eraseInstFromFunction(II);


  // Vector splat address -> scalar store

  if (auto *SplatPtr = getSplatValue(II.getArgOperand(1))) {

    // scatter(splat(value), splat(ptr), non-zero-mask) -> store value, ptr

    if (auto *SplatValue = getSplatValue(II.getArgOperand(0))) {

      if (maskContainsAllOneOrUndef(ConstMask)) {

        Align Alignment =

            cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

        StoreInst *S = new StoreInst(SplatValue, SplatPtr, /*IsVolatile=*/false,

                                     Alignment);

        S->copyMetadata(II);

        return S;

      }

    }

    // scatter(vector, splat(ptr), splat(true)) -> store extract(vector,

    // lastlane), ptr

    if (ConstMask->isAllOnesValue()) {

      Align Alignment = cast<ConstantInt>(II.getArgOperand(2))->getAlignValue();

      VectorType *WideLoadTy = cast<VectorType>(II.getArgOperand(1)->getType());

      ElementCount VF = WideLoadTy->getElementCount();

      Value *RunTimeVF = Builder.CreateElementCount(Builder.getInt32Ty(), VF);

      Value *LastLane = Builder.CreateSub(RunTimeVF, Builder.getInt32(1));

      Value *Extract =

          Builder.CreateExtractElement(II.getArgOperand(0), LastLane);

      StoreInst *S =

          new StoreInst(Extract, SplatPtr, /*IsVolatile=*/false, Alignment);

      S->copyMetadata(II);

      return S;

    }

  }

  if (isa<ScalableVectorType>(ConstMask->getType()))

    return nullptr;


  // Use masked off lanes to simplify operands via SimplifyDemandedVectorElts

  APInt DemandedElts = possiblyDemandedEltsInMask(ConstMask);

  APInt PoisonElts(DemandedElts.getBitWidth(), 0);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(0), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 0, V);

  if (Value *V = SimplifyDemandedVectorElts(II.getOperand(1), DemandedElts,

                                            PoisonElts))

    return replaceOperand(II, 1, V);


  return nullptr;

}


/// This function transforms launder.invariant.group and strip.invariant.group

/// like:

/// launder(launder(%x)) -> launder(%x)       (the result is not the argument)

/// launder(strip(%x)) -> launder(%x)

/// strip(strip(%x)) -> strip(%x)             (the result is not the argument)

/// strip(launder(%x)) -> strip(%x)

/// This is legal because it preserves the most recent information about

/// the presence or absence of invariant.group.

static Instruction *simplifyInvariantGroupIntrinsic(IntrinsicInst &II,

                                                    InstCombinerImpl &IC) {

  auto *Arg = II.getArgOperand(0);

  auto *StrippedArg = Arg->stripPointerCasts();

  auto *StrippedInvariantGroupsArg = StrippedArg;

  while (auto *Intr = dyn_cast<IntrinsicInst>(StrippedInvariantGroupsArg)) {

    if (Intr->getIntrinsicID() != Intrinsic::launder_invariant_group &&

        Intr->getIntrinsicID() != Intrinsic::strip_invariant_group)

      break;

    StrippedInvariantGroupsArg = Intr->getArgOperand(0)->stripPointerCasts();

  }

  if (StrippedArg == StrippedInvariantGroupsArg)

    return nullptr; // No launders/strips to remove.


  Value *Result = nullptr;


  if (II.getIntrinsicID() == Intrinsic::launder_invariant_group)

    Result = IC.Builder.CreateLaunderInvariantGroup(StrippedInvariantGroupsArg);

  else if (II.getIntrinsicID() == Intrinsic::strip_invariant_group)

    Result = IC.Builder.CreateStripInvariantGroup(StrippedInvariantGroupsArg);

  else

    llvm_unreachable(

        "simplifyInvariantGroupIntrinsic only handles launder and strip");

  if (Result->getType()->getPointerAddressSpace() !=

      II.getType()->getPointerAddressSpace())

    Result = IC.Builder.CreateAddrSpaceCast(Result, II.getType());


  return cast<Instruction>(Result);

}


static Instruction *foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC) {

  assert((II.getIntrinsicID() == Intrinsic::cttz ||

          II.getIntrinsicID() == Intrinsic::ctlz) &&

         "Expected cttz or ctlz intrinsic");

  bool IsTZ = II.getIntrinsicID() == Intrinsic::cttz;

  Value *Op0 = II.getArgOperand(0);

  Value *Op1 = II.getArgOperand(1);

  Value *X;

  // ctlz(bitreverse(x)) -> cttz(x)

  // cttz(bitreverse(x)) -> ctlz(x)

  if (match(Op0, m_BitReverse(m_Value(X)))) {

    Intrinsic::ID ID = IsTZ ? Intrinsic::ctlz : Intrinsic::cttz;

    Function *F = Intrinsic::getDeclaration(II.getModule(), ID, II.getType());

    return CallInst::Create(F, {X, II.getArgOperand(1)});

  }


  if (II.getType()->isIntOrIntVectorTy(1)) {

    // ctlz/cttz i1 Op0 --> not Op0

    if (match(Op1, m_Zero()))

      return BinaryOperator::CreateNot(Op0);

    // If zero is poison, then the input can be assumed to be "true", so the

    // instruction simplifies to "false".

    assert(match(Op1, m_One()) && "Expected ctlz/cttz operand to be 0 or 1");

    return IC.replaceInstUsesWith(II, ConstantInt::getNullValue(II.getType()));

  }


  // If ctlz/cttz is only used as a shift amount, set is_zero_poison to true.

  if (II.hasOneUse() && match(Op1, m_Zero()) &&

      match(II.user_back(), m_Shift(m_Value(), m_Specific(&II))))

    return IC.replaceOperand(II, 1, IC.Builder.getTrue());


  Constant *C;


  if (IsTZ) {

    // cttz(-x) -> cttz(x)

    if (match(Op0, m_Neg(m_Value(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(-x & x) -> cttz(x)

    if (match(Op0, m_c_And(m_Neg(m_Value(X)), m_Deferred(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(sext(x)) -> cttz(zext(x))

    if (match(Op0, m_OneUse(m_SExt(m_Value(X))))) {

      auto *Zext = IC.Builder.CreateZExt(X, II.getType());

      auto *CttzZext =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, Zext, Op1);

      return IC.replaceInstUsesWith(II, CttzZext);

    }


    // Zext doesn't change the number of trailing zeros, so narrow:

    // cttz(zext(x)) -> zext(cttz(x)) if the 'ZeroIsPoison' parameter is 'true'.

    if (match(Op0, m_OneUse(m_ZExt(m_Value(X)))) && match(Op1, m_One())) {

      auto *Cttz = IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, X,

                                                    IC.Builder.getTrue());

      auto *ZextCttz = IC.Builder.CreateZExt(Cttz, II.getType());

      return IC.replaceInstUsesWith(II, ZextCttz);

    }


    // cttz(abs(x)) -> cttz(x)

    // cttz(nabs(x)) -> cttz(x)

    Value *Y;

    SelectPatternFlavor SPF = matchSelectPattern(Op0, X, Y).Flavor;

    if (SPF == SPF_ABS || SPF == SPF_NABS)

      return IC.replaceOperand(II, 0, X);


    if (match(Op0, m_Intrinsic<Intrinsic::abs>(m_Value(X))))

      return IC.replaceOperand(II, 0, X);


    // cttz(shl(%const, %val), 1) --> add(cttz(%const, 1), %val)

    if (match(Op0, m_Shl(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCttz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, C, Op1);

      return BinaryOperator::CreateAdd(ConstCttz, X);

    }


    // cttz(lshr exact (%const, %val), 1) --> sub(cttz(%const, 1), %val)

    if (match(Op0, m_Exact(m_LShr(m_ImmConstant(C), m_Value(X)))) &&

        match(Op1, m_One())) {

      Value *ConstCttz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::cttz, C, Op1);

      return BinaryOperator::CreateSub(ConstCttz, X);

    }


    // cttz(add(lshr(UINT_MAX, %val), 1)) --> sub(width, %val)

    if (match(Op0, m_Add(m_LShr(m_AllOnes(), m_Value(X)), m_One()))) {

      Value *Width =

          ConstantInt::get(II.getType(), II.getType()->getScalarSizeInBits());

      return BinaryOperator::CreateSub(Width, X);

    }

  } else {

    // ctlz(lshr(%const, %val), 1) --> add(ctlz(%const, 1), %val)

    if (match(Op0, m_LShr(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCtlz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);

      return BinaryOperator::CreateAdd(ConstCtlz, X);

    }


    // ctlz(shl nuw (%const, %val), 1) --> sub(ctlz(%const, 1), %val)

    if (match(Op0, m_NUWShl(m_ImmConstant(C), m_Value(X))) &&

        match(Op1, m_One())) {

      Value *ConstCtlz =

          IC.Builder.CreateBinaryIntrinsic(Intrinsic::ctlz, C, Op1);

      return BinaryOperator::CreateSub(ConstCtlz, X);

    }

  }


  KnownBits Known = IC.computeKnownBits(Op0, 0, &II);


  // Create a mask for bits above (ctlz) or below (cttz) the first known one.

  unsigned PossibleZeros = IsTZ ? Known.countMaxTrailingZeros()

                                : Known.countMaxLeadingZeros();

  unsigned DefiniteZeros = IsTZ ? Known.countMinTrailingZeros()

                                : Known.countMinLeadingZeros();


  // If all bits above (ctlz) or below (cttz) the first known one are known

  // zero, this value is constant.

  // FIXME: This should be in InstSimplify because we're replacing an

  // instruction with a constant.

  if (PossibleZeros == DefiniteZeros) {

    auto *C = ConstantInt::get(Op0->getType(), DefiniteZeros);

    return IC.replaceInstUsesWith(II, C);

  }


  // If the input to cttz/ctlz is known to be non-zero,

  // then change the 'ZeroIsPoison' parameter to 'true'

  // because we know the zero behavior can't affect the result.

  if (!Known.One.isZero() ||

      isKnownNonZero(Op0, IC.getSimplifyQuery().getWithInstruction(&II))) {

    if (!match(II.getArgOperand(1), m_One()))

      return IC.replaceOperand(II, 1, IC.Builder.getTrue());

  }


  // Add range attribute since known bits can't completely reflect what we know.

  unsigned BitWidth = Op0->getType()->getScalarSizeInBits();

  if (BitWidth != 1 && !II.hasRetAttr(Attribute::Range) &&

      !II.getMetadata(LLVMContext::MD_range)) {

    ConstantRange Range(APInt(BitWidth, DefiniteZeros),

                        APInt(BitWidth, PossibleZeros + 1));

    II.addRangeRetAttr(Range);

    return &II;

  }


  return nullptr;

}


static Instruction *foldCtpop(IntrinsicInst &II, InstCombinerImpl &IC) {

  assert(II.getIntrinsicID() == Intrinsic::ctpop &&

         "Expected ctpop intrinsic");

  Type *Ty = II.getType();

  unsigned BitWidth = Ty->getScalarSizeInBits();

  Value *Op0 = II.getArgOperand(0);

  Value *X, *Y;


  // ctpop(bitreverse(x)) -> ctpop(x)

  // ctpop(bswap(x)) -> ctpop(x)

  if (match(Op0, m_BitReverse(m_Value(X))) || match(Op0, m_BSwap(m_Value(X))))

    return IC.replaceOperand(II, 0, X);


  // ctpop(rot(x)) -> ctpop(x)

  if ((match(Op0, m_FShl(m_Value(X), m_Value(Y), m_Value())) ||

       match(Op0, m_FShr(m_Value(X), m_Value(Y), m_Value()))) &&

      X == Y)

    return IC.replaceOperand(II, 0, X);


  // ctpop(x | -x) -> bitwidth - cttz(x, false)

  if (Op0->hasOneUse() &&

      match(Op0, m_c_Or(m_Value(X), m_Neg(m_Deferred(X))))) {

    Function *F =

        Intrinsic::getDeclaration(II.getModule(), Intrinsic::cttz, Ty);

    auto *Cttz = IC.Builder.CreateCall(F, {X, IC.Builder.getFalse()});

    auto *Bw = ConstantInt::get(Ty, APInt(BitWidth, BitWidth));

    return IC.replaceInstUsesWith(II, IC.Builder.CreateSub(Bw, Cttz));

  }


  // ctpop(~x & (x - 1)) -> cttz(x, false)

  if (match(Op0,

            m_c_And(m_Not(m_Value(X)), m_Add(m_Deferred(X), m_AllOnes())))) {

    Function *F =

        Intrinsic::getDeclaration(II.getModule(), Intrinsic::cttz, Ty);

    return CallInst::Create(F, {X, IC.Builder.getFalse()});

  }


  // Zext doesn't change the number of set bits, so narrow:

  // ctpop (zext X) --> zext (ctpop X)

  if (match(Op0, m_OneUse(m_ZExt(m_Value(X))))) {

    Value *NarrowPop = IC.Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, X);

    return CastInst::Create(Instruction::ZExt, NarrowPop, Ty);

  }


  KnownBits Known(BitWidth);

  IC.computeKnownBits(Op0, Known, 0, &II);


  // If all bits are zero except for exactly one fixed bit, then the result

  // must be 0 or 1, and we can get that answer by shifting to LSB:

  // ctpop (X & 32) --> (X & 32) >> 5

  // TODO: Investigate removing this as its likely unnecessary given the below

  // `isKnownToBeAPowerOfTwo` check.

  if ((~Known.Zero).isPowerOf2())

    return BinaryOperator::CreateLShr(

        Op0, ConstantInt::get(Ty, (~Known.Zero).exactLogBase2()));


  // More generally we can also handle non-constant power of 2 patterns such as

  // shl/shr(Pow2, X), (X & -X), etc... by transforming:

  // ctpop(Pow2OrZero) --> icmp ne X, 0

  if (IC.isKnownToBeAPowerOfTwo(Op0, /* OrZero */ true))

    return CastInst::Create(Instruction::ZExt,

                            IC.Builder.CreateICmp(ICmpInst::ICMP_NE, Op0,

                                                  Constant::getNullValue(Ty)),

                            Ty);


  // Add range attribute since known bits can't completely reflect what we know.

  if (BitWidth != 1 && !II.hasRetAttr(Attribute::Range) &&

      !II.getMetadata(LLVMContext::MD_range)) {

    ConstantRange Range(APInt(BitWidth, Known.countMinPopulation()),

                        APInt(BitWidth, Known.countMaxPopulation() + 1));

    II.addRangeRetAttr(Range);

    return &II;

  }


  return nullptr;

}


/// Convert a table lookup to shufflevector if the mask is constant.

/// This could benefit tbl1 if the mask is { 7,6,5,4,3,2,1,0 }, in

/// which case we could lower the shufflevector with rev64 instructions

/// as it's actually a byte reverse.

static Value *simplifyNeonTbl1(const IntrinsicInst &II,

                               InstCombiner::BuilderTy &Builder) {

  // Bail out if the mask is not a constant.

  auto *C = dyn_cast<Constant>(II.getArgOperand(1));

  if (!C)

    return nullptr;


  auto *VecTy = cast<FixedVectorType>(II.getType());

  unsigned NumElts = VecTy->getNumElements();


  // Only perform this transformation for <8 x i8> vector types.

  if (!VecTy->getElementType()->isIntegerTy(8) || NumElts != 8)

    return nullptr;


  int Indexes[8];


  for (unsigned I = 0; I < NumElts; ++I) {

    Constant *COp = C->getAggregateElement(I);


    if (!COp || !isa<ConstantInt>(COp))

      return nullptr;


    Indexes[I] = cast<ConstantInt>(COp)->getLimitedValue();


    // Make sure the mask indices are in range.

    if ((unsigned)Indexes[I] >= NumElts)

      return nullptr;

  }


  auto *V1 = II.getArgOperand(0);

  auto *V2 = Constant::getNullValue(V1->getType());

  return Builder.CreateShuffleVector(V1, V2, ArrayRef(Indexes));

}


// Returns true iff the 2 intrinsics have the same operands, limiting the

// comparison to the first NumOperands.

static bool haveSameOperands(const IntrinsicInst &I, const IntrinsicInst &E,

                             unsigned NumOperands) {

  assert(I.arg_size() >= NumOperands && "Not enough operands");

  assert(E.arg_size() >= NumOperands && "Not enough operands");

  for (unsigned i = 0; i < NumOperands; i++)

    if (I.getArgOperand(i) != E.getArgOperand(i))

      return false;

  return true;

}


// Remove trivially empty start/end intrinsic ranges, i.e. a start

// immediately followed by an end (ignoring debuginfo or other

// start/end intrinsics in between). As this handles only the most trivial

// cases, tracking the nesting level is not needed:

//

//   call @llvm.foo.start(i1 0)

//   call @llvm.foo.start(i1 0) ; This one won't be skipped: it will be removed

//   call @llvm.foo.end(i1 0)

//   call @llvm.foo.end(i1 0) ; &I

static bool

removeTriviallyEmptyRange(IntrinsicInst &EndI, InstCombinerImpl &IC,

                          std::function<bool(const IntrinsicInst &)> IsStart) {

  // We start from the end intrinsic and scan backwards, so that InstCombine

  // has already processed (and potentially removed) all the instructions

  // before the end intrinsic.

  BasicBlock::reverse_iterator BI(EndI), BE(EndI.getParent()->rend());

  for (; BI != BE; ++BI) {

    if (auto *I = dyn_cast<IntrinsicInst>(&*BI)) {

      if (I->isDebugOrPseudoInst() ||

          I->getIntrinsicID() == EndI.getIntrinsicID())

        continue;

      if (IsStart(*I)) {

        if (haveSameOperands(EndI, *I, EndI.arg_size())) {

          IC.eraseInstFromFunction(*I);

          IC.eraseInstFromFunction(EndI);

          return true;

        }

        // Skip start intrinsics that don't pair with this end intrinsic.

        continue;

      }

    }

    break;

  }


  return false;

}


Instruction *InstCombinerImpl::visitVAEndInst(VAEndInst &I) {

  removeTriviallyEmptyRange(I, *this, [](const IntrinsicInst &I) {

    return I.getIntrinsicID() == Intrinsic::vastart ||

           I.getIntrinsicID() == Intrinsic::vacopy;

  });

  return nullptr;

}


static CallInst *canonicalizeConstantArg0ToArg1(CallInst &Call) {

  assert(Call.arg_size() > 1 && "Need at least 2 args to swap");

  Value *Arg0 = Call.getArgOperand(0), *Arg1 = Call.getArgOperand(1);

  if (isa<Constant>(Arg0) && !isa<Constant>(Arg1)) {

    Call.setArgOperand(0, Arg1);

    Call.setArgOperand(1, Arg0);

    return &Call;

  }

  return nullptr;

}


/// Creates a result tuple for an overflow intrinsic \p II with a given

/// \p Result and a constant \p Overflow value.

static Instruction *createOverflowTuple(IntrinsicInst *II, Value *Result,

                                        Constant *Overflow) {

  Constant *V[] = {PoisonValue::get(Result->getType()), Overflow};

  StructType *ST = cast<StructType>(II->getType());

  Constant *Struct = ConstantStruct::get(ST, V);

  return InsertValueInst::Create(Struct, Result, 0);

}


Instruction *

InstCombinerImpl::foldIntrinsicWithOverflowCommon(IntrinsicInst *II) {

  WithOverflowInst *WO = cast<WithOverflowInst>(II);

  Value *OperationResult = nullptr;

  Constant *OverflowResult = nullptr;

  if (OptimizeOverflowCheck(WO->getBinaryOp(), WO->isSigned(), WO->getLHS(),

                            WO->getRHS(), *WO, OperationResult, OverflowResult))

    return createOverflowTuple(WO, OperationResult, OverflowResult);

  return nullptr;

}


static bool inputDenormalIsIEEE(const Function &F, const Type *Ty) {

  Ty = Ty->getScalarType();

  return F.getDenormalMode(Ty->getFltSemantics()).Input == DenormalMode::IEEE;

}


static bool inputDenormalIsDAZ(const Function &F, const Type *Ty) {

  Ty = Ty->getScalarType();

  return F.getDenormalMode(Ty->getFltSemantics()).inputsAreZero();

}


/// \returns the compare predicate type if the test performed by

/// llvm.is.fpclass(x, \p Mask) is equivalent to fcmp o__ x, 0.0 with the

/// floating-point environment assumed for \p F for type \p Ty

static FCmpInst::Predicate fpclassTestIsFCmp0(FPClassTest Mask,

                                              const Function &F, Type *Ty) {

  switch (static_cast<unsigned>(Mask)) {

  case fcZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OEQ;

    break;

  case fcZero | fcSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OEQ;

    break;

  case fcPositive | fcNegZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OGE;

    break;

  case fcPositive | fcNegZero | fcNegSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OGE;

    break;

  case fcPosSubnormal | fcPosNormal | fcPosInf:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OGT;

    break;

  case fcNegative | fcPosZero:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OLE;

    break;

  case fcNegative | fcPosZero | fcPosSubnormal:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OLE;

    break;

  case fcNegSubnormal | fcNegNormal | fcNegInf:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_OLT;

    break;

  case fcPosNormal | fcPosInf:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OGT;

    break;

  case fcNegNormal | fcNegInf:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_OLT;

    break;

  case ~fcZero & ~fcNan:

    if (inputDenormalIsIEEE(F, Ty))

      return FCmpInst::FCMP_ONE;

    break;

  case ~(fcZero | fcSubnormal) & ~fcNan:

    if (inputDenormalIsDAZ(F, Ty))

      return FCmpInst::FCMP_ONE;

    break;

  default:

    break;

  }


  return FCmpInst::BAD_FCMP_PREDICATE;

}


Instruction *InstCombinerImpl::foldIntrinsicIsFPClass(IntrinsicInst &II) {

  Value *Src0 = II.getArgOperand(0);

  Value *Src1 = II.getArgOperand(1);

  const ConstantInt *CMask = cast<ConstantInt>(Src1);

  FPClassTest Mask = static_cast<FPClassTest>(CMask->getZExtValue());

  const bool IsUnordered = (Mask & fcNan) == fcNan;

  const bool IsOrdered = (Mask & fcNan) == fcNone;

  const FPClassTest OrderedMask = Mask & ~fcNan;

  const FPClassTest OrderedInvertedMask = ~OrderedMask & ~fcNan;


  const bool IsStrict =

      II.getFunction()->getAttributes().hasFnAttr(Attribute::StrictFP);


  Value *FNegSrc;

  if (match(Src0, m_FNeg(m_Value(FNegSrc)))) {

    // is.fpclass (fneg x), mask -> is.fpclass x, (fneg mask)


    II.setArgOperand(1, ConstantInt::get(Src1->getType(), fneg(Mask)));

    return replaceOperand(II, 0, FNegSrc);

  }


  Value *FAbsSrc;

  if (match(Src0, m_FAbs(m_Value(FAbsSrc)))) {

    II.setArgOperand(1, ConstantInt::get(Src1->getType(), inverse_fabs(Mask)));

    return replaceOperand(II, 0, FAbsSrc);

  }


  if ((OrderedMask == fcInf || OrderedInvertedMask == fcInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, fcInf) -> fcmp oeq fabs(x), +inf

    // is.fpclass(x, ~fcInf) -> fcmp one fabs(x), +inf

    // is.fpclass(x, fcInf|fcNan) -> fcmp ueq fabs(x), +inf

    // is.fpclass(x, ~(fcInf|fcNan)) -> fcmp une fabs(x), +inf

    Constant *Inf = ConstantFP::getInfinity(Src0->getType());

    FCmpInst::Predicate Pred =

        IsUnordered ? FCmpInst::FCMP_UEQ : FCmpInst::FCMP_OEQ;

    if (OrderedInvertedMask == fcInf)

      Pred = IsUnordered ? FCmpInst::FCMP_UNE : FCmpInst::FCMP_ONE;


    Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Src0);

    Value *CmpInf = Builder.CreateFCmp(Pred, Fabs, Inf);

    CmpInf->takeName(&II);

    return replaceInstUsesWith(II, CmpInf);

  }


  if ((OrderedMask == fcPosInf || OrderedMask == fcNegInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, fcPosInf) -> fcmp oeq x, +inf

    // is.fpclass(x, fcNegInf) -> fcmp oeq x, -inf

    // is.fpclass(x, fcPosInf|fcNan) -> fcmp ueq x, +inf

    // is.fpclass(x, fcNegInf|fcNan) -> fcmp ueq x, -inf

    Constant *Inf =

        ConstantFP::getInfinity(Src0->getType(), OrderedMask == fcNegInf);

    Value *EqInf = IsUnordered ? Builder.CreateFCmpUEQ(Src0, Inf)

                               : Builder.CreateFCmpOEQ(Src0, Inf);


    EqInf->takeName(&II);

    return replaceInstUsesWith(II, EqInf);

  }


  if ((OrderedInvertedMask == fcPosInf || OrderedInvertedMask == fcNegInf) &&

      (IsOrdered || IsUnordered) && !IsStrict) {

    // is.fpclass(x, ~fcPosInf) -> fcmp one x, +inf

    // is.fpclass(x, ~fcNegInf) -> fcmp one x, -inf

    // is.fpclass(x, ~fcPosInf|fcNan) -> fcmp une x, +inf

    // is.fpclass(x, ~fcNegInf|fcNan) -> fcmp une x, -inf

    Constant *Inf = ConstantFP::getInfinity(Src0->getType(),

                                            OrderedInvertedMask == fcNegInf);

    Value *NeInf = IsUnordered ? Builder.CreateFCmpUNE(Src0, Inf)

                               : Builder.CreateFCmpONE(Src0, Inf);

    NeInf->takeName(&II);

    return replaceInstUsesWith(II, NeInf);

  }


  if (Mask == fcNan && !IsStrict) {

    // Equivalent of isnan. Replace with standard fcmp if we don't care about FP

    // exceptions.

    Value *IsNan =

        Builder.CreateFCmpUNO(Src0, ConstantFP::getZero(Src0->getType()));

    IsNan->takeName(&II);

    return replaceInstUsesWith(II, IsNan);

  }


  if (Mask == (~fcNan & fcAllFlags) && !IsStrict) {

    // Equivalent of !isnan. Replace with standard fcmp.

    Value *FCmp =

        Builder.CreateFCmpORD(Src0, ConstantFP::getZero(Src0->getType()));

    FCmp->takeName(&II);

    return replaceInstUsesWith(II, FCmp);

  }


  FCmpInst::Predicate PredType = FCmpInst::BAD_FCMP_PREDICATE;


  // Try to replace with an fcmp with 0

  //

  // is.fpclass(x, fcZero) -> fcmp oeq x, 0.0

  // is.fpclass(x, fcZero | fcNan) -> fcmp ueq x, 0.0

  // is.fpclass(x, ~fcZero & ~fcNan) -> fcmp one x, 0.0

  // is.fpclass(x, ~fcZero) -> fcmp une x, 0.0

  //

  // is.fpclass(x, fcPosSubnormal | fcPosNormal | fcPosInf) -> fcmp ogt x, 0.0

  // is.fpclass(x, fcPositive | fcNegZero) -> fcmp oge x, 0.0

  //

  // is.fpclass(x, fcNegSubnormal | fcNegNormal | fcNegInf) -> fcmp olt x, 0.0

  // is.fpclass(x, fcNegative | fcPosZero) -> fcmp ole x, 0.0

  //

  if (!IsStrict && (IsOrdered || IsUnordered) &&

      (PredType = fpclassTestIsFCmp0(OrderedMask, *II.getFunction(),

                                     Src0->getType())) !=

          FCmpInst::BAD_FCMP_PREDICATE) {

    Constant *Zero = ConstantFP::getZero(Src0->getType());

    // Equivalent of == 0.

    Value *FCmp = Builder.CreateFCmp(

        IsUnordered ? FCmpInst::getUnorderedPredicate(PredType) : PredType,

        Src0, Zero);


    FCmp->takeName(&II);

    return replaceInstUsesWith(II, FCmp);

  }


  KnownFPClass Known = computeKnownFPClass(Src0, Mask, &II);


  // Clear test bits we know must be false from the source value.

  // fp_class (nnan x), qnan|snan|other -> fp_class (nnan x), other

  // fp_class (ninf x), ninf|pinf|other -> fp_class (ninf x), other

  if ((Mask & Known.KnownFPClasses) != Mask) {

    II.setArgOperand(

        1, ConstantInt::get(Src1->getType(), Mask & Known.KnownFPClasses));

    return &II;

  }


  // If none of the tests which can return false are possible, fold to true.

  // fp_class (nnan x), ~(qnan|snan) -> true

  // fp_class (ninf x), ~(ninf|pinf) -> true

  if (Mask == Known.KnownFPClasses)

    return replaceInstUsesWith(II, ConstantInt::get(II.getType(), true));


  return nullptr;

}


static std::optional<bool> getKnownSign(Value *Op, Instruction *CxtI,

                                   const DataLayout &DL, AssumptionCache *AC,

                                   DominatorTree *DT) {

  KnownBits Known = computeKnownBits(Op, DL, 0, AC, CxtI, DT);

  if (Known.isNonNegative())

    return false;

  if (Known.isNegative())

    return true;


  Value *X, *Y;

  if (match(Op, m_NSWSub(m_Value(X), m_Value(Y))))

    return isImpliedByDomCondition(ICmpInst::ICMP_SLT, X, Y, CxtI, DL);


  return isImpliedByDomCondition(

      ICmpInst::ICMP_SLT, Op, Constant::getNullValue(Op->getType()), CxtI, DL);

}


static std::optional<bool> getKnownSignOrZero(Value *Op, Instruction *CxtI,

                                              const DataLayout &DL,

                                              AssumptionCache *AC,

                                              DominatorTree *DT) {

  if (std::optional<bool> Sign = getKnownSign(Op, CxtI, DL, AC, DT))

    return Sign;


  Value *X, *Y;

  if (match(Op, m_NSWSub(m_Value(X), m_Value(Y))))

    return isImpliedByDomCondition(ICmpInst::ICMP_SLE, X, Y, CxtI, DL);


  return std::nullopt;

}


/// Return true if two values \p Op0 and \p Op1 are known to have the same sign.

static bool signBitMustBeTheSame(Value *Op0, Value *Op1, Instruction *CxtI,

                                 const DataLayout &DL, AssumptionCache *AC,

                                 DominatorTree *DT) {

  std::optional<bool> Known1 = getKnownSign(Op1, CxtI, DL, AC, DT);

  if (!Known1)

    return false;

  std::optional<bool> Known0 = getKnownSign(Op0, CxtI, DL, AC, DT);

  if (!Known0)

    return false;

  return *Known0 == *Known1;

}


/// Try to canonicalize min/max(X + C0, C1) as min/max(X, C1 - C0) + C0. This

/// can trigger other combines.

static Instruction *moveAddAfterMinMax(IntrinsicInst *II,

                                       InstCombiner::BuilderTy &Builder) {

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  assert((MinMaxID == Intrinsic::smax || MinMaxID == Intrinsic::smin ||

          MinMaxID == Intrinsic::umax || MinMaxID == Intrinsic::umin) &&

         "Expected a min or max intrinsic");


  // TODO: Match vectors with undef elements, but undef may not propagate.

  Value *Op0 = II->getArgOperand(0), *Op1 = II->getArgOperand(1);

  Value *X;

  const APInt *C0, *C1;

  if (!match(Op0, m_OneUse(m_Add(m_Value(X), m_APInt(C0)))) ||

      !match(Op1, m_APInt(C1)))

    return nullptr;


  // Check for necessary no-wrap and overflow constraints.

  bool IsSigned = MinMaxID == Intrinsic::smax || MinMaxID == Intrinsic::smin;

  auto *Add = cast<BinaryOperator>(Op0);

  if ((IsSigned && !Add->hasNoSignedWrap()) ||

      (!IsSigned && !Add->hasNoUnsignedWrap()))

    return nullptr;


  // If the constant difference overflows, then instsimplify should reduce the

  // min/max to the add or C1.

  bool Overflow;

  APInt CDiff =

      IsSigned ? C1->ssub_ov(*C0, Overflow) : C1->usub_ov(*C0, Overflow);

  assert(!Overflow && "Expected simplify of min/max");


  // min/max (add X, C0), C1 --> add (min/max X, C1 - C0), C0

  // Note: the "mismatched" no-overflow setting does not propagate.

  Constant *NewMinMaxC = ConstantInt::get(II->getType(), CDiff);

  Value *NewMinMax = Builder.CreateBinaryIntrinsic(MinMaxID, X, NewMinMaxC);

  return IsSigned ? BinaryOperator::CreateNSWAdd(NewMinMax, Add->getOperand(1))

                  : BinaryOperator::CreateNUWAdd(NewMinMax, Add->getOperand(1));

}

/// Match a sadd_sat or ssub_sat which is using min/max to clamp the value.

Instruction *InstCombinerImpl::matchSAddSubSat(IntrinsicInst &MinMax1) {

  Type *Ty = MinMax1.getType();


  // We are looking for a tree of:

  // max(INT_MIN, min(INT_MAX, add(sext(A), sext(B))))

  // Where the min and max could be reversed

  Instruction *MinMax2;

  BinaryOperator *AddSub;

  const APInt *MinValue, *MaxValue;

  if (match(&MinMax1, m_SMin(m_Instruction(MinMax2), m_APInt(MaxValue)))) {

    if (!match(MinMax2, m_SMax(m_BinOp(AddSub), m_APInt(MinValue))))

      return nullptr;

  } else if (match(&MinMax1,

                   m_SMax(m_Instruction(MinMax2), m_APInt(MinValue)))) {

    if (!match(MinMax2, m_SMin(m_BinOp(AddSub), m_APInt(MaxValue))))

      return nullptr;

  } else

    return nullptr;


  // Check that the constants clamp a saturate, and that the new type would be

  // sensible to convert to.

  if (!(*MaxValue + 1).isPowerOf2() || -*MinValue != *MaxValue + 1)

    return nullptr;

  // In what bitwidth can this be treated as saturating arithmetics?

  unsigned NewBitWidth = (*MaxValue + 1).logBase2() + 1;

  // FIXME: This isn't quite right for vectors, but using the scalar type is a

  // good first approximation for what should be done there.

  if (!shouldChangeType(Ty->getScalarType()->getIntegerBitWidth(), NewBitWidth))

    return nullptr;


  // Also make sure that the inner min/max and the add/sub have one use.

  if (!MinMax2->hasOneUse() || !AddSub->hasOneUse())

    return nullptr;


  // Create the new type (which can be a vector type)

  Type *NewTy = Ty->getWithNewBitWidth(NewBitWidth);


  Intrinsic::ID IntrinsicID;

  if (AddSub->getOpcode() == Instruction::Add)

    IntrinsicID = Intrinsic::sadd_sat;

  else if (AddSub->getOpcode() == Instruction::Sub)

    IntrinsicID = Intrinsic::ssub_sat;

  else

    return nullptr;


  // The two operands of the add/sub must be nsw-truncatable to the NewTy. This

  // is usually achieved via a sext from a smaller type.

  if (ComputeMaxSignificantBits(AddSub->getOperand(0), 0, AddSub) >

          NewBitWidth ||

      ComputeMaxSignificantBits(AddSub->getOperand(1), 0, AddSub) > NewBitWidth)

    return nullptr;


  // Finally create and return the sat intrinsic, truncated to the new type

  Function *F = Intrinsic::getDeclaration(MinMax1.getModule(), IntrinsicID, NewTy);

  Value *AT = Builder.CreateTrunc(AddSub->getOperand(0), NewTy);

  Value *BT = Builder.CreateTrunc(AddSub->getOperand(1), NewTy);

  Value *Sat = Builder.CreateCall(F, {AT, BT});

  return CastInst::Create(Instruction::SExt, Sat, Ty);

}


/// If we have a clamp pattern like max (min X, 42), 41 -- where the output

/// can only be one of two possible constant values -- turn that into a select

/// of constants.

static Instruction *foldClampRangeOfTwo(IntrinsicInst *II,

                                        InstCombiner::BuilderTy &Builder) {

  Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

  Value *X;

  const APInt *C0, *C1;

  if (!match(I1, m_APInt(C1)) || !I0->hasOneUse())

    return nullptr;


  CmpInst::Predicate Pred = CmpInst::BAD_ICMP_PREDICATE;

  switch (II->getIntrinsicID()) {

  case Intrinsic::smax:

    if (match(I0, m_SMin(m_Value(X), m_APInt(C0))) && *C0 == *C1 + 1)

      Pred = ICmpInst::ICMP_SGT;

    break;

  case Intrinsic::smin:

    if (match(I0, m_SMax(m_Value(X), m_APInt(C0))) && *C1 == *C0 + 1)

      Pred = ICmpInst::ICMP_SLT;

    break;

  case Intrinsic::umax:

    if (match(I0, m_UMin(m_Value(X), m_APInt(C0))) && *C0 == *C1 + 1)

      Pred = ICmpInst::ICMP_UGT;

    break;

  case Intrinsic::umin:

    if (match(I0, m_UMax(m_Value(X), m_APInt(C0))) && *C1 == *C0 + 1)

      Pred = ICmpInst::ICMP_ULT;

    break;

  default:

    llvm_unreachable("Expected min/max intrinsic");

  }

  if (Pred == CmpInst::BAD_ICMP_PREDICATE)

    return nullptr;


  // max (min X, 42), 41 --> X > 41 ? 42 : 41

  // min (max X, 42), 43 --> X < 43 ? 42 : 43

  Value *Cmp = Builder.CreateICmp(Pred, X, I1);

  return SelectInst::Create(Cmp, ConstantInt::get(II->getType(), *C0), I1);

}


/// If this min/max has a constant operand and an operand that is a matching

/// min/max with a constant operand, constant-fold the 2 constant operands.

static Value *reassociateMinMaxWithConstants(IntrinsicInst *II,

                                             IRBuilderBase &Builder,

                                             const SimplifyQuery &SQ) {

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  auto *LHS = dyn_cast<MinMaxIntrinsic>(II->getArgOperand(0));

  if (!LHS)

    return nullptr;


  Constant *C0, *C1;

  if (!match(LHS->getArgOperand(1), m_ImmConstant(C0)) ||

      !match(II->getArgOperand(1), m_ImmConstant(C1)))

    return nullptr;


  // max (max X, C0), C1 --> max X, (max C0, C1)

  // min (min X, C0), C1 --> min X, (min C0, C1)

  // umax (smax X, nneg C0), nneg C1 --> smax X, (umax C0, C1)

  // smin (umin X, nneg C0), nneg C1 --> umin X, (smin C0, C1)

  Intrinsic::ID InnerMinMaxID = LHS->getIntrinsicID();

  if (InnerMinMaxID != MinMaxID &&

      !(((MinMaxID == Intrinsic::umax && InnerMinMaxID == Intrinsic::smax) ||

         (MinMaxID == Intrinsic::smin && InnerMinMaxID == Intrinsic::umin)) &&

        isKnownNonNegative(C0, SQ) && isKnownNonNegative(C1, SQ)))

    return nullptr;


  ICmpInst::Predicate Pred = MinMaxIntrinsic::getPredicate(MinMaxID);

  Value *CondC = Builder.CreateICmp(Pred, C0, C1);

  Value *NewC = Builder.CreateSelect(CondC, C0, C1);

  return Builder.CreateIntrinsic(InnerMinMaxID, II->getType(),

                                 {LHS->getArgOperand(0), NewC});

}


/// If this min/max has a matching min/max operand with a constant, try to push

/// the constant operand into this instruction. This can enable more folds.

static Instruction *

reassociateMinMaxWithConstantInOperand(IntrinsicInst *II,

                                       InstCombiner::BuilderTy &Builder) {

  // Match and capture a min/max operand candidate.

  Value *X, *Y;

  Constant *C;

  Instruction *Inner;

  if (!match(II, m_c_MaxOrMin(m_OneUse(m_CombineAnd(

                                  m_Instruction(Inner),

                                  m_MaxOrMin(m_Value(X), m_ImmConstant(C)))),

                              m_Value(Y))))

    return nullptr;


  // The inner op must match. Check for constants to avoid infinite loops.

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  auto *InnerMM = dyn_cast<IntrinsicInst>(Inner);

  if (!InnerMM || InnerMM->getIntrinsicID() != MinMaxID ||

      match(X, m_ImmConstant()) || match(Y, m_ImmConstant()))

    return nullptr;


  // max (max X, C), Y --> max (max X, Y), C

  Function *MinMax =

      Intrinsic::getDeclaration(II->getModule(), MinMaxID, II->getType());

  Value *NewInner = Builder.CreateBinaryIntrinsic(MinMaxID, X, Y);

  NewInner->takeName(Inner);

  return CallInst::Create(MinMax, {NewInner, C});

}


/// Reduce a sequence of min/max intrinsics with a common operand.

static Instruction *factorizeMinMaxTree(IntrinsicInst *II) {

  // Match 3 of the same min/max ops. Example: umin(umin(), umin()).

  auto *LHS = dyn_cast<IntrinsicInst>(II->getArgOperand(0));

  auto *RHS = dyn_cast<IntrinsicInst>(II->getArgOperand(1));

  Intrinsic::ID MinMaxID = II->getIntrinsicID();

  if (!LHS || !RHS || LHS->getIntrinsicID() != MinMaxID ||

      RHS->getIntrinsicID() != MinMaxID ||

      (!LHS->hasOneUse() && !RHS->hasOneUse()))

    return nullptr;


  Value *A = LHS->getArgOperand(0);

  Value *B = LHS->getArgOperand(1);

  Value *C = RHS->getArgOperand(0);

  Value *D = RHS->getArgOperand(1);


  // Look for a common operand.

  Value *MinMaxOp = nullptr;

  Value *ThirdOp = nullptr;

  if (LHS->hasOneUse()) {

    // If the LHS is only used in this chain and the RHS is used outside of it,

    // reuse the RHS min/max because that will eliminate the LHS.

    if (D == A || C == A) {

      // min(min(a, b), min(c, a)) --> min(min(c, a), b)

      // min(min(a, b), min(a, d)) --> min(min(a, d), b)

      MinMaxOp = RHS;

      ThirdOp = B;

    } else if (D == B || C == B) {

      // min(min(a, b), min(c, b)) --> min(min(c, b), a)

      // min(min(a, b), min(b, d)) --> min(min(b, d), a)

      MinMaxOp = RHS;

      ThirdOp = A;

    }

  } else {

    assert(RHS->hasOneUse() && "Expected one-use operand");

    // Reuse the LHS. This will eliminate the RHS.

    if (D == A || D == B) {

      // min(min(a, b), min(c, a)) --> min(min(a, b), c)

      // min(min(a, b), min(c, b)) --> min(min(a, b), c)

      MinMaxOp = LHS;

      ThirdOp = C;

    } else if (C == A || C == B) {

      // min(min(a, b), min(b, d)) --> min(min(a, b), d)

      // min(min(a, b), min(c, b)) --> min(min(a, b), d)

      MinMaxOp = LHS;

      ThirdOp = D;

    }

  }


  if (!MinMaxOp || !ThirdOp)

    return nullptr;


  Module *Mod = II->getModule();

  Function *MinMax = Intrinsic::getDeclaration(Mod, MinMaxID, II->getType());

  return CallInst::Create(MinMax, { MinMaxOp, ThirdOp });

}


/// If all arguments of the intrinsic are unary shuffles with the same mask,

/// try to shuffle after the intrinsic.

static Instruction *

foldShuffledIntrinsicOperands(IntrinsicInst *II,

                              InstCombiner::BuilderTy &Builder) {

  // TODO: This should be extended to handle other intrinsics like fshl, ctpop,

  //       etc. Use llvm::isTriviallyVectorizable() and related to determine

  //       which intrinsics are safe to shuffle?

  switch (II->getIntrinsicID()) {

  case Intrinsic::smax:

  case Intrinsic::smin:

  case Intrinsic::umax:

  case Intrinsic::umin:

  case Intrinsic::fma:

  case Intrinsic::fshl:

  case Intrinsic::fshr:

    break;

  default:

    return nullptr;

  }


  Value *X;

  ArrayRef<int> Mask;

  if (!match(II->getArgOperand(0),

             m_Shuffle(m_Value(X), m_Undef(), m_Mask(Mask))))

    return nullptr;


  // At least 1 operand must have 1 use because we are creating 2 instructions.

  if (none_of(II->args(), [](Value *V) { return V->hasOneUse(); }))

    return nullptr;


  // See if all arguments are shuffled with the same mask.

  SmallVector<Value *, 4> NewArgs(II->arg_size());

  NewArgs[0] = X;

  Type *SrcTy = X->getType();

  for (unsigned i = 1, e = II->arg_size(); i != e; ++i) {

    if (!match(II->getArgOperand(i),

               m_Shuffle(m_Value(X), m_Undef(), m_SpecificMask(Mask))) ||

        X->getType() != SrcTy)

      return nullptr;

    NewArgs[i] = X;

  }


  // intrinsic (shuf X, M), (shuf Y, M), ... --> shuf (intrinsic X, Y, ...), M

  Instruction *FPI = isa<FPMathOperator>(II) ? II : nullptr;

  Value *NewIntrinsic =

      Builder.CreateIntrinsic(II->getIntrinsicID(), SrcTy, NewArgs, FPI);

  return new ShuffleVectorInst(NewIntrinsic, Mask);

}


/// Fold the following cases and accepts bswap and bitreverse intrinsics:

///   bswap(logic_op(bswap(x), y)) --> logic_op(x, bswap(y))

///   bswap(logic_op(bswap(x), bswap(y))) --> logic_op(x, y) (ignores multiuse)

template <Intrinsic::ID IntrID>

static Instruction *foldBitOrderCrossLogicOp(Value *V,

                                             InstCombiner::BuilderTy &Builder) {

  static_assert(IntrID == Intrinsic::bswap || IntrID == Intrinsic::bitreverse,

                "This helper only supports BSWAP and BITREVERSE intrinsics");


  Value *X, *Y;

  // Find bitwise logic op. Check that it is a BinaryOperator explicitly so we

  // don't match ConstantExpr that aren't meaningful for this transform.

  if (match(V, m_OneUse(m_BitwiseLogic(m_Value(X), m_Value(Y)))) &&

      isa<BinaryOperator>(V)) {

    Value *OldReorderX, *OldReorderY;

    BinaryOperator::BinaryOps Op = cast<BinaryOperator>(V)->getOpcode();


    // If both X and Y are bswap/bitreverse, the transform reduces the number

    // of instructions even if there's multiuse.

    // If only one operand is bswap/bitreverse, we need to ensure the operand

    // have only one use.

    if (match(X, m_Intrinsic<IntrID>(m_Value(OldReorderX))) &&

        match(Y, m_Intrinsic<IntrID>(m_Value(OldReorderY)))) {

      return BinaryOperator::Create(Op, OldReorderX, OldReorderY);

    }


    if (match(X, m_OneUse(m_Intrinsic<IntrID>(m_Value(OldReorderX))))) {

      Value *NewReorder = Builder.CreateUnaryIntrinsic(IntrID, Y);

      return BinaryOperator::Create(Op, OldReorderX, NewReorder);

    }


    if (match(Y, m_OneUse(m_Intrinsic<IntrID>(m_Value(OldReorderY))))) {

      Value *NewReorder = Builder.CreateUnaryIntrinsic(IntrID, X);

      return BinaryOperator::Create(Op, NewReorder, OldReorderY);

    }

  }

  return nullptr;

}


/// CallInst simplification. This mostly only handles folding of intrinsic

/// instructions. For normal calls, it allows visitCallBase to do the heavy

/// lifting.

Instruction *InstCombinerImpl::visitCallInst(CallInst &CI) {

  // Don't try to simplify calls without uses. It will not do anything useful,

  // but will result in the following folds being skipped.

  if (!CI.use_empty()) {

    SmallVector<Value *, 4> Args;

    Args.reserve(CI.arg_size());

    for (Value *Op : CI.args())

      Args.push_back(Op);

    if (Value *V = simplifyCall(&CI, CI.getCalledOperand(), Args,

                                SQ.getWithInstruction(&CI)))

      return replaceInstUsesWith(CI, V);

  }


  if (Value *FreedOp = getFreedOperand(&CI, &TLI))

    return visitFree(CI, FreedOp);


  // If the caller function (i.e. us, the function that contains this CallInst)

  // is nounwind, mark the call as nounwind, even if the callee isn't.

  if (CI.getFunction()->doesNotThrow() && !CI.doesNotThrow()) {

    CI.setDoesNotThrow();

    return &CI;

  }


  IntrinsicInst *II = dyn_cast<IntrinsicInst>(&CI);

  if (!II) return visitCallBase(CI);


  // For atomic unordered mem intrinsics if len is not a positive or

  // not a multiple of element size then behavior is undefined.

  if (auto *AMI = dyn_cast<AtomicMemIntrinsic>(II))

    if (ConstantInt *NumBytes = dyn_cast<ConstantInt>(AMI->getLength()))

      if (NumBytes->isNegative() ||

          (NumBytes->getZExtValue() % AMI->getElementSizeInBytes() != 0)) {

        CreateNonTerminatorUnreachable(AMI);

        assert(AMI->getType()->isVoidTy() &&

               "non void atomic unordered mem intrinsic");

        return eraseInstFromFunction(*AMI);

      }


  // Intrinsics cannot occur in an invoke or a callbr, so handle them here

  // instead of in visitCallBase.

  if (auto *MI = dyn_cast<AnyMemIntrinsic>(II)) {

    bool Changed = false;


    // memmove/cpy/set of zero bytes is a noop.

    if (Constant *NumBytes = dyn_cast<Constant>(MI->getLength())) {

      if (NumBytes->isNullValue())

        return eraseInstFromFunction(CI);

    }


    // No other transformations apply to volatile transfers.

    if (auto *M = dyn_cast<MemIntrinsic>(MI))

      if (M->isVolatile())

        return nullptr;


    // If we have a memmove and the source operation is a constant global,

    // then the source and dest pointers can't alias, so we can change this

    // into a call to memcpy.

    if (auto *MMI = dyn_cast<AnyMemMoveInst>(MI)) {

      if (GlobalVariable *GVSrc = dyn_cast<GlobalVariable>(MMI->getSource()))

        if (GVSrc->isConstant()) {

          Module *M = CI.getModule();

          Intrinsic::ID MemCpyID =

              isa<AtomicMemMoveInst>(MMI)

                  ? Intrinsic::memcpy_element_unordered_atomic

                  : Intrinsic::memcpy;

          Type *Tys[3] = { CI.getArgOperand(0)->getType(),

                           CI.getArgOperand(1)->getType(),

                           CI.getArgOperand(2)->getType() };

          CI.setCalledFunction(Intrinsic::getDeclaration(M, MemCpyID, Tys));

          Changed = true;

        }

    }


    if (AnyMemTransferInst *MTI = dyn_cast<AnyMemTransferInst>(MI)) {

      // memmove(x,x,size) -> noop.

      if (MTI->getSource() == MTI->getDest())

        return eraseInstFromFunction(CI);

    }


    // If we can determine a pointer alignment that is bigger than currently

    // set, update the alignment.

    if (auto *MTI = dyn_cast<AnyMemTransferInst>(MI)) {

      if (Instruction *I = SimplifyAnyMemTransfer(MTI))

        return I;

    } else if (auto *MSI = dyn_cast<AnyMemSetInst>(MI)) {

      if (Instruction *I = SimplifyAnyMemSet(MSI))

        return I;

    }


    if (Changed) return II;

  }


  // For fixed width vector result intrinsics, use the generic demanded vector

  // support.

  if (auto *IIFVTy = dyn_cast<FixedVectorType>(II->getType())) {

    auto VWidth = IIFVTy->getNumElements();

    APInt PoisonElts(VWidth, 0);

    APInt AllOnesEltMask(APInt::getAllOnes(VWidth));

    if (Value *V = SimplifyDemandedVectorElts(II, AllOnesEltMask, PoisonElts)) {

      if (V != II)

        return replaceInstUsesWith(*II, V);

      return II;

    }

  }


  if (II->isCommutative()) {

    if (auto Pair = matchSymmetricPair(II->getOperand(0), II->getOperand(1))) {

      replaceOperand(*II, 0, Pair->first);

      replaceOperand(*II, 1, Pair->second);

      return II;

    }


    if (CallInst *NewCall = canonicalizeConstantArg0ToArg1(CI))

      return NewCall;

  }


  // Unused constrained FP intrinsic calls may have declared side effect, which

  // prevents it from being removed. In some cases however the side effect is

  // actually absent. To detect this case, call SimplifyConstrainedFPCall. If it

  // returns a replacement, the call may be removed.

  if (CI.use_empty() && isa<ConstrainedFPIntrinsic>(CI)) {

    if (simplifyConstrainedFPCall(&CI, SQ.getWithInstruction(&CI)))

      return eraseInstFromFunction(CI);

  }


  Intrinsic::ID IID = II->getIntrinsicID();

  switch (IID) {

  case Intrinsic::objectsize: {

    SmallVector<Instruction *> InsertedInstructions;

    if (Value *V = lowerObjectSizeCall(II, DL, &TLI, AA, /*MustSucceed=*/false,

                                       &InsertedInstructions)) {

      for (Instruction *Inserted : InsertedInstructions)

        Worklist.add(Inserted);

      return replaceInstUsesWith(CI, V);

    }

    return nullptr;

  }

  case Intrinsic::abs: {

    Value *IIOperand = II->getArgOperand(0);

    bool IntMinIsPoison = cast<Constant>(II->getArgOperand(1))->isOneValue();


    // abs(-x) -> abs(x)

    // TODO: Copy nsw if it was present on the neg?

    Value *X;

    if (match(IIOperand, m_Neg(m_Value(X))))

      return replaceOperand(*II, 0, X);

    if (match(IIOperand, m_Select(m_Value(), m_Value(X), m_Neg(m_Deferred(X)))))

      return replaceOperand(*II, 0, X);

    if (match(IIOperand, m_Select(m_Value(), m_Neg(m_Value(X)), m_Deferred(X))))

      return replaceOperand(*II, 0, X);


    Value *Y;

    // abs(a * abs(b)) -> abs(a * b)

    if (match(IIOperand,

              m_OneUse(m_c_Mul(m_Value(X),

                               m_Intrinsic<Intrinsic::abs>(m_Value(Y)))))) {

      bool NSW =

          cast<Instruction>(IIOperand)->hasNoSignedWrap() && IntMinIsPoison;

      auto *XY = NSW ? Builder.CreateNSWMul(X, Y) : Builder.CreateMul(X, Y);

      return replaceOperand(*II, 0, XY);

    }


    if (std::optional<bool> Known =

            getKnownSignOrZero(IIOperand, II, DL, &AC, &DT)) {

      // abs(x) -> x if x >= 0 (include abs(x-y) --> x - y where x >= y)

      // abs(x) -> x if x > 0 (include abs(x-y) --> x - y where x > y)

      if (!*Known)

        return replaceInstUsesWith(*II, IIOperand);


      // abs(x) -> -x if x < 0

      // abs(x) -> -x if x < = 0 (include abs(x-y) --> y - x where x <= y)

      if (IntMinIsPoison)

        return BinaryOperator::CreateNSWNeg(IIOperand);

      return BinaryOperator::CreateNeg(IIOperand);

    }


    // abs (sext X) --> zext (abs X*)

    // Clear the IsIntMin (nsw) bit on the abs to allow narrowing.

    if (match(IIOperand, m_OneUse(m_SExt(m_Value(X))))) {

      Value *NarrowAbs =

          Builder.CreateBinaryIntrinsic(Intrinsic::abs, X, Builder.getFalse());

      return CastInst::Create(Instruction::ZExt, NarrowAbs, II->getType());

    }


    // Match a complicated way to check if a number is odd/even:

    // abs (srem X, 2) --> and X, 1

    const APInt *C;

    if (match(IIOperand, m_SRem(m_Value(X), m_APInt(C))) && *C == 2)

      return BinaryOperator::CreateAnd(X, ConstantInt::get(II->getType(), 1));


    break;

  }

  case Intrinsic::umin: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    // umin(x, 1) == zext(x != 0)

    if (match(I1, m_One())) {

      assert(II->getType()->getScalarSizeInBits() != 1 &&

             "Expected simplify of umin with max constant");

      Value *Zero = Constant::getNullValue(I0->getType());

      Value *Cmp = Builder.CreateICmpNE(I0, Zero);

      return CastInst::Create(Instruction::ZExt, Cmp, II->getType());

    }

    [[fallthrough]];

  }

  case Intrinsic::umax: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(I0, m_ZExt(m_Value(X))) && match(I1, m_ZExt(m_Value(Y))) &&

        (I0->hasOneUse() || I1->hasOneUse()) && X->getType() == Y->getType()) {

      Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, Y);

      return CastInst::Create(Instruction::ZExt, NarrowMaxMin, II->getType());

    }

    Constant *C;

    if (match(I0, m_ZExt(m_Value(X))) && match(I1, m_Constant(C)) &&

        I0->hasOneUse()) {

      if (Constant *NarrowC = getLosslessUnsignedTrunc(C, X->getType())) {

        Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, NarrowC);

        return CastInst::Create(Instruction::ZExt, NarrowMaxMin, II->getType());

      }

    }

    // If both operands of unsigned min/max are sign-extended, it is still ok

    // to narrow the operation.

    [[fallthrough]];

  }

  case Intrinsic::smax:

  case Intrinsic::smin: {

    Value *I0 = II->getArgOperand(0), *I1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(I0, m_SExt(m_Value(X))) && match(I1, m_SExt(m_Value(Y))) &&

        (I0->hasOneUse() || I1->hasOneUse()) && X->getType() == Y->getType()) {

      Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, Y);

      return CastInst::Create(Instruction::SExt, NarrowMaxMin, II->getType());

    }


    Constant *C;

    if (match(I0, m_SExt(m_Value(X))) && match(I1, m_Constant(C)) &&

        I0->hasOneUse()) {

      if (Constant *NarrowC = getLosslessSignedTrunc(C, X->getType())) {

        Value *NarrowMaxMin = Builder.CreateBinaryIntrinsic(IID, X, NarrowC);

        return CastInst::Create(Instruction::SExt, NarrowMaxMin, II->getType());

      }

    }


    // umin(i1 X, i1 Y) -> and i1 X, Y

    // smax(i1 X, i1 Y) -> and i1 X, Y

    if ((IID == Intrinsic::umin || IID == Intrinsic::smax) &&

        II->getType()->isIntOrIntVectorTy(1)) {

      return BinaryOperator::CreateAnd(I0, I1);

    }


    // umax(i1 X, i1 Y) -> or i1 X, Y

    // smin(i1 X, i1 Y) -> or i1 X, Y

    if ((IID == Intrinsic::umax || IID == Intrinsic::smin) &&

        II->getType()->isIntOrIntVectorTy(1)) {

      return BinaryOperator::CreateOr(I0, I1);

    }


    if (IID == Intrinsic::smax || IID == Intrinsic::smin) {

      // smax (neg nsw X), (neg nsw Y) --> neg nsw (smin X, Y)

      // smin (neg nsw X), (neg nsw Y) --> neg nsw (smax X, Y)

      // TODO: Canonicalize neg after min/max if I1 is constant.

      if (match(I0, m_NSWNeg(m_Value(X))) && match(I1, m_NSWNeg(m_Value(Y))) &&

          (I0->hasOneUse() || I1->hasOneUse())) {

        Intrinsic::ID InvID = getInverseMinMaxIntrinsic(IID);

        Value *InvMaxMin = Builder.CreateBinaryIntrinsic(InvID, X, Y);

        return BinaryOperator::CreateNSWNeg(InvMaxMin);

      }

    }


    // (umax X, (xor X, Pow2))

    //      -> (or X, Pow2)

    // (umin X, (xor X, Pow2))

    //      -> (and X, ~Pow2)

    // (smax X, (xor X, Pos_Pow2))

    //      -> (or X, Pos_Pow2)

    // (smin X, (xor X, Pos_Pow2))

    //      -> (and X, ~Pos_Pow2)

    // (smax X, (xor X, Neg_Pow2))

    //      -> (and X, ~Neg_Pow2)

    // (smin X, (xor X, Neg_Pow2))

    //      -> (or X, Neg_Pow2)

    if ((match(I0, m_c_Xor(m_Specific(I1), m_Value(X))) ||

         match(I1, m_c_Xor(m_Specific(I0), m_Value(X)))) &&

        isKnownToBeAPowerOfTwo(X, /* OrZero */ true)) {

      bool UseOr = IID == Intrinsic::smax || IID == Intrinsic::umax;

      bool UseAndN = IID == Intrinsic::smin || IID == Intrinsic::umin;


      if (IID == Intrinsic::smax || IID == Intrinsic::smin) {

        auto KnownSign = getKnownSign(X, II, DL, &AC, &DT);

        if (KnownSign == std::nullopt) {

          UseOr = false;

          UseAndN = false;

        } else if (*KnownSign /* true is Signed. */) {

          UseOr ^= true;

          UseAndN ^= true;

          Type *Ty = I0->getType();

          // Negative power of 2 must be IntMin. It's possible to be able to

          // prove negative / power of 2 without actually having known bits, so

          // just get the value by hand.

          X = Constant::getIntegerValue(

              Ty, APInt::getSignedMinValue(Ty->getScalarSizeInBits()));

        }

      }

      if (UseOr)

        return BinaryOperator::CreateOr(I0, X);

      else if (UseAndN)

        return BinaryOperator::CreateAnd(I0, Builder.CreateNot(X));

    }


    // If we can eliminate ~A and Y is free to invert:

    // max ~A, Y --> ~(min A, ~Y)

    //

    // Examples:

    // max ~A, ~Y --> ~(min A, Y)

    // max ~A, C --> ~(min A, ~C)

    // max ~A, (max ~Y, ~Z) --> ~min( A, (min Y, Z))

    auto moveNotAfterMinMax = [&](Value *X, Value *Y) -> Instruction * {

      Value *A;

      if (match(X, m_OneUse(m_Not(m_Value(A)))) &&

          !isFreeToInvert(A, A->hasOneUse())) {

        if (Value *NotY = getFreelyInverted(Y, Y->hasOneUse(), &Builder)) {

          Intrinsic::ID InvID = getInverseMinMaxIntrinsic(IID);

          Value *InvMaxMin = Builder.CreateBinaryIntrinsic(InvID, A, NotY);

          return BinaryOperator::CreateNot(InvMaxMin);

        }

      }

      return nullptr;

    };


    if (Instruction *I = moveNotAfterMinMax(I0, I1))

      return I;

    if (Instruction *I = moveNotAfterMinMax(I1, I0))

      return I;


    if (Instruction *I = moveAddAfterMinMax(II, Builder))

      return I;


    // minmax (X & NegPow2C, Y & NegPow2C) --> minmax(X, Y) & NegPow2C

    const APInt *RHSC;

    if (match(I0, m_OneUse(m_And(m_Value(X), m_NegatedPower2(RHSC)))) &&

        match(I1, m_OneUse(m_And(m_Value(Y), m_SpecificInt(*RHSC)))))

      return BinaryOperator::CreateAnd(Builder.CreateBinaryIntrinsic(IID, X, Y),

                                       ConstantInt::get(II->getType(), *RHSC));


    // smax(X, -X) --> abs(X)

    // smin(X, -X) --> -abs(X)

    // umax(X, -X) --> -abs(X)

    // umin(X, -X) --> abs(X)

    if (isKnownNegation(I0, I1)) {

      // We can choose either operand as the input to abs(), but if we can

      // eliminate the only use of a value, that's better for subsequent

      // transforms/analysis.

      if (I0->hasOneUse() && !I1->hasOneUse())

        std::swap(I0, I1);


      // This is some variant of abs(). See if we can propagate 'nsw' to the abs

      // operation and potentially its negation.

      bool IntMinIsPoison = isKnownNegation(I0, I1, /* NeedNSW */ true);

      Value *Abs = Builder.CreateBinaryIntrinsic(

          Intrinsic::abs, I0,

          ConstantInt::getBool(II->getContext(), IntMinIsPoison));


      // We don't have a "nabs" intrinsic, so negate if needed based on the

      // max/min operation.

      if (IID == Intrinsic::smin || IID == Intrinsic::umax)

        Abs = Builder.CreateNeg(Abs, "nabs", IntMinIsPoison);

      return replaceInstUsesWith(CI, Abs);

    }


    if (Instruction *Sel = foldClampRangeOfTwo(II, Builder))

      return Sel;


    if (Instruction *SAdd = matchSAddSubSat(*II))

      return SAdd;


    if (Value *NewMinMax = reassociateMinMaxWithConstants(II, Builder, SQ))

      return replaceInstUsesWith(*II, NewMinMax);


    if (Instruction *R = reassociateMinMaxWithConstantInOperand(II, Builder))

      return R;


    if (Instruction *NewMinMax = factorizeMinMaxTree(II))

       return NewMinMax;


    // Try to fold minmax with constant RHS based on range information

    if (match(I1, m_APIntAllowPoison(RHSC))) {

      ICmpInst::Predicate Pred =

          ICmpInst::getNonStrictPredicate(MinMaxIntrinsic::getPredicate(IID));

      bool IsSigned = MinMaxIntrinsic::isSigned(IID);

      ConstantRange LHS_CR = computeConstantRangeIncludingKnownBits(

          I0, IsSigned, SQ.getWithInstruction(II));

      if (!LHS_CR.isFullSet()) {

        if (LHS_CR.icmp(Pred, *RHSC))

          return replaceInstUsesWith(*II, I0);

        if (LHS_CR.icmp(ICmpInst::getSwappedPredicate(Pred), *RHSC))

          return replaceInstUsesWith(*II,

                                     ConstantInt::get(II->getType(), *RHSC));

      }

    }


    break;

  }

  case Intrinsic::bitreverse: {

    Value *IIOperand = II->getArgOperand(0);

    // bitrev (zext i1 X to ?) --> X ? SignBitC : 0

    Value *X;

    if (match(IIOperand, m_ZExt(m_Value(X))) &&

        X->getType()->isIntOrIntVectorTy(1)) {

      Type *Ty = II->getType();

      APInt SignBit = APInt::getSignMask(Ty->getScalarSizeInBits());

      return SelectInst::Create(X, ConstantInt::get(Ty, SignBit),

                                ConstantInt::getNullValue(Ty));

    }


    if (Instruction *crossLogicOpFold =

        foldBitOrderCrossLogicOp<Intrinsic::bitreverse>(IIOperand, Builder))

      return crossLogicOpFold;


    break;

  }

  case Intrinsic::bswap: {

    Value *IIOperand = II->getArgOperand(0);


    // Try to canonicalize bswap-of-logical-shift-by-8-bit-multiple as

    // inverse-shift-of-bswap:

    // bswap (shl X, Y) --> lshr (bswap X), Y

    // bswap (lshr X, Y) --> shl (bswap X), Y

    Value *X, *Y;

    if (match(IIOperand, m_OneUse(m_LogicalShift(m_Value(X), m_Value(Y))))) {

      unsigned BitWidth = IIOperand->getType()->getScalarSizeInBits();

      if (MaskedValueIsZero(Y, APInt::getLowBitsSet(BitWidth, 3))) {

        Value *NewSwap = Builder.CreateUnaryIntrinsic(Intrinsic::bswap, X);

        BinaryOperator::BinaryOps InverseShift =

            cast<BinaryOperator>(IIOperand)->getOpcode() == Instruction::Shl

                ? Instruction::LShr

                : Instruction::Shl;

        return BinaryOperator::Create(InverseShift, NewSwap, Y);

      }

    }


    KnownBits Known = computeKnownBits(IIOperand, 0, II);

    uint64_t LZ = alignDown(Known.countMinLeadingZeros(), 8);

    uint64_t TZ = alignDown(Known.countMinTrailingZeros(), 8);

    unsigned BW = Known.getBitWidth();


    // bswap(x) -> shift(x) if x has exactly one "active byte"

    if (BW - LZ - TZ == 8) {

      assert(LZ != TZ && "active byte cannot be in the middle");

      if (LZ > TZ)  // -> shl(x) if the "active byte" is in the low part of x

        return BinaryOperator::CreateNUWShl(

            IIOperand, ConstantInt::get(IIOperand->getType(), LZ - TZ));

      // -> lshr(x) if the "active byte" is in the high part of x

      return BinaryOperator::CreateExactLShr(

            IIOperand, ConstantInt::get(IIOperand->getType(), TZ - LZ));

    }


    // bswap(trunc(bswap(x))) -> trunc(lshr(x, c))

    if (match(IIOperand, m_Trunc(m_BSwap(m_Value(X))))) {

      unsigned C = X->getType()->getScalarSizeInBits() - BW;

      Value *CV = ConstantInt::get(X->getType(), C);

      Value *V = Builder.CreateLShr(X, CV);

      return new TruncInst(V, IIOperand->getType());

    }


    if (Instruction *crossLogicOpFold =

            foldBitOrderCrossLogicOp<Intrinsic::bswap>(IIOperand, Builder)) {

      return crossLogicOpFold;

    }


    // Try to fold into bitreverse if bswap is the root of the expression tree.

    if (Instruction *BitOp = matchBSwapOrBitReverse(*II, /*MatchBSwaps*/ false,

                                                    /*MatchBitReversals*/ true))

      return BitOp;

    break;

  }

  case Intrinsic::masked_load:

    if (Value *SimplifiedMaskedOp = simplifyMaskedLoad(*II))

      return replaceInstUsesWith(CI, SimplifiedMaskedOp);

    break;

  case Intrinsic::masked_store:

    return simplifyMaskedStore(*II);

  case Intrinsic::masked_gather:

    return simplifyMaskedGather(*II);

  case Intrinsic::masked_scatter:

    return simplifyMaskedScatter(*II);

  case Intrinsic::launder_invariant_group:

  case Intrinsic::strip_invariant_group:

    if (auto *SkippedBarrier = simplifyInvariantGroupIntrinsic(*II, *this))

      return replaceInstUsesWith(*II, SkippedBarrier);

    break;

  case Intrinsic::powi:

    if (ConstantInt *Power = dyn_cast<ConstantInt>(II->getArgOperand(1))) {

      // 0 and 1 are handled in instsimplify

      // powi(x, -1) -> 1/x

      if (Power->isMinusOne())

        return BinaryOperator::CreateFDivFMF(ConstantFP::get(CI.getType(), 1.0),

                                             II->getArgOperand(0), II);

      // powi(x, 2) -> x*x

      if (Power->equalsInt(2))

        return BinaryOperator::CreateFMulFMF(II->getArgOperand(0),

                                             II->getArgOperand(0), II);


      if (!Power->getValue()[0]) {

        Value *X;

        // If power is even:

        // powi(-x, p) -> powi(x, p)

        // powi(fabs(x), p) -> powi(x, p)

        // powi(copysign(x, y), p) -> powi(x, p)

        if (match(II->getArgOperand(0), m_FNeg(m_Value(X))) ||

            match(II->getArgOperand(0), m_FAbs(m_Value(X))) ||

            match(II->getArgOperand(0),

                  m_Intrinsic<Intrinsic::copysign>(m_Value(X), m_Value())))

          return replaceOperand(*II, 0, X);

      }

    }

    break;


  case Intrinsic::cttz:

  case Intrinsic::ctlz:

    if (auto *I = foldCttzCtlz(*II, *this))

      return I;

    break;


  case Intrinsic::ctpop:

    if (auto *I = foldCtpop(*II, *this))

      return I;

    break;


  case Intrinsic::fshl:

  case Intrinsic::fshr: {

    Value *Op0 = II->getArgOperand(0), *Op1 = II->getArgOperand(1);

    Type *Ty = II->getType();

    unsigned BitWidth = Ty->getScalarSizeInBits();

    Constant *ShAmtC;

    if (match(II->getArgOperand(2), m_ImmConstant(ShAmtC))) {

      // Canonicalize a shift amount constant operand to modulo the bit-width.

      Constant *WidthC = ConstantInt::get(Ty, BitWidth);

      Constant *ModuloC =

          ConstantFoldBinaryOpOperands(Instruction::URem, ShAmtC, WidthC, DL);

      if (!ModuloC)

        return nullptr;

      if (ModuloC != ShAmtC)

        return replaceOperand(*II, 2, ModuloC);


      assert(match(ConstantFoldCompareInstOperands(ICmpInst::ICMP_UGT, WidthC,

                                                   ShAmtC, DL),

                   m_One()) &&

             "Shift amount expected to be modulo bitwidth");


      // Canonicalize funnel shift right by constant to funnel shift left. This

      // is not entirely arbitrary. For historical reasons, the backend may

      // recognize rotate left patterns but miss rotate right patterns.

      if (IID == Intrinsic::fshr) {

        // fshr X, Y, C --> fshl X, Y, (BitWidth - C) if C is not zero.

        if (!isKnownNonZero(ShAmtC, SQ.getWithInstruction(II)))

          return nullptr;


        Constant *LeftShiftC = ConstantExpr::getSub(WidthC, ShAmtC);

        Module *Mod = II->getModule();

        Function *Fshl = Intrinsic::getDeclaration(Mod, Intrinsic::fshl, Ty);

        return CallInst::Create(Fshl, { Op0, Op1, LeftShiftC });

      }

      assert(IID == Intrinsic::fshl &&

             "All funnel shifts by simple constants should go left");


      // fshl(X, 0, C) --> shl X, C

      // fshl(X, undef, C) --> shl X, C

      if (match(Op1, m_ZeroInt()) || match(Op1, m_Undef()))

        return BinaryOperator::CreateShl(Op0, ShAmtC);


      // fshl(0, X, C) --> lshr X, (BW-C)

      // fshl(undef, X, C) --> lshr X, (BW-C)

      if (match(Op0, m_ZeroInt()) || match(Op0, m_Undef()))

        return BinaryOperator::CreateLShr(Op1,

                                          ConstantExpr::getSub(WidthC, ShAmtC));


      // fshl i16 X, X, 8 --> bswap i16 X (reduce to more-specific form)

      if (Op0 == Op1 && BitWidth == 16 && match(ShAmtC, m_SpecificInt(8))) {

        Module *Mod = II->getModule();

        Function *Bswap = Intrinsic::getDeclaration(Mod, Intrinsic::bswap, Ty);

        return CallInst::Create(Bswap, { Op0 });

      }

      if (Instruction *BitOp =

              matchBSwapOrBitReverse(*II, /*MatchBSwaps*/ true,

                                     /*MatchBitReversals*/ true))

        return BitOp;

    }


    // Left or right might be masked.

    if (SimplifyDemandedInstructionBits(*II))

      return &CI;


    // The shift amount (operand 2) of a funnel shift is modulo the bitwidth,

    // so only the low bits of the shift amount are demanded if the bitwidth is

    // a power-of-2.

    if (!isPowerOf2_32(BitWidth))

      break;

    APInt Op2Demanded = APInt::getLowBitsSet(BitWidth, Log2_32_Ceil(BitWidth));

    KnownBits Op2Known(BitWidth);

    if (SimplifyDemandedBits(II, 2, Op2Demanded, Op2Known))

      return &CI;

    break;

  }

  case Intrinsic::ptrmask: {

    unsigned BitWidth = DL.getPointerTypeSizeInBits(II->getType());

    KnownBits Known(BitWidth);

    if (SimplifyDemandedInstructionBits(*II, Known))

      return II;


    Value *InnerPtr, *InnerMask;

    bool Changed = false;

    // Combine:

    // (ptrmask (ptrmask p, A), B)

    //    -> (ptrmask p, (and A, B))

    if (match(II->getArgOperand(0),

              m_OneUse(m_Intrinsic<Intrinsic::ptrmask>(m_Value(InnerPtr),

                                                       m_Value(InnerMask))))) {

      assert(II->getArgOperand(1)->getType() == InnerMask->getType() &&

             "Mask types must match");

      // TODO: If InnerMask == Op1, we could copy attributes from inner

      // callsite -> outer callsite.

      Value *NewMask = Builder.CreateAnd(II->getArgOperand(1), InnerMask);

      replaceOperand(CI, 0, InnerPtr);

      replaceOperand(CI, 1, NewMask);

      Changed = true;

    }


    // See if we can deduce non-null.

    if (!CI.hasRetAttr(Attribute::NonNull) &&

        (Known.isNonZero() ||

         isKnownNonZero(II, getSimplifyQuery().getWithInstruction(II)))) {

      CI.addRetAttr(Attribute::NonNull);

      Changed = true;

    }


    unsigned NewAlignmentLog =

        std::min(Value::MaxAlignmentExponent,

                 std::min(BitWidth - 1, Known.countMinTrailingZeros()));

    // Known bits will capture if we had alignment information associated with

    // the pointer argument.

    if (NewAlignmentLog > Log2(CI.getRetAlign().valueOrOne())) {

      CI.addRetAttr(Attribute::getWithAlignment(

          CI.getContext(), Align(uint64_t(1) << NewAlignmentLog)));

      Changed = true;

    }

    if (Changed)

      return &CI;

    break;

  }

  case Intrinsic::uadd_with_overflow:

  case Intrinsic::sadd_with_overflow: {

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;


    // Given 2 constant operands whose sum does not overflow:

    // uaddo (X +nuw C0), C1 -> uaddo X, C0 + C1

    // saddo (X +nsw C0), C1 -> saddo X, C0 + C1

    Value *X;

    const APInt *C0, *C1;

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    bool IsSigned = IID == Intrinsic::sadd_with_overflow;

    bool HasNWAdd = IsSigned

                        ? match(Arg0, m_NSWAddLike(m_Value(X), m_APInt(C0)))

                        : match(Arg0, m_NUWAddLike(m_Value(X), m_APInt(C0)));

    if (HasNWAdd && match(Arg1, m_APInt(C1))) {

      bool Overflow;

      APInt NewC =

          IsSigned ? C1->sadd_ov(*C0, Overflow) : C1->uadd_ov(*C0, Overflow);

      if (!Overflow)

        return replaceInstUsesWith(

            *II, Builder.CreateBinaryIntrinsic(

                     IID, X, ConstantInt::get(Arg1->getType(), NewC)));

    }

    break;

  }


  case Intrinsic::umul_with_overflow:

  case Intrinsic::smul_with_overflow:

  case Intrinsic::usub_with_overflow:

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;

    break;


  case Intrinsic::ssub_with_overflow: {

    if (Instruction *I = foldIntrinsicWithOverflowCommon(II))

      return I;


    Constant *C;

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    // Given a constant C that is not the minimum signed value

    // for an integer of a given bit width:

    //

    // ssubo X, C -> saddo X, -C

    if (match(Arg1, m_Constant(C)) && C->isNotMinSignedValue()) {

      Value *NegVal = ConstantExpr::getNeg(C);

      // Build a saddo call that is equivalent to the discovered

      // ssubo call.

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(Intrinsic::sadd_with_overflow,

                                             Arg0, NegVal));

    }


    break;

  }


  case Intrinsic::uadd_sat:

  case Intrinsic::sadd_sat:

  case Intrinsic::usub_sat:

  case Intrinsic::ssub_sat: {

    SaturatingInst *SI = cast<SaturatingInst>(II);

    Type *Ty = SI->getType();

    Value *Arg0 = SI->getLHS();

    Value *Arg1 = SI->getRHS();


    // Make use of known overflow information.

    OverflowResult OR = computeOverflow(SI->getBinaryOp(), SI->isSigned(),

                                        Arg0, Arg1, SI);

    switch (OR) {

      case OverflowResult::MayOverflow:

        break;

      case OverflowResult::NeverOverflows:

        if (SI->isSigned())

          return BinaryOperator::CreateNSW(SI->getBinaryOp(), Arg0, Arg1);

        else

          return BinaryOperator::CreateNUW(SI->getBinaryOp(), Arg0, Arg1);

      case OverflowResult::AlwaysOverflowsLow: {

        unsigned BitWidth = Ty->getScalarSizeInBits();

        APInt Min = APSInt::getMinValue(BitWidth, !SI->isSigned());

        return replaceInstUsesWith(*SI, ConstantInt::get(Ty, Min));

      }

      case OverflowResult::AlwaysOverflowsHigh: {

        unsigned BitWidth = Ty->getScalarSizeInBits();

        APInt Max = APSInt::getMaxValue(BitWidth, !SI->isSigned());

        return replaceInstUsesWith(*SI, ConstantInt::get(Ty, Max));

      }

    }


    // usub_sat((sub nuw C, A), C1) -> usub_sat(usub_sat(C, C1), A)

    // which after that:

    // usub_sat((sub nuw C, A), C1) -> usub_sat(C - C1, A) if C1 u< C

    // usub_sat((sub nuw C, A), C1) -> 0 otherwise

    Constant *C, *C1;

    Value *A;

    if (IID == Intrinsic::usub_sat &&

        match(Arg0, m_NUWSub(m_ImmConstant(C), m_Value(A))) &&

        match(Arg1, m_ImmConstant(C1))) {

      auto *NewC = Builder.CreateBinaryIntrinsic(Intrinsic::usub_sat, C, C1);

      auto *NewSub =

          Builder.CreateBinaryIntrinsic(Intrinsic::usub_sat, NewC, A);

      return replaceInstUsesWith(*SI, NewSub);

    }


    // ssub.sat(X, C) -> sadd.sat(X, -C) if C != MIN

    if (IID == Intrinsic::ssub_sat && match(Arg1, m_Constant(C)) &&

        C->isNotMinSignedValue()) {

      Value *NegVal = ConstantExpr::getNeg(C);

      return replaceInstUsesWith(

          *II, Builder.CreateBinaryIntrinsic(

              Intrinsic::sadd_sat, Arg0, NegVal));

    }


    // sat(sat(X + Val2) + Val) -> sat(X + (Val+Val2))

    // sat(sat(X - Val2) - Val) -> sat(X - (Val+Val2))

    // if Val and Val2 have the same sign

    if (auto *Other = dyn_cast<IntrinsicInst>(Arg0)) {

      Value *X;

      const APInt *Val, *Val2;

      APInt NewVal;

      bool IsUnsigned =

          IID == Intrinsic::uadd_sat || IID == Intrinsic::usub_sat;

      if (Other->getIntrinsicID() == IID &&

          match(Arg1, m_APInt(Val)) &&

          match(Other->getArgOperand(0), m_Value(X)) &&

          match(Other->getArgOperand(1), m_APInt(Val2))) {

        if (IsUnsigned)

          NewVal = Val->uadd_sat(*Val2);

        else if (Val->isNonNegative() == Val2->isNonNegative()) {

          bool Overflow;

          NewVal = Val->sadd_ov(*Val2, Overflow);

          if (Overflow) {

            // Both adds together may add more than SignedMaxValue

            // without saturating the final result.

            break;

          }

        } else {

          // Cannot fold saturated addition with different signs.

          break;

        }


        return replaceInstUsesWith(

            *II, Builder.CreateBinaryIntrinsic(

                     IID, X, ConstantInt::get(II->getType(), NewVal)));

      }

    }

    break;

  }


  case Intrinsic::minnum:

  case Intrinsic::maxnum:

  case Intrinsic::minimum:

  case Intrinsic::maximum: {

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(Arg0, m_FNeg(m_Value(X))) && match(Arg1, m_FNeg(m_Value(Y))) &&

        (Arg0->hasOneUse() || Arg1->hasOneUse())) {

      // If both operands are negated, invert the call and negate the result:

      // min(-X, -Y) --> -(max(X, Y))

      // max(-X, -Y) --> -(min(X, Y))

      Intrinsic::ID NewIID;

      switch (IID) {

      case Intrinsic::maxnum:

        NewIID = Intrinsic::minnum;

        break;

      case Intrinsic::minnum:

        NewIID = Intrinsic::maxnum;

        break;

      case Intrinsic::maximum:

        NewIID = Intrinsic::minimum;

        break;

      case Intrinsic::minimum:

        NewIID = Intrinsic::maximum;

        break;

      default:

        llvm_unreachable("unexpected intrinsic ID");

      }

      Value *NewCall = Builder.CreateBinaryIntrinsic(NewIID, X, Y, II);

      Instruction *FNeg = UnaryOperator::CreateFNeg(NewCall);

      FNeg->copyIRFlags(II);

      return FNeg;

    }


    // m(m(X, C2), C1) -> m(X, C)

    const APFloat *C1, *C2;

    if (auto *M = dyn_cast<IntrinsicInst>(Arg0)) {

      if (M->getIntrinsicID() == IID && match(Arg1, m_APFloat(C1)) &&

          ((match(M->getArgOperand(0), m_Value(X)) &&

            match(M->getArgOperand(1), m_APFloat(C2))) ||

           (match(M->getArgOperand(1), m_Value(X)) &&

            match(M->getArgOperand(0), m_APFloat(C2))))) {

        APFloat Res(0.0);

        switch (IID) {

        case Intrinsic::maxnum:

          Res = maxnum(*C1, *C2);

          break;

        case Intrinsic::minnum:

          Res = minnum(*C1, *C2);

          break;

        case Intrinsic::maximum:

          Res = maximum(*C1, *C2);

          break;

        case Intrinsic::minimum:

          Res = minimum(*C1, *C2);

          break;

        default:

          llvm_unreachable("unexpected intrinsic ID");

        }

        Value *V = Builder.CreateBinaryIntrinsic(

            IID, X, ConstantFP::get(Arg0->getType(), Res), II);

        // TODO: Conservatively intersecting FMF. If Res == C2, the transform

        //       was a simplification (so Arg0 and its original flags could

        //       propagate?)

        if (auto *CI = dyn_cast<CallInst>(V))

          CI->andIRFlags(M);

        return replaceInstUsesWith(*II, V);

      }

    }


    // m((fpext X), (fpext Y)) -> fpext (m(X, Y))

    if (match(Arg0, m_OneUse(m_FPExt(m_Value(X)))) &&

        match(Arg1, m_OneUse(m_FPExt(m_Value(Y)))) &&

        X->getType() == Y->getType()) {

      Value *NewCall =

          Builder.CreateBinaryIntrinsic(IID, X, Y, II, II->getName());

      return new FPExtInst(NewCall, II->getType());

    }


    // max X, -X --> fabs X

    // min X, -X --> -(fabs X)

    // TODO: Remove one-use limitation? That is obviously better for max,

    // hence why we don't check for one-use for that. However,

    // it would be an extra instruction for min (fnabs), but

    // that is still likely better for analysis and codegen.

    auto IsMinMaxOrXNegX = [IID, &X](Value *Op0, Value *Op1) {

      if (match(Op0, m_FNeg(m_Value(X))) && match(Op1, m_Specific(X)))

        return Op0->hasOneUse() ||

               (IID != Intrinsic::minimum && IID != Intrinsic::minnum);

      return false;

    };


    if (IsMinMaxOrXNegX(Arg0, Arg1) || IsMinMaxOrXNegX(Arg1, Arg0)) {

      Value *R = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, X, II);

      if (IID == Intrinsic::minimum || IID == Intrinsic::minnum)

        R = Builder.CreateFNegFMF(R, II);

      return replaceInstUsesWith(*II, R);

    }


    break;

  }

  case Intrinsic::matrix_multiply: {

    // Optimize negation in matrix multiplication.


    // -A * -B -> A * B

    Value *A, *B;

    if (match(II->getArgOperand(0), m_FNeg(m_Value(A))) &&

        match(II->getArgOperand(1), m_FNeg(m_Value(B)))) {

      replaceOperand(*II, 0, A);

      replaceOperand(*II, 1, B);

      return II;

    }


    Value *Op0 = II->getOperand(0);

    Value *Op1 = II->getOperand(1);

    Value *OpNotNeg, *NegatedOp;

    unsigned NegatedOpArg, OtherOpArg;

    if (match(Op0, m_FNeg(m_Value(OpNotNeg)))) {

      NegatedOp = Op0;

      NegatedOpArg = 0;

      OtherOpArg = 1;

    } else if (match(Op1, m_FNeg(m_Value(OpNotNeg)))) {

      NegatedOp = Op1;

      NegatedOpArg = 1;

      OtherOpArg = 0;

    } else

      // Multiplication doesn't have a negated operand.

      break;


    // Only optimize if the negated operand has only one use.

    if (!NegatedOp->hasOneUse())

      break;


    Value *OtherOp = II->getOperand(OtherOpArg);

    VectorType *RetTy = cast<VectorType>(II->getType());

    VectorType *NegatedOpTy = cast<VectorType>(NegatedOp->getType());

    VectorType *OtherOpTy = cast<VectorType>(OtherOp->getType());

    ElementCount NegatedCount = NegatedOpTy->getElementCount();

    ElementCount OtherCount = OtherOpTy->getElementCount();

    ElementCount RetCount = RetTy->getElementCount();

    // (-A) * B -> A * (-B), if it is cheaper to negate B and vice versa.

    if (ElementCount::isKnownGT(NegatedCount, OtherCount) &&

        ElementCount::isKnownLT(OtherCount, RetCount)) {

      Value *InverseOtherOp = Builder.CreateFNeg(OtherOp);

      replaceOperand(*II, NegatedOpArg, OpNotNeg);

      replaceOperand(*II, OtherOpArg, InverseOtherOp);

      return II;

    }

    // (-A) * B -> -(A * B), if it is cheaper to negate the result

    if (ElementCount::isKnownGT(NegatedCount, RetCount)) {

      SmallVector<Value *, 5> NewArgs(II->args());

      NewArgs[NegatedOpArg] = OpNotNeg;

      Instruction *NewMul =

          Builder.CreateIntrinsic(II->getType(), IID, NewArgs, II);

      return replaceInstUsesWith(*II, Builder.CreateFNegFMF(NewMul, II));

    }

    break;

  }

  case Intrinsic::fmuladd: {

    // Canonicalize fast fmuladd to the separate fmul + fadd.

    if (II->isFast()) {

      BuilderTy::FastMathFlagGuard Guard(Builder);

      Builder.setFastMathFlags(II->getFastMathFlags());

      Value *Mul = Builder.CreateFMul(II->getArgOperand(0),

                                      II->getArgOperand(1));

      Value *Add = Builder.CreateFAdd(Mul, II->getArgOperand(2));

      Add->takeName(II);

      return replaceInstUsesWith(*II, Add);

    }


    // Try to simplify the underlying FMul.

    if (Value *V = simplifyFMulInst(II->getArgOperand(0), II->getArgOperand(1),

                                    II->getFastMathFlags(),

                                    SQ.getWithInstruction(II))) {

      auto *FAdd = BinaryOperator::CreateFAdd(V, II->getArgOperand(2));

      FAdd->copyFastMathFlags(II);

      return FAdd;

    }


    [[fallthrough]];

  }

  case Intrinsic::fma: {

    // fma fneg(x), fneg(y), z -> fma x, y, z

    Value *Src0 = II->getArgOperand(0);

    Value *Src1 = II->getArgOperand(1);

    Value *X, *Y;

    if (match(Src0, m_FNeg(m_Value(X))) && match(Src1, m_FNeg(m_Value(Y)))) {

      replaceOperand(*II, 0, X);

      replaceOperand(*II, 1, Y);

      return II;

    }


    // fma fabs(x), fabs(x), z -> fma x, x, z

    if (match(Src0, m_FAbs(m_Value(X))) &&

        match(Src1, m_FAbs(m_Specific(X)))) {

      replaceOperand(*II, 0, X);

      replaceOperand(*II, 1, X);

      return II;

    }


    // Try to simplify the underlying FMul. We can only apply simplifications

    // that do not require rounding.

    if (Value *V = simplifyFMAFMul(II->getArgOperand(0), II->getArgOperand(1),

                                   II->getFastMathFlags(),

                                   SQ.getWithInstruction(II))) {

      auto *FAdd = BinaryOperator::CreateFAdd(V, II->getArgOperand(2));

      FAdd->copyFastMathFlags(II);

      return FAdd;

    }


    // fma x, y, 0 -> fmul x, y

    // This is always valid for -0.0, but requires nsz for +0.0 as

    // -0.0 + 0.0 = 0.0, which would not be the same as the fmul on its own.

    if (match(II->getArgOperand(2), m_NegZeroFP()) ||

        (match(II->getArgOperand(2), m_PosZeroFP()) &&

         II->getFastMathFlags().noSignedZeros()))

      return BinaryOperator::CreateFMulFMF(Src0, Src1, II);


    break;

  }

  case Intrinsic::copysign: {

    Value *Mag = II->getArgOperand(0), *Sign = II->getArgOperand(1);

    if (std::optional<bool> KnownSignBit = computeKnownFPSignBit(

            Sign, /*Depth=*/0, getSimplifyQuery().getWithInstruction(II))) {

      if (*KnownSignBit) {

        // If we know that the sign argument is negative, reduce to FNABS:

        // copysign Mag, -Sign --> fneg (fabs Mag)

        Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Mag, II);

        return replaceInstUsesWith(*II, Builder.CreateFNegFMF(Fabs, II));

      }


      // If we know that the sign argument is positive, reduce to FABS:

      // copysign Mag, +Sign --> fabs Mag

      Value *Fabs = Builder.CreateUnaryIntrinsic(Intrinsic::fabs, Mag, II);

      return replaceInstUsesWith(*II, Fabs);

    }


    // Propagate sign argument through nested calls:

    // copysign Mag, (copysign ?, X) --> copysign Mag, X

    Value *X;

    if (match(Sign, m_Intrinsic<Intrinsic::copysign>(m_Value(), m_Value(X))))

      return replaceOperand(*II, 1, X);


    // Clear sign-bit of constant magnitude:

    // copysign -MagC, X --> copysign MagC, X

    // TODO: Support constant folding for fabs

    const APFloat *MagC;

    if (match(Mag, m_APFloat(MagC)) && MagC->isNegative()) {

      APFloat PosMagC = *MagC;

      PosMagC.clearSign();

      return replaceOperand(*II, 0, ConstantFP::get(Mag->getType(), PosMagC));

    }


    // Peek through changes of magnitude's sign-bit. This call rewrites those:

    // copysign (fabs X), Sign --> copysign X, Sign

    // copysign (fneg X), Sign --> copysign X, Sign

    if (match(Mag, m_FAbs(m_Value(X))) || match(Mag, m_FNeg(m_Value(X))))

      return replaceOperand(*II, 0, X);


    break;

  }

  case Intrinsic::fabs: {

    Value *Cond, *TVal, *FVal;

    if (match(II->getArgOperand(0),

              m_Select(m_Value(Cond), m_Value(TVal), m_Value(FVal)))) {

      // fabs (select Cond, TrueC, FalseC) --> select Cond, AbsT, AbsF

      if (isa<Constant>(TVal) || isa<Constant>(FVal)) {

        CallInst *AbsT = Builder.CreateCall(II->getCalledFunction(), {TVal});

        CallInst *AbsF = Builder.CreateCall(II->getCalledFunction(), {FVal});

        SelectInst *SI = SelectInst::Create(Cond, AbsT, AbsF);

        FastMathFlags FMF1 = II->getFastMathFlags();

        FastMathFlags FMF2 =

            cast<SelectInst>(II->getArgOperand(0))->getFastMathFlags();

        FMF2.setNoSignedZeros(false);

        SI->setFastMathFlags(FMF1 | FMF2);

        return SI;

      }

      // fabs (select Cond, -FVal, FVal) --> fabs FVal

      if (match(TVal, m_FNeg(m_Specific(FVal))))

        return replaceOperand(*II, 0, FVal);

      // fabs (select Cond, TVal, -TVal) --> fabs TVal

      if (match(FVal, m_FNeg(m_Specific(TVal))))

        return replaceOperand(*II, 0, TVal);

    }


    Value *Magnitude, *Sign;

    if (match(II->getArgOperand(0),

              m_CopySign(m_Value(Magnitude), m_Value(Sign)))) {

      // fabs (copysign x, y) -> (fabs x)

      CallInst *AbsSign =

          Builder.CreateCall(II->getCalledFunction(), {Magnitude});

      AbsSign->copyFastMathFlags(II);

      return replaceInstUsesWith(*II, AbsSign);

    }


    [[fallthrough]];

  }

  case Intrinsic::ceil:

  case Intrinsic::floor:

  case Intrinsic::round:

  case Intrinsic::roundeven:

  case Intrinsic::nearbyint:

  case Intrinsic::rint:

  case Intrinsic::trunc: {

    Value *ExtSrc;

    if (match(II->getArgOperand(0), m_OneUse(m_FPExt(m_Value(ExtSrc))))) {

      // Narrow the call: intrinsic (fpext x) -> fpext (intrinsic x)

      Value *NarrowII = Builder.CreateUnaryIntrinsic(IID, ExtSrc, II);

      return new FPExtInst(NarrowII, II->getType());

    }

    break;

  }

  case Intrinsic::cos:

  case Intrinsic::amdgcn_cos: {

    Value *X, *Sign;

    Value *Src = II->getArgOperand(0);

    if (match(Src, m_FNeg(m_Value(X))) || match(Src, m_FAbs(m_Value(X))) ||

        match(Src, m_CopySign(m_Value(X), m_Value(Sign)))) {

      // cos(-x) --> cos(x)

      // cos(fabs(x)) --> cos(x)

      // cos(copysign(x, y)) --> cos(x)

      return replaceOperand(*II, 0, X);

    }

    break;

  }

  case Intrinsic::sin: {

    Value *X;

    if (match(II->getArgOperand(0), m_OneUse(m_FNeg(m_Value(X))))) {

      // sin(-x) --> -sin(x)

      Value *NewSin = Builder.CreateUnaryIntrinsic(Intrinsic::sin, X, II);

      Instruction *FNeg = UnaryOperator::CreateFNeg(NewSin);

      FNeg->copyFastMathFlags(II);

      return FNeg;

    }

    break;

  }

  case Intrinsic::ldexp: {

    // ldexp(ldexp(x, a), b) -> ldexp(x, a + b)

    //

    // The danger is if the first ldexp would overflow to infinity or underflow

    // to zero, but the combined exponent avoids it. We ignore this with

    // reassoc.

    //

    // It's also safe to fold if we know both exponents are >= 0 or <= 0 since

    // it would just double down on the overflow/underflow which would occur

    // anyway.

    //

    // TODO: Could do better if we had range tracking for the input value

    // exponent. Also could broaden sign check to cover == 0 case.

    Value *Src = II->getArgOperand(0);

    Value *Exp = II->getArgOperand(1);

    Value *InnerSrc;

    Value *InnerExp;

    if (match(Src, m_OneUse(m_Intrinsic<Intrinsic::ldexp>(

                       m_Value(InnerSrc), m_Value(InnerExp)))) &&

        Exp->getType() == InnerExp->getType()) {

      FastMathFlags FMF = II->getFastMathFlags();

      FastMathFlags InnerFlags = cast<FPMathOperator>(Src)->getFastMathFlags();


      if ((FMF.allowReassoc() && InnerFlags.allowReassoc()) ||

          signBitMustBeTheSame(Exp, InnerExp, II, DL, &AC, &DT)) {

        // TODO: Add nsw/nuw probably safe if integer type exceeds exponent

        // width.

        Value *NewExp = Builder.CreateAdd(InnerExp, Exp);

        II->setArgOperand(1, NewExp);

        II->setFastMathFlags(InnerFlags); // Or the inner flags.

        return replaceOperand(*II, 0, InnerSrc);

      }

    }


    break;

  }

  case Intrinsic::ptrauth_auth:

  case Intrinsic::ptrauth_resign: {

    // (sign|resign) + (auth|resign) can be folded by omitting the middle

    // sign+auth component if the key and discriminator match.

    bool NeedSign = II->getIntrinsicID() == Intrinsic::ptrauth_resign;

    Value *Key = II->getArgOperand(1);

    Value *Disc = II->getArgOperand(2);


    // AuthKey will be the key we need to end up authenticating against in

    // whatever we replace this sequence with.

    Value *AuthKey = nullptr, *AuthDisc = nullptr, *BasePtr;

    if (auto CI = dyn_cast<CallBase>(II->getArgOperand(0))) {

      BasePtr = CI->getArgOperand(0);

      if (CI->getIntrinsicID() == Intrinsic::ptrauth_sign) {

        if (CI->getArgOperand(1) != Key || CI->getArgOperand(2) != Disc)

          break;

      } else if (CI->getIntrinsicID() == Intrinsic::ptrauth_resign) {

        if (CI->getArgOperand(3) != Key || CI->getArgOperand(4) != Disc)

          break;

        AuthKey = CI->getArgOperand(1);

        AuthDisc = CI->getArgOperand(2);

      } else

        break;

    } else

      break;


    unsigned NewIntrin;

    if (AuthKey && NeedSign) {

      // resign(0,1) + resign(1,2) = resign(0, 2)

      NewIntrin = Intrinsic::ptrauth_resign;

    } else if (AuthKey) {

      // resign(0,1) + auth(1) = auth(0)

      NewIntrin = Intrinsic::ptrauth_auth;

    } else if (NeedSign) {

      // sign(0) + resign(0, 1) = sign(1)

      NewIntrin = Intrinsic::ptrauth_sign;

    } else {

      // sign(0) + auth(0) = nop

      replaceInstUsesWith(*II, BasePtr);

      eraseInstFromFunction(*II);

      return nullptr;

    }


    SmallVector<Value *, 4> CallArgs;

    CallArgs.push_back(BasePtr);

    if (AuthKey) {

      CallArgs.push_back(AuthKey);

      CallArgs.push_back(AuthDisc);

    }


    if (NeedSign) {

      CallArgs.push_back(II->getArgOperand(3));

      CallArgs.push_back(II->getArgOperand(4));

    }


    Function *NewFn = Intrinsic::getDeclaration(II->getModule(), NewIntrin);

    return CallInst::Create(NewFn, CallArgs);

  }

  case Intrinsic::arm_neon_vtbl1:

  case Intrinsic::aarch64_neon_tbl1:

    if (Value *V = simplifyNeonTbl1(*II, Builder))

      return replaceInstUsesWith(*II, V);

    break;


  case Intrinsic::arm_neon_vmulls:

  case Intrinsic::arm_neon_vmullu:

  case Intrinsic::aarch64_neon_smull:

  case Intrinsic::aarch64_neon_umull: {

    Value *Arg0 = II->getArgOperand(0);

    Value *Arg1 = II->getArgOperand(1);


    // Handle mul by zero first:

    if (isa<ConstantAggregateZero>(Arg0) || isa<ConstantAggregateZero>(Arg1)) {

      return replaceInstUsesWith(CI, ConstantAggregateZero::get(II->getType()));

    }


    // Check for constant LHS & RHS - in this case we just simplify.

    bool Zext = (IID == Intrinsic::arm_neon_vmullu ||

                 IID == Intrinsic::aarch64_neon_umull);

    VectorType *NewVT = cast<VectorType>(II->getType());

    if (Constant *CV0 = dyn_cast<Constant>(Arg0)) {

      if (Constant *CV1 = dyn_cast<Constant>(Arg1)) {

        Value *V0 = Builder.CreateIntCast(CV0, NewVT, /*isSigned=*/!Zext);

        Value *V1 = Builder.CreateIntCast(CV1, NewVT, /*isSigned=*/!Zext);

        return replaceInstUsesWith(CI, Builder.CreateMul(V0, V1));

      }


      // Couldn't simplify - canonicalize constant to the RHS.

      std::swap(Arg0, Arg1);

    }


    // Handle mul by one:

    if (Constant *CV1 = dyn_cast<Constant>(Arg1))

      if (ConstantInt *Splat =

              dyn_cast_or_null<ConstantInt>(CV1->getSplatValue()))

        if (Splat->isOne())

          return CastInst::CreateIntegerCast(Arg0, II->getType(),

                                             /*isSigned=*/!Zext);


    break;

  }

  case Intrinsic::arm_neon_aesd:

  case Intrinsic::arm_neon_aese:

  case Intrinsic::aarch64_crypto_aesd:

  case Intrinsic::aarch64_crypto_aese: {

    Value *DataArg = II->getArgOperand(0);

    Value *KeyArg  = II->getArgOperand(1);


    // Try to use the builtin XOR in AESE and AESD to eliminate a prior XOR

    Value *Data, *Key;

    if (match(KeyArg, m_ZeroInt()) &&

        match(DataArg, m_Xor(m_Value(Data), m_Value(Key)))) {

      replaceOperand(*II, 0, Data);

      replaceOperand(*II, 1, Key);

      return II;

    }

    break;

  }

  case Intrinsic::hexagon_V6_vandvrt:

  case Intrinsic::hexagon_V6_vandvrt_128B: {

    // Simplify Q -> V -> Q conversion.

    if (auto Op0 = dyn_cast<IntrinsicInst>(II->getArgOperand(0))) {

      Intrinsic::ID ID0 = Op0->getIntrinsicID();

      if (ID0 != Intrinsic::hexagon_V6_vandqrt &&

          ID0 != Intrinsic::hexagon_V6_vandqrt_128B)

        break;

      Value *Bytes = Op0->getArgOperand(1), *Mask = II->getArgOperand(1);

      uint64_t Bytes1 = computeKnownBits(Bytes, 0, Op0).One.getZExtValue();

      uint64_t Mask1 = computeKnownBits(Mask, 0, II).One.getZExtValue();

      // Check if every byte has common bits in Bytes and Mask.

      uint64_t C = Bytes1 & Mask1;

      if ((C & 0xFF) && (C & 0xFF00) && (C & 0xFF0000) && (C & 0xFF000000))

        return replaceInstUsesWith(*II, Op0->getArgOperand(0));

    }

    break;

  }

  case Intrinsic::stackrestore: {

    enum class ClassifyResult {

      None,

      Alloca,

      StackRestore,

      CallWithSideEffects,

    };

    auto Classify = [](const Instruction *I) {

      if (isa<AllocaInst>(I))

        return ClassifyResult::Alloca;


      if (auto *CI = dyn_cast<CallInst>(I)) {

        if (auto *II = dyn_cast<IntrinsicInst>(CI)) {

          if (II->getIntrinsicID() == Intrinsic::stackrestore)

            return ClassifyResult::StackRestore;


          if (II->mayHaveSideEffects())

            return ClassifyResult::CallWithSideEffects;

        } else {

          // Consider all non-intrinsic calls to be side effects

          return ClassifyResult::CallWithSideEffects;

        }

      }


      return ClassifyResult::None;

    };


    // If the stacksave and the stackrestore are in the same BB, and there is

    // no intervening call, alloca, or stackrestore of a different stacksave,

    // remove the restore. This can happen when variable allocas are DCE'd.

    if (IntrinsicInst *SS = dyn_cast<IntrinsicInst>(II->getArgOperand(0))) {

      if (SS->getIntrinsicID() == Intrinsic::stacksave &&

          SS->getParent() == II->getParent()) {

        BasicBlock::iterator BI(SS);

        bool CannotRemove = false;

        for (++BI; &*BI != II; ++BI) {

          switch (Classify(&*BI)) {

          case ClassifyResult::None:

            // So far so good, look at next instructions.

            break;


          case ClassifyResult::StackRestore:

            // If we found an intervening stackrestore for a different

            // stacksave, we can't remove the stackrestore. Otherwise, continue.

            if (cast<IntrinsicInst>(*BI).getArgOperand(0) != SS)

              CannotRemove = true;

            break;


          case ClassifyResult::Alloca:

          case ClassifyResult::CallWithSideEffects:

            // If we found an alloca, a non-intrinsic call, or an intrinsic

            // call with side effects, we can't remove the stackrestore.

            CannotRemove = true;

            break;

          }

          if (CannotRemove)

            break;

        }


        if (!CannotRemove)

          return eraseInstFromFunction(CI);

      }

    }


    // Scan down this block to see if there is another stack restore in the

    // same block without an intervening call/alloca.

    BasicBlock::iterator BI(II);

    Instruction *TI = II->getParent()->getTerminator();

    bool CannotRemove = false;

    for (++BI; &*BI != TI; ++BI) {

      switch (Classify(&*BI)) {

      case ClassifyResult::None:

        // So far so good, look at next instructions.

        break;


      case ClassifyResult::StackRestore:

        // If there is a stackrestore below this one, remove this one.

        return eraseInstFromFunction(CI);


      case ClassifyResult::Alloca:

      case ClassifyResult::CallWithSideEffects:

        // If we found an alloca, a non-intrinsic call, or an intrinsic call

        // with side effects (such as llvm.stacksave and llvm.read_register),

        // we can't remove the stack restore.

        CannotRemove = true;

        break;

      }

      if (CannotRemove)

        break;

    }


    // If the stack restore is in a return, resume, or unwind block and if there

    // are no allocas or calls between the restore and the return, nuke the

    // restore.

    if (!CannotRemove && (isa<ReturnInst>(TI) || isa<ResumeInst>(TI)))

      return eraseInstFromFunction(CI);

    break;

  }

  case Intrinsic::lifetime_end:

    // Asan needs to poison memory to detect invalid access which is possible

    // even for empty lifetime range.

    if (II->getFunction()->hasFnAttribute(Attribute::SanitizeAddress) ||

        II->getFunction()->hasFnAttribute(Attribute::SanitizeMemory) ||

        II->getFunction()->hasFnAttribute(Attribute::SanitizeHWAddress))

      break;


    if (removeTriviallyEmptyRange(*II, *this, [](const IntrinsicInst &I) {

          return I.getIntrinsicID() == Intrinsic::lifetime_start;

        }))

      return nullptr;

    break;

  case Intrinsic::assume: {

    Value *IIOperand = II->getArgOperand(0);

    SmallVector<OperandBundleDef, 4> OpBundles;

    II->getOperandBundlesAsDefs(OpBundles);


    /// This will remove the boolean Condition from the assume given as

    /// argument and remove the assume if it becomes useless.

    /// always returns nullptr for use as a return values.

    auto RemoveConditionFromAssume = [&](Instruction *Assume) -> Instruction * {

      assert(isa<AssumeInst>(Assume));

      if (isAssumeWithEmptyBundle(*cast<AssumeInst>(II)))

        return eraseInstFromFunction(CI);

      replaceUse(II->getOperandUse(0), ConstantInt::getTrue(II->getContext()));

      return nullptr;

    };

    // Remove an assume if it is followed by an identical assume.

    // TODO: Do we need this? Unless there are conflicting assumptions, the

    // computeKnownBits(IIOperand) below here eliminates redundant assumes.

    Instruction *Next = II->getNextNonDebugInstruction();

    if (match(Next, m_Intrinsic<Intrinsic::assume>(m_Specific(IIOperand))))

      return RemoveConditionFromAssume(Next);


    // Canonicalize assume(a && b) -> assume(a); assume(b);

    // Note: New assumption intrinsics created here are registered by

    // the InstCombineIRInserter object.

    FunctionType *AssumeIntrinsicTy = II->getFunctionType();

    Value *AssumeIntrinsic = II->getCalledOperand();

    Value *A, *B;

    if (match(IIOperand, m_LogicalAnd(m_Value(A), m_Value(B)))) {

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic, A, OpBundles,

                         II->getName());

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic, B, II->getName());

      return eraseInstFromFunction(*II);

    }

    // assume(!(a || b)) -> assume(!a); assume(!b);

    if (match(IIOperand, m_Not(m_LogicalOr(m_Value(A), m_Value(B))))) {

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic,

                         Builder.CreateNot(A), OpBundles, II->getName());

      Builder.CreateCall(AssumeIntrinsicTy, AssumeIntrinsic,

                         Builder.CreateNot(B), II->getName());

      return eraseInstFromFunction(*II);

    }


    // assume( (load addr) != null ) -> add 'nonnull' metadata to load

    // (if assume is valid at the load)

    CmpInst::Predicate Pred;

    Instruction *LHS;

    if (match(IIOperand, m_ICmp(Pred, m_Instruction(LHS), m_Zero())) &&

        Pred == ICmpInst::ICMP_NE && LHS->getOpcode() == Instruction::Load &&

        LHS->getType()->isPointerTy() &&

        isValidAssumeForContext(II, LHS, &DT)) {

      MDNode *MD = MDNode::get(II->getContext(), std::nullopt);

      LHS->setMetadata(LLVMContext::MD_nonnull, MD);

      LHS->setMetadata(LLVMContext::MD_noundef, MD);

      return RemoveConditionFromAssume(II);


      // TODO: apply nonnull return attributes to calls and invokes

      // TODO: apply range metadata for range check patterns?

    }


    // Separate storage assumptions apply to the underlying allocations, not any

    // particular pointer within them. When evaluating the hints for AA purposes

    // we getUnderlyingObject them; by precomputing the answers here we can

    // avoid having to do so repeatedly there.

    for (unsigned Idx = 0; Idx < II->getNumOperandBundles(); Idx++) {

      OperandBundleUse OBU = II->getOperandBundleAt(Idx);

      if (OBU.getTagName() == "separate_storage") {

        assert(OBU.Inputs.size() == 2);

        auto MaybeSimplifyHint = [&](const Use &U) {

          Value *Hint = U.get();

          // Not having a limit is safe because InstCombine removes unreachable

          // code.

          Value *UnderlyingObject = getUnderlyingObject(Hint, /*MaxLookup*/ 0);

          if (Hint != UnderlyingObject)

            replaceUse(const_cast<Use &>(U), UnderlyingObject);

        };

        MaybeSimplifyHint(OBU.Inputs[0]);

        MaybeSimplifyHint(OBU.Inputs[1]);

      }

    }


    // Convert nonnull assume like:

    // %A = icmp ne i32* %PTR, null

    // call void @llvm.assume(i1 %A)

    // into

    // call void @llvm.assume(i1 true) [ "nonnull"(i32* %PTR) ]

    if (EnableKnowledgeRetention &&

        match(IIOperand, m_Cmp(Pred, m_Value(A), m_Zero())) &&

        Pred == CmpInst::ICMP_NE && A->getType()->isPointerTy()) {

      if (auto *Replacement = buildAssumeFromKnowledge(

              {RetainedKnowledge{Attribute::NonNull, 0, A}}, Next, &AC, &DT)) {


        Replacement->insertBefore(Next);

        AC.registerAssumption(Replacement);

        return RemoveConditionFromAssume(II);

      }

    }


    // Convert alignment assume like:

    // %B = ptrtoint i32* %A to i64

    // %C = and i64 %B, Constant

    // %D = icmp eq i64 %C, 0

    // call void @llvm.assume(i1 %D)

    // into

    // call void @llvm.assume(i1 true) [ "align"(i32* [[A]], i64  Constant + 1)]

    uint64_t AlignMask;

    if (EnableKnowledgeRetention &&

        match(IIOperand,

              m_Cmp(Pred, m_And(m_Value(A), m_ConstantInt(AlignMask)),

                    m_Zero())) &&

        Pred == CmpInst::ICMP_EQ) {

      if (isPowerOf2_64(AlignMask + 1)) {

        uint64_t Offset = 0;

        match(A, m_Add(m_Value(A), m_ConstantInt(Offset)));

        if (match(A, m_PtrToInt(m_Value(A)))) {

          /// Note: this doesn't preserve the offset information but merges

          /// offset and alignment.

          /// TODO: we can generate a GEP instead of merging the alignment with

          /// the offset.

          RetainedKnowledge RK{Attribute::Alignment,

                               (unsigned)MinAlign(Offset, AlignMask + 1), A};

          if (auto *Replacement =

                  buildAssumeFromKnowledge(RK, Next, &AC, &DT)) {


            Replacement->insertAfter(II);

            AC.registerAssumption(Replacement);

          }

          return RemoveConditionFromAssume(II);

        }

      }

    }


    /// Canonicalize Knowledge in operand bundles.

    if (EnableKnowledgeRetention && II->hasOperandBundles()) {

      for (unsigned Idx = 0; Idx < II->getNumOperandBundles(); Idx++) {

        auto &BOI = II->bundle_op_info_begin()[Idx];

        RetainedKnowledge RK =

          llvm::getKnowledgeFromBundle(cast<AssumeInst>(*II), BOI);

        if (BOI.End - BOI.Begin > 2)

          continue; // Prevent reducing knowledge in an align with offset since

                    // extracting a RetainedKnowledge from them looses offset

                    // information

        RetainedKnowledge CanonRK =

          llvm::simplifyRetainedKnowledge(cast<AssumeInst>(II), RK,

                                          &getAssumptionCache(),

                                          &getDominatorTree());

        if (CanonRK == RK)

          continue;

        if (!CanonRK) {

          if (BOI.End - BOI.Begin > 0) {

            Worklist.pushValue(II->op_begin()[BOI.Begin]);

            Value::dropDroppableUse(II->op_begin()[BOI.Begin]);

          }

          continue;

        }

        assert(RK.AttrKind == CanonRK.AttrKind);

        if (BOI.End - BOI.Begin > 0)

          II->op_begin()[BOI.Begin].set(CanonRK.WasOn);

        if (BOI.End - BOI.Begin > 1)

          II->op_begin()[BOI.Begin + 1].set(ConstantInt::get(

              Type::getInt64Ty(II->getContext()), CanonRK.ArgValue));

        if (RK.WasOn)

          Worklist.pushValue(RK.WasOn);

        return II;

      }

    }


    // If there is a dominating assume with the same condition as this one,

    // then this one is redundant, and should be removed.

    KnownBits Known(1);

    computeKnownBits(IIOperand, Known, 0, II);

    if (Known.isAllOnes() && isAssumeWithEmptyBundle(cast<AssumeInst>(*II)))

      return eraseInstFromFunction(*II);


    // assume(false) is unreachable.

    if (match(IIOperand, m_CombineOr(m_Zero(), m_Undef()))) {

      CreateNonTerminatorUnreachable(II);

      return eraseInstFromFunction(*II);

    }


    // Update the cache of affected values for this assumption (we might be

    // here because we just simplified the condition).

    AC.updateAffectedValues(cast<AssumeInst>(II));

    break;

  }

  case Intrinsic::experimental_guard: {

    // Is this guard followed by another guard?  We scan forward over a small

    // fixed window of instructions to handle common cases with conditions

    // computed between guards.

    Instruction *NextInst = II->getNextNonDebugInstruction();

    for (unsigned i = 0; i < GuardWideningWindow; i++) {

      // Note: Using context-free form to avoid compile time blow up

      if (!isSafeToSpeculativelyExecute(NextInst))

        break;

      NextInst = NextInst->getNextNonDebugInstruction();

    }

    Value *NextCond = nullptr;

    if (match(NextInst,

              m_Intrinsic<Intrinsic::experimental_guard>(m_Value(NextCond)))) {

      Value *CurrCond = II->getArgOperand(0);


      // Remove a guard that it is immediately preceded by an identical guard.

      // Otherwise canonicalize guard(a); guard(b) -> guard(a & b).

      if (CurrCond != NextCond) {

        Instruction *MoveI = II->getNextNonDebugInstruction();

        while (MoveI != NextInst) {

          auto *Temp = MoveI;

          MoveI = MoveI->getNextNonDebugInstruction();

          Temp->moveBefore(II);

        }

        replaceOperand(*II, 0, Builder.CreateAnd(CurrCond, NextCond));

      }

      eraseInstFromFunction(*NextInst);

      return II;

    }

    break;

  }

  case Intrinsic::vector_insert: {

    Value *Vec = II->getArgOperand(0);

    Value *SubVec = II->getArgOperand(1);

    Value *Idx = II->getArgOperand(2);

    auto *DstTy = dyn_cast<FixedVectorType>(II->getType());

    auto *VecTy = dyn_cast<FixedVectorType>(Vec->getType());

    auto *SubVecTy = dyn_cast<FixedVectorType>(SubVec->getType());


    // Only canonicalize if the destination vector, Vec, and SubVec are all

    // fixed vectors.

    if (DstTy && VecTy && SubVecTy) {

      unsigned DstNumElts = DstTy->getNumElements();

      unsigned VecNumElts = VecTy->getNumElements();

      unsigned SubVecNumElts = SubVecTy->getNumElements();

      unsigned IdxN = cast<ConstantInt>(Idx)->getZExtValue();


      // An insert that entirely overwrites Vec with SubVec is a nop.

      if (VecNumElts == SubVecNumElts)

        return replaceInstUsesWith(CI, SubVec);


      // Widen SubVec into a vector of the same width as Vec, since

      // shufflevector requires the two input vectors to be the same width.

      // Elements beyond the bounds of SubVec within the widened vector are

      // undefined.

      SmallVector<int, 8> WidenMask;

      unsigned i;

      for (i = 0; i != SubVecNumElts; ++i)

        WidenMask.push_back(i);

      for (; i != VecNumElts; ++i)

        WidenMask.push_back(PoisonMaskElem);


      Value *WidenShuffle = Builder.CreateShuffleVector(SubVec, WidenMask);


      SmallVector<int, 8> Mask;

      for (unsigned i = 0; i != IdxN; ++i)

        Mask.push_back(i);

      for (unsigned i = DstNumElts; i != DstNumElts + SubVecNumElts; ++i)

        Mask.push_back(i);

      for (unsigned i = IdxN + SubVecNumElts; i != DstNumElts; ++i)

        Mask.push_back(i);


      Value *Shuffle = Builder.CreateShuffleVector(Vec, WidenShuffle, Mask);

      return replaceInstUsesWith(CI, Shuffle);

    }

    break;

  }

  case Intrinsic::vector_extract: {

    Value *Vec = II->getArgOperand(0);

    Value *Idx = II->getArgOperand(1);


    Type *ReturnType = II->getType();

    // (extract_vector (insert_vector InsertTuple, InsertValue, InsertIdx),

    // ExtractIdx)

    unsigned ExtractIdx = cast<ConstantInt>(Idx)->getZExtValue();

    Value *InsertTuple, *InsertIdx, *InsertValue;

    if (match(Vec, m_Intrinsic<Intrinsic::vector_insert>(m_Value(InsertTuple),

                                                         m_Value(InsertValue),

                                                         m_Value(InsertIdx))) &&

        InsertValue->getType() == ReturnType) {

      unsigned Index = cast<ConstantInt>(InsertIdx)->getZExtValue();

      // Case where we get the same index right after setting it.

      // extract.vector(insert.vector(InsertTuple, InsertValue, Idx), Idx) -->

      // InsertValue

      if (ExtractIdx == Index)

        return replaceInstUsesWith(CI, InsertValue);

      // If we are getting a different index than what was set in the

      // insert.vector intrinsic. We can just set the input tuple to the one up

      // in the chain. extract.vector(insert.vector(InsertTuple, InsertValue,

      // InsertIndex), ExtractIndex)

      // --> extract.vector(InsertTuple, ExtractIndex)

      else

        return replaceOperand(CI, 0, InsertTuple);

    }


    auto *DstTy = dyn_cast<VectorType>(ReturnType);

    auto *VecTy = dyn_cast<VectorType>(Vec->getType());


    if (DstTy && VecTy) {

      auto DstEltCnt = DstTy->getElementCount();

      auto VecEltCnt = VecTy->getElementCount();

      unsigned IdxN = cast<ConstantInt>(Idx)->getZExtValue();


      // Extracting the entirety of Vec is a nop.

      if (DstEltCnt == VecTy->getElementCount()) {

        replaceInstUsesWith(CI, Vec);

        return eraseInstFromFunction(CI);

      }


      // Only canonicalize to shufflevector if the destination vector and

      // Vec are fixed vectors.

      if (VecEltCnt.isScalable() || DstEltCnt.isScalable())

        break;


      SmallVector<int, 8> Mask;

      for (unsigned i = 0; i != DstEltCnt.getKnownMinValue(); ++i)

        Mask.push_back(IdxN + i);


      Value *Shuffle = Builder.CreateShuffleVector(Vec, Mask);

      return replaceInstUsesWith(CI, Shuffle);

    }

    break;

  }

  case Intrinsic::vector_reverse: {

    Value *BO0, *BO1, *X, *Y;

    Value *Vec = II->getArgOperand(0);

    if (match(Vec, m_OneUse(m_BinOp(m_Value(BO0), m_Value(BO1))))) {

      auto *OldBinOp = cast<BinaryOperator>(Vec);

      if (match(BO0, m_VecReverse(m_Value(X)))) {

        // rev(binop rev(X), rev(Y)) --> binop X, Y

        if (match(BO1, m_VecReverse(m_Value(Y))))

          return replaceInstUsesWith(CI, BinaryOperator::CreateWithCopiedFlags(

                                             OldBinOp->getOpcode(), X, Y,

                                             OldBinOp, OldBinOp->getName(),

                                             II->getIterator()));

        // rev(binop rev(X), BO1Splat) --> binop X, BO1Splat

        if (isSplatValue(BO1))

          return replaceInstUsesWith(CI, BinaryOperator::CreateWithCopiedFlags(

                                             OldBinOp->getOpcode(), X, BO1,

                                             OldBinOp, OldBinOp->getName(),

                                             II->getIterator()));

      }

      // rev(binop BO0Splat, rev(Y)) --> binop BO0Splat, Y

      if (match(BO1, m_VecReverse(m_Value(Y))) && isSplatValue(BO0))

        return replaceInstUsesWith(CI,

                                   BinaryOperator::CreateWithCopiedFlags(

                                       OldBinOp->getOpcode(), BO0, Y, OldBinOp,

                                       OldBinOp->getName(), II->getIterator()));

    }

    // rev(unop rev(X)) --> unop X

    if (match(Vec, m_OneUse(m_UnOp(m_VecReverse(m_Value(X)))))) {

      auto *OldUnOp = cast<UnaryOperator>(Vec);

      auto *NewUnOp = UnaryOperator::CreateWithCopiedFlags(

          OldUnOp->getOpcode(), X, OldUnOp, OldUnOp->getName(),

          II->getIterator());

      return replaceInstUsesWith(CI, NewUnOp);

    }

    break;

  }

  case Intrinsic::vector_reduce_or:

  case Intrinsic::vector_reduce_and: {

    // Canonicalize logical or/and reductions:

    // Or reduction for i1 is represented as:

    // %val = bitcast <ReduxWidth x i1> to iReduxWidth

    // %res = cmp ne iReduxWidth %val, 0

    // And reduction for i1 is represented as:

    // %val = bitcast <ReduxWidth x i1> to iReduxWidth

    // %res = cmp eq iReduxWidth %val, 11111

    Value *Arg = II->getArgOperand(0);

    Value *Vect;

    if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

      if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

        if (FTy->getElementType() == Builder.getInt1Ty()) {

          Value *Res = Builder.CreateBitCast(

              Vect, Builder.getIntNTy(FTy->getNumElements()));

          if (IID == Intrinsic::vector_reduce_and) {

            Res = Builder.CreateICmpEQ(

                Res, ConstantInt::getAllOnesValue(Res->getType()));

          } else {

            assert(IID == Intrinsic::vector_reduce_or &&

                   "Expected or reduction.");

            Res = Builder.CreateIsNotNull(Res);

          }

          if (Arg != Vect)

            Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                     II->getType());

          return replaceInstUsesWith(CI, Res);

        }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_add: {

    if (IID == Intrinsic::vector_reduce_add) {

      // Convert vector_reduce_add(ZExt(<n x i1>)) to

      // ZExtOrTrunc(ctpop(bitcast <n x i1> to in)).

      // Convert vector_reduce_add(SExt(<n x i1>)) to

      // -ZExtOrTrunc(ctpop(bitcast <n x i1> to in)).

      // Convert vector_reduce_add(<n x i1>) to

      // Trunc(ctpop(bitcast <n x i1> to in)).

      Value *Arg = II->getArgOperand(0);

      Value *Vect;

      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

          if (FTy->getElementType() == Builder.getInt1Ty()) {

            Value *V = Builder.CreateBitCast(

                Vect, Builder.getIntNTy(FTy->getNumElements()));

            Value *Res = Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, V);

            if (Res->getType() != II->getType())

              Res = Builder.CreateZExtOrTrunc(Res, II->getType());

            if (Arg != Vect &&

                cast<Instruction>(Arg)->getOpcode() == Instruction::SExt)

              Res = Builder.CreateNeg(Res);

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_xor: {

    if (IID == Intrinsic::vector_reduce_xor) {

      // Exclusive disjunction reduction over the vector with

      // (potentially-extended) i1 element type is actually a

      // (potentially-extended) arithmetic `add` reduction over the original

      // non-extended value:

      //   vector_reduce_xor(?ext(<n x i1>))

      //     -->

      //   ?ext(vector_reduce_add(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;

      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

          if (FTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = Builder.CreateAddReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                       II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_mul: {

    if (IID == Intrinsic::vector_reduce_mul) {

      // Multiplicative reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially zero-extended)

      // logical `and` reduction over the original non-extended value:

      //   vector_reduce_mul(?ext(<n x i1>))

      //     -->

      //   zext(vector_reduce_and(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;

      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

          if (FTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = Builder.CreateAndReduce(Vect);

            if (Res->getType() != II->getType())

              Res = Builder.CreateZExt(Res, II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_umin:

  case Intrinsic::vector_reduce_umax: {

    if (IID == Intrinsic::vector_reduce_umin ||

        IID == Intrinsic::vector_reduce_umax) {

      // UMin/UMax reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially-extended)

      // logical `and`/`or` reduction over the original non-extended value:

      //   vector_reduce_u{min,max}(?ext(<n x i1>))

      //     -->

      //   ?ext(vector_reduce_{and,or}(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;

      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

          if (FTy->getElementType() == Builder.getInt1Ty()) {

            Value *Res = IID == Intrinsic::vector_reduce_umin

                             ? Builder.CreateAndReduce(Vect)

                             : Builder.CreateOrReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(cast<CastInst>(Arg)->getOpcode(), Res,

                                       II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_smin:

  case Intrinsic::vector_reduce_smax: {

    if (IID == Intrinsic::vector_reduce_smin ||

        IID == Intrinsic::vector_reduce_smax) {

      // SMin/SMax reduction over the vector with (potentially-extended)

      // i1 element type is actually a (potentially-extended)

      // logical `and`/`or` reduction over the original non-extended value:

      //   vector_reduce_s{min,max}(<n x i1>)

      //     -->

      //   vector_reduce_{or,and}(<n x i1>)

      // and

      //   vector_reduce_s{min,max}(sext(<n x i1>))

      //     -->

      //   sext(vector_reduce_{or,and}(<n x i1>))

      // and

      //   vector_reduce_s{min,max}(zext(<n x i1>))

      //     -->

      //   zext(vector_reduce_{and,or}(<n x i1>))

      Value *Arg = II->getArgOperand(0);

      Value *Vect;

      if (match(Arg, m_ZExtOrSExtOrSelf(m_Value(Vect)))) {

        if (auto *FTy = dyn_cast<FixedVectorType>(Vect->getType()))

          if (FTy->getElementType() == Builder.getInt1Ty()) {

            Instruction::CastOps ExtOpc = Instruction::CastOps::CastOpsEnd;

            if (Arg != Vect)

              ExtOpc = cast<CastInst>(Arg)->getOpcode();

            Value *Res = ((IID == Intrinsic::vector_reduce_smin) ==

                          (ExtOpc == Instruction::CastOps::ZExt))

                             ? Builder.CreateAndReduce(Vect)

                             : Builder.CreateOrReduce(Vect);

            if (Arg != Vect)

              Res = Builder.CreateCast(ExtOpc, Res, II->getType());

            return replaceInstUsesWith(CI, Res);

          }

      }

    }

    [[fallthrough]];

  }

  case Intrinsic::vector_reduce_fmax:

  case Intrinsic::vector_reduce_fmin:

  case Intrinsic::vector_reduce_fadd:

  case Intrinsic::vector_reduce_fmul: {

    bool CanBeReassociated = (IID != Intrinsic::vector_reduce_fadd &&

                              IID != Intrinsic::vector_reduce_fmul) ||

                             II->hasAllowReassoc();

    const unsigned ArgIdx = (IID == Intrinsic::vector_reduce_fadd ||

                             IID == Intrinsic::vector_reduce_fmul)

                                ? 1

                                : 0;

    Value *Arg = II->getArgOperand(ArgIdx);

    Value *V;

    ArrayRef<int> Mask;

    if (!isa<FixedVectorType>(Arg->getType()) || !CanBeReassociated ||

        !match(Arg, m_Shuffle(m_Value(V), m_Undef(), m_Mask(Mask))) ||

        !cast<ShuffleVectorInst>(Arg)->isSingleSource())

      break;

    int Sz = Mask.size();

    SmallBitVector UsedIndices(Sz);

    for (int Idx : Mask) {

      if (Idx == PoisonMaskElem || UsedIndices.test(Idx))

        break;

      UsedIndices.set(Idx);

    }

    // Can remove shuffle iff just shuffled elements, no repeats, undefs, or

    // other changes.

    if (UsedIndices.all()) {

      replaceUse(II->getOperandUse(ArgIdx), V);

      return nullptr;

    }

    break;

  }

  case Intrinsic::is_fpclass: {

    if (Instruction *I = foldIntrinsicIsFPClass(*II))

      return I;

    break;

  }

  case Intrinsic::threadlocal_address: {

    Align MinAlign = getKnownAlignment(II->getArgOperand(0), DL, II, &AC, &DT);

    MaybeAlign Align = II->getRetAlign();

    if (MinAlign > Align.valueOrOne()) {

      II->addRetAttr(Attribute::getWithAlignment(II->getContext(), MinAlign));

      return II;

    }

    break;

  }

  default: {

    // Handle target specific intrinsics

    std::optional<Instruction *> V = targetInstCombineIntrinsic(*II);

    if (V)

      return *V;

    break;

  }

  }


  // Try to fold intrinsic into select operands. This is legal if:

  //  * The intrinsic is speculatable.

  //  * The select condition is not a vector, or the intrinsic does not

  //    perform cross-lane operations.

  switch (IID) {

  case Intrinsic::ctlz:

  case Intrinsic::cttz:

  case Intrinsic::ctpop:

  case Intrinsic::umin:

  case Intrinsic::umax:

  case Intrinsic::smin:

  case Intrinsic::smax:

  case Intrinsic::usub_sat:

  case Intrinsic::uadd_sat:

  case Intrinsic::ssub_sat:

  case Intrinsic::sadd_sat:

    for (Value *Op : II->args())

      if (auto *Sel = dyn_cast<SelectInst>(Op))

        if (Instruction *R = FoldOpIntoSelect(*II, Sel))

          return R;

    [[fallthrough]];

  default:

    break;

  }


  if (Instruction *Shuf = foldShuffledIntrinsicOperands(II, Builder))

    return Shuf;


  // Some intrinsics (like experimental_gc_statepoint) can be used in invoke

  // context, so it is handled in visitCallBase and we should trigger it.

  return visitCallBase(*II);

}


// Fence instruction simplification

Instruction *InstCombinerImpl::visitFenceInst(FenceInst &FI) {

  auto *NFI = dyn_cast<FenceInst>(FI.getNextNonDebugInstruction());

  // This check is solely here to handle arbitrary target-dependent syncscopes.

  // TODO: Can remove if does not matter in practice.

  if (NFI && FI.isIdenticalTo(NFI))

    return eraseInstFromFunction(FI);


  // Returns true if FI1 is identical or stronger fence than FI2.

  auto isIdenticalOrStrongerFence = [](FenceInst *FI1, FenceInst *FI2) {

    auto FI1SyncScope = FI1->getSyncScopeID();

    // Consider same scope, where scope is global or single-thread.

    if (FI1SyncScope != FI2->getSyncScopeID() ||

        (FI1SyncScope != SyncScope::System &&

         FI1SyncScope != SyncScope::SingleThread))

      return false;


    return isAtLeastOrStrongerThan(FI1->getOrdering(), FI2->getOrdering());

  };

  if (NFI && isIdenticalOrStrongerFence(NFI, &FI))

    return eraseInstFromFunction(FI);


  if (auto *PFI = dyn_cast_or_null<FenceInst>(FI.getPrevNonDebugInstruction()))

    if (isIdenticalOrStrongerFence(PFI, &FI))

      return eraseInstFromFunction(FI);

  return nullptr;

}


// InvokeInst simplification

Instruction *InstCombinerImpl::visitInvokeInst(InvokeInst &II) {

  return visitCallBase(II);

}


// CallBrInst simplification

Instruction *InstCombinerImpl::visitCallBrInst(CallBrInst &CBI) {

  return visitCallBase(CBI);

}


Instruction *InstCombinerImpl::tryOptimizeCall(CallInst *CI) {

  if (!CI->getCalledFunction()) return nullptr;


  // Skip optimizing notail and musttail calls so

  // LibCallSimplifier::optimizeCall doesn't have to preserve those invariants.

  // LibCallSimplifier::optimizeCall should try to preseve tail calls though.

  if (CI->isMustTailCall() || CI->isNoTailCall())

    return nullptr;


  auto InstCombineRAUW = [this](Instruction *From, Value *With) {

    replaceInstUsesWith(*From, With);

  };

  auto InstCombineErase = [this](Instruction *I) {

    eraseInstFromFunction(*I);

  };

  LibCallSimplifier Simplifier(DL, &TLI, &AC, ORE, BFI, PSI, InstCombineRAUW,

                               InstCombineErase);

  if (Value *With = Simplifier.optimizeCall(CI, Builder)) {

    ++NumSimplified;

    return CI->use_empty() ? CI : replaceInstUsesWith(*CI, With);

  }


  return nullptr;

}


static IntrinsicInst *findInitTrampolineFromAlloca(Value *TrampMem) {

  // Strip off at most one level of pointer casts, looking for an alloca.  This

  // is good enough in practice and simpler than handling any number of casts.

  Value *Underlying = TrampMem->stripPointerCasts();

  if (Underlying != TrampMem &&

      (!Underlying->hasOneUse() || Underlying->user_back() != TrampMem))

    return nullptr;

  if (!isa<AllocaInst>(Underlying))

    return nullptr;


  IntrinsicInst *InitTrampoline = nullptr;

  for (User *U : TrampMem->users()) {

    IntrinsicInst *II = dyn_cast<IntrinsicInst>(U);

    if (!II)

      return nullptr;

    if (II->getIntrinsicID() == Intrinsic::init_trampoline) {

      if (InitTrampoline)

        // More than one init_trampoline writes to this value.  Give up.

        return nullptr;

      InitTrampoline = II;

      continue;

    }

    if (II->getIntrinsicID() == Intrinsic::adjust_trampoline)

      // Allow any number of calls to adjust.trampoline.

      continue;

    return nullptr;

  }


  // No call to init.trampoline found.

  if (!InitTrampoline)

    return nullptr;


  // Check that the alloca is being used in the expected way.

  if (InitTrampoline->getOperand(0) != TrampMem)

    return nullptr;


  return InitTrampoline;

}


static IntrinsicInst *findInitTrampolineFromBB(IntrinsicInst *AdjustTramp,

                                               Value *TrampMem) {

  // Visit all the previous instructions in the basic block, and try to find a

  // init.trampoline which has a direct path to the adjust.trampoline.

  for (BasicBlock::iterator I = AdjustTramp->getIterator(),

                            E = AdjustTramp->getParent()->begin();

       I != E;) {

    Instruction *Inst = &*--I;

    if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(I))

      if (II->getIntrinsicID() == Intrinsic::init_trampoline &&

          II->getOperand(0) == TrampMem)

        return II;

    if (Inst->mayWriteToMemory())

      return nullptr;

  }

  return nullptr;

}


// Given a call to llvm.adjust.trampoline, find and return the corresponding

// call to llvm.init.trampoline if the call to the trampoline can be optimized

// to a direct call to a function.  Otherwise return NULL.

static IntrinsicInst *findInitTrampoline(Value *Callee) {

  Callee = Callee->stripPointerCasts();

  IntrinsicInst *AdjustTramp = dyn_cast<IntrinsicInst>(Callee);

  if (!AdjustTramp ||

      AdjustTramp->getIntrinsicID() != Intrinsic::adjust_trampoline)

    return nullptr;


  Value *TrampMem = AdjustTramp->getOperand(0);


  if (IntrinsicInst *IT = findInitTrampolineFromAlloca(TrampMem))

    return IT;

  if (IntrinsicInst *IT = findInitTrampolineFromBB(AdjustTramp, TrampMem))

    return IT;

  return nullptr;

}


bool InstCombinerImpl::annotateAnyAllocSite(CallBase &Call,

                                            const TargetLibraryInfo *TLI) {

  // Note: We only handle cases which can't be driven from generic attributes

  // here.  So, for example, nonnull and noalias (which are common properties

  // of some allocation functions) are expected to be handled via annotation

  // of the respective allocator declaration with generic attributes.

  bool Changed = false;


  if (!Call.getType()->isPointerTy())

    return Changed;


  std::optional<APInt> Size = getAllocSize(&Call, TLI);

  if (Size && *Size != 0) {

    // TODO: We really should just emit deref_or_null here and then

    // let the generic inference code combine that with nonnull.

    if (Call.hasRetAttr(Attribute::NonNull)) {

      Changed = !Call.hasRetAttr(Attribute::Dereferenceable);

      Call.addRetAttr(Attribute::getWithDereferenceableBytes(

          Call.getContext(), Size->getLimitedValue()));

    } else {

      Changed = !Call.hasRetAttr(Attribute::DereferenceableOrNull);

      Call.addRetAttr(Attribute::getWithDereferenceableOrNullBytes(

          Call.getContext(), Size->getLimitedValue()));

    }

  }


  // Add alignment attribute if alignment is a power of two constant.

  Value *Alignment = getAllocAlignment(&Call, TLI);

  if (!Alignment)

    return Changed;


  ConstantInt *AlignOpC = dyn_cast<ConstantInt>(Alignment);

  if (AlignOpC && AlignOpC->getValue().ult(llvm::Value::MaximumAlignment)) {

    uint64_t AlignmentVal = AlignOpC->getZExtValue();

    if (llvm::isPowerOf2_64(AlignmentVal)) {

      Align ExistingAlign = Call.getRetAlign().valueOrOne();

      Align NewAlign = Align(AlignmentVal);

      if (NewAlign > ExistingAlign) {

        Call.addRetAttr(

            Attribute::getWithAlignment(Call.getContext(), NewAlign));

        Changed = true;

      }

    }

  }

  return Changed;

}


/// Improvements for call, callbr and invoke instructions.

Instruction *InstCombinerImpl::visitCallBase(CallBase &Call) {

  bool Changed = annotateAnyAllocSite(Call, &TLI);


  // Mark any parameters that are known to be non-null with the nonnull

  // attribute.  This is helpful for inlining calls to functions with null

  // checks on their arguments.

  SmallVector<unsigned, 4> ArgNos;

  unsigned ArgNo = 0;


  for (Value *V : Call.args()) {

    if (V->getType()->isPointerTy() &&

        !Call.paramHasAttr(ArgNo, Attribute::NonNull) &&

        isKnownNonZero(V, getSimplifyQuery().getWithInstruction(&Call)))

      ArgNos.push_back(ArgNo);

    ArgNo++;

  }


  assert(ArgNo == Call.arg_size() && "Call arguments not processed correctly.");


  if (!ArgNos.empty()) {

    AttributeList AS = Call.getAttributes();

    LLVMContext &Ctx = Call.getContext();

    AS = AS.addParamAttribute(Ctx, ArgNos,

                              Attribute::get(Ctx, Attribute::NonNull));

    Call.setAttributes(AS);

    Changed = true;

  }


  // If the callee is a pointer to a function, attempt to move any casts to the

  // arguments of the call/callbr/invoke.

  Value *Callee = Call.getCalledOperand();

  Function *CalleeF = dyn_cast<Function>(Callee);

  if ((!CalleeF || CalleeF->getFunctionType() != Call.getFunctionType()) &&

      transformConstExprCastCall(Call))

    return nullptr;


  if (CalleeF) {

    // Remove the convergent attr on calls when the callee is not convergent.

    if (Call.isConvergent() && !CalleeF->isConvergent() &&

        !CalleeF->isIntrinsic()) {

      LLVM_DEBUG(dbgs() << "Removing convergent attr from instr " << Call

                        << "\n");

      Call.setNotConvergent();

      return &Call;

    }


    // If the call and callee calling conventions don't match, and neither one

    // of the calling conventions is compatible with C calling convention

    // this call must be unreachable, as the call is undefined.

    if ((CalleeF->getCallingConv() != Call.getCallingConv() &&

         !(CalleeF->getCallingConv() == llvm::CallingConv::C &&

           TargetLibraryInfoImpl::isCallingConvCCompatible(&Call)) &&

         !(Call.getCallingConv() == llvm::CallingConv::C &&

           TargetLibraryInfoImpl::isCallingConvCCompatible(CalleeF))) &&

        // Only do this for calls to a function with a body.  A prototype may

        // not actually end up matching the implementation's calling conv for a

        // variety of reasons (e.g. it may be written in assembly).

        !CalleeF->isDeclaration()) {

      Instruction *OldCall = &Call;

      CreateNonTerminatorUnreachable(OldCall);

      // If OldCall does not return void then replaceInstUsesWith poison.

      // This allows ValueHandlers and custom metadata to adjust itself.

      if (!OldCall->getType()->isVoidTy())

        replaceInstUsesWith(*OldCall, PoisonValue::get(OldCall->getType()));

      if (isa<CallInst>(OldCall))

        return eraseInstFromFunction(*OldCall);


      // We cannot remove an invoke or a callbr, because it would change thexi

      // CFG, just change the callee to a null pointer.

      cast<CallBase>(OldCall)->setCalledFunction(

          CalleeF->getFunctionType(),

          Constant::getNullValue(CalleeF->getType()));

      return nullptr;

    }

  }


  // Calling a null function pointer is undefined if a null address isn't

  // dereferenceable.

  if ((isa<ConstantPointerNull>(Callee) &&

       !NullPointerIsDefined(Call.getFunction())) ||

      isa<UndefValue>(Callee)) {

    // If Call does not return void then replaceInstUsesWith poison.

    // This allows ValueHandlers and custom metadata to adjust itself.

    if (!Call.getType()->isVoidTy())

      replaceInstUsesWith(Call, PoisonValue::get(Call.getType()));


    if (Call.isTerminator()) {

      // Can't remove an invoke or callbr because we cannot change the CFG.

      return nullptr;

    }


    // This instruction is not reachable, just remove it.

    CreateNonTerminatorUnreachable(&Call);

    return eraseInstFromFunction(Call);

  }


  if (IntrinsicInst *II = findInitTrampoline(Callee))

    return transformCallThroughTrampoline(Call, *II);


  if (isa<InlineAsm>(Callee) && !Call.doesNotThrow()) {

    InlineAsm *IA = cast<InlineAsm>(Callee);

    if (!IA->canThrow()) {

      // Normal inline asm calls cannot throw - mark them

      // 'nounwind'.

      Call.setDoesNotThrow();

      Changed = true;

    }

  }


  // Try to optimize the call if possible, we require DataLayout for most of

  // this.  None of these calls are seen as possibly dead so go ahead and

  // delete the instruction now.

  if (CallInst *CI = dyn_cast<CallInst>(&Call)) {

    Instruction *I = tryOptimizeCall(CI);

    // If we changed something return the result, etc. Otherwise let

    // the fallthrough check.

    if (I) return eraseInstFromFunction(*I);

  }


  if (!Call.use_empty() && !Call.isMustTailCall())

    if (Value *ReturnedArg = Call.getReturnedArgOperand()) {

      Type *CallTy = Call.getType();

      Type *RetArgTy = ReturnedArg->getType();

      if (RetArgTy->canLosslesslyBitCastTo(CallTy))

        return replaceInstUsesWith(

            Call, Builder.CreateBitOrPointerCast(ReturnedArg, CallTy));

    }


  // Drop unnecessary kcfi operand bundles from calls that were converted

  // into direct calls.

  auto Bundle = Call.getOperandBundle(LLVMContext::OB_kcfi);

  if (Bundle && !Call.isIndirectCall()) {

    DEBUG_WITH_TYPE(DEBUG_TYPE "-kcfi", {

      if (CalleeF) {

        ConstantInt *FunctionType = nullptr;

        ConstantInt *ExpectedType = cast<ConstantInt>(Bundle->Inputs[0]);


        if (MDNode *MD = CalleeF->getMetadata(LLVMContext::MD_kcfi_type))

          FunctionType = mdconst::extract<ConstantInt>(MD->getOperand(0));


        if (FunctionType &&

            FunctionType->getZExtValue() != ExpectedType->getZExtValue())

          dbgs() << Call.getModule()->getName()

                 << ": warning: kcfi: " << Call.getCaller()->getName()

                 << ": call to " << CalleeF->getName()

                 << " using a mismatching function pointer type\n";

      }

    });


    return CallBase::removeOperandBundle(&Call, LLVMContext::OB_kcfi);

  }


  if (isRemovableAlloc(&Call, &TLI))

    return visitAllocSite(Call);


  // Handle intrinsics which can be used in both call and invoke context.

  switch (Call.getIntrinsicID()) {

  case Intrinsic::experimental_gc_statepoint: {

    GCStatepointInst &GCSP = *cast<GCStatepointInst>(&Call);

    SmallPtrSet<Value *, 32> LiveGcValues;

    for (const GCRelocateInst *Reloc : GCSP.getGCRelocates()) {

      GCRelocateInst &GCR = *const_cast<GCRelocateInst *>(Reloc);


      // Remove the relocation if unused.

      if (GCR.use_empty()) {

        eraseInstFromFunction(GCR);

        continue;

      }


      Value *DerivedPtr = GCR.getDerivedPtr();

      Value *BasePtr = GCR.getBasePtr();


      // Undef is undef, even after relocation.

      if (isa<UndefValue>(DerivedPtr) || isa<UndefValue>(BasePtr)) {

        replaceInstUsesWith(GCR, UndefValue::get(GCR.getType()));

        eraseInstFromFunction(GCR);

        continue;

      }


      if (auto *PT = dyn_cast<PointerType>(GCR.getType())) {

        // The relocation of null will be null for most any collector.

        // TODO: provide a hook for this in GCStrategy.  There might be some

        // weird collector this property does not hold for.

        if (isa<ConstantPointerNull>(DerivedPtr)) {

          // Use null-pointer of gc_relocate's type to replace it.

          replaceInstUsesWith(GCR, ConstantPointerNull::get(PT));

          eraseInstFromFunction(GCR);

          continue;

        }


        // isKnownNonNull -> nonnull attribute

        if (!GCR.hasRetAttr(Attribute::NonNull) &&

            isKnownNonZero(DerivedPtr,

                           getSimplifyQuery().getWithInstruction(&Call))) {

          GCR.addRetAttr(Attribute::NonNull);

          // We discovered new fact, re-check users.

          Worklist.pushUsersToWorkList(GCR);

        }

      }


      // If we have two copies of the same pointer in the statepoint argument

      // list, canonicalize to one.  This may let us common gc.relocates.

      if (GCR.getBasePtr() == GCR.getDerivedPtr() &&

          GCR.getBasePtrIndex() != GCR.getDerivedPtrIndex()) {

        auto *OpIntTy = GCR.getOperand(2)->getType();

        GCR.setOperand(2, ConstantInt::get(OpIntTy, GCR.getBasePtrIndex()));

      }


      // TODO: bitcast(relocate(p)) -> relocate(bitcast(p))

      // Canonicalize on the type from the uses to the defs


      // TODO: relocate((gep p, C, C2, ...)) -> gep(relocate(p), C, C2, ...)

      LiveGcValues.insert(BasePtr);

      LiveGcValues.insert(DerivedPtr);

    }

    std::optional<OperandBundleUse> Bundle =

        GCSP.getOperandBundle(LLVMContext::OB_gc_live);

    unsigned NumOfGCLives = LiveGcValues.size();

    if (!Bundle || NumOfGCLives == Bundle->Inputs.size())

      break;

    // We can reduce the size of gc live bundle.

    DenseMap<Value *, unsigned> Val2Idx;

    std::vector<Value *> NewLiveGc;

    for (Value *V : Bundle->Inputs) {

      if (Val2Idx.count(V))

        continue;

      if (LiveGcValues.count(V)) {

        Val2Idx[V] = NewLiveGc.size();

        NewLiveGc.push_back(V);

      } else

        Val2Idx[V] = NumOfGCLives;

    }

    // Update all gc.relocates

    for (const GCRelocateInst *Reloc : GCSP.getGCRelocates()) {

      GCRelocateInst &GCR = *const_cast<GCRelocateInst *>(Reloc);

      Value *BasePtr = GCR.getBasePtr();

      assert(Val2Idx.count(BasePtr) && Val2Idx[BasePtr] != NumOfGCLives &&

             "Missed live gc for base pointer");

      auto *OpIntTy1 = GCR.getOperand(1)->getType();

      GCR.setOperand(1, ConstantInt::get(OpIntTy1, Val2Idx[BasePtr]));

      Value *DerivedPtr = GCR.getDerivedPtr();

      assert(Val2Idx.count(DerivedPtr) && Val2Idx[DerivedPtr] != NumOfGCLives &&

             "Missed live gc for derived pointer");

      auto *OpIntTy2 = GCR.getOperand(2)->getType();

      GCR.setOperand(2, ConstantInt::get(OpIntTy2, Val2Idx[DerivedPtr]));

    }

    // Create new statepoint instruction.

    OperandBundleDef NewBundle("gc-live", NewLiveGc);

    return CallBase::Create(&Call, NewBundle);

  }

  default: { break; }

  }


  return Changed ? &Call : nullptr;

}


/// If the callee is a constexpr cast of a function, attempt to move the cast to

/// the arguments of the call/invoke.

/// CallBrInst is not supported.

bool InstCombinerImpl::transformConstExprCastCall(CallBase &Call) {

  auto *Callee =

      dyn_cast<Function>(Call.getCalledOperand()->stripPointerCasts());

  if (!Callee)

    return false;


  assert(!isa<CallBrInst>(Call) &&

         "CallBr's don't have a single point after a def to insert at");


  // If this is a call to a thunk function, don't remove the cast. Thunks are

  // used to transparently forward all incoming parameters and outgoing return

  // values, so it's important to leave the cast in place.

  if (Callee->hasFnAttribute("thunk"))

    return false;


  // If this is a call to a naked function, the assembly might be

  // using an argument, or otherwise rely on the frame layout,

  // the function prototype will mismatch.

  if (Callee->hasFnAttribute(Attribute::Naked))

    return false;


  // If this is a musttail call, the callee's prototype must match the caller's

  // prototype with the exception of pointee types. The code below doesn't

  // implement that, so we can't do this transform.

  // TODO: Do the transform if it only requires adding pointer casts.

  if (Call.isMustTailCall())

    return false;


  Instruction *Caller = &Call;

  const AttributeList &CallerPAL = Call.getAttributes();


  // Okay, this is a cast from a function to a different type.  Unless doing so

  // would cause a type conversion of one of our arguments, change this call to

  // be a direct call with arguments casted to the appropriate types.

  FunctionType *FT = Callee->getFunctionType();

  Type *OldRetTy = Caller->getType();

  Type *NewRetTy = FT->getReturnType();


  // Check to see if we are changing the return type...

  if (OldRetTy != NewRetTy) {


    if (NewRetTy->isStructTy())

      return false; // TODO: Handle multiple return values.


    if (!CastInst::isBitOrNoopPointerCastable(NewRetTy, OldRetTy, DL)) {

      if (Callee->isDeclaration())

        return false;   // Cannot transform this return value.


      if (!Caller->use_empty() &&

          // void -> non-void is handled specially

          !NewRetTy->isVoidTy())

        return false;   // Cannot transform this return value.

    }


    if (!CallerPAL.isEmpty() && !Caller->use_empty()) {

      AttrBuilder RAttrs(FT->getContext(), CallerPAL.getRetAttrs());

      if (RAttrs.overlaps(AttributeFuncs::typeIncompatible(NewRetTy)))

        return false;   // Attribute not compatible with transformed value.

    }


    // If the callbase is an invoke instruction, and the return value is

    // used by a PHI node in a successor, we cannot change the return type of

    // the call because there is no place to put the cast instruction (without

    // breaking the critical edge).  Bail out in this case.

    if (!Caller->use_empty()) {

      BasicBlock *PhisNotSupportedBlock = nullptr;

      if (auto *II = dyn_cast<InvokeInst>(Caller))

        PhisNotSupportedBlock = II->getNormalDest();

      if (PhisNotSupportedBlock)

        for (User *U : Caller->users())

          if (PHINode *PN = dyn_cast<PHINode>(U))

            if (PN->getParent() == PhisNotSupportedBlock)

              return false;

    }

  }


  unsigned NumActualArgs = Call.arg_size();

  unsigned NumCommonArgs = std::min(FT->getNumParams(), NumActualArgs);


  // Prevent us turning:

  // declare void @takes_i32_inalloca(i32* inalloca)

  //  call void bitcast (void (i32*)* @takes_i32_inalloca to void (i32)*)(i32 0)

  //

  // into:

  //  call void @takes_i32_inalloca(i32* null)

  //

  //  Similarly, avoid folding away bitcasts of byval calls.

  if (Callee->getAttributes().hasAttrSomewhere(Attribute::InAlloca) ||

      Callee->getAttributes().hasAttrSomewhere(Attribute::Preallocated))

    return false;


  auto AI = Call.arg_begin();

  for (unsigned i = 0, e = NumCommonArgs; i != e; ++i, ++AI) {

    Type *ParamTy = FT->getParamType(i);

    Type *ActTy = (*AI)->getType();


    if (!CastInst::isBitOrNoopPointerCastable(ActTy, ParamTy, DL))

      return false;   // Cannot transform this parameter value.


    // Check if there are any incompatible attributes we cannot drop safely.

    if (AttrBuilder(FT->getContext(), CallerPAL.getParamAttrs(i))

            .overlaps(AttributeFuncs::typeIncompatible(

                ParamTy, AttributeFuncs::ASK_UNSAFE_TO_DROP)))

      return false;   // Attribute not compatible with transformed value.


    if (Call.isInAllocaArgument(i) ||

        CallerPAL.hasParamAttr(i, Attribute::Preallocated))

      return false; // Cannot transform to and from inalloca/preallocated.


    if (CallerPAL.hasParamAttr(i, Attribute::SwiftError))

      return false;


    if (CallerPAL.hasParamAttr(i, Attribute::ByVal) !=

        Callee->getAttributes().hasParamAttr(i, Attribute::ByVal))

      return false; // Cannot transform to or from byval.

  }


  if (Callee->isDeclaration()) {

    // Do not delete arguments unless we have a function body.

    if (FT->getNumParams() < NumActualArgs && !FT->isVarArg())

      return false;


    // If the callee is just a declaration, don't change the varargsness of the

    // call.  We don't want to introduce a varargs call where one doesn't

    // already exist.

    if (FT->isVarArg() != Call.getFunctionType()->isVarArg())

      return false;


    // If both the callee and the cast type are varargs, we still have to make

    // sure the number of fixed parameters are the same or we have the same

    // ABI issues as if we introduce a varargs call.

    if (FT->isVarArg() && Call.getFunctionType()->isVarArg() &&

        FT->getNumParams() != Call.getFunctionType()->getNumParams())

      return false;

  }


  if (FT->getNumParams() < NumActualArgs && FT->isVarArg() &&

      !CallerPAL.isEmpty()) {

    // In this case we have more arguments than the new function type, but we

    // won't be dropping them.  Check that these extra arguments have attributes

    // that are compatible with being a vararg call argument.

    unsigned SRetIdx;

    if (CallerPAL.hasAttrSomewhere(Attribute::StructRet, &SRetIdx) &&

        SRetIdx - AttributeList::FirstArgIndex >= FT->getNumParams())

      return false;

  }


  // Okay, we decided that this is a safe thing to do: go ahead and start

  // inserting cast instructions as necessary.

  SmallVector<Value *, 8> Args;

  SmallVector<AttributeSet, 8> ArgAttrs;

  Args.reserve(NumActualArgs);

  ArgAttrs.reserve(NumActualArgs);


  // Get any return attributes.

  AttrBuilder RAttrs(FT->getContext(), CallerPAL.getRetAttrs());


  // If the return value is not being used, the type may not be compatible

  // with the existing attributes.  Wipe out any problematic attributes.

  RAttrs.remove(AttributeFuncs::typeIncompatible(NewRetTy));


  LLVMContext &Ctx = Call.getContext();

  AI = Call.arg_begin();

  for (unsigned i = 0; i != NumCommonArgs; ++i, ++AI) {

    Type *ParamTy = FT->getParamType(i);


    Value *NewArg = *AI;

    if ((*AI)->getType() != ParamTy)

      NewArg = Builder.CreateBitOrPointerCast(*AI, ParamTy);

    Args.push_back(NewArg);


    // Add any parameter attributes except the ones incompatible with the new

    // type. Note that we made sure all incompatible ones are safe to drop.

    AttributeMask IncompatibleAttrs = AttributeFuncs::typeIncompatible(

        ParamTy, AttributeFuncs::ASK_SAFE_TO_DROP);

    ArgAttrs.push_back(

        CallerPAL.getParamAttrs(i).removeAttributes(Ctx, IncompatibleAttrs));

  }


  // If the function takes more arguments than the call was taking, add them

  // now.

  for (unsigned i = NumCommonArgs; i != FT->getNumParams(); ++i) {

    Args.push_back(Constant::getNullValue(FT->getParamType(i)));

    ArgAttrs.push_back(AttributeSet());

  }


  // If we are removing arguments to the function, emit an obnoxious warning.

  if (FT->getNumParams() < NumActualArgs) {

    // TODO: if (!FT->isVarArg()) this call may be unreachable. PR14722

    if (FT->isVarArg()) {

      // Add all of the arguments in their promoted form to the arg list.

      for (unsigned i = FT->getNumParams(); i != NumActualArgs; ++i, ++AI) {

        Type *PTy = getPromotedType((*AI)->getType());

        Value *NewArg = *AI;

        if (PTy != (*AI)->getType()) {

          // Must promote to pass through va_arg area!

          Instruction::CastOps opcode =

            CastInst::getCastOpcode(*AI, false, PTy, false);

          NewArg = Builder.CreateCast(opcode, *AI, PTy);

        }

        Args.push_back(NewArg);


        // Add any parameter attributes.

        ArgAttrs.push_back(CallerPAL.getParamAttrs(i));

      }

    }

  }


  AttributeSet FnAttrs = CallerPAL.getFnAttrs();


  if (NewRetTy->isVoidTy())

    Caller->setName("");   // Void type should not have a name.


  assert((ArgAttrs.size() == FT->getNumParams() || FT->isVarArg()) &&

         "missing argument attributes");

  AttributeList NewCallerPAL = AttributeList::get(

      Ctx, FnAttrs, AttributeSet::get(Ctx, RAttrs), ArgAttrs);


  SmallVector<OperandBundleDef, 1> OpBundles;

  Call.getOperandBundlesAsDefs(OpBundles);


  CallBase *NewCall;

  if (InvokeInst *II = dyn_cast<InvokeInst>(Caller)) {

    NewCall = Builder.CreateInvoke(Callee, II->getNormalDest(),

                                   II->getUnwindDest(), Args, OpBundles);

  } else {

    NewCall = Builder.CreateCall(Callee, Args, OpBundles);

    cast<CallInst>(NewCall)->setTailCallKind(

        cast<CallInst>(Caller)->getTailCallKind());

  }

  NewCall->takeName(Caller);

  NewCall->setCallingConv(Call.getCallingConv());

  NewCall->setAttributes(NewCallerPAL);


  // Preserve prof metadata if any.

  NewCall->copyMetadata(*Caller, {LLVMContext::MD_prof});


  // Insert a cast of the return type as necessary.

  Instruction *NC = NewCall;

  Value *NV = NC;

  if (OldRetTy != NV->getType() && !Caller->use_empty()) {

    if (!NV->getType()->isVoidTy()) {

      NV = NC = CastInst::CreateBitOrPointerCast(NC, OldRetTy);

      NC->setDebugLoc(Caller->getDebugLoc());


      auto OptInsertPt = NewCall->getInsertionPointAfterDef();

      assert(OptInsertPt && "No place to insert cast");

      InsertNewInstBefore(NC, *OptInsertPt);

      Worklist.pushUsersToWorkList(*Caller);

    } else {

      NV = PoisonValue::get(Caller->getType());

    }

  }


  if (!Caller->use_empty())

    replaceInstUsesWith(*Caller, NV);

  else if (Caller->hasValueHandle()) {

    if (OldRetTy == NV->getType())

      ValueHandleBase::ValueIsRAUWd(Caller, NV);

    else

      // We cannot call ValueIsRAUWd with a different type, and the

      // actual tracked value will disappear.

      ValueHandleBase::ValueIsDeleted(Caller);

  }


  eraseInstFromFunction(*Caller);

  return true;

}


/// Turn a call to a function created by init_trampoline / adjust_trampoline

/// intrinsic pair into a direct call to the underlying function.

Instruction *

InstCombinerImpl::transformCallThroughTrampoline(CallBase &Call,

                                                 IntrinsicInst &Tramp) {

  FunctionType *FTy = Call.getFunctionType();

  AttributeList Attrs = Call.getAttributes();


  // If the call already has the 'nest' attribute somewhere then give up -

  // otherwise 'nest' would occur twice after splicing in the chain.

  if (Attrs.hasAttrSomewhere(Attribute::Nest))

    return nullptr;


  Function *NestF = cast<Function>(Tramp.getArgOperand(1)->stripPointerCasts());

  FunctionType *NestFTy = NestF->getFunctionType();


  AttributeList NestAttrs = NestF->getAttributes();

  if (!NestAttrs.isEmpty()) {

    unsigned NestArgNo = 0;

    Type *NestTy = nullptr;

    AttributeSet NestAttr;


    // Look for a parameter marked with the 'nest' attribute.

    for (FunctionType::param_iterator I = NestFTy->param_begin(),

                                      E = NestFTy->param_end();

         I != E; ++NestArgNo, ++I) {

      AttributeSet AS = NestAttrs.getParamAttrs(NestArgNo);

      if (AS.hasAttribute(Attribute::Nest)) {

        // Record the parameter type and any other attributes.

        NestTy = *I;

        NestAttr = AS;

        break;

      }

    }


    if (NestTy) {

      std::vector<Value*> NewArgs;

      std::vector<AttributeSet> NewArgAttrs;

      NewArgs.reserve(Call.arg_size() + 1);

      NewArgAttrs.reserve(Call.arg_size());


      // Insert the nest argument into the call argument list, which may

      // mean appending it.  Likewise for attributes.


      {

        unsigned ArgNo = 0;

        auto I = Call.arg_begin(), E = Call.arg_end();

        do {

          if (ArgNo == NestArgNo) {

            // Add the chain argument and attributes.

            Value *NestVal = Tramp.getArgOperand(2);

            if (NestVal->getType() != NestTy)

              NestVal = Builder.CreateBitCast(NestVal, NestTy, "nest");

            NewArgs.push_back(NestVal);

            NewArgAttrs.push_back(NestAttr);

          }


          if (I == E)

            break;


          // Add the original argument and attributes.

          NewArgs.push_back(*I);

          NewArgAttrs.push_back(Attrs.getParamAttrs(ArgNo));


          ++ArgNo;

          ++I;

        } while (true);

      }


      // The trampoline may have been bitcast to a bogus type (FTy).

      // Handle this by synthesizing a new function type, equal to FTy

      // with the chain parameter inserted.


      std::vector<Type*> NewTypes;

      NewTypes.reserve(FTy->getNumParams()+1);


      // Insert the chain's type into the list of parameter types, which may

      // mean appending it.

      {

        unsigned ArgNo = 0;

        FunctionType::param_iterator I = FTy->param_begin(),

          E = FTy->param_end();


        do {

          if (ArgNo == NestArgNo)

            // Add the chain's type.

            NewTypes.push_back(NestTy);


          if (I == E)

            break;


          // Add the original type.

          NewTypes.push_back(*I);


          ++ArgNo;

          ++I;

        } while (true);

      }


      // Replace the trampoline call with a direct call.  Let the generic

      // code sort out any function type mismatches.

      FunctionType *NewFTy =

          FunctionType::get(FTy->getReturnType(), NewTypes, FTy->isVarArg());

      AttributeList NewPAL =

          AttributeList::get(FTy->getContext(), Attrs.getFnAttrs(),

                             Attrs.getRetAttrs(), NewArgAttrs);


      SmallVector<OperandBundleDef, 1> OpBundles;

      Call.getOperandBundlesAsDefs(OpBundles);


      Instruction *NewCaller;

      if (InvokeInst *II = dyn_cast<InvokeInst>(&Call)) {

        NewCaller = InvokeInst::Create(NewFTy, NestF, II->getNormalDest(),

                                       II->getUnwindDest(), NewArgs, OpBundles);

        cast<InvokeInst>(NewCaller)->setCallingConv(II->getCallingConv());

        cast<InvokeInst>(NewCaller)->setAttributes(NewPAL);

      } else if (CallBrInst *CBI = dyn_cast<CallBrInst>(&Call)) {

        NewCaller =

            CallBrInst::Create(NewFTy, NestF, CBI->getDefaultDest(),

                               CBI->getIndirectDests(), NewArgs, OpBundles);

        cast<CallBrInst>(NewCaller)->setCallingConv(CBI->getCallingConv());

        cast<CallBrInst>(NewCaller)->setAttributes(NewPAL);

      } else {

        NewCaller = CallInst::Create(NewFTy, NestF, NewArgs, OpBundles);

        cast<CallInst>(NewCaller)->setTailCallKind(

            cast<CallInst>(Call).getTailCallKind());

        cast<CallInst>(NewCaller)->setCallingConv(

            cast<CallInst>(Call).getCallingConv());

        cast<CallInst>(NewCaller)->setAttributes(NewPAL);

      }

      NewCaller->setDebugLoc(Call.getDebugLoc());


      return NewCaller;

    }

  }


  // Replace the trampoline call with a direct call.  Since there is no 'nest'

  // parameter, there is no need to adjust the argument list.  Let the generic

  // code sort out any function type mismatches.

  Call.setCalledFunction(FTy, NestF);

  return &Call;

}

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: AArch64SLSHardening.cpp:74

Intr
unsigned Intr
Definition: AMDGPUBaseInfo.cpp:2888

APFloat.h
This file declares a class to represent arbitrary precision floating point values and provide a varie...

APInt.h
This file implements a class to represent arbitrary precision integral constant values and operations...

APSInt.h
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...

IT
static cl::opt< ITMode > IT(cl::desc("IT block support"), cl::Hidden, cl::init(DefaultIT), cl::values(clEnumValN(DefaultIT, "arm-default-it", "Generate any type of IT block"), clEnumValN(RestrictedIT, "arm-restrict-it", "Disallow complex IT blocks")))

AliasAnalysis.h

ArrayRef.h

AssumeBundleBuilder.h

AssumeBundleQueries.h

AssumptionCache.h

AtomicOrdering.h
Atomic ordering constants.

AttributeMask.h

Attributes.h
This file contains the simple types necessary to represent the attributes associated with functions a...

BasicBlock.h

From
BlockVerifier::State From
Definition: BlockVerifier.cpp:57

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

Casting.h

CommandLine.h

Compiler.h

Constant.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

foldBitOrderCrossLogicOp
static SDValue foldBitOrderCrossLogicOp(SDNode *N, SelectionDAG &DAG)
Definition: DAGCombiner.cpp:10251

DataLayout.h

RetTy
return RetTy
Definition: DeadArgumentElimination.cpp:362

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:354

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(X)
Definition: Debug.h:101

DEBUG_WITH_TYPE
#define DEBUG_WITH_TYPE(TYPE, X)
DEBUG_WITH_TYPE macro - This macro should be used by passes to emit debug information.
Definition: Debug.h:64

DerivedTypes.h

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

X
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")

Function.h

DEBUG_TYPE
#define DEBUG_TYPE
Definition: GenericCycleImpl.h:30

GlobalVariable.h

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:113

Instruction.h

InlineAsm.h

getPromotedType
static Type * getPromotedType(Type *Ty)
Return the specified type promoted as it would be to pass though a va_arg area.
Definition: InstCombineCalls.cpp:94

createOverflowTuple
static Instruction * createOverflowTuple(IntrinsicInst *II, Value *Result, Constant *Overflow)
Creates a result tuple for an overflow intrinsic II with a given Result and a constant Overflow value...
Definition: InstCombineCalls.cpp:814

findInitTrampolineFromAlloca
static IntrinsicInst * findInitTrampolineFromAlloca(Value *TrampMem)
Definition: InstCombineCalls.cpp:3537

removeTriviallyEmptyRange
static bool removeTriviallyEmptyRange(IntrinsicInst &EndI, InstCombinerImpl &IC, std::function< bool(const IntrinsicInst &)> IsStart)
Definition: InstCombineCalls.cpp:766

inputDenormalIsDAZ
static bool inputDenormalIsDAZ(const Function &F, const Type *Ty)
Definition: InstCombineCalls.cpp:838

reassociateMinMaxWithConstantInOperand
static Instruction * reassociateMinMaxWithConstantInOperand(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If this min/max has a matching min/max operand with a constant, try to push the constant operand into...
Definition: InstCombineCalls.cpp:1265

signBitMustBeTheSame
static bool signBitMustBeTheSame(Value *Op0, Value *Op1, Instruction *CxtI, const DataLayout &DL, AssumptionCache *AC, DominatorTree *DT)
Return true if two values Op0 and Op1 are known to have the same sign.
Definition: InstCombineCalls.cpp:1076

moveAddAfterMinMax
static Instruction * moveAddAfterMinMax(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
Try to canonicalize min/max(X + C0, C1) as min/max(X, C1 - C0) + C0.
Definition: InstCombineCalls.cpp:1090

simplifyInvariantGroupIntrinsic
static Instruction * simplifyInvariantGroupIntrinsic(IntrinsicInst &II, InstCombinerImpl &IC)
This function transforms launder.invariant.group and strip.invariant.group like: launder(launder(x)) ...
Definition: InstCombineCalls.cpp:451

haveSameOperands
static bool haveSameOperands(const IntrinsicInst &I, const IntrinsicInst &E, unsigned NumOperands)
Definition: InstCombineCalls.cpp:746

GuardWideningWindow
static cl::opt< unsigned > GuardWideningWindow("instcombine-guard-widening-window", cl::init(3), cl::desc("How wide an instruction window to bypass looking for " "another guard"))

hasUndefSource
static bool hasUndefSource(AnyMemTransferInst *MI)
Recognize a memcpy/memmove from a trivially otherwise unused alloca.
Definition: InstCombineCalls.cpp:105

foldShuffledIntrinsicOperands
static Instruction * foldShuffledIntrinsicOperands(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If all arguments of the intrinsic are unary shuffles with the same mask, try to shuffle after the int...
Definition: InstCombineCalls.cpp:1352

factorizeMinMaxTree
static Instruction * factorizeMinMaxTree(IntrinsicInst *II)
Reduce a sequence of min/max intrinsics with a common operand.
Definition: InstCombineCalls.cpp:1293

simplifyNeonTbl1
static Value * simplifyNeonTbl1(const IntrinsicInst &II, InstCombiner::BuilderTy &Builder)
Convert a table lookup to shufflevector if the mask is constant.
Definition: InstCombineCalls.cpp:710

foldClampRangeOfTwo
static Instruction * foldClampRangeOfTwo(IntrinsicInst *II, InstCombiner::BuilderTy &Builder)
If we have a clamp pattern like max (min X, 42), 41 – where the output can only be one of two possibl...
Definition: InstCombineCalls.cpp:1191

findInitTrampolineFromBB
static IntrinsicInst * findInitTrampolineFromBB(IntrinsicInst *AdjustTramp, Value *TrampMem)
Definition: InstCombineCalls.cpp:3576

getKnownSignOrZero
static std::optional< bool > getKnownSignOrZero(Value *Op, Instruction *CxtI, const DataLayout &DL, AssumptionCache *AC, DominatorTree *DT)
Definition: InstCombineCalls.cpp:1061

foldCtpop
static Instruction * foldCtpop(IntrinsicInst &II, InstCombinerImpl &IC)
Definition: InstCombineCalls.cpp:629

foldCttzCtlz
static Instruction * foldCttzCtlz(IntrinsicInst &II, InstCombinerImpl &IC)
Definition: InstCombineCalls.cpp:481

findInitTrampoline
static IntrinsicInst * findInitTrampoline(Value *Callee)
Definition: InstCombineCalls.cpp:3597

fpclassTestIsFCmp0
static FCmpInst::Predicate fpclassTestIsFCmp0(FPClassTest Mask, const Function &F, Type *Ty)
Definition: InstCombineCalls.cpp:846

reassociateMinMaxWithConstants
static Value * reassociateMinMaxWithConstants(IntrinsicInst *II, IRBuilderBase &Builder, const SimplifyQuery &SQ)
If this min/max has a constant operand and an operand that is a matching min/max with a constant oper...
Definition: InstCombineCalls.cpp:1231

getKnownSign
static std::optional< bool > getKnownSign(Value *Op, Instruction *CxtI, const DataLayout &DL, AssumptionCache *AC, DominatorTree *DT)
Definition: InstCombineCalls.cpp:1044

canonicalizeConstantArg0ToArg1
static CallInst * canonicalizeConstantArg0ToArg1(CallInst &Call)
Definition: InstCombineCalls.cpp:801

InstCombineInternal.h
This file provides internal interfaces used to implement the InstCombine.

InstCombiner.h
This file provides the interface for the instcombine pass implementation.

InstrTypes.h

InstructionSimplify.h

InstructionWorklist.h

Instructions.h

IntrinsicInst.h

Intrinsics.h

KnownBits.h

LLVMContext.h

Loads.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

MathExtras.h

MemoryBuiltins.h

Metadata.h
This file contains the declarations for metadata subclasses.

Y
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")

PatternMatch.h

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition: RISCVRedundantCopyElimination.cpp:75

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

STLFunctionalExtras.h

SimplifyLibCalls.h

SmallBitVector.h
This file implements the SmallBitVector class.

SmallVector.h
This file defines the SmallVector class.

Statepoint.h

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition: Statistic.h:167

Struct
@ Struct
Definition: TargetLibraryInfo.cpp:77

Local.h

Type.h

User.h

getOpcode
static std::optional< unsigned > getOpcode(ArrayRef< VPValue * > Values)
Returns the opcode of Values or ~0 if they do not all agree.
Definition: VPlanSLP.cpp:191

ValueHandle.h

inputDenormalIsIEEE
static bool inputDenormalIsIEEE(const Function &F, const Type *Ty)
Return true if it's possible to assume IEEE treatment of input denormals in F for Val.
Definition: ValueTracking.cpp:4001

ValueTracking.h

Value.h

VectorUtils.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:76

LHS
Value * LHS
Definition: X86PartialReduction.cpp:75

FunctionType
Definition: ItaniumDemangle.h:799

VectorType
Definition: ItaniumDemangle.h:1149

llvm::AAResults::getModRefInfoMask
ModRefInfo getModRefInfoMask(const MemoryLocation &Loc, bool IgnoreLocals=false)
Returns a bitmask that should be unconditionally applied to the ModRef info of a memory location.
Definition: AliasAnalysis.cpp:149

llvm::APFloat
Definition: APFloat.h:780

llvm::APFloat::isNegative
bool isNegative() const
Definition: APFloat.h:1295

llvm::APFloat::clearSign
void clearSign()
Definition: APFloat.h:1159

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:76

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition: APInt.h:212

llvm::APInt::getSignMask
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition: APInt.h:207

llvm::APInt::usub_ov
APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1918

llvm::APInt::isZero
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition: APInt.h:358

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition: APInt.h:1439

llvm::APInt::ult
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition: APInt.h:1089

llvm::APInt::sadd_ov
APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1898

llvm::APInt::uadd_ov
APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1905

llvm::APInt::getSignedMinValue
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition: APInt.h:197

llvm::APInt::uadd_sat
APInt uadd_sat(const APInt &RHS) const
Definition: APInt.cpp:2006

llvm::APInt::isNonNegative
bool isNonNegative() const
Determine if this APInt Value is non-negative (>= 0)
Definition: APInt.h:312

llvm::APInt::getLowBitsSet
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
Definition: APInt.h:284

llvm::APInt::ssub_ov
APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition: APInt.cpp:1911

llvm::APSInt::getMinValue
static APSInt getMinValue(uint32_t numBits, bool Unsigned)
Return the APSInt representing the minimum integer value with the given bit width and signedness.
Definition: APSInt.h:311

llvm::APSInt::getMaxValue
static APSInt getMaxValue(uint32_t numBits, bool Unsigned)
Return the APSInt representing the maximum integer value with the given bit width and signedness.
Definition: APSInt.h:303

llvm::AnyMemSetInst
This class represents any memset intrinsic.
Definition: IntrinsicInst.h:1312

llvm::AnyMemTransferInst
Definition: IntrinsicInst.h:1332

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::AssumptionCache
A cache of @llvm.assume calls within a function.
Definition: AssumptionCache.h:42

llvm::AssumptionCache::registerAssumption
void registerAssumption(AssumeInst *CI)
Add an @llvm.assume intrinsic to this function's cache.
Definition: AssumptionCache.cpp:187

llvm::AssumptionCache::updateAffectedValues
void updateAffectedValues(AssumeInst *CI)
Update the cache of values being affected by this assumption (i.e.
Definition: AssumptionCache.cpp:99

llvm::AttrBuilder
Definition: Attributes.h:1016

llvm::AttrBuilder::overlaps
bool overlaps(const AttributeMask &AM) const
Return true if the builder has any attribute that's in the specified builder.
Definition: Attributes.cpp:1975

llvm::AttributeList
Definition: Attributes.h:451

llvm::AttributeList::getFnAttrs
AttributeSet getFnAttrs() const
The function attributes are returned.
Definition: Attributes.cpp:1560

llvm::AttributeList::get
static AttributeList get(LLVMContext &C, ArrayRef< std::pair< unsigned, Attribute > > Attrs)
Create an AttributeList with the specified parameters in it.
Definition: Attributes.cpp:1223

llvm::AttributeList::isEmpty
bool isEmpty() const
Return true if there are no attributes.
Definition: Attributes.h:977

llvm::AttributeList::getRetAttrs
AttributeSet getRetAttrs() const
The attributes for the ret value are returned.
Definition: Attributes.cpp:1556

llvm::AttributeList::hasFnAttr
bool hasFnAttr(Attribute::AttrKind Kind) const
Return true if the attribute exists for the function.
Definition: Attributes.cpp:1577

llvm::AttributeList::hasAttrSomewhere
bool hasAttrSomewhere(Attribute::AttrKind Kind, unsigned *Index=nullptr) const
Return true if the specified attribute is set for at least one parameter or for the return value.
Definition: Attributes.cpp:1585

llvm::AttributeList::hasParamAttr
bool hasParamAttr(unsigned ArgNo, Attribute::AttrKind Kind) const
Return true if the attribute exists for the given argument.
Definition: Attributes.h:788

llvm::AttributeList::getParamAttrs
AttributeSet getParamAttrs(unsigned ArgNo) const
The attributes for the argument or parameter at the given index are returned.
Definition: Attributes.cpp:1552

llvm::AttributeList::addParamAttribute
AttributeList addParamAttribute(LLVMContext &C, unsigned ArgNo, Attribute::AttrKind Kind) const
Add an argument attribute to the list.
Definition: Attributes.h:589

llvm::AttributeList::FirstArgIndex
@ FirstArgIndex
Definition: Attributes.h:456

llvm::AttributeMask
Definition: AttributeMask.h:29

llvm::AttributeSet
Definition: Attributes.h:313

llvm::AttributeSet::hasAttribute
bool hasAttribute(Attribute::AttrKind Kind) const
Return true if the attribute exists in this set.
Definition: Attributes.cpp:841

llvm::AttributeSet::removeAttributes
AttributeSet removeAttributes(LLVMContext &C, const AttributeMask &AttrsToRemove) const
Remove the specified attributes from this set.
Definition: Attributes.cpp:826

llvm::AttributeSet::get
static AttributeSet get(LLVMContext &C, const AttrBuilder &B)
Definition: Attributes.cpp:774

llvm::Attribute::get
static Attribute get(LLVMContext &Context, AttrKind Kind, uint64_t Val=0)
Return a uniquified Attribute object.
Definition: Attributes.cpp:93

llvm::Attribute::getWithDereferenceableBytes
static Attribute getWithDereferenceableBytes(LLVMContext &Context, uint64_t Bytes)
Definition: Attributes.cpp:204

llvm::Attribute::getWithDereferenceableOrNullBytes
static Attribute getWithDereferenceableOrNullBytes(LLVMContext &Context, uint64_t Bytes)
Definition: Attributes.cpp:210

llvm::Attribute::getWithAlignment
static Attribute getWithAlignment(LLVMContext &Context, Align Alignment)
Return a uniquified Attribute object that has the specific alignment set.
Definition: Attributes.cpp:194

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:60

llvm::BasicBlock::begin
iterator begin()
Instruction iterator methods.
Definition: BasicBlock.h:430

llvm::BasicBlock::reverse_iterator
InstListType::reverse_iterator reverse_iterator
Definition: BasicBlock.h:167

llvm::BasicBlock::rend
reverse_iterator rend()
Definition: BasicBlock.h:448

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition: BasicBlock.h:165

llvm::BasicBlock::getTerminator
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Definition: BasicBlock.h:221

llvm::BinaryOpIntrinsic::getRHS
Value * getRHS() const
Definition: IntrinsicInst.h:862

llvm::BinaryOpIntrinsic::isSigned
bool isSigned() const
Whether the intrinsic is signed or unsigned.
Definition: IntrinsicInst.cpp:846

llvm::BinaryOpIntrinsic::getBinaryOp
Instruction::BinaryOps getBinaryOp() const
Returns the binary operation underlying the intrinsic.
Definition: IntrinsicInst.cpp:826

llvm::BinaryOpIntrinsic::getLHS
Value * getLHS() const
Definition: IntrinsicInst.h:861

llvm::BinaryOperator
Definition: InstrTypes.h:222

llvm::BinaryOperator::Create
static BinaryOperator * Create(BinaryOps Op, Value *S1, Value *S2, const Twine &Name, BasicBlock::iterator InsertBefore)
Construct a binary instruction, given the opcode and the two operands.
Definition: Instructions.cpp:3318

llvm::BinaryOperator::CreateNSWNeg
static BinaryOperator * CreateNSWNeg(Value *Op, const Twine &Name, BasicBlock::iterator InsertBefore)

llvm::BinaryOperator::CreateNSW
static BinaryOperator * CreateNSW(BinaryOps Opc, Value *V1, Value *V2, const Twine &Name="")
Definition: InstrTypes.h:367

llvm::BinaryOperator::CreateNeg
static BinaryOperator * CreateNeg(Value *Op, const Twine &Name, BasicBlock::iterator InsertBefore)
Helper functions to construct and inspect unary operations (NEG and NOT) via binary operators SUB and...
Definition: Instructions.cpp:3342

llvm::BinaryOperator::CreateNUW
static BinaryOperator * CreateNUW(BinaryOps Opc, Value *V1, Value *V2, const Twine &Name="")
Definition: InstrTypes.h:392

llvm::BinaryOperator::CreateFMulFMF
static BinaryOperator * CreateFMulFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:332

llvm::BinaryOperator::CreateNot
static BinaryOperator * CreateNot(Value *Op, const Twine &Name, BasicBlock::iterator InsertBefore)
Definition: Instructions.cpp:3369

llvm::BinaryOperator::CreateFDivFMF
static BinaryOperator * CreateFDivFMF(Value *V1, Value *V2, FastMathFlags FMF, const Twine &Name="")
Definition: InstrTypes.h:336

llvm::BinaryOperator::CreateWithCopiedFlags
static BinaryOperator * CreateWithCopiedFlags(BinaryOps Opc, Value *V1, Value *V2, Value *CopyO, const Twine &Name, BasicBlock::iterator InsertBefore)
Definition: InstrTypes.h:299

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1494

llvm::CallBase::setCallingConv
void setCallingConv(CallingConv::ID CC)
Definition: InstrTypes.h:1804

llvm::CallBase::bundle_op_info_begin
bundle_op_iterator bundle_op_info_begin()
Return the start of the list of BundleOpInfo instances associated with this OperandBundleUser.
Definition: InstrTypes.h:2572

llvm::CallBase::setDoesNotThrow
void setDoesNotThrow()
Definition: InstrTypes.h:2284

llvm::CallBase::addRangeRetAttr
void addRangeRetAttr(const ConstantRange &CR)
adds the range attribute to the list of attributes.
Definition: InstrTypes.h:1945

llvm::CallBase::getRetAlign
MaybeAlign getRetAlign() const
Extract the alignment of the return value.
Definition: InstrTypes.h:2106

llvm::CallBase::getOperandBundlesAsDefs
void getOperandBundlesAsDefs(SmallVectorImpl< OperandBundleDef > &Defs) const
Return the list of operand bundles attached to this instruction as a vector of OperandBundleDefs.
Definition: Instructions.cpp:504

llvm::CallBase::getOperandBundleAt
OperandBundleUse getOperandBundleAt(unsigned Index) const
Return the operand bundle at a specific index.
Definition: InstrTypes.h:2380

llvm::CallBase::getOperandBundle
std::optional< OperandBundleUse > getOperandBundle(StringRef Name) const
Return an operand bundle by name, if present.
Definition: InstrTypes.h:2411

llvm::CallBase::getCalledFunction
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
Definition: InstrTypes.h:1742

llvm::CallBase::hasRetAttr
bool hasRetAttr(Attribute::AttrKind Kind) const
Determine whether the return value has the given attribute.
Definition: InstrTypes.h:1950

llvm::CallBase::getNumOperandBundles
unsigned getNumOperandBundles() const
Return the number of operand bundles associated with this User.
Definition: InstrTypes.h:2324

llvm::CallBase::getCallingConv
CallingConv::ID getCallingConv() const
Definition: InstrTypes.h:1800

llvm::CallBase::Create
static CallBase * Create(CallBase *CB, ArrayRef< OperandBundleDef > Bundles, BasicBlock::iterator InsertPt)
Create a clone of CB with a different set of operand bundles and insert it before InsertPt.
Definition: Instructions.cpp:307

llvm::CallBase::removeOperandBundle
static CallBase * removeOperandBundle(CallBase *CB, uint32_t ID, Instruction *InsertPt=nullptr)
Create a clone of CB with operand bundle ID removed.
Definition: Instructions.cpp:624

llvm::CallBase::getCalledOperand
Value * getCalledOperand() const
Definition: InstrTypes.h:1735

llvm::CallBase::setAttributes
void setAttributes(AttributeList A)
Set the parameter attributes for this call.
Definition: InstrTypes.h:1823

llvm::CallBase::doesNotThrow
bool doesNotThrow() const
Determine if the call cannot unwind.
Definition: InstrTypes.h:2283

llvm::CallBase::addRetAttr
void addRetAttr(Attribute::AttrKind Kind)
Adds the attribute to the return value.
Definition: InstrTypes.h:1861

llvm::CallBase::getArgOperand
Value * getArgOperand(unsigned i) const
Definition: InstrTypes.h:1687

llvm::CallBase::setArgOperand
void setArgOperand(unsigned i, Value *v)
Definition: InstrTypes.h:1692

llvm::CallBase::getFunctionType
FunctionType * getFunctionType() const
Definition: InstrTypes.h:1600

llvm::CallBase::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Returns the intrinsic ID of the intrinsic called or Intrinsic::not_intrinsic if the called function i...
Definition: Instructions.cpp:377

llvm::CallBase::args
iterator_range< User::op_iterator > args()
Iteration adapter for range-for loops.
Definition: InstrTypes.h:1678

llvm::CallBase::arg_size
unsigned arg_size() const
Definition: InstrTypes.h:1685

llvm::CallBase::hasOperandBundles
bool hasOperandBundles() const
Return true if this User has any operand bundles.
Definition: InstrTypes.h:2329

llvm::CallBase::setCalledFunction
void setCalledFunction(Function *Fn)
Sets the function called, including updating the function type.
Definition: InstrTypes.h:1781

llvm::CallBrInst
CallBr instruction, tracking function calls that may not return control but instead transfer it to a ...
Definition: Instructions.h:4431

llvm::CallBrInst::Create
static CallBrInst * Create(FunctionType *Ty, Value *Func, BasicBlock *DefaultDest, ArrayRef< BasicBlock * > IndirectDests, ArrayRef< Value * > Args, const Twine &NameStr, BasicBlock::iterator InsertBefore)
Definition: Instructions.h:4478

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1565

llvm::CallInst::isNoTailCall
bool isNoTailCall() const
Definition: Instructions.h:1787

llvm::CallInst::Create
static CallInst * Create(FunctionType *Ty, Value *F, const Twine &NameStr, BasicBlock::iterator InsertBefore)
Definition: Instructions.h:1620

llvm::CallInst::setTailCallKind
void setTailCallKind(TailCallKind TCK)
Definition: Instructions.h:1789

llvm::CallInst::isMustTailCall
bool isMustTailCall() const
Definition: Instructions.h:1785

llvm::CastInst::getCastOpcode
static Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
Definition: Instructions.cpp:4085

llvm::CastInst::Create
static CastInst * Create(Instruction::CastOps, Value *S, Type *Ty, const Twine &Name, BasicBlock::iterator InsertBefore)
Provides a way to construct any of the CastInst subclasses using an opcode instead of the subclass's ...
Definition: Instructions.cpp:3695

llvm::CastInst::isBitOrNoopPointerCastable
static bool isBitOrNoopPointerCastable(Type *SrcTy, Type *DestTy, const DataLayout &DL)
Check whether a bitcast, inttoptr, or ptrtoint cast between these types is valid and a no-op.
Definition: Instructions.cpp:4063

llvm::CastInst::CreateBitOrPointerCast
static CastInst * CreateBitOrPointerCast(Value *S, Type *Ty, const Twine &Name, BasicBlock::iterator InsertBefore)
Create a BitCast, a PtrToInt, or an IntToPTr cast instruction.
Definition: Instructions.cpp:3920

llvm::CastInst::CreateIntegerCast
static CastInst * CreateIntegerCast(Value *S, Type *Ty, bool isSigned, const Twine &Name, BasicBlock::iterator InsertBefore)
Create a ZExt, BitCast, or Trunc for int -> int casts.
Definition: Instructions.cpp:3942

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:993

llvm::CmpInst::FCMP_OEQ
@ FCMP_OEQ
0 0 0 1 True if ordered and equal
Definition: InstrTypes.h:996

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition: InstrTypes.h:1026

llvm::CmpInst::ICMP_SLT
@ ICMP_SLT
signed less than
Definition: InstrTypes.h:1022

llvm::CmpInst::ICMP_SLE
@ ICMP_SLE
signed less or equal
Definition: InstrTypes.h:1023

llvm::CmpInst::FCMP_OLT
@ FCMP_OLT
0 1 0 0 True if ordered and less than
Definition: InstrTypes.h:999

llvm::CmpInst::FCMP_OGT
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
Definition: InstrTypes.h:997

llvm::CmpInst::FCMP_OGE
@ FCMP_OGE
0 0 1 1 True if ordered and greater than or equal
Definition: InstrTypes.h:998

llvm::CmpInst::ICMP_UGT
@ ICMP_UGT
unsigned greater than
Definition: InstrTypes.h:1016

llvm::CmpInst::ICMP_SGT
@ ICMP_SGT
signed greater than
Definition: InstrTypes.h:1020

llvm::CmpInst::FCMP_ONE
@ FCMP_ONE
0 1 1 0 True if ordered and operands are unequal
Definition: InstrTypes.h:1001

llvm::CmpInst::FCMP_UEQ
@ FCMP_UEQ
1 0 0 1 True if unordered or equal
Definition: InstrTypes.h:1004

llvm::CmpInst::ICMP_ULT
@ ICMP_ULT
unsigned less than
Definition: InstrTypes.h:1018

llvm::CmpInst::FCMP_OLE
@ FCMP_OLE
0 1 0 1 True if ordered and less than or equal
Definition: InstrTypes.h:1000

llvm::CmpInst::ICMP_EQ
@ ICMP_EQ
equal
Definition: InstrTypes.h:1014

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition: InstrTypes.h:1015

llvm::CmpInst::FCMP_UNE
@ FCMP_UNE
1 1 1 0 True if unordered or not equal
Definition: InstrTypes.h:1009

llvm::CmpInst::BAD_FCMP_PREDICATE
@ BAD_FCMP_PREDICATE
Definition: InstrTypes.h:1013

llvm::CmpInst::getSwappedPredicate
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition: InstrTypes.h:1167

llvm::CmpInst::getNonStrictPredicate
Predicate getNonStrictPredicate() const
For example, SGT -> SGE, SLT -> SLE, ULT -> ULE, UGT -> UGE.
Definition: InstrTypes.h:1211

llvm::CmpInst::getUnorderedPredicate
Predicate getUnorderedPredicate() const
Definition: InstrTypes.h:1151

llvm::ConstantAggregateZero::get
static ConstantAggregateZero * get(Type *Ty)
Definition: Constants.cpp:1663

llvm::ConstantExpr::getSub
static Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
Definition: Constants.cpp:2542

llvm::ConstantExpr::getNeg
static Constant * getNeg(Constant *C, bool HasNSW=false)
Definition: Constants.cpp:2523

llvm::ConstantFP::getInfinity
static Constant * getInfinity(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1083

llvm::ConstantFP::getZero
static Constant * getZero(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1037

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:80

llvm::ConstantInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=~0ULL) const
getLimitedValue - If the value is smaller than the specified limit, return it, otherwise return the l...
Definition: Constants.h:255

llvm::ConstantInt::getTrue
static ConstantInt * getTrue(LLVMContext &Context)
Definition: Constants.cpp:849

llvm::ConstantInt::getZExtValue
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition: Constants.h:154

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition: Constants.h:145

llvm::ConstantInt::getBool
static ConstantInt * getBool(LLVMContext &Context, bool V)
Definition: Constants.cpp:863

llvm::ConstantPointerNull::get
static ConstantPointerNull * get(PointerType *T)
Static factory methods - Return objects of the specified value.
Definition: Constants.cpp:1775

llvm::ConstantRange
This class represents a range of values.
Definition: ConstantRange.h:47

llvm::ConstantRange::isFullSet
bool isFullSet() const
Return true if this set contains all of the elements possible for this data-type.
Definition: ConstantRange.cpp:367

llvm::ConstantRange::icmp
bool icmp(CmpInst::Predicate Pred, const ConstantRange &Other) const
Does the predicate Pred hold between ranges this and Other? NOTE: false does not mean that inverse pr...
Definition: ConstantRange.cpp:242

llvm::ConstantStruct::get
static Constant * get(StructType *T, ArrayRef< Constant * > V)
Definition: Constants.cpp:1356

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:41

llvm::Constant::getIntegerValue
static Constant * getIntegerValue(Type *Ty, const APInt &V)
Return the value for an integer or pointer constant, or a vector thereof, with the given scalar value...
Definition: Constants.cpp:400

llvm::Constant::getAllOnesValue
static Constant * getAllOnesValue(Type *Ty)
Definition: Constants.cpp:417

llvm::Constant::getNullValue
static Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
Definition: Constants.cpp:370

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:110

llvm::DataLayout::getPointerTypeSizeInBits
unsigned getPointerTypeSizeInBits(Type *) const
Layout pointer size, in bits, based on the type.
Definition: DataLayout.cpp:763

llvm::DenseMapBase::size
unsigned size() const
Definition: DenseMap.h:99

llvm::DenseMapBase::count
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition: DenseMap.h:151

llvm::DenseMap
Definition: DenseMap.h:742

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition: Dominators.h:162

llvm::ElementCount
Definition: TypeSize.h:297

llvm::FPExtInst
This class represents an extension of floating point types.
Definition: Instructions.h:5575

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition: FMF.h:20

llvm::FastMathFlags::noSignedZeros
bool noSignedZeros() const
Definition: FMF.h:68

llvm::FastMathFlags::setNoSignedZeros
void setNoSignedZeros(bool B=true)
Definition: FMF.h:85

llvm::FastMathFlags::allowReassoc
bool allowReassoc() const
Flag queries.
Definition: FMF.h:65

llvm::FenceInst
An instruction for ordering other memory operations.
Definition: Instructions.h:460

llvm::FenceInst::getSyncScopeID
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this fence instruction.
Definition: Instructions.h:498

llvm::FenceInst::getOrdering
AtomicOrdering getOrdering() const
Returns the ordering constraint of this fence instruction.
Definition: Instructions.h:487

llvm::FunctionType
Class to represent function types.
Definition: DerivedTypes.h:103

llvm::FunctionType::param_iterator
Type::subtype_iterator param_iterator
Definition: DerivedTypes.h:126

llvm::FunctionType::get
static FunctionType * get(Type *Result, ArrayRef< Type * > Params, bool isVarArg)
This static method is the primary way of constructing a FunctionType.

llvm::Function
Definition: Function.h:63

llvm::Function::isConvergent
bool isConvergent() const
Determine if the call is convergent.
Definition: Function.h:592

llvm::Function::getFunctionType
FunctionType * getFunctionType() const
Returns the FunctionType for me.
Definition: Function.h:202

llvm::Function::getCallingConv
CallingConv::ID getCallingConv() const
getCallingConv()/setCallingConv(CC) - These method get and set the calling convention of this functio...
Definition: Function.h:264

llvm::Function::getAttributes
AttributeList getAttributes() const
Return the attribute list for this Function.
Definition: Function.h:340

llvm::Function::doesNotThrow
bool doesNotThrow() const
Determine if the function cannot unwind.
Definition: Function.h:576

llvm::Function::isIntrinsic
bool isIntrinsic() const
isIntrinsic - Returns true if the function's name starts with "llvm.".
Definition: Function.h:237

llvm::Function::hasFnAttribute
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
Definition: Function.cpp:677

llvm::GCRelocateInst
Represents calls to the gc.relocate intrinsic.
Definition: IntrinsicInst.h:1728

llvm::GCRelocateInst::getBasePtr
Value * getBasePtr() const
Definition: IntrinsicInst.cpp:891

llvm::GCRelocateInst::getBasePtrIndex
unsigned getBasePtrIndex() const
The index into the associate statepoint's argument list which contains the base pointer of the pointe...
Definition: IntrinsicInst.h:1741

llvm::GCRelocateInst::getDerivedPtr
Value * getDerivedPtr() const
Definition: IntrinsicInst.cpp:902

llvm::GCRelocateInst::getDerivedPtrIndex
unsigned getDerivedPtrIndex() const
The index into the associate statepoint's argument list which contains the pointer whose relocation t...
Definition: IntrinsicInst.h:1747

llvm::GCStatepointInst
Represents a gc.statepoint intrinsic call.
Definition: Statepoint.h:61

llvm::GCStatepointInst::getGCRelocates
std::vector< const GCRelocateInst * > getGCRelocates() const
Get list of all gc reloactes linked to this statepoint May contain several relocations for the same b...
Definition: Statepoint.h:206

llvm::GlobalObject::getMetadata
MDNode * getMetadata(unsigned KindID) const
Get the current metadata attachments for the given kind, if any.
Definition: Value.h:565

llvm::GlobalValue::isDeclaration
bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
Definition: Globals.cpp:281

llvm::GlobalValue::getType
PointerType * getType() const
Global values are always pointers.
Definition: GlobalValue.h:294

llvm::GlobalVariable
Definition: GlobalVariable.h:39

llvm::IRBuilderBase::FastMathFlagGuard
Definition: IRBuilder.h:397

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition: IRBuilder.h:94

llvm::IRBuilderBase::CreateFCmpONE
Value * CreateFCmpONE(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2306

llvm::IRBuilderBase::CreateUnaryIntrinsic
CallInst * CreateUnaryIntrinsic(Intrinsic::ID ID, Value *V, Instruction *FMFSource=nullptr, const Twine &Name="")
Create a call to intrinsic ID with 1 operand which is mangled on its type.
Definition: IRBuilder.cpp:913

llvm::IRBuilderBase::CreateLaunderInvariantGroup
Value * CreateLaunderInvariantGroup(Value *Ptr)
Create a launder.invariant.group intrinsic call.
Definition: IRBuilder.cpp:1118

llvm::IRBuilderBase::CreateBinaryIntrinsic
Value * CreateBinaryIntrinsic(Intrinsic::ID ID, Value *LHS, Value *RHS, Instruction *FMFSource=nullptr, const Twine &Name="")
Create a call to intrinsic ID with 2 operands which is mangled on the first type.
Definition: IRBuilder.cpp:921

llvm::IRBuilderBase::CreateFCmp
Value * CreateFCmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2361

llvm::IRBuilderBase::getInt1Ty
IntegerType * getInt1Ty()
Fetch the type representing a single bit.
Definition: IRBuilder.h:511

llvm::IRBuilderBase::CreateExtractElement
Value * CreateExtractElement(Value *Vec, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2460

llvm::IRBuilderBase::getIntNTy
IntegerType * getIntNTy(unsigned N)
Fetch the type representing an N-bit integer.
Definition: IRBuilder.h:539

llvm::IRBuilderBase::CreateAlignedLoad
LoadInst * CreateAlignedLoad(Type *Ty, Value *Ptr, MaybeAlign Align, const char *Name)
Definition: IRBuilder.h:1807

llvm::IRBuilderBase::CreateFCmpORD
Value * CreateFCmpORD(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2311

llvm::IRBuilderBase::CreateZExtOrTrunc
Value * CreateZExtOrTrunc(Value *V, Type *DestTy, const Twine &Name="")
Create a ZExt or Trunc from the integer value V to DestTy.
Definition: IRBuilder.h:2039

llvm::IRBuilderBase::CreateFAdd
Value * CreateFAdd(Value *L, Value *R, const Twine &Name="", MDNode *FPMD=nullptr)
Definition: IRBuilder.h:1533

llvm::IRBuilderBase::CreateAndReduce
CallInst * CreateAndReduce(Value *Src)
Create a vector int AND reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:441

llvm::IRBuilderBase::CreateVectorSplat
Value * CreateVectorSplat(unsigned NumElts, Value *V, const Twine &Name="")
Return a vector value that contains.
Definition: IRBuilder.cpp:1193

llvm::IRBuilderBase::getTrue
ConstantInt * getTrue()
Get the constant value for i1 true.
Definition: IRBuilder.h:466

llvm::IRBuilderBase::CreateIntrinsic
CallInst * CreateIntrinsic(Intrinsic::ID ID, ArrayRef< Type * > Types, ArrayRef< Value * > Args, Instruction *FMFSource=nullptr, const Twine &Name="")
Create a call to intrinsic ID with Args, mangled using Types.
Definition: IRBuilder.cpp:932

llvm::IRBuilderBase::CreateFNegFMF
Value * CreateFNegFMF(Value *V, Instruction *FMFSource, const Twine &Name="")
Copy fast-math-flags from an instruction rather than using the builder's default FMF.
Definition: IRBuilder.h:1740

llvm::IRBuilderBase::CreateSelect
Value * CreateSelect(Value *C, Value *True, Value *False, const Twine &Name="", Instruction *MDFrom=nullptr)
Definition: IRBuilder.cpp:1091

llvm::IRBuilderBase::CreateInvoke
InvokeInst * CreateInvoke(FunctionType *Ty, Value *Callee, BasicBlock *NormalDest, BasicBlock *UnwindDest, ArrayRef< Value * > Args, ArrayRef< OperandBundleDef > OpBundles, const Twine &Name="")
Create an invoke instruction.
Definition: IRBuilder.h:1158

llvm::IRBuilderBase::CreateFCmpUNE
Value * CreateFCmpUNE(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2346

llvm::IRBuilderBase::CreateAddReduce
CallInst * CreateAddReduce(Value *Src)
Create a vector int add reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:433

llvm::IRBuilderBase::CreateLShr
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1437

llvm::IRBuilderBase::getInt32Ty
IntegerType * getInt32Ty()
Fetch the type representing a 32-bit integer.
Definition: IRBuilder.h:526

llvm::IRBuilderBase::setFastMathFlags
void setFastMathFlags(FastMathFlags NewFMF)
Set the fast-math flags to be used with generated fp-math operators.
Definition: IRBuilder.h:311

llvm::IRBuilderBase::CreateNSWMul
Value * CreateNSWMul(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1370

llvm::IRBuilderBase::CreateICmpNE
Value * CreateICmpNE(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2245

llvm::IRBuilderBase::CreateNeg
Value * CreateNeg(Value *V, const Twine &Name="", bool HasNSW=false)
Definition: IRBuilder.h:1721

llvm::IRBuilderBase::CreateOrReduce
CallInst * CreateOrReduce(Value *Src)
Create a vector int OR reduction intrinsic of the source vector.
Definition: IRBuilder.cpp:445

llvm::IRBuilderBase::getInt32
ConstantInt * getInt32(uint32_t C)
Get a constant 32-bit value.
Definition: IRBuilder.h:486

llvm::IRBuilderBase::CreateBitOrPointerCast
Value * CreateBitOrPointerCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2205

llvm::IRBuilderBase::CreateNot
Value * CreateNot(Value *V, const Twine &Name="")
Definition: IRBuilder.h:1749

llvm::IRBuilderBase::CreateICmpEQ
Value * CreateICmpEQ(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2241

llvm::IRBuilderBase::CreateFCmpUEQ
Value * CreateFCmpUEQ(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2321

llvm::IRBuilderBase::CreateSub
Value * CreateSub(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1344

llvm::IRBuilderBase::CreateBitCast
Value * CreateBitCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2127

llvm::IRBuilderBase::CreateLoad
LoadInst * CreateLoad(Type *Ty, Value *Ptr, const char *Name)
Provided to resolve 'CreateLoad(Ty, Ptr, "...")' correctly, instead of converting the string to 'bool...
Definition: IRBuilder.h:1790

llvm::IRBuilderBase::CreateZExt
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
Definition: IRBuilder.h:2021

llvm::IRBuilderBase::CreateShuffleVector
Value * CreateShuffleVector(Value *V1, Value *V2, Value *Mask, const Twine &Name="")
Definition: IRBuilder.h:2494

llvm::IRBuilderBase::CreateFCmpOEQ
Value * CreateFCmpOEQ(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2281

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1475

llvm::IRBuilderBase::CreateStore
StoreInst * CreateStore(Value *Val, Value *Ptr, bool isVolatile=false)
Definition: IRBuilder.h:1803

llvm::IRBuilderBase::CreateAdd
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1327

llvm::IRBuilderBase::getFalse
ConstantInt * getFalse()
Get the constant value for i1 false.
Definition: IRBuilder.h:471

llvm::IRBuilderBase::CreateIsNotNull
Value * CreateIsNotNull(Value *Arg, const Twine &Name="")
Return a boolean value testing if Arg != 0.
Definition: IRBuilder.h:2549

llvm::IRBuilderBase::CreateTrunc
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Definition: IRBuilder.h:2007

llvm::IRBuilderBase::CreateElementCount
Value * CreateElementCount(Type *DstType, ElementCount EC)
Create an expression which evaluates to the number of elements in EC at runtime.
Definition: IRBuilder.cpp:99

llvm::IRBuilderBase::CreateCast
Value * CreateCast(Instruction::CastOps Op, Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2161

llvm::IRBuilderBase::CreateIntCast
Value * CreateIntCast(Value *V, Type *DestTy, bool isSigned, const Twine &Name="")
Definition: IRBuilder.h:2196

llvm::IRBuilderBase::CreateFCmpUNO
Value * CreateFCmpUNO(Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2316

llvm::IRBuilderBase::CreateCall
CallInst * CreateCall(FunctionType *FTy, Value *Callee, ArrayRef< Value * > Args=std::nullopt, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2412

llvm::IRBuilderBase::CreateICmp
Value * CreateICmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2351

llvm::IRBuilderBase::CreateFMul
Value * CreateFMul(Value *L, Value *R, const Twine &Name="", MDNode *FPMD=nullptr)
Definition: IRBuilder.h:1587

llvm::IRBuilderBase::CreateFNeg
Value * CreateFNeg(Value *V, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:1730

llvm::IRBuilderBase::CreateAddrSpaceCast
Value * CreateAddrSpaceCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2132

llvm::IRBuilderBase::CreateMul
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1361

llvm::IRBuilderBase::CreateStripInvariantGroup
Value * CreateStripInvariantGroup(Value *Ptr)
Create a strip.invariant.group intrinsic call.
Definition: IRBuilder.cpp:1134

llvm::IRBuilder< TargetFolder, IRBuilderCallbackInserter >

llvm::InlineAsm
Definition: InlineAsm.h:34

llvm::InsertValueInst::Create
static InsertValueInst * Create(Value *Agg, Value *Val, ArrayRef< unsigned > Idxs, const Twine &NameStr, BasicBlock::iterator InsertBefore)
Definition: Instructions.h:2854

llvm::InstCombinerImpl
Definition: InstCombineInternal.h:64

llvm::InstCombinerImpl::FoldOpIntoSelect
Instruction * FoldOpIntoSelect(Instruction &Op, SelectInst *SI, bool FoldWithMultiUse=false)
Given an instruction with a select as one operand and a constant as the other operand,...
Definition: InstructionCombining.cpp:1683

llvm::InstCombinerImpl::computeKnownFPClass
KnownFPClass computeKnownFPClass(Value *Val, FastMathFlags FMF, FPClassTest Interested=fcAllFlags, const Instruction *CtxI=nullptr, unsigned Depth=0) const
Definition: InstCombineInternal.h:202

llvm::InstCombinerImpl::SimplifyDemandedBits
bool SimplifyDemandedBits(Instruction *I, unsigned Op, const APInt &DemandedMask, KnownBits &Known, unsigned Depth=0) override
This form of SimplifyDemandedBits simplifies the specified instruction operand if possible,...
Definition: InstCombineSimplifyDemanded.cpp:89

llvm::InstCombinerImpl::SimplifyDemandedVectorElts
Value * SimplifyDemandedVectorElts(Value *V, APInt DemandedElts, APInt &PoisonElts, unsigned Depth=0, bool AllowMultipleUsers=false) override
The specified value produces a vector with any number of elements.
Definition: InstCombineSimplifyDemanded.cpp:1415

llvm::InstCombinerImpl::SimplifyAnyMemSet
Instruction * SimplifyAnyMemSet(AnyMemSetInst *MI)
Definition: InstCombineCalls.cpp:217

llvm::InstCombinerImpl::getLosslessUnsignedTrunc
Constant * getLosslessUnsignedTrunc(Constant *C, Type *TruncTy)
Definition: InstCombineInternal.h:233

llvm::InstCombinerImpl::visitFree
Instruction * visitFree(CallInst &FI, Value *FreedOp)
Definition: InstructionCombining.cpp:3409

llvm::InstCombinerImpl::visitCallBrInst
Instruction * visitCallBrInst(CallBrInst &CBI)
Definition: InstCombineCalls.cpp:3508

llvm::InstCombinerImpl::eraseInstFromFunction
Instruction * eraseInstFromFunction(Instruction &I) override
Combiner aware instruction erasure.
Definition: InstCombineInternal.h:473

llvm::InstCombinerImpl::visitFenceInst
Instruction * visitFenceInst(FenceInst &FI)
Definition: InstCombineCalls.cpp:3475

llvm::InstCombinerImpl::visitInvokeInst
Instruction * visitInvokeInst(InvokeInst &II)
Definition: InstCombineCalls.cpp:3503

llvm::InstCombinerImpl::getLosslessSignedTrunc
Constant * getLosslessSignedTrunc(Constant *C, Type *TruncTy)
Definition: InstCombineInternal.h:237

llvm::InstCombinerImpl::SimplifyDemandedInstructionBits
bool SimplifyDemandedInstructionBits(Instruction &Inst)
Tries to simplify operands to an integer instruction based on its demanded bits.
Definition: InstCombineSimplifyDemanded.cpp:81

llvm::InstCombinerImpl::CreateNonTerminatorUnreachable
void CreateNonTerminatorUnreachable(Instruction *InsertAt)
Create and insert the idiom we use to indicate a block is unreachable without having to rewrite the C...
Definition: InstCombineInternal.h:460

llvm::InstCombinerImpl::visitVAEndInst
Instruction * visitVAEndInst(VAEndInst &I)
Definition: InstCombineCalls.cpp:793

llvm::InstCombinerImpl::matchBSwapOrBitReverse
Instruction * matchBSwapOrBitReverse(Instruction &I, bool MatchBSwaps, bool MatchBitReversals)
Given an initial instruction, check to see if it is the root of a bswap/bitreverse idiom.
Definition: InstCombineAndOrXor.cpp:2786

llvm::InstCombinerImpl::visitAllocSite
Instruction * visitAllocSite(Instruction &FI)
Definition: InstructionCombining.cpp:3193

llvm::InstCombinerImpl::SimplifyAnyMemTransfer
Instruction * SimplifyAnyMemTransfer(AnyMemTransferInst *MI)
Definition: InstCombineCalls.cpp:115

llvm::InstCombinerImpl::computeOverflow
OverflowResult computeOverflow(Instruction::BinaryOps BinaryOp, bool IsSigned, Value *LHS, Value *RHS, Instruction *CxtI) const
Definition: InstCombineCompares.cpp:5930

llvm::InstCombinerImpl::visitCallInst
Instruction * visitCallInst(CallInst &CI)
CallInst simplification.
Definition: InstCombineCalls.cpp:1441

llvm::InstCombiner::SQ
SimplifyQuery SQ
Definition: InstCombiner.h:76

llvm::InstCombiner::isFreeToInvert
bool isFreeToInvert(Value *V, bool WillInvertAllUses, bool &DoesConsume)
Return true if the specified value is free to invert (apply ~ to).
Definition: InstCombiner.h:232

llvm::InstCombiner::getDominatorTree
DominatorTree & getDominatorTree() const
Definition: InstCombiner.h:340

llvm::InstCombiner::BFI
BlockFrequencyInfo * BFI
Definition: InstCombiner.h:78

llvm::InstCombiner::TLI
TargetLibraryInfo & TLI
Definition: InstCombiner.h:73

llvm::InstCombiner::isKnownToBeAPowerOfTwo
bool isKnownToBeAPowerOfTwo(const Value *V, bool OrZero=false, unsigned Depth=0, const Instruction *CxtI=nullptr)
Definition: InstCombiner.h:441

llvm::InstCombiner::InsertNewInstBefore
Instruction * InsertNewInstBefore(Instruction *New, BasicBlock::iterator Old)
Inserts an instruction New before instruction Old.
Definition: InstCombiner.h:366

llvm::InstCombiner::AA
AAResults * AA
Definition: InstCombiner.h:69

llvm::InstCombiner::replaceInstUsesWith
Instruction * replaceInstUsesWith(Instruction &I, Value *V)
A combiner-aware RAUW-like routine.
Definition: InstCombiner.h:386

llvm::InstCombiner::LI
LoopInfo * LI
Definition: InstCombiner.h:85

llvm::InstCombiner::replaceUse
void replaceUse(Use &U, Value *NewValue)
Replace use and add the previously used value to the worklist.
Definition: InstCombiner.h:418

llvm::InstCombiner::Worklist
InstructionWorklist & Worklist
A worklist of the instructions that need to be simplified.
Definition: InstCombiner.h:64

llvm::InstCombiner::DL
const DataLayout & DL
Definition: InstCombiner.h:75

llvm::InstCombiner::targetInstCombineIntrinsic
std::optional< Instruction * > targetInstCombineIntrinsic(IntrinsicInst &II)
Definition: InstructionCombining.cpp:156

llvm::InstCombiner::AC
AssumptionCache & AC
Definition: InstCombiner.h:72

llvm::InstCombiner::replaceOperand
Instruction * replaceOperand(Instruction &I, unsigned OpNum, Value *V)
Replace operand of instruction and add old operand to the worklist.
Definition: InstCombiner.h:410

llvm::InstCombiner::DT
DominatorTree & DT
Definition: InstCombiner.h:74

llvm::InstCombiner::PSI
ProfileSummaryInfo * PSI
Definition: InstCombiner.h:80

llvm::InstCombiner::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, unsigned Depth, const Instruction *CxtI) const
Definition: InstCombiner.h:431

llvm::InstCombiner::Builder
BuilderTy & Builder
Definition: InstCombiner.h:60

llvm::InstCombiner::getAssumptionCache
AssumptionCache & getAssumptionCache() const
Definition: InstCombiner.h:338

llvm::InstCombiner::MaskedValueIsZero
bool MaskedValueIsZero(const Value *V, const APInt &Mask, unsigned Depth=0, const Instruction *CxtI=nullptr) const
Definition: InstCombiner.h:447

llvm::InstCombiner::ORE
OptimizationRemarkEmitter & ORE
Definition: InstCombiner.h:77

llvm::InstCombiner::getFreelyInverted
Value * getFreelyInverted(Value *V, bool WillInvertAllUses, BuilderTy *Builder, bool &DoesConsume)
Definition: InstCombiner.h:213

llvm::InstCombiner::getSimplifyQuery
const SimplifyQuery & getSimplifyQuery() const
Definition: InstCombiner.h:342

llvm::InstCombiner::ComputeMaxSignificantBits
unsigned ComputeMaxSignificantBits(const Value *Op, unsigned Depth=0, const Instruction *CxtI=nullptr) const
Definition: InstCombiner.h:457

llvm::InstructionWorklist::pushValue
void pushValue(Value *V)
Definition: InstructionWorklist.h:68

llvm::InstructionWorklist::pushUsersToWorkList
void pushUsersToWorkList(Instruction &I)
When an instruction is simplified, add all users of the instruction to the work lists because they mi...
Definition: InstructionWorklist.h:106

llvm::InstructionWorklist::add
void add(Instruction *I)
Add instruction to the worklist.
Definition: InstructionWorklist.h:44

llvm::Instruction
Definition: Instruction.h:49

llvm::Instruction::copyFastMathFlags
void copyFastMathFlags(FastMathFlags FMF)
Convenience function for transferring all fast-math flag values to this instruction,...
Definition: Instruction.cpp:577

llvm::Instruction::mayWriteToMemory
bool mayWriteToMemory() const LLVM_READONLY
Return true if this instruction may modify memory.
Definition: Instruction.cpp:959

llvm::Instruction::copyIRFlags
void copyIRFlags(const Value *V, bool IncludeWrapFlags=true)
Convenience method to copy supported exact, fast-math, and (optionally) wrapping flags from V to this...
Definition: Instruction.cpp:631

llvm::Instruction::getModule
const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
Definition: Instruction.cpp:83

llvm::Instruction::setAAMetadata
void setAAMetadata(const AAMDNodes &N)
Sets the AA metadata on this instruction from the AAMDNodes structure.
Definition: Metadata.cpp:1720

llvm::Instruction::andIRFlags
void andIRFlags(const Value *V)
Logical 'and' of any supported wrapping, exact, and fast-math flags of V and this instruction.
Definition: Instruction.cpp:670

llvm::Instruction::getPrevNonDebugInstruction
const Instruction * getPrevNonDebugInstruction(bool SkipPseudoOp=false) const
Return a pointer to the previous non-debug instruction in the same basic block as 'this',...
Definition: Instruction.cpp:1182

llvm::Instruction::setFastMathFlags
void setFastMathFlags(FastMathFlags FMF)
Convenience function for setting multiple fast-math flags on this instruction, which must be an opera...
Definition: Instruction.cpp:572

llvm::Instruction::getParent
const BasicBlock * getParent() const
Definition: Instruction.h:152

llvm::Instruction::isFast
bool isFast() const LLVM_READONLY
Determine whether all fast-math-flags are set.
Definition: Instruction.cpp:582

llvm::Instruction::user_back
Instruction * user_back()
Specialize the methods defined in Value, as we know that an instruction can only be used by other ins...
Definition: Instruction.h:149

llvm::Instruction::getFunction
const Function * getFunction() const
Return the function this instruction belongs to.
Definition: Instruction.cpp:87

llvm::Instruction::getMetadata
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
Definition: Instruction.h:359

llvm::Instruction::mayHaveSideEffects
bool mayHaveSideEffects() const LLVM_READONLY
Return true if the instruction may have side effects.
Definition: Instruction.cpp:1133

llvm::Instruction::getNextNonDebugInstruction
const Instruction * getNextNonDebugInstruction(bool SkipPseudoOp=false) const
Return a pointer to the next non-debug instruction in the same basic block as 'this',...
Definition: Instruction.cpp:1174

llvm::Instruction::setMetadata
void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
Definition: Metadata.cpp:1635

llvm::Instruction::getFastMathFlags
FastMathFlags getFastMathFlags() const LLVM_READONLY
Convenience function for getting all the fast-math flags, which must be an operator which supports th...
Definition: Instruction.cpp:622

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition: Instruction.h:252

llvm::Instruction::BinaryOps
BinaryOps
Definition: Instruction.h:947

llvm::Instruction::getInsertionPointAfterDef
std::optional< InstListType::iterator > getInsertionPointAfterDef()
Get the first insertion point at which the result of this instruction is defined.
Definition: Instruction.cpp:340

llvm::Instruction::isIdenticalTo
bool isIdenticalTo(const Instruction *I) const LLVM_READONLY
Return true if the specified instruction is exactly identical to the current one.
Definition: Instruction.cpp:865

llvm::Instruction::setDebugLoc
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
Definition: Instruction.h:451

llvm::Instruction::copyMetadata
void copyMetadata(const Instruction &SrcInst, ArrayRef< unsigned > WL=ArrayRef< unsigned >())
Copy metadata from SrcInst to this instruction.
Definition: Instruction.cpp:1279

llvm::Instruction::hasAllowReassoc
bool hasAllowReassoc() const LLVM_READONLY
Determine whether the allow-reassociation flag is set.
Definition: Instruction.cpp:587

llvm::Instruction::moveBefore
void moveBefore(Instruction *MovePos)
Unlink this instruction from its current basic block and insert it into the basic block that MovePos ...
Definition: Instruction.cpp:180

llvm::Instruction::CastOps
CastOps
Definition: Instruction.h:961

llvm::IntegerType
Class to represent integer types.
Definition: DerivedTypes.h:40

llvm::IntegerType::get
static IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition: Type.cpp:278

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:47

llvm::IntrinsicInst::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
Definition: IntrinsicInst.h:54

llvm::IntrinsicInst::isCommutative
bool isCommutative() const
Return true if swapping the first two arguments to the intrinsic produces the same result.
Definition: IntrinsicInst.h:72

llvm::InvokeInst
Invoke instruction.
Definition: Instructions.h:4160

llvm::InvokeInst::Create
static InvokeInst * Create(FunctionType *Ty, Value *Func, BasicBlock *IfNormal, BasicBlock *IfException, ArrayRef< Value * > Args, const Twine &NameStr, BasicBlock::iterator InsertBefore)
Definition: Instructions.h:4210

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LLVMContext::OB_kcfi
@ OB_kcfi
Definition: LLVMContext.h:97

llvm::LLVMContext::OB_gc_live
@ OB_gc_live
Definition: LLVMContext.h:94

llvm::LibCallSimplifier
LibCallSimplifier - This class implements a collection of optimizations that replace well formed call...
Definition: SimplifyLibCalls.h:101

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:184

llvm::MDNode
Metadata node.
Definition: Metadata.h:1067

llvm::MDNode::get
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition: Metadata.h:1541

llvm::MinMaxIntrinsic::getPredicate
ICmpInst::Predicate getPredicate() const
Returns the comparison predicate underlying the intrinsic.
Definition: IntrinsicInst.h:783

llvm::MinMaxIntrinsic::isSigned
bool isSigned() const
Whether the intrinsic is signed or unsigned.
Definition: IntrinsicInst.h:793

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:65

llvm::Module::getDataLayout
const DataLayout & getDataLayout() const
Get the data layout for the module's target platform.
Definition: Module.h:293

llvm::OperandBundleDefT
A container for an operand bundle being viewed as a set of values rather than a set of uses.
Definition: InstrTypes.h:1447

llvm::PHINode
Definition: Instructions.h:2973

llvm::PoisonValue::get
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition: Constants.cpp:1827

llvm::SaturatingInst
Represents a saturating add/sub intrinsic.
Definition: IntrinsicInst.h:896

llvm::SelectInst
This class represents the LLVM 'select' instruction.
Definition: Instructions.h:1860

llvm::SelectInst::Create
static SelectInst * Create(Value *C, Value *S1, Value *S2, const Twine &NameStr, BasicBlock::iterator InsertBefore, Instruction *MDFrom=nullptr)
Definition: Instructions.h:1899

llvm::ShuffleVectorInst
This instruction constructs a fixed permutation of two input vectors.
Definition: Instructions.h:2171

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition: SmallBitVector.h:35

llvm::SmallBitVector::set
SmallBitVector & set()
Definition: SmallBitVector.h:366

llvm::SmallBitVector::test
bool test(unsigned Idx) const
Definition: SmallBitVector.h:472

llvm::SmallBitVector::all
bool all() const
Returns true if all bits are set.
Definition: SmallBitVector.h:216

llvm::SmallPtrSetImplBase::size
size_type size() const
Definition: SmallPtrSet.h:94

llvm::SmallPtrSetImpl::count
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
Definition: SmallPtrSet.h:360

llvm::SmallPtrSetImpl::insert
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
Definition: SmallPtrSet.h:342

llvm::SmallPtrSet
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
Definition: SmallPtrSet.h:427

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:94

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:91

llvm::SmallVectorImpl::reserve
void reserve(size_type N)
Definition: SmallVector.h:676

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:426

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209

llvm::StoreInst
An instruction for storing to memory.
Definition: Instructions.h:317

llvm::StoreInst::setVolatile
void setVolatile(bool V)
Specify whether this is a volatile store or not.
Definition: Instructions.h:364

llvm::StoreInst::setAlignment
void setAlignment(Align Align)
Definition: Instructions.h:373

llvm::StoreInst::setOrdering
void setOrdering(AtomicOrdering Ordering)
Sets the ordering constraint of this store instruction.
Definition: Instructions.h:384

llvm::StructType
Class to represent struct types.
Definition: DerivedTypes.h:216

llvm::TargetLibraryInfoImpl::isCallingConvCCompatible
static bool isCallingConvCCompatible(CallBase *CI)
Returns true if call site / callee has cdecl-compatible calling conventions.
Definition: TargetLibraryInfo.cpp:151

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:281

llvm::TruncInst
This class represents a truncation of integer types.
Definition: Instructions.h:5352

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getIntegerBitWidth
unsigned getIntegerBitWidth() const

llvm::Type::getFltSemantics
const fltSemantics & getFltSemantics() const

llvm::Type::isIntOrIntVectorTy
bool isIntOrIntVectorTy() const
Return true if this is an integer type or a vector of integer types.
Definition: Type.h:234

llvm::Type::isPointerTy
bool isPointerTy() const
True if this is an instance of PointerType.
Definition: Type.h:255

llvm::Type::getPointerAddressSpace
unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.

llvm::Type::getScalarSizeInBits
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::Type::isStructTy
bool isStructTy() const
True if this is an instance of StructType.
Definition: Type.h:249

llvm::Type::getWithNewBitWidth
Type * getWithNewBitWidth(unsigned NewBitWidth) const
Given an integer or vector type, change the lane bitwidth to NewBitwidth, whilst keeping the old numb...

llvm::Type::getContext
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition: Type.h:129

llvm::Type::canLosslesslyBitCastTo
bool canLosslesslyBitCastTo(Type *Ty) const
Return true if this type could be converted with a lossless BitCast to type 'Ty'.

llvm::Type::getInt32Ty
static IntegerType * getInt32Ty(LLVMContext &C)

llvm::Type::getInt64Ty
static IntegerType * getInt64Ty(LLVMContext &C)

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:228

llvm::Type::isVoidTy
bool isVoidTy() const
Return true if this is 'void'.
Definition: Type.h:140

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition: Type.h:348

llvm::UnaryOperator::CreateWithCopiedFlags
static UnaryOperator * CreateWithCopiedFlags(UnaryOps Opc, Value *V, Instruction *CopyO, const Twine &Name, BasicBlock::iterator InsertBefore)
Definition: InstrTypes.h:175

llvm::UndefValue::get
static UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
Definition: Constants.cpp:1808

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition: Use.h:43

llvm::Use::set
void set(Value *Val)
Definition: Value.h:882

llvm::User
Definition: User.h:44

llvm::User::op_begin
op_iterator op_begin()
Definition: User.h:234

llvm::User::getOperandUse
const Use & getOperandUse(unsigned i) const
Definition: User.h:182

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition: User.h:174

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:169

llvm::VAEndInst
This represents the llvm.va_end intrinsic.
Definition: IntrinsicInst.h:1404

llvm::ValueHandleBase::ValueIsDeleted
static void ValueIsDeleted(Value *V)
Definition: Value.cpp:1201

llvm::ValueHandleBase::ValueIsRAUWd
static void ValueIsRAUWd(Value *Old, Value *New)
Definition: Value.cpp:1254

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::MaximumAlignment
static constexpr uint64_t MaximumAlignment
Definition: Value.h:807

llvm::Value::setMetadata
void setMetadata(unsigned KindID, MDNode *Node)
Set a particular kind of metadata attachment.
Definition: Metadata.cpp:1487

llvm::Value::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition: Value.h:434

llvm::Value::users
iterator_range< user_iterator > users()
Definition: Value.h:421

llvm::Value::dropDroppableUse
static void dropDroppableUse(Use &U)
Remove the droppable use U.
Definition: Value.cpp:217

llvm::Value::stripPointerCasts
const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition: Value.cpp:693

llvm::Value::use_empty
bool use_empty() const
Definition: Value.h:344

llvm::Value::getContext
LLVMContext & getContext() const
All values hold a context through their type.
Definition: Value.cpp:1074

llvm::Value::MaxAlignmentExponent
static constexpr unsigned MaxAlignmentExponent
The maximum alignment for instructions.
Definition: Value.h:806

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::Value::takeName
void takeName(Value *V)
Transfer the name from V to this value.
Definition: Value.cpp:383

llvm::VectorType
Base class of all SIMD vector types.
Definition: DerivedTypes.h:403

llvm::VectorType::getElementCount
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Definition: DerivedTypes.h:641

llvm::WithOverflowInst
Represents an op.with.overflow intrinsic.
Definition: IntrinsicInst.h:875

llvm::cl::opt
Definition: CommandLine.h:1430

llvm::details::FixedOrScalableQuantity< ElementCount, unsigned >::isKnownLT
static constexpr bool isKnownLT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition: TypeSize.h:215

llvm::details::FixedOrScalableQuantity< ElementCount, unsigned >::isKnownGT
static constexpr bool isKnownGT(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition: TypeSize.h:222

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:109

uint32_t

uint64_t

unsigned

DebugInfo.h

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::AArch64PACKey::IA
@ IA
Definition: AArch64BaseInfo.h:820

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition: AMDGPUMetadata.h:395

llvm::AMDGPU::HSAMD::Kernel::Key::Attrs
constexpr char Attrs[]
Key for Kernel::Metadata::mAttrs.
Definition: AMDGPUMetadata.h:393

llvm::AttributeFuncs::ASK_UNSAFE_TO_DROP
@ ASK_UNSAFE_TO_DROP
Definition: Attributes.h:1235

llvm::AttributeFuncs::ASK_SAFE_TO_DROP
@ ASK_SAFE_TO_DROP
Definition: Attributes.h:1234

llvm::AttributeFuncs::typeIncompatible
AttributeMask typeIncompatible(Type *Ty, AttributeSafetyKind ASK=ASK_ALL)
Which attributes cannot be applied to a type.
Definition: Attributes.cpp:2021

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition: BitmaskEnum.h:121

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::Intrinsic::getDeclaration
Function * getDeclaration(Module *M, ID id, ArrayRef< Type * > Tys=std::nullopt)
Create or insert an LLVM Function declaration for an intrinsic, and return it.
Definition: Function.cpp:1471

llvm::M68k::MemAddrModeKind::V
@ V

llvm::M68k::MemAddrModeKind::L
@ L

llvm::MCID::Call
@ Call
Definition: MCInstrDesc.h:156

llvm::PatternMatch::m_AllOnes
cst_pred_ty< is_all_ones > m_AllOnes()
Match an integer or vector with all bits set.
Definition: PatternMatch.h:524

llvm::PatternMatch::m_And
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1206

llvm::PatternMatch::m_Add
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1092

llvm::PatternMatch::m_BinOp
class_match< BinaryOperator > m_BinOp()
Match an arbitrary binary operation and ignore it.
Definition: PatternMatch.h:100

llvm::PatternMatch::m_BitReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_BitReverse(const Opnd0 &Op0)
Definition: PatternMatch.h:2526

llvm::PatternMatch::m_Constant
class_match< Constant > m_Constant()
Match an arbitrary Constant and ignore it.
Definition: PatternMatch.h:165

llvm::PatternMatch::m_c_And
BinaryOp_match< LHS, RHS, Instruction::And, true > m_c_And(const LHS &L, const RHS &R)
Matches an And with LHS and RHS in either order.
Definition: PatternMatch.h:2627

llvm::PatternMatch::m_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor > m_Xor(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1218

llvm::PatternMatch::m_NSWSub
OverflowingBinaryOp_match< LHS, RHS, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWSub(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1279

llvm::PatternMatch::m_SpecificInt
specific_intval< false > m_SpecificInt(const APInt &V)
Match a specific integer value or vector with all elements equal to the value.
Definition: PatternMatch.h:972

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_Instruction
bind_ty< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
Definition: PatternMatch.h:816

llvm::PatternMatch::m_Specific
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
Definition: PatternMatch.h:875

llvm::PatternMatch::m_NSWNeg
OverflowingBinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub, OverflowingBinaryOperator::NoSignedWrap > m_NSWNeg(const ValTy &V)
Matches a 'Neg' as 'sub nsw 0, V'.
Definition: PatternMatch.h:2658

llvm::PatternMatch::m_ConstantInt
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
Definition: PatternMatch.h:168

llvm::PatternMatch::m_One
cst_pred_ty< is_one > m_One()
Match an integer 1 or a vector with all elements equal to 1.
Definition: PatternMatch.h:592

llvm::PatternMatch::m_Select
ThreeOps_match< Cond, LHS, RHS, Instruction::Select > m_Select(const Cond &C, const LHS &L, const RHS &R)
Matches SelectInst.
Definition: PatternMatch.h:1683

llvm::PatternMatch::m_NegZeroFP
cstfp_pred_ty< is_neg_zero_fp > m_NegZeroFP()
Match a floating-point negative zero.
Definition: PatternMatch.h:782

llvm::PatternMatch::m_LogicalShift
BinOpPred_match< LHS, RHS, is_logical_shift_op > m_LogicalShift(const LHS &L, const RHS &R)
Matches logical shift operations.
Definition: PatternMatch.h:1495

llvm::PatternMatch::m_CombineAnd
match_combine_and< LTy, RTy > m_CombineAnd(const LTy &L, const RTy &R)
Combine two pattern matchers matching L && R.
Definition: PatternMatch.h:245

llvm::PatternMatch::m_SMin
MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > m_SMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2224

llvm::PatternMatch::m_Trunc
CastOperator_match< OpTy, Instruction::Trunc > m_Trunc(const OpTy &Op)
Matches Trunc.
Definition: PatternMatch.h:1951

llvm::PatternMatch::m_c_Xor
BinaryOp_match< LHS, RHS, Instruction::Xor, true > m_c_Xor(const LHS &L, const RHS &R)
Matches an Xor with LHS and RHS in either order.
Definition: PatternMatch.h:2641

llvm::PatternMatch::m_Deferred
deferredval_ty< Value > m_Deferred(Value *const &V)
Like m_Specific(), but works if the specific value to match is determined as part of the same match()...
Definition: PatternMatch.h:893

llvm::PatternMatch::m_ZeroInt
cst_pred_ty< is_zero_int > m_ZeroInt()
Match an integer 0 or a vector with all elements equal to 0.
Definition: PatternMatch.h:599

llvm::PatternMatch::m_APIntAllowPoison
apint_match m_APIntAllowPoison(const APInt *&Res)
Match APInt while allowing poison in splat vector constants.
Definition: PatternMatch.h:305

llvm::PatternMatch::m_ICmp
CmpClass_match< LHS, RHS, ICmpInst, ICmpInst::Predicate > m_ICmp(ICmpInst::Predicate &Pred, const LHS &L, const RHS &R)
Definition: PatternMatch.h:1585

llvm::PatternMatch::m_ZExtOrSExtOrSelf
match_combine_or< match_combine_or< CastInst_match< OpTy, ZExtInst >, CastInst_match< OpTy, SExtInst > >, OpTy > m_ZExtOrSExtOrSelf(const OpTy &Op)
Definition: PatternMatch.h:2022

llvm::PatternMatch::m_OneUse
OneUse_match< T > m_OneUse(const T &SubPattern)
Definition: PatternMatch.h:67

llvm::PatternMatch::m_LogicalOr
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
Definition: PatternMatch.h:2933

llvm::PatternMatch::m_Neg
BinaryOp_match< cst_pred_ty< is_zero_int >, ValTy, Instruction::Sub > m_Neg(const ValTy &V)
Matches a 'Neg' as 'sub 0, V'.
Definition: PatternMatch.h:2649

llvm::PatternMatch::m_Shuffle
TwoOps_match< V1_t, V2_t, Instruction::ShuffleVector > m_Shuffle(const V1_t &v1, const V2_t &v2)
Matches ShuffleVectorInst independently of mask value.
Definition: PatternMatch.h:1787

llvm::PatternMatch::m_ImmConstant
match_combine_and< class_match< Constant >, match_unless< constantexpr_match > > m_ImmConstant()
Match an arbitrary immediate Constant and ignore it.
Definition: PatternMatch.h:854

llvm::PatternMatch::m_FPExt
CastInst_match< OpTy, FPExtInst > m_FPExt(const OpTy &Op)
Definition: PatternMatch.h:2052

llvm::PatternMatch::m_ZExt
CastInst_match< OpTy, ZExtInst > m_ZExt(const OpTy &Op)
Matches ZExt.
Definition: PatternMatch.h:1983

llvm::PatternMatch::m_NUWShl
OverflowingBinaryOp_match< LHS, RHS, Instruction::Shl, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWShl(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1338

llvm::PatternMatch::m_UMax
MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty > m_UMax(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2230

llvm::PatternMatch::m_Cmp
class_match< CmpInst > m_Cmp()
Matches any compare instruction and ignore it.
Definition: PatternMatch.h:105

llvm::PatternMatch::m_NegatedPower2
cst_pred_ty< is_negated_power2 > m_NegatedPower2()
Match a integer or vector negated power-of-2.
Definition: PatternMatch.h:627

llvm::PatternMatch::m_FShl
m_Intrinsic_Ty< Opnd0, Opnd1, Opnd2 >::Ty m_FShl(const Opnd0 &Op0, const Opnd1 &Op1, const Opnd2 &Op2)
Definition: PatternMatch.h:2559

llvm::PatternMatch::m_c_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty, true >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty, true > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty, true >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty, true > > > m_c_MaxOrMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2709

llvm::PatternMatch::m_UnOp
class_match< UnaryOperator > m_UnOp()
Match an arbitrary unary operation and ignore it.
Definition: PatternMatch.h:95

llvm::PatternMatch::m_NUWSub
OverflowingBinaryOp_match< LHS, RHS, Instruction::Sub, OverflowingBinaryOperator::NoUnsignedWrap > m_NUWSub(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1322

llvm::PatternMatch::m_SMax
MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty > m_SMax(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2218

llvm::PatternMatch::m_APInt
apint_match m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
Definition: PatternMatch.h:299

llvm::PatternMatch::m_NSWAddLike
match_combine_or< OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoSignedWrap >, DisjointOr_match< LHS, RHS > > m_NSWAddLike(const LHS &L, const RHS &R)
Match either "add nsw" or "or disjoint".
Definition: PatternMatch.h:1409

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_LShr
BinaryOp_match< LHS, RHS, Instruction::LShr > m_LShr(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1230

llvm::PatternMatch::m_Exact
Exact_match< T > m_Exact(const T &SubPattern)
Definition: PatternMatch.h:1542

llvm::PatternMatch::m_FNeg
FNeg_match< OpTy > m_FNeg(const OpTy &X)
Match 'fneg X' as 'fsub -0.0, X'.
Definition: PatternMatch.h:1146

llvm::PatternMatch::m_Shift
BinOpPred_match< LHS, RHS, is_shift_op > m_Shift(const LHS &L, const RHS &R)
Matches shift operations.
Definition: PatternMatch.h:1480

llvm::PatternMatch::m_PosZeroFP
cstfp_pred_ty< is_pos_zero_fp > m_PosZeroFP()
Match a floating-point positive zero.
Definition: PatternMatch.h:773

llvm::PatternMatch::m_Shl
BinaryOp_match< LHS, RHS, Instruction::Shl > m_Shl(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1224

llvm::PatternMatch::m_VecReverse
m_Intrinsic_Ty< Opnd0 >::Ty m_VecReverse(const Opnd0 &Op0)
Definition: PatternMatch.h:2581

llvm::PatternMatch::m_APFloat
apfloat_match m_APFloat(const APFloat *&Res)
Match a ConstantFP or splatted ConstantVector, binding the specified pointer to the contained APFloat...
Definition: PatternMatch.h:316

llvm::PatternMatch::m_LogicalAnd
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Definition: PatternMatch.h:2915

llvm::PatternMatch::m_MaxOrMin
match_combine_or< match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, smax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, smin_pred_ty > >, match_combine_or< MaxMin_match< ICmpInst, LHS, RHS, umax_pred_ty >, MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > > > m_MaxOrMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2247

llvm::PatternMatch::m_FShr
m_Intrinsic_Ty< Opnd0, Opnd1, Opnd2 >::Ty m_FShr(const Opnd0 &Op0, const Opnd1 &Op1, const Opnd2 &Op2)
Definition: PatternMatch.h:2565

llvm::PatternMatch::m_SRem
BinaryOp_match< LHS, RHS, Instruction::SRem > m_SRem(const LHS &L, const RHS &R)
Definition: PatternMatch.h:1194

llvm::PatternMatch::m_Undef
auto m_Undef()
Match an arbitrary undef constant.
Definition: PatternMatch.h:152

llvm::PatternMatch::m_Not
BinaryOp_match< cst_pred_ty< is_all_ones >, ValTy, Instruction::Xor, true > m_Not(const ValTy &V)
Matches a 'Not' as 'xor V, -1' or 'xor -1, V'.
Definition: PatternMatch.h:2667

llvm::PatternMatch::m_BSwap
m_Intrinsic_Ty< Opnd0 >::Ty m_BSwap(const Opnd0 &Op0)
Definition: PatternMatch.h:2531

llvm::PatternMatch::m_SExt
CastInst_match< OpTy, SExtInst > m_SExt(const OpTy &Op)
Matches SExt.
Definition: PatternMatch.h:1977

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition: PatternMatch.h:612

llvm::PatternMatch::m_c_Or
BinaryOp_match< LHS, RHS, Instruction::Or, true > m_c_Or(const LHS &L, const RHS &R)
Matches an Or with LHS and RHS in either order.
Definition: PatternMatch.h:2634

llvm::PatternMatch::m_NUWAddLike
match_combine_or< OverflowingBinaryOp_match< LHS, RHS, Instruction::Add, OverflowingBinaryOperator::NoUnsignedWrap >, DisjointOr_match< LHS, RHS > > m_NUWAddLike(const LHS &L, const RHS &R)
Match either "add nuw" or "or disjoint".
Definition: PatternMatch.h:1419

llvm::PatternMatch::m_BitwiseLogic
BinOpPred_match< LHS, RHS, is_bitwiselogic_op > m_BitwiseLogic(const LHS &L, const RHS &R)
Matches bitwise logic operations.
Definition: PatternMatch.h:1502

llvm::PatternMatch::m_FAbs
m_Intrinsic_Ty< Opnd0 >::Ty m_FAbs(const Opnd0 &Op0)
Definition: PatternMatch.h:2536

llvm::PatternMatch::m_c_Mul
BinaryOp_match< LHS, RHS, Instruction::Mul, true > m_c_Mul(const LHS &L, const RHS &R)
Matches a Mul with LHS and RHS in either order.
Definition: PatternMatch.h:2620

llvm::PatternMatch::m_CopySign
m_Intrinsic_Ty< Opnd0, Opnd1 >::Ty m_CopySign(const Opnd0 &Op0, const Opnd1 &Op1)
Definition: PatternMatch.h:2575

llvm::PatternMatch::m_PtrToInt
CastOperator_match< OpTy, Instruction::PtrToInt > m_PtrToInt(const OpTy &Op)
Matches PtrToInt.
Definition: PatternMatch.h:1932

llvm::PatternMatch::m_UMin
MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > m_UMin(const LHS &L, const RHS &R)
Definition: PatternMatch.h:2236

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition: PatternMatch.h:239

llvm::SyncScope::SingleThread
@ SingleThread
Synchronized with respect to signal handlers executing in the same thread.
Definition: LLVMContext.h:54

llvm::SyncScope::System
@ System
Synchronized with respect to all concurrently executing threads.
Definition: LLVMContext.h:57

llvm::X86::FirstMacroFusionInstKind::AddSub
@ AddSub

llvm::at::getAssignmentMarkers
AssignmentMarkerRange getAssignmentMarkers(DIAssignID *ID)
Return a range of dbg.assign intrinsics which use \ID as an operand.
Definition: DebugInfo.cpp:1895

llvm::at::getDVRAssignmentMarkers
SmallVector< DbgVariableRecord * > getDVRAssignmentMarkers(const Instruction *Inst)
Definition: DebugInfo.h:238

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:450

llvm::codeview::EncodedFramePtrReg::BasePtr
@ BasePtr

llvm::dwarf::Index
Index
Definition: Dwarf.h:872

llvm::logicalview::LVAttributeKind::Zero
@ Zero

llvm::numbers::e
constexpr double e
Definition: MathExtras.h:31

llvm::ore::NV
DiagnosticInfoOptimizationBase::Argument NV
Definition: OptimizationRemarkEmitter.h:136

llvm::pdb::PDB_SymType::Caller
@ Caller

llvm::pdb::PDB_SymType::Callee
@ Callee

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::EnableKnowledgeRetention
cl::opt< bool > EnableKnowledgeRetention

llvm::getInverseMinMaxIntrinsic
Intrinsic::ID getInverseMinMaxIntrinsic(Intrinsic::ID MinMaxID)
Definition: ValueTracking.cpp:8484

llvm::Log2_32_Ceil
unsigned Log2_32_Ceil(uint32_t Value)
Return the ceil log base 2 of the specified value, 32 if the value is zero.
Definition: MathExtras.h:337

llvm::Offset
@ Offset
Definition: DWP.cpp:456

llvm::OverflowResult
OverflowResult
Definition: ValueTracking.h:853

llvm::OverflowResult::NeverOverflows
@ NeverOverflows
Never overflows.

llvm::OverflowResult::AlwaysOverflowsHigh
@ AlwaysOverflowsHigh
Always overflows in the direction of signed/unsigned max value.

llvm::OverflowResult::AlwaysOverflowsLow
@ AlwaysOverflowsLow
Always overflows in the direction of signed/unsigned min value.

llvm::OverflowResult::MayOverflow
@ MayOverflow
May or may not overflow.

llvm::for_each
UnaryFunction for_each(R &&Range, UnaryFunction F)
Provide wrappers to std::for_each which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1715

llvm::simplifyFMulInst
Value * simplifyFMulInst(Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q, fp::ExceptionBehavior ExBehavior=fp::ebIgnore, RoundingMode Rounding=RoundingMode::NearestTiesToEven)
Given operands for an FMul, fold the result or return null.
Definition: InstructionSimplify.cpp:5813

llvm::isValidAssumeForContext
bool isValidAssumeForContext(const Instruction *I, const Instruction *CxtI, const DominatorTree *DT=nullptr, bool AllowEphemerals=false)
Return true if it is valid to use the assumptions provided by an assume intrinsic,...
Definition: ValueTracking.cpp:487

llvm::possiblyDemandedEltsInMask
APInt possiblyDemandedEltsInMask(Value *Mask)
Given a mask vector of the form <Y x i1>, return an APInt (of bitwidth Y) for each lane which may be ...
Definition: VectorUtils.cpp:1047

llvm::simplifyRetainedKnowledge
RetainedKnowledge simplifyRetainedKnowledge(AssumeInst *Assume, RetainedKnowledge RK, AssumptionCache *AC, DominatorTree *DT)
canonicalize the RetainedKnowledge RK.
Definition: AssumeBundleBuilder.cpp:318

llvm::isRemovableAlloc
bool isRemovableAlloc(const CallBase *V, const TargetLibraryInfo *TLI)
Return true if this is a call to an allocation function that does not have side effects that we are r...
Definition: MemoryBuiltins.cpp:342

llvm::lowerObjectSizeCall
Value * lowerObjectSizeCall(IntrinsicInst *ObjectSize, const DataLayout &DL, const TargetLibraryInfo *TLI, bool MustSucceed)
Try to turn a call to @llvm.objectsize into an integer value of the given Type.
Definition: MemoryBuiltins.cpp:603

llvm::getAllocAlignment
Value * getAllocAlignment(const CallBase *V, const TargetLibraryInfo *TLI)
Gets the alignment argument for an aligned_alloc-like function, using either built-in knowledge based...
Definition: MemoryBuiltins.cpp:353

llvm::maximum
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition: APFloat.h:1436

llvm::getUnderlyingObject
const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=6)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
Definition: ValueTracking.cpp:6312

llvm::simplifyCall
Value * simplifyCall(CallBase *Call, Value *Callee, ArrayRef< Value * > Args, const SimplifyQuery &Q)
Given a callsite, callee, and arguments, fold the result or return null.
Definition: InstructionSimplify.cpp:6903

llvm::ConstantFoldCompareInstOperands
Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
Definition: ConstantFolding.cpp:1190

llvm::isPowerOf2_64
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
Definition: MathExtras.h:280

llvm::isAssumeWithEmptyBundle
bool isAssumeWithEmptyBundle(const AssumeInst &Assume)
Return true iff the operand bundles of the provided llvm.assume doesn't contain any valuable informat...
Definition: AssumeBundleQueries.cpp:128

llvm::getSplatValue
Value * getSplatValue(const Value *V)
Get splat value if the input is a splat vector or return nullptr.
Definition: VectorUtils.cpp:250

llvm::getKnowledgeFromBundle
RetainedKnowledge getKnowledgeFromBundle(AssumeInst &Assume, const CallBase::BundleOpInfo &BOI)
This extracts the Knowledge from an element of an operand bundle.
Definition: AssumeBundleQueries.cpp:99

llvm::getKnownAlignment
Align getKnownAlignment(Value *V, const DataLayout &DL, const Instruction *CxtI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr)
Try to infer an alignment for the specified pointer.
Definition: Local.h:242

llvm::isSplatValue
bool isSplatValue(const Value *V, int Index=-1, unsigned Depth=0)
Return true if each element of the vector value V is poisoned or equal to every other non-poisoned el...
Definition: VectorUtils.cpp:265

llvm::maxnum
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2019 maximumNumber semantics.
Definition: APFloat.h:1410

llvm::fneg
FPClassTest fneg(FPClassTest Mask)
Return the test mask which returns true if the value's sign bit is flipped.
Definition: FloatingPointMode.cpp:14

llvm::SelectPatternFlavor
SelectPatternFlavor
Specific patterns of select instructions we can match.
Definition: ValueTracking.h:1060

llvm::SPF_ABS
@ SPF_ABS
Floating point maxnum.
Definition: ValueTracking.h:1068

llvm::SPF_NABS
@ SPF_NABS
Absolute value.
Definition: ValueTracking.h:1069

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:275

llvm::isModSet
bool isModSet(const ModRefInfo MRI)
Definition: ModRef.h:48

llvm::ComplexDeinterleavingOperation::Splat
@ Splat

llvm::FPClassTest
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
Definition: FloatingPointMode.h:239

llvm::fcInf
@ fcInf
Definition: FloatingPointMode.h:254

llvm::fcNegSubnormal
@ fcNegSubnormal
Definition: FloatingPointMode.h:246

llvm::fcPosNormal
@ fcPosNormal
Definition: FloatingPointMode.h:250

llvm::fcNegZero
@ fcNegZero
Definition: FloatingPointMode.h:247

llvm::fcNegInf
@ fcNegInf
Definition: FloatingPointMode.h:244

llvm::fcSubnormal
@ fcSubnormal
Definition: FloatingPointMode.h:256

llvm::fcNone
@ fcNone
Definition: FloatingPointMode.h:240

llvm::fcPositive
@ fcPositive
Definition: FloatingPointMode.h:261

llvm::fcPosZero
@ fcPosZero
Definition: FloatingPointMode.h:248

llvm::fcNegNormal
@ fcNegNormal
Definition: FloatingPointMode.h:245

llvm::fcZero
@ fcZero
Definition: FloatingPointMode.h:257

llvm::fcNegative
@ fcNegative
Definition: FloatingPointMode.h:262

llvm::fcAllFlags
@ fcAllFlags
Definition: FloatingPointMode.h:264

llvm::fcPosSubnormal
@ fcPosSubnormal
Definition: FloatingPointMode.h:249

llvm::fcPosInf
@ fcPosInf
Definition: FloatingPointMode.h:251

llvm::fcNan
@ fcNan
Definition: FloatingPointMode.h:253

llvm::matchSelectPattern
SelectPatternResult matchSelectPattern(Value *V, Value *&LHS, Value *&RHS, Instruction::CastOps *CastOp=nullptr, unsigned Depth=0)
Pattern match integer [SU]MIN, [SU]MAX and ABS idioms, returning the kind and providing the out param...
Definition: ValueTracking.cpp:8406

llvm::NullPointerIsDefined
bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
Definition: Function.cpp:2060

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::none_of
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1736

llvm::isAtLeastOrStrongerThan
bool isAtLeastOrStrongerThan(AtomicOrdering AO, AtomicOrdering Other)
Definition: AtomicOrdering.h:106

llvm::buildAssumeFromKnowledge
AssumeInst * buildAssumeFromKnowledge(ArrayRef< RetainedKnowledge > Knowledge, Instruction *CtxI, AssumptionCache *AC=nullptr, DominatorTree *DT=nullptr)
Build and return a new assume created from the provided knowledge if the knowledge in the assume is f...
Definition: AssumeBundleBuilder.cpp:309

llvm::inverse_fabs
FPClassTest inverse_fabs(FPClassTest Mask)
Return the test mask which returns true after fabs is applied to the value.
Definition: FloatingPointMode.cpp:35

llvm::maskIsAllOneOrUndef
bool maskIsAllOneOrUndef(Value *Mask)
Given a mask vector of i1, Return true if all of the elements of this predicate mask are known to be ...
Definition: VectorUtils.cpp:994

llvm::ConstantFoldBinaryOpOperands
Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
Definition: ConstantFolding.cpp:1302

llvm::isKnownNonZero
bool isKnownNonZero(const Value *V, const SimplifyQuery &Q, unsigned Depth=0)
Return true if the given value is known to be non-zero when defined.
Definition: ValueTracking.cpp:3122

llvm::PoisonMaskElem
constexpr int PoisonMaskElem
Definition: Instructions.h:2159

llvm::AtomicOrdering::Unordered
@ Unordered

llvm::ModRefInfo::Mod
@ Mod
The access may modify the value stored in memory.

llvm::simplifyFMAFMul
Value * simplifyFMAFMul(Value *LHS, Value *RHS, FastMathFlags FMF, const SimplifyQuery &Q, fp::ExceptionBehavior ExBehavior=fp::ebIgnore, RoundingMode Rounding=RoundingMode::NearestTiesToEven)
Given operands for the multiplication of a FMA, fold the result or return null.
Definition: InstructionSimplify.cpp:5821

llvm::IRMemLocation::Other
@ Other
Any other memory.

llvm::simplifyConstrainedFPCall
Value * simplifyConstrainedFPCall(CallBase *Call, const SimplifyQuery &Q)
Given a constrained FP intrinsic call, tries to compute its simplified version.
Definition: InstructionSimplify.cpp:6929

llvm::minnum
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2019 minimumNumber semantics.
Definition: APFloat.h:1396

llvm::RecurKind::Mul
@ Mul
Product of integers.

llvm::RecurKind::None
@ None
Not a recurrence.

llvm::RecurKind::Add
@ Add
Sum of integers.

llvm::RecurKind::FAdd
@ FAdd
Sum of floats.

llvm::computeConstantRangeIncludingKnownBits
ConstantRange computeConstantRangeIncludingKnownBits(const WithCache< const Value * > &V, bool ForSigned, const SimplifyQuery &SQ)
Combine constant ranges from computeConstantRange() and computeKnownBits().
Definition: ValueTracking.cpp:6688

llvm::computeKnownBits
void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, unsigned Depth=0, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
Definition: ValueTracking.cpp:165

llvm::MinAlign
constexpr uint64_t MinAlign(uint64_t A, uint64_t B)
A and B are either alignments or offsets.
Definition: MathExtras.h:349

llvm::getFreedOperand
Value * getFreedOperand(const CallBase *CB, const TargetLibraryInfo *TLI)
If this if a call to a free function, return the freed operand.
Definition: MemoryBuiltins.cpp:558

llvm::isSafeToSpeculativelyExecute
bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr)
Return true if the instruction does not have any effects besides calculating the result and does not ...
Definition: ValueTracking.cpp:6546

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:191

llvm::isDereferenceablePointer
bool isDereferenceablePointer(const Value *V, Type *Ty, const DataLayout &DL, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr)
Return true if this is always a dereferenceable pointer.
Definition: Loads.cpp:221

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition: STLExtras.h:1879

llvm::getAllocSize
std::optional< APInt > getAllocSize(const CallBase *CB, const TargetLibraryInfo *TLI, function_ref< const Value *(const Value *)> Mapper=[](const Value *V) { return V;})
Return the size of the requested allocation.
Definition: MemoryBuiltins.cpp:379

llvm::computeKnownFPSignBit
std::optional< bool > computeKnownFPSignBit(const Value *V, unsigned Depth, const SimplifyQuery &SQ)
Return false if we can prove that the specified FP value's sign bit is 0.
Definition: ValueTracking.h:581

llvm::Log2
unsigned Log2(Align A)
Returns the log2 of the alignment.
Definition: Alignment.h:208

llvm::maskContainsAllOneOrUndef
bool maskContainsAllOneOrUndef(Value *Mask)
Given a mask vector of i1, Return true if any of the elements of this predicate mask are known to be ...
Definition: VectorUtils.cpp:1020

llvm::alignDown
uint64_t alignDown(uint64_t Value, uint64_t Align, uint64_t Skew=0)
Returns the largest uint64_t less than or equal to Value and is Skew mod Align.
Definition: MathExtras.h:439

llvm::isImpliedByDomCondition
std::optional< bool > isImpliedByDomCondition(const Value *Cond, const Instruction *ContextI, const DataLayout &DL)
Return the boolean condition value in the context of the given instruction if it is known based on do...
Definition: ValueTracking.cpp:8981

llvm::minimum
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition: APFloat.h:1423

llvm::isKnownNegation
bool isKnownNegation(const Value *X, const Value *Y, bool NeedNSW=false, bool AllowPoison=true)
Return true if the two given values are negation.
Definition: ValueTracking.cpp:8074

llvm::Data
@ Data
Definition: SIMachineScheduler.h:55

llvm::isKnownNonNegative
bool isKnownNonNegative(const Value *V, const SimplifyQuery &SQ, unsigned Depth=0)
Returns true if the give value is known to be non-negative.
Definition: ValueTracking.cpp:284

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:860

raw_ostream.h

NC
#define NC
Definition: regutils.h:42

llvm::AAMDNodes
A collection of metadata nodes that might be associated with a memory access used by the alias-analys...
Definition: Metadata.h:760

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::BitTracker
Definition: BitTracker.h:35

llvm::DenormalMode::IEEE
@ IEEE
IEEE-754 denormal numbers preserved.
Definition: FloatingPointMode.h:77

llvm::KnownBits
Definition: KnownBits.h:23

llvm::KnownBits::isNonNegative
bool isNonNegative() const
Returns true if this value is known to be non-negative.
Definition: KnownBits.h:104

llvm::KnownBits::countMinTrailingZeros
unsigned countMinTrailingZeros() const
Returns the minimum number of trailing zero bits.
Definition: KnownBits.h:238

llvm::KnownBits::countMaxTrailingZeros
unsigned countMaxTrailingZeros() const
Returns the maximum number of trailing zero bits possible.
Definition: KnownBits.h:270

llvm::KnownBits::countMaxPopulation
unsigned countMaxPopulation() const
Returns the maximum number of bits that could be one.
Definition: KnownBits.h:285

llvm::KnownBits::getBitWidth
unsigned getBitWidth() const
Get the bit width of this value.
Definition: KnownBits.h:40

llvm::KnownBits::isNonZero
bool isNonZero() const
Returns true if this value is known to be non-zero.
Definition: KnownBits.h:107

llvm::KnownBits::countMinLeadingZeros
unsigned countMinLeadingZeros() const
Returns the minimum number of leading zero bits.
Definition: KnownBits.h:244

llvm::KnownBits::isNegative
bool isNegative() const
Returns true if this value is known to be negative.
Definition: KnownBits.h:101

llvm::KnownBits::countMaxLeadingZeros
unsigned countMaxLeadingZeros() const
Returns the maximum number of leading zero bits possible.
Definition: KnownBits.h:276

llvm::KnownBits::One
APInt One
Definition: KnownBits.h:25

llvm::KnownBits::Zero
APInt Zero
Definition: KnownBits.h:24

llvm::KnownBits::countMinPopulation
unsigned countMinPopulation() const
Returns the number of bits known to be one.
Definition: KnownBits.h:282

llvm::KnownBits::isAllOnes
bool isAllOnes() const
Returns true if value is all one bits.
Definition: KnownBits.h:83

llvm::KnownFPClass
Definition: ValueTracking.h:249

llvm::KnownFPClass::KnownFPClasses
FPClassTest KnownFPClasses
Floating-point classes the value could be one of.
Definition: ValueTracking.h:251

llvm::MaybeAlign
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition: Alignment.h:117

llvm::MaybeAlign::valueOrOne
Align valueOrOne() const
For convenience, returns a valid alignment or 1 if undefined.
Definition: Alignment.h:141

llvm::MinMax
Definition: AssumeBundleQueries.h:71

llvm::OperandBundleUse
A lightweight accessor for an operand bundle meant to be passed around by value.
Definition: InstrTypes.h:1389

llvm::OperandBundleUse::getTagName
StringRef getTagName() const
Return the tag of this operand bundle as a string.
Definition: InstrTypes.h:1408

llvm::OperandBundleUse::Inputs
ArrayRef< Use > Inputs
Definition: InstrTypes.h:1390

llvm::PatternMatch::m_Mask
Definition: PatternMatch.h:1735

llvm::PatternMatch::m_SpecificMask
Definition: PatternMatch.h:1750

llvm::RetainedKnowledge
Represent one information held inside an operand bundle of an llvm.assume.
Definition: AssumeBundleQueries.h:100

llvm::RetainedKnowledge::AttrKind
Attribute::AttrKind AttrKind
Definition: AssumeBundleQueries.h:101

llvm::RetainedKnowledge::ArgValue
uint64_t ArgValue
Definition: AssumeBundleQueries.h:102

llvm::RetainedKnowledge::WasOn
Value * WasOn
Definition: AssumeBundleQueries.h:103

llvm::SelectPatternResult::Flavor
SelectPatternFlavor Flavor
Definition: ValueTracking.h:1084

llvm::SimplifyQuery
Definition: SimplifyQuery.h:60

llvm::SimplifyQuery::getWithInstruction
SimplifyQuery getWithInstruction(const Instruction *I) const
Definition: SimplifyQuery.h:96

llvm::UnderlyingObject
Definition: ScheduleDAGInstrs.h:110

llvm::cl::desc
Definition: CommandLine.h:416