/usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Analysis/VectorUtils.cpp

Bug Summary

File:	src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Analysis/VectorUtils.cpp
Warning:	line 1180, column 11 Called C++ object pointer is null

Annotated Source Code

Press '?' to see keyboard shortcuts

Show analyzer invocation

clang -cc1 -cc1 -triple amd64-unknown-openbsd7.0 -analyze -disable-free -disable-llvm-verifier -discard-value-names -main-file-name VectorUtils.cpp -analyzer-store=region -analyzer-opt-analyze-nested-blocks -analyzer-checker=core -analyzer-checker=apiModeling -analyzer-checker=unix -analyzer-checker=deadcode -analyzer-checker=cplusplus -analyzer-checker=security.insecureAPI.UncheckedReturn -analyzer-checker=security.insecureAPI.getpw -analyzer-checker=security.insecureAPI.gets -analyzer-checker=security.insecureAPI.mktemp -analyzer-checker=security.insecureAPI.mkstemp -analyzer-checker=security.insecureAPI.vfork -analyzer-checker=nullability.NullPassedToNonnull -analyzer-checker=nullability.NullReturnedFromNonnull -analyzer-output plist -w -setup-static-analyzer -mrelocation-model pic -pic-level 1 -fhalf-no-semantic-interposition -mframe-pointer=all -relaxed-aliasing -fno-rounding-math -mconstructor-aliases -munwind-tables -target-cpu x86-64 -tune-cpu generic -debugger-tuning=gdb -fcoverage-compilation-dir=/usr/src/gnu/usr.bin/clang/libLLVM/obj -resource-dir /usr/local/lib/clang/13.0.0 -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/AMDGPU -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Analysis -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ASMParser -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/BinaryFormat -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Bitcode -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Bitcode -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Bitstream -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /include/llvm/CodeGen -I /include/llvm/CodeGen/PBQP -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/IR -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/IR -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms/Coroutines -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ProfileData/Coverage -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/DebugInfo/CodeView -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/DebugInfo/DWARF -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/DebugInfo -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/DebugInfo/MSF -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/DebugInfo/PDB -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Demangle -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ExecutionEngine -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ExecutionEngine/JITLink -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ExecutionEngine/Orc -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Frontend -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Frontend/OpenACC -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Frontend -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Frontend/OpenMP -I /include/llvm/CodeGen/GlobalISel -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/IRReader -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms/InstCombine -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/Transforms/InstCombine -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/LTO -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Linker -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/MC -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/MC/MCParser -I /include/llvm/CodeGen/MIRParser -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Object -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Option -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Passes -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ProfileData -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms/Scalar -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ADT -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Support -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/DebugInfo/Symbolize -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Target -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms/Utils -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms/Vectorize -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include/llvm/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Target/X86 -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Transforms/IPO -I /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include -I /usr/src/gnu/usr.bin/clang/libLLVM/../include -I /usr/src/gnu/usr.bin/clang/libLLVM/obj -I /usr/src/gnu/usr.bin/clang/libLLVM/obj/../include -D NDEBUG -D __STDC_LIMIT_MACROS -D __STDC_CONSTANT_MACROS -D __STDC_FORMAT_MACROS -D LLVM_PREFIX="/usr" -D PIC -internal-isystem /usr/include/c++/v1 -internal-isystem /usr/local/lib/clang/13.0.0/include -internal-externc-isystem /usr/include -O2 -Wno-unused-parameter -Wwrite-strings -Wno-missing-field-initializers -Wno-long-long -Wno-comment -std=c++14 -fdeprecated-macro -fdebug-compilation-dir=/usr/src/gnu/usr.bin/clang/libLLVM/obj -ferror-limit 19 -fvisibility-inlines-hidden -fwrapv -D_RET_PROTECTOR -ret-protector -fno-rtti -fgnuc-version=4.2.1 -vectorize-loops -vectorize-slp -fno-builtin-malloc -fno-builtin-calloc -fno-builtin-realloc -fno-builtin-valloc -fno-builtin-free -fno-builtin-strdup -fno-builtin-strndup -analyzer-output=html -faddrsig -D__GCC_HAVE_DWARF2_CFI_ASM=1 -o /home/ben/Projects/vmm/scan-build/2022-01-12-194120-40624-1 -x c++ /usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Analysis/VectorUtils.cpp

/usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/lib/Analysis/VectorUtils.cpp

→

1//===----------- VectorUtils.cpp - Vectorizer utility functions -----------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines vectorizer utilities.
10//
11//===----------------------------------------------------------------------===//

13#include "llvm/Analysis/VectorUtils.h"
14#include "llvm/ADT/EquivalenceClasses.h"
15#include "llvm/Analysis/DemandedBits.h"
16#include "llvm/Analysis/LoopInfo.h"
17#include "llvm/Analysis/LoopIterator.h"
18#include "llvm/Analysis/ScalarEvolution.h"
19#include "llvm/Analysis/ScalarEvolutionExpressions.h"
20#include "llvm/Analysis/TargetTransformInfo.h"
21#include "llvm/Analysis/ValueTracking.h"
22#include "llvm/IR/Constants.h"
23#include "llvm/IR/GetElementPtrTypeIterator.h"
24#include "llvm/IR/IRBuilder.h"
25#include "llvm/IR/PatternMatch.h"
26#include "llvm/IR/Value.h"
27#include "llvm/Support/CommandLine.h"

29#define DEBUG_TYPE"vectorutils" "vectorutils"

31using namespace llvm;
32using namespace llvm::PatternMatch;

34/// Maximum factor for an interleaved memory access.
35static cl::opt<unsigned> MaxInterleaveGroupFactor(
  "max-interleave-group-factor", cl::Hidden,
  cl::desc("Maximum factor for an interleaved access group (default = 8)"),
  cl::init(8));

40/// Return true if all of the intrinsic's arguments and return type are scalars
41/// for the scalar form of the intrinsic, and vectors for the vector form of the
42/// intrinsic (except operands that are marked as always being scalar by
43/// hasVectorInstrinsicScalarOpd).
44bool llvm::isTriviallyVectorizable(Intrinsic::ID ID) {
switch (ID) {
case Intrinsic::abs:   // Begin integer bit-manipulation.
case Intrinsic::bswap:
case Intrinsic::bitreverse:
case Intrinsic::ctpop:
case Intrinsic::ctlz:
case Intrinsic::cttz:
case Intrinsic::fshl:
case Intrinsic::fshr:
case Intrinsic::smax:
case Intrinsic::smin:
case Intrinsic::umax:
case Intrinsic::umin:
case Intrinsic::sadd_sat:
case Intrinsic::ssub_sat:
case Intrinsic::uadd_sat:
case Intrinsic::usub_sat:
case Intrinsic::smul_fix:
case Intrinsic::smul_fix_sat:
case Intrinsic::umul_fix:
case Intrinsic::umul_fix_sat:
case Intrinsic::sqrt: // Begin floating-point.
case Intrinsic::sin:
case Intrinsic::cos:
case Intrinsic::exp:
case Intrinsic::exp2:
case Intrinsic::log:
case Intrinsic::log10:
case Intrinsic::log2:
case Intrinsic::fabs:
case Intrinsic::minnum:
case Intrinsic::maxnum:
case Intrinsic::minimum:
case Intrinsic::maximum:
case Intrinsic::copysign:
case Intrinsic::floor:
case Intrinsic::ceil:
case Intrinsic::trunc:
case Intrinsic::rint:
case Intrinsic::nearbyint:
case Intrinsic::round:
case Intrinsic::roundeven:
case Intrinsic::pow:
case Intrinsic::fma:
case Intrinsic::fmuladd:
case Intrinsic::powi:
case Intrinsic::canonicalize:
  return true;
default:
  return false;
}
96}

98/// Identifies if the vector form of the intrinsic has a scalar operand.
99bool llvm::hasVectorInstrinsicScalarOpd(Intrinsic::ID ID,
                                      unsigned ScalarOpdIdx) {
switch (ID) {
case Intrinsic::abs:
case Intrinsic::ctlz:
case Intrinsic::cttz:
case Intrinsic::powi:
  return (ScalarOpdIdx == 1);
case Intrinsic::smul_fix:
case Intrinsic::smul_fix_sat:
case Intrinsic::umul_fix:
case Intrinsic::umul_fix_sat:
  return (ScalarOpdIdx == 2);
default:
  return false;
}
115}

117bool llvm::hasVectorInstrinsicOverloadedScalarOpd(Intrinsic::ID ID,
                                                unsigned ScalarOpdIdx) {
switch (ID) {
case Intrinsic::powi:
  return (ScalarOpdIdx == 1);
default:
  return false;
}
125}

127/// Returns intrinsic ID for call.
128/// For the input call instruction it finds mapping intrinsic and returns
129/// its ID, in case it does not found it return not_intrinsic.
130Intrinsic::ID llvm::getVectorIntrinsicIDForCall(const CallInst *CI,
                                              const TargetLibraryInfo *TLI) {
Intrinsic::ID ID = getIntrinsicForCallSite(*CI, TLI);
if (ID == Intrinsic::not_intrinsic)
  return Intrinsic::not_intrinsic;

if (isTriviallyVectorizable(ID) || ID == Intrinsic::lifetime_start ||
    ID == Intrinsic::lifetime_end || ID == Intrinsic::assume ||
    ID == Intrinsic::experimental_noalias_scope_decl ||
    ID == Intrinsic::sideeffect || ID == Intrinsic::pseudoprobe)
  return ID;
return Intrinsic::not_intrinsic;
142}

144/// Find the operand of the GEP that should be checked for consecutive
145/// stores. This ignores trailing indices that have no effect on the final
146/// pointer.
147unsigned llvm::getGEPInductionOperand(const GetElementPtrInst *Gep) {
const DataLayout &DL = Gep->getModule()->getDataLayout();
unsigned LastOperand = Gep->getNumOperands() - 1;
TypeSize GEPAllocSize = DL.getTypeAllocSize(Gep->getResultElementType());

// Walk backwards and try to peel off zeros.
while (LastOperand > 1 && match(Gep->getOperand(LastOperand), m_Zero())) {
  // Find the type we're currently indexing into.
  gep_type_iterator GEPTI = gep_type_begin(Gep);
  std::advance(GEPTI, LastOperand - 2);

  // If it's a type with the same allocation size as the result of the GEP we
  // can peel off the zero index.
  if (DL.getTypeAllocSize(GEPTI.getIndexedType()) != GEPAllocSize)
    break;
  --LastOperand;
}

return LastOperand;
166}

168/// If the argument is a GEP, then returns the operand identified by
169/// getGEPInductionOperand. However, if there is some other non-loop-invariant
170/// operand, it returns that instead.
171Value *llvm::stripGetElementPtr(Value *Ptr, ScalarEvolution *SE, Loop *Lp) {
GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(Ptr);
if (!GEP)
  return Ptr;

unsigned InductionOperand = getGEPInductionOperand(GEP);

// Check that all of the gep indices are uniform except for our induction
// operand.
for (unsigned i = 0, e = GEP->getNumOperands(); i != e; ++i)
  if (i != InductionOperand &&
      !SE->isLoopInvariant(SE->getSCEV(GEP->getOperand(i)), Lp))
    return Ptr;
return GEP->getOperand(InductionOperand);
185}

187/// If a value has only one user that is a CastInst, return it.
188Value *llvm::getUniqueCastUse(Value *Ptr, Loop *Lp, Type *Ty) {
Value *UniqueCast = nullptr;
for (User *U : Ptr->users()) {
  CastInst *CI = dyn_cast<CastInst>(U);
  if (CI && CI->getType() == Ty) {
    if (!UniqueCast)
      UniqueCast = CI;
    else
      return nullptr;
  }
}
return UniqueCast;
200}

202/// Get the stride of a pointer access in a loop. Looks for symbolic
203/// strides "a[i*stride]". Returns the symbolic stride, or null otherwise.
204Value *llvm::getStrideFromPointer(Value *Ptr, ScalarEvolution *SE, Loop *Lp) {
auto *PtrTy = dyn_cast<PointerType>(Ptr->getType());
if (!PtrTy || PtrTy->isAggregateType())
  return nullptr;

// Try to remove a gep instruction to make the pointer (actually index at this
// point) easier analyzable. If OrigPtr is equal to Ptr we are analyzing the
// pointer, otherwise, we are analyzing the index.
Value *OrigPtr = Ptr;

// The size of the pointer access.
int64_t PtrAccessSize = 1;

Ptr = stripGetElementPtr(Ptr, SE, Lp);
const SCEV *V = SE->getSCEV(Ptr);

if (Ptr != OrigPtr)
  // Strip off casts.
  while (const SCEVIntegralCastExpr *C = dyn_cast<SCEVIntegralCastExpr>(V))
    V = C->getOperand();

const SCEVAddRecExpr *S = dyn_cast<SCEVAddRecExpr>(V);
if (!S)
  return nullptr;

V = S->getStepRecurrence(*SE);
if (!V)
  return nullptr;

// Strip off the size of access multiplication if we are still analyzing the
// pointer.
if (OrigPtr == Ptr) {
  if (const SCEVMulExpr *M = dyn_cast<SCEVMulExpr>(V)) {
    if (M->getOperand(0)->getSCEVType() != scConstant)
      return nullptr;

    const APInt &APStepVal = cast<SCEVConstant>(M->getOperand(0))->getAPInt();

    // Huge step value - give up.
    if (APStepVal.getBitWidth() > 64)
      return nullptr;

    int64_t StepVal = APStepVal.getSExtValue();
    if (PtrAccessSize != StepVal)
      return nullptr;
    V = M->getOperand(1);
  }
}

// Strip off casts.
Type *StripedOffRecurrenceCast = nullptr;
if (const SCEVIntegralCastExpr *C = dyn_cast<SCEVIntegralCastExpr>(V)) {
  StripedOffRecurrenceCast = C->getType();
  V = C->getOperand();
}

// Look for the loop invariant symbolic value.
const SCEVUnknown *U = dyn_cast<SCEVUnknown>(V);
if (!U)
  return nullptr;

Value *Stride = U->getValue();
if (!Lp->isLoopInvariant(Stride))
  return nullptr;

// If we have stripped off the recurrence cast we have to make sure that we
// return the value that is used in this loop so that we can replace it later.
if (StripedOffRecurrenceCast)
  Stride = getUniqueCastUse(Stride, Lp, StripedOffRecurrenceCast);

return Stride;
275}

277/// Given a vector and an element number, see if the scalar value is
278/// already around as a register, for example if it were inserted then extracted
279/// from the vector.
280Value *llvm::findScalarElement(Value *V, unsigned EltNo) {
assert(V->getType()->isVectorTy() && "Not looking at a vector?")((void)0);
VectorType *VTy = cast<VectorType>(V->getType());
// For fixed-length vector, return undef for out of range access.
if (auto *FVTy = dyn_cast<FixedVectorType>(VTy)) {
  unsigned Width = FVTy->getNumElements();
  if (EltNo >= Width)
    return UndefValue::get(FVTy->getElementType());
}

if (Constant *C = dyn_cast<Constant>(V))
  return C->getAggregateElement(EltNo);

if (InsertElementInst *III = dyn_cast<InsertElementInst>(V)) {
  // If this is an insert to a variable element, we don't know what it is.
  if (!isa<ConstantInt>(III->getOperand(2)))
    return nullptr;
  unsigned IIElt = cast<ConstantInt>(III->getOperand(2))->getZExtValue();

  // If this is an insert to the element we are looking for, return the
  // inserted value.
  if (EltNo == IIElt)
    return III->getOperand(1);

  // Guard against infinite loop on malformed, unreachable IR.
  if (III == III->getOperand(0))
    return nullptr;

  // Otherwise, the insertelement doesn't modify the value, recurse on its
  // vector input.
  return findScalarElement(III->getOperand(0), EltNo);
}

ShuffleVectorInst *SVI = dyn_cast<ShuffleVectorInst>(V);
// Restrict the following transformation to fixed-length vector.
if (SVI && isa<FixedVectorType>(SVI->getType())) {
  unsigned LHSWidth =
      cast<FixedVectorType>(SVI->getOperand(0)->getType())->getNumElements();
  int InEl = SVI->getMaskValue(EltNo);
  if (InEl < 0)
    return UndefValue::get(VTy->getElementType());
  if (InEl < (int)LHSWidth)
    return findScalarElement(SVI->getOperand(0), InEl);
  return findScalarElement(SVI->getOperand(1), InEl - LHSWidth);
}

// Extract a value from a vector add operation with a constant zero.
// TODO: Use getBinOpIdentity() to generalize this.
Value *Val; Constant *C;
if (match(V, m_Add(m_Value(Val), m_Constant(C))))
  if (Constant *Elt = C->getAggregateElement(EltNo))
    if (Elt->isNullValue())
      return findScalarElement(Val, EltNo);

// Otherwise, we don't know.
return nullptr;
336}

338int llvm::getSplatIndex(ArrayRef<int> Mask) {
int SplatIndex = -1;
for (int M : Mask) {
  // Ignore invalid (undefined) mask elements.
  if (M < 0)
    continue;

  // There can be only 1 non-negative mask element value if this is a splat.
  if (SplatIndex != -1 && SplatIndex != M)
    return -1;

  // Initialize the splat index to the 1st non-negative mask element.
  SplatIndex = M;
}
assert((SplatIndex == -1 || SplatIndex >= 0) && "Negative index?")((void)0);
return SplatIndex;
354}

356/// Get splat value if the input is a splat vector or return nullptr.
357/// This function is not fully general. It checks only 2 cases:
358/// the input value is (1) a splat constant vector or (2) a sequence
359/// of instructions that broadcasts a scalar at element 0.
360Value *llvm::getSplatValue(const Value *V) {
if (isa<VectorType>(V->getType()))
  if (auto *C = dyn_cast<Constant>(V))
    return C->getSplatValue();

// shuf (inselt ?, Splat, 0), ?, <0, undef, 0, ...>
Value *Splat;
if (match(V,
          m_Shuffle(m_InsertElt(m_Value(), m_Value(Splat), m_ZeroInt()),
                    m_Value(), m_ZeroMask())))
  return Splat;

return nullptr;
373}

375bool llvm::isSplatValue(const Value *V, int Index, unsigned Depth) {
assert(Depth <= MaxAnalysisRecursionDepth && "Limit Search Depth")((void)0);

if (isa<VectorType>(V->getType())) {
  if (isa<UndefValue>(V))
    return true;
  // FIXME: We can allow undefs, but if Index was specified, we may want to
  //        check that the constant is defined at that index.
  if (auto *C = dyn_cast<Constant>(V))
    return C->getSplatValue() != nullptr;
}

if (auto *Shuf = dyn_cast<ShuffleVectorInst>(V)) {
  // FIXME: We can safely allow undefs here. If Index was specified, we will
  //        check that the mask elt is defined at the required index.
  if (!is_splat(Shuf->getShuffleMask()))
    return false;

  // Match any index.
  if (Index == -1)
    return true;

  // Match a specific element. The mask should be defined at and match the
  // specified index.
  return Shuf->getMaskValue(Index) == Index;
}

// The remaining tests are all recursive, so bail out if we hit the limit.
if (Depth++ == MaxAnalysisRecursionDepth)
  return false;

// If both operands of a binop are splats, the result is a splat.
Value *X, *Y, *Z;
if (match(V, m_BinOp(m_Value(X), m_Value(Y))))
  return isSplatValue(X, Index, Depth) && isSplatValue(Y, Index, Depth);

// If all operands of a select are splats, the result is a splat.
if (match(V, m_Select(m_Value(X), m_Value(Y), m_Value(Z))))
  return isSplatValue(X, Index, Depth) && isSplatValue(Y, Index, Depth) &&
         isSplatValue(Z, Index, Depth);

// TODO: Add support for unary ops (fneg), casts, intrinsics (overflow ops).

return false;
419}

421void llvm::narrowShuffleMaskElts(int Scale, ArrayRef<int> Mask,
                               SmallVectorImpl<int> &ScaledMask) {
assert(Scale > 0 && "Unexpected scaling factor")((void)0);

// Fast-path: if no scaling, then it is just a copy.
if (Scale == 1) {
  ScaledMask.assign(Mask.begin(), Mask.end());
  return;
}

ScaledMask.clear();
for (int MaskElt : Mask) {
  if (MaskElt >= 0) {
    assert(((uint64_t)Scale * MaskElt + (Scale - 1)) <= INT32_MAX &&((void)0)
           "Overflowed 32-bits")((void)0);
  }
  for (int SliceElt = 0; SliceElt != Scale; ++SliceElt)
    ScaledMask.push_back(MaskElt < 0 ? MaskElt : Scale * MaskElt + SliceElt);
}
440}

442bool llvm::widenShuffleMaskElts(int Scale, ArrayRef<int> Mask,
                              SmallVectorImpl<int> &ScaledMask) {
assert(Scale > 0 && "Unexpected scaling factor")((void)0);

// Fast-path: if no scaling, then it is just a copy.
if (Scale == 1) {
  ScaledMask.assign(Mask.begin(), Mask.end());
  return true;
}

// We must map the original elements down evenly to a type with less elements.
int NumElts = Mask.size();
if (NumElts % Scale != 0)
  return false;

ScaledMask.clear();
ScaledMask.reserve(NumElts / Scale);

// Step through the input mask by splitting into Scale-sized slices.
do {
  ArrayRef<int> MaskSlice = Mask.take_front(Scale);
  assert((int)MaskSlice.size() == Scale && "Expected Scale-sized slice.")((void)0);

  // The first element of the slice determines how we evaluate this slice.
  int SliceFront = MaskSlice.front();
  if (SliceFront < 0) {
    // Negative values (undef or other "sentinel" values) must be equal across
    // the entire slice.
    if (!is_splat(MaskSlice))
      return false;
    ScaledMask.push_back(SliceFront);
  } else {
    // A positive mask element must be cleanly divisible.
    if (SliceFront % Scale != 0)
      return false;
    // Elements of the slice must be consecutive.
    for (int i = 1; i < Scale; ++i)
      if (MaskSlice[i] != SliceFront + i)
        return false;
    ScaledMask.push_back(SliceFront / Scale);
  }
  Mask = Mask.drop_front(Scale);
} while (!Mask.empty());

assert((int)ScaledMask.size() * Scale == NumElts && "Unexpected scaled mask")((void)0);

// All elements of the original mask can be scaled down to map to the elements
// of a mask with wider elements.
return true;
491}

493MapVector<Instruction *, uint64_t>
494llvm::computeMinimumValueSizes(ArrayRef<BasicBlock *> Blocks, DemandedBits &DB,
                             const TargetTransformInfo *TTI) {

// DemandedBits will give us every value's live-out bits. But we want
// to ensure no extra casts would need to be inserted, so every DAG
// of connected values must have the same minimum bitwidth.
EquivalenceClasses<Value *> ECs;
SmallVector<Value *, 16> Worklist;
SmallPtrSet<Value *, 4> Roots;
SmallPtrSet<Value *, 16> Visited;
DenseMap<Value *, uint64_t> DBits;
SmallPtrSet<Instruction *, 4> InstructionSet;
MapVector<Instruction *, uint64_t> MinBWs;

// Determine the roots. We work bottom-up, from truncs or icmps.
bool SeenExtFromIllegalType = false;
for (auto *BB : Blocks)
  for (auto &I : *BB) {
    InstructionSet.insert(&I);

    if (TTI && (isa<ZExtInst>(&I) || isa<SExtInst>(&I)) &&
        !TTI->isTypeLegal(I.getOperand(0)->getType()))
      SeenExtFromIllegalType = true;

    // Only deal with non-vector integers up to 64-bits wide.
    if ((isa<TruncInst>(&I) || isa<ICmpInst>(&I)) &&
        !I.getType()->isVectorTy() &&
        I.getOperand(0)->getType()->getScalarSizeInBits() <= 64) {
      // Don't make work for ourselves. If we know the loaded type is legal,
      // don't add it to the worklist.
      if (TTI && isa<TruncInst>(&I) && TTI->isTypeLegal(I.getType()))
        continue;

      Worklist.push_back(&I);
      Roots.insert(&I);
    }
  }
// Early exit.
if (Worklist.empty() || (TTI && !SeenExtFromIllegalType))
  return MinBWs;

// Now proceed breadth-first, unioning values together.
while (!Worklist.empty()) {
  Value *Val = Worklist.pop_back_val();
  Value *Leader = ECs.getOrInsertLeaderValue(Val);

  if (Visited.count(Val))
    continue;
  Visited.insert(Val);

  // Non-instructions terminate a chain successfully.
  if (!isa<Instruction>(Val))
    continue;
  Instruction *I = cast<Instruction>(Val);

  // If we encounter a type that is larger than 64 bits, we can't represent
  // it so bail out.
  if (DB.getDemandedBits(I).getBitWidth() > 64)
    return MapVector<Instruction *, uint64_t>();

  uint64_t V = DB.getDemandedBits(I).getZExtValue();
  DBits[Leader] |= V;
  DBits[I] = V;

  // Casts, loads and instructions outside of our range terminate a chain
  // successfully.
  if (isa<SExtInst>(I) || isa<ZExtInst>(I) || isa<LoadInst>(I) ||
      !InstructionSet.count(I))
    continue;

  // Unsafe casts terminate a chain unsuccessfully. We can't do anything
  // useful with bitcasts, ptrtoints or inttoptrs and it'd be unsafe to
  // transform anything that relies on them.
  if (isa<BitCastInst>(I) || isa<PtrToIntInst>(I) || isa<IntToPtrInst>(I) ||
      !I->getType()->isIntegerTy()) {
    DBits[Leader] |= ~0ULL;
    continue;
  }

  // We don't modify the types of PHIs. Reductions will already have been
  // truncated if possible, and inductions' sizes will have been chosen by
  // indvars.
  if (isa<PHINode>(I))
    continue;

  if (DBits[Leader] == ~0ULL)
    // All bits demanded, no point continuing.
    continue;

  for (Value *O : cast<User>(I)->operands()) {
    ECs.unionSets(Leader, O);
    Worklist.push_back(O);
  }
}

// Now we've discovered all values, walk them to see if there are
// any users we didn't see. If there are, we can't optimize that
// chain.
for (auto &I : DBits)
  for (auto *U : I.first->users())
    if (U->getType()->isIntegerTy() && DBits.count(U) == 0)
      DBits[ECs.getOrInsertLeaderValue(I.first)] |= ~0ULL;

for (auto I = ECs.begin(), E = ECs.end(); I != E; ++I) {
  uint64_t LeaderDemandedBits = 0;
  for (Value *M : llvm::make_range(ECs.member_begin(I), ECs.member_end()))
    LeaderDemandedBits |= DBits[M];

  uint64_t MinBW = (sizeof(LeaderDemandedBits) * 8) -
                   llvm::countLeadingZeros(LeaderDemandedBits);
  // Round up to a power of 2
  if (!isPowerOf2_64((uint64_t)MinBW))
    MinBW = NextPowerOf2(MinBW);

  // We don't modify the types of PHIs. Reductions will already have been
  // truncated if possible, and inductions' sizes will have been chosen by
  // indvars.
  // If we are required to shrink a PHI, abandon this entire equivalence class.
  bool Abort = false;
  for (Value *M : llvm::make_range(ECs.member_begin(I), ECs.member_end()))
    if (isa<PHINode>(M) && MinBW < M->getType()->getScalarSizeInBits()) {
      Abort = true;
      break;
    }
  if (Abort)
    continue;

  for (Value *M : llvm::make_range(ECs.member_begin(I), ECs.member_end())) {
    if (!isa<Instruction>(M))
      continue;
    Type *Ty = M->getType();
    if (Roots.count(M))
      Ty = cast<Instruction>(M)->getOperand(0)->getType();
    if (MinBW < Ty->getScalarSizeInBits())
      MinBWs[cast<Instruction>(M)] = MinBW;
  }
}

return MinBWs;
633}

635/// Add all access groups in @p AccGroups to @p List.
636template <typename ListT>
637static void addToAccessGroupList(ListT &List, MDNode *AccGroups) {
// Interpret an access group as a list containing itself.
if (AccGroups->getNumOperands() == 0) {
  assert(isValidAsAccessGroup(AccGroups) && "Node must be an access group")((void)0);
  List.insert(AccGroups);
  return;
}

for (auto &AccGroupListOp : AccGroups->operands()) {
  auto *Item = cast<MDNode>(AccGroupListOp.get());
  assert(isValidAsAccessGroup(Item) && "List item must be an access group")((void)0);
  List.insert(Item);
}
650}

652MDNode *llvm::uniteAccessGroups(MDNode *AccGroups1, MDNode *AccGroups2) {
if (!AccGroups1)
  return AccGroups2;
if (!AccGroups2)
  return AccGroups1;
if (AccGroups1 == AccGroups2)
  return AccGroups1;

SmallSetVector<Metadata *, 4> Union;
addToAccessGroupList(Union, AccGroups1);
addToAccessGroupList(Union, AccGroups2);

if (Union.size() == 0)
  return nullptr;
if (Union.size() == 1)
  return cast<MDNode>(Union.front());

LLVMContext &Ctx = AccGroups1->getContext();
return MDNode::get(Ctx, Union.getArrayRef());
671}

673MDNode *llvm::intersectAccessGroups(const Instruction *Inst1,
                                  const Instruction *Inst2) {
bool MayAccessMem1 = Inst1->mayReadOrWriteMemory();
bool MayAccessMem2 = Inst2->mayReadOrWriteMemory();

if (!MayAccessMem1 && !MayAccessMem2)
  return nullptr;
if (!MayAccessMem1)
  return Inst2->getMetadata(LLVMContext::MD_access_group);
if (!MayAccessMem2)
  return Inst1->getMetadata(LLVMContext::MD_access_group);

MDNode *MD1 = Inst1->getMetadata(LLVMContext::MD_access_group);
MDNode *MD2 = Inst2->getMetadata(LLVMContext::MD_access_group);
if (!MD1 || !MD2)
  return nullptr;
if (MD1 == MD2)
  return MD1;

// Use set for scalable 'contains' check.
SmallPtrSet<Metadata *, 4> AccGroupSet2;
addToAccessGroupList(AccGroupSet2, MD2);

SmallVector<Metadata *, 4> Intersection;
if (MD1->getNumOperands() == 0) {
  assert(isValidAsAccessGroup(MD1) && "Node must be an access group")((void)0);
  if (AccGroupSet2.count(MD1))
    Intersection.push_back(MD1);
} else {
  for (const MDOperand &Node : MD1->operands()) {
    auto *Item = cast<MDNode>(Node.get());
    assert(isValidAsAccessGroup(Item) && "List item must be an access group")((void)0);
    if (AccGroupSet2.count(Item))
      Intersection.push_back(Item);
  }
}

if (Intersection.size() == 0)
  return nullptr;
if (Intersection.size() == 1)
  return cast<MDNode>(Intersection.front());

LLVMContext &Ctx = Inst1->getContext();
return MDNode::get(Ctx, Intersection);
717}

719/// \returns \p I after propagating metadata from \p VL.
720Instruction *llvm::propagateMetadata(Instruction *Inst, ArrayRef<Value *> VL) {
if (VL.empty())
  return Inst;
Instruction *I0 = cast<Instruction>(VL[0]);
SmallVector<std::pair<unsigned, MDNode *>, 4> Metadata;
I0->getAllMetadataOtherThanDebugLoc(Metadata);

for (auto Kind : {LLVMContext::MD_tbaa, LLVMContext::MD_alias_scope,
                  LLVMContext::MD_noalias, LLVMContext::MD_fpmath,
                  LLVMContext::MD_nontemporal, LLVMContext::MD_invariant_load,
                  LLVMContext::MD_access_group}) {
  MDNode *MD = I0->getMetadata(Kind);

  for (int J = 1, E = VL.size(); MD && J != E; ++J) {
    const Instruction *IJ = cast<Instruction>(VL[J]);
    MDNode *IMD = IJ->getMetadata(Kind);
    switch (Kind) {
    case LLVMContext::MD_tbaa:
      MD = MDNode::getMostGenericTBAA(MD, IMD);
      break;
    case LLVMContext::MD_alias_scope:
      MD = MDNode::getMostGenericAliasScope(MD, IMD);
      break;
    case LLVMContext::MD_fpmath:
      MD = MDNode::getMostGenericFPMath(MD, IMD);
      break;
    case LLVMContext::MD_noalias:
    case LLVMContext::MD_nontemporal:
    case LLVMContext::MD_invariant_load:
      MD = MDNode::intersect(MD, IMD);
      break;
    case LLVMContext::MD_access_group:
      MD = intersectAccessGroups(Inst, IJ);
      break;
    default:
      llvm_unreachable("unhandled metadata")__builtin_unreachable();
    }
  }

  Inst->setMetadata(Kind, MD);
}

return Inst;
763}

765Constant *
766llvm::createBitMaskForGaps(IRBuilderBase &Builder, unsigned VF,
                         const InterleaveGroup<Instruction> &Group) {
// All 1's means mask is not needed.
if (Group.getNumMembers() == Group.getFactor())
  return nullptr;

// TODO: support reversed access.
assert(!Group.isReverse() && "Reversed group not supported.")((void)0);

SmallVector<Constant *, 16> Mask;
for (unsigned i = 0; i < VF; i++)
  for (unsigned j = 0; j < Group.getFactor(); ++j) {
    unsigned HasMember = Group.getMember(j) ? 1 : 0;
    Mask.push_back(Builder.getInt1(HasMember));
  }

return ConstantVector::get(Mask);
783}

785llvm::SmallVector<int, 16>
786llvm::createReplicatedMask(unsigned ReplicationFactor, unsigned VF) {
SmallVector<int, 16> MaskVec;
for (unsigned i = 0; i < VF; i++)
  for (unsigned j = 0; j < ReplicationFactor; j++)
    MaskVec.push_back(i);

return MaskVec;
793}

795llvm::SmallVector<int, 16> llvm::createInterleaveMask(unsigned VF,
                                                    unsigned NumVecs) {
SmallVector<int, 16> Mask;
for (unsigned i = 0; i < VF; i++)
  for (unsigned j = 0; j < NumVecs; j++)
    Mask.push_back(j * VF + i);

return Mask;
803}

805llvm::SmallVector<int, 16>
806llvm::createStrideMask(unsigned Start, unsigned Stride, unsigned VF) {
SmallVector<int, 16> Mask;
for (unsigned i = 0; i < VF; i++)
  Mask.push_back(Start + i * Stride);

return Mask;
812}

814llvm::SmallVector<int, 16> llvm::createSequentialMask(unsigned Start,
                                                    unsigned NumInts,
                                                    unsigned NumUndefs) {
SmallVector<int, 16> Mask;
for (unsigned i = 0; i < NumInts; i++)
  Mask.push_back(Start + i);

for (unsigned i = 0; i < NumUndefs; i++)
  Mask.push_back(-1);

return Mask;
825}

827/// A helper function for concatenating vectors. This function concatenates two
828/// vectors having the same element type. If the second vector has fewer
829/// elements than the first, it is padded with undefs.
830static Value *concatenateTwoVectors(IRBuilderBase &Builder, Value *V1,
                                  Value *V2) {
VectorType *VecTy1 = dyn_cast<VectorType>(V1->getType());
VectorType *VecTy2 = dyn_cast<VectorType>(V2->getType());
assert(VecTy1 && VecTy2 &&((void)0)
       VecTy1->getScalarType() == VecTy2->getScalarType() &&((void)0)
       "Expect two vectors with the same element type")((void)0);

unsigned NumElts1 = cast<FixedVectorType>(VecTy1)->getNumElements();
unsigned NumElts2 = cast<FixedVectorType>(VecTy2)->getNumElements();
assert(NumElts1 >= NumElts2 && "Unexpect the first vector has less elements")((void)0);

if (NumElts1 > NumElts2) {
  // Extend with UNDEFs.
  V2 = Builder.CreateShuffleVector(
      V2, createSequentialMask(0, NumElts2, NumElts1 - NumElts2));
}

return Builder.CreateShuffleVector(
    V1, V2, createSequentialMask(0, NumElts1 + NumElts2, 0));
850}

852Value *llvm::concatenateVectors(IRBuilderBase &Builder,
                              ArrayRef<Value *> Vecs) {
unsigned NumVecs = Vecs.size();
assert(NumVecs > 1 && "Should be at least two vectors")((void)0);

SmallVector<Value *, 8> ResList;
ResList.append(Vecs.begin(), Vecs.end());
do {
  SmallVector<Value *, 8> TmpList;
  for (unsigned i = 0; i < NumVecs - 1; i += 2) {
    Value *V0 = ResList[i], *V1 = ResList[i + 1];
    assert((V0->getType() == V1->getType() || i == NumVecs - 2) &&((void)0)
           "Only the last vector may have a different type")((void)0);

    TmpList.push_back(concatenateTwoVectors(Builder, V0, V1));
  }

  // Push the last vector if the total number of vectors is odd.
  if (NumVecs % 2 != 0)
    TmpList.push_back(ResList[NumVecs - 1]);

  ResList = TmpList;
  NumVecs = ResList.size();
} while (NumVecs > 1);

return ResList[0];
878}

880bool llvm::maskIsAllZeroOrUndef(Value *Mask) {
assert(isa<VectorType>(Mask->getType()) &&((void)0)
       isa<IntegerType>(Mask->getType()->getScalarType()) &&((void)0)
       cast<IntegerType>(Mask->getType()->getScalarType())->getBitWidth() ==((void)0)
           1 &&((void)0)
       "Mask must be a vector of i1")((void)0);

auto *ConstMask = dyn_cast<Constant>(Mask);
if (!ConstMask)
  return false;
if (ConstMask->isNullValue() || isa<UndefValue>(ConstMask))
  return true;
if (isa<ScalableVectorType>(ConstMask->getType()))
  return false;
for (unsigned
         I = 0,
         E = cast<FixedVectorType>(ConstMask->getType())->getNumElements();
     I != E; ++I) {
  if (auto *MaskElt = ConstMask->getAggregateElement(I))
    if (MaskElt->isNullValue() || isa<UndefValue>(MaskElt))
      continue;
  return false;
}
return true;
904}

906bool llvm::maskIsAllOneOrUndef(Value *Mask) {
assert(isa<VectorType>(Mask->getType()) &&((void)0)
       isa<IntegerType>(Mask->getType()->getScalarType()) &&((void)0)
       cast<IntegerType>(Mask->getType()->getScalarType())->getBitWidth() ==((void)0)
           1 &&((void)0)
       "Mask must be a vector of i1")((void)0);

auto *ConstMask = dyn_cast<Constant>(Mask);
if (!ConstMask)
  return false;
if (ConstMask->isAllOnesValue() || isa<UndefValue>(ConstMask))
  return true;
if (isa<ScalableVectorType>(ConstMask->getType()))
  return false;
for (unsigned
         I = 0,
         E = cast<FixedVectorType>(ConstMask->getType())->getNumElements();
     I != E; ++I) {
  if (auto *MaskElt = ConstMask->getAggregateElement(I))
    if (MaskElt->isAllOnesValue() || isa<UndefValue>(MaskElt))
      continue;
  return false;
}
return true;
930}

932/// TODO: This is a lot like known bits, but for
933/// vectors.  Is there something we can common this with?
934APInt llvm::possiblyDemandedEltsInMask(Value *Mask) {
assert(isa<FixedVectorType>(Mask->getType()) &&((void)0)
       isa<IntegerType>(Mask->getType()->getScalarType()) &&((void)0)
       cast<IntegerType>(Mask->getType()->getScalarType())->getBitWidth() ==((void)0)
           1 &&((void)0)
       "Mask must be a fixed width vector of i1")((void)0);

const unsigned VWidth =
    cast<FixedVectorType>(Mask->getType())->getNumElements();
APInt DemandedElts = APInt::getAllOnesValue(VWidth);
if (auto *CV = dyn_cast<ConstantVector>(Mask))
  for (unsigned i = 0; i < VWidth; i++)
    if (CV->getAggregateElement(i)->isNullValue())
      DemandedElts.clearBit(i);
return DemandedElts;
949}

951bool InterleavedAccessInfo::isStrided(int Stride) {
unsigned Factor = std::abs(Stride);
return Factor >= 2 && Factor <= MaxInterleaveGroupFactor;
52
←
Assuming 'Factor' is >= 2→
53
←
Assuming the condition is true→
54
←
Returning the value 1, which participates in a condition later→
57
←
Assuming 'Factor' is >= 2→
58
←
Assuming the condition is true→
59
←
Returning the value 1, which participates in a condition later→
954}

956void InterleavedAccessInfo::collectConstStrideAccesses(
  MapVector<Instruction *, StrideDescriptor> &AccessStrideInfo,
  const ValueToValueMap &Strides) {
auto &DL = TheLoop->getHeader()->getModule()->getDataLayout();

// Since it's desired that the load/store instructions be maintained in
// "program order" for the interleaved access analysis, we have to visit the
// blocks in the loop in reverse postorder (i.e., in a topological order).
// Such an ordering will ensure that any load/store that may be executed
// before a second load/store will precede the second load/store in
// AccessStrideInfo.
LoopBlocksDFS DFS(TheLoop);
DFS.perform(LI);
for (BasicBlock *BB : make_range(DFS.beginRPO(), DFS.endRPO()))
  for (auto &I : *BB) {
    Value *Ptr = getLoadStorePointerOperand(&I);
    if (!Ptr)
      continue;
    Type *ElementTy = getLoadStoreType(&I);

    // We don't check wrapping here because we don't know yet if Ptr will be
    // part of a full group or a group with gaps. Checking wrapping for all
    // pointers (even those that end up in groups with no gaps) will be overly
    // conservative. For full groups, wrapping should be ok since if we would
    // wrap around the address space we would do a memory access at nullptr
    // even without the transformation. The wrapping checks are therefore
    // deferred until after we've formed the interleaved groups.
    int64_t Stride = getPtrStride(PSE, Ptr, TheLoop, Strides,
                                  /*Assume=*/true, /*ShouldCheckWrap=*/false);

    const SCEV *Scev = replaceSymbolicStrideSCEV(PSE, Strides, Ptr);
    uint64_t Size = DL.getTypeAllocSize(ElementTy);
    AccessStrideInfo[&I] = StrideDescriptor(Stride, Scev, Size,
                                            getLoadStoreAlignment(&I));
  }
991}

993// Analyze interleaved accesses and collect them into interleaved load and
994// store groups.
995//
996// When generating code for an interleaved load group, we effectively hoist all
997// loads in the group to the location of the first load in program order. When
998// generating code for an interleaved store group, we sink all stores to the
999// location of the last store. This code motion can change the order of load
1000// and store instructions and may break dependences.
1001//
1002// The code generation strategy mentioned above ensures that we won't violate
1003// any write-after-read (WAR) dependences.
1004//
1005// E.g., for the WAR dependence:  a = A[i];      // (1)
1006//                                A[i] = b;      // (2)
1007//
1008// The store group of (2) is always inserted at or below (2), and the load
1009// group of (1) is always inserted at or above (1). Thus, the instructions will
1010// never be reordered. All other dependences are checked to ensure the
1011// correctness of the instruction reordering.
1012//
1013// The algorithm visits all memory accesses in the loop in bottom-up program
1014// order. Program order is established by traversing the blocks in the loop in
1015// reverse postorder when collecting the accesses.
1016//
1017// We visit the memory accesses in bottom-up order because it can simplify the
1018// construction of store groups in the presence of write-after-write (WAW)
1019// dependences.
1020//
1021// E.g., for the WAW dependence:  A[i] = a;      // (1)
1022//                                A[i] = b;      // (2)
1023//                                A[i + 1] = c;  // (3)
1024//
1025// We will first create a store group with (3) and (2). (1) can't be added to
1026// this group because it and (2) are dependent. However, (1) can be grouped
1027// with other accesses that may precede it in program order. Note that a
1028// bottom-up order does not imply that WAW dependences should not be checked.
1029void InterleavedAccessInfo::analyzeInterleaving(
                               bool EnablePredicatedInterleavedMemAccesses) {
LLVM_DEBUG(dbgs() << "LV: Analyzing interleaved accesses...\n")do { } while (false);
1
Loop condition is false.  Exiting loop→
const ValueToValueMap &Strides = LAI->getSymbolicStrides();

// Holds all accesses with a constant stride.
MapVector<Instruction *, StrideDescriptor> AccessStrideInfo;
collectConstStrideAccesses(AccessStrideInfo, Strides);

if (AccessStrideInfo.empty())
2
←
Assuming the condition is false→
3
←
Taking false branch→
  return;

// Collect the dependences in the loop.
collectDependences();

// Holds all interleaved store groups temporarily.
SmallSetVector<InterleaveGroup<Instruction> *, 4> StoreGroups;
// Holds all interleaved load groups temporarily.
SmallSetVector<InterleaveGroup<Instruction> *, 4> LoadGroups;

// Search in bottom-up program order for pairs of accesses (A and B) that can
// form interleaved load or store groups. In the algorithm below, access A
// precedes access B in program order. We initialize a group for B in the
// outer loop of the algorithm, and then in the inner loop, we attempt to
// insert each A into B's group if:
//
//  1. A and B have the same stride,
//  2. A and B have the same memory object size, and
//  3. A belongs in B's group according to its distance from B.
//
// Special care is taken to ensure group formation will not break any
// dependences.
for (auto BI = AccessStrideInfo.rbegin(), E = AccessStrideInfo.rend();
14
←
Loop condition is true.  Entering loop body→
     BI != E; ++BI) {
4
←
Calling 'operator!=<std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>, std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>>'→
13
←
Returning from 'operator!=<std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>, std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>>'→
  Instruction *B = BI->first;
  StrideDescriptor DesB = BI->second;

  // Initialize a group for B if it has an allowable stride. Even if we don't
  // create a group for B, we continue with the bottom-up algorithm to ensure
  // we don't break any of B's dependences.
  InterleaveGroup<Instruction> *Group = nullptr;
15
←
'Group' initialized to a null pointer value→
  if (isStrided(DesB.Stride) &&
      (!isPredicated(B->getParent()) || EnablePredicatedInterleavedMemAccesses)) {
    Group = getInterleaveGroup(B);
    if (!Group) {
      LLVM_DEBUG(dbgs() << "LV: Creating an interleave group with:" << *Bdo { } while (false)
                        << '\n')do { } while (false);
      Group = createInterleaveGroup(B, DesB.Stride, DesB.Alignment);
    }
    if (B->mayWriteToMemory())
      StoreGroups.insert(Group);
    else
      LoadGroups.insert(Group);
  }

  for (auto AI = std::next(BI); AI != E; ++AI) {
16
←
Calling 'operator!=<std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>, std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>>'→
25
←
Returning from 'operator!=<std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>, std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>>'→
26
←
Loop condition is true.  Entering loop body→
34
←
Calling 'operator!=<std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>, std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>>'→
43
←
Returning from 'operator!=<std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>, std::__wrap_iter<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>>'→
44
←
Loop condition is true.  Entering loop body→
    Instruction *A = AI->first;
    StrideDescriptor DesA = AI->second;

    // Our code motion strategy implies that we can't have dependences
    // between accesses in an interleaved group and other accesses located
    // between the first and last member of the group. Note that this also
    // means that a group can't have more than one member at a given offset.
    // The accesses in a group can have dependences with other accesses, but
    // we must ensure we don't extend the boundaries of the group such that
    // we encompass those dependent accesses.
    //
    // For example, assume we have the sequence of accesses shown below in a
    // stride-2 loop:
    //
    //  (1, 2) is a group | A[i]   = a;  // (1)
    //                    | A[i-1] = b;  // (2) |
    //                      A[i-3] = c;  // (3)
    //                      A[i]   = d;  // (4) | (2, 4) is not a group
    //
    // Because accesses (2) and (3) are dependent, we can group (2) with (1)
    // but not with (4). If we did, the dependent access (3) would be within
    // the boundaries of the (2, 4) group.
    if (!canReorderMemAccessesForInterleavedGroups(&*AI, &*BI)) {
27
←
Calling 'InterleavedAccessInfo::canReorderMemAccessesForInterleavedGroups'→
31
←
Returning from 'InterleavedAccessInfo::canReorderMemAccessesForInterleavedGroups'→
32
←
Taking false branch→
45
←
Calling 'InterleavedAccessInfo::canReorderMemAccessesForInterleavedGroups'→
49
←
Returning from 'InterleavedAccessInfo::canReorderMemAccessesForInterleavedGroups'→
50
←
Taking false branch→
      // If a dependence exists and A is already in a group, we know that A
      // must be a store since A precedes B and WAR dependences are allowed.
      // Thus, A would be sunk below B. We release A's group to prevent this
      // illegal code motion. A will then be free to form another group with
      // instructions that precede it.
      if (isInterleaved(A)) {
        InterleaveGroup<Instruction> *StoreGroup = getInterleaveGroup(A);

        LLVM_DEBUG(dbgs() << "LV: Invalidated store group due to "do { } while (false)
                             "dependence between " << *A << " and "<< *B << '\n')do { } while (false);

        StoreGroups.remove(StoreGroup);
        releaseGroup(StoreGroup);
      }

      // If a dependence exists and A is not already in a group (or it was
      // and we just released it), B might be hoisted above A (if B is a
      // load) or another store might be sunk below A (if B is a store). In
      // either case, we can't add additional instructions to B's group. B
      // will only form a group with instructions that it precedes.
      break;
    }

    // At this point, we've checked for illegal code motion. If either A or B
    // isn't strided, there's nothing left to do.
    if (!isStrided(DesA.Stride) || !isStrided(DesB.Stride))
51
←
Calling 'InterleavedAccessInfo::isStrided'→
55
←
Returning from 'InterleavedAccessInfo::isStrided'→
56
←
Calling 'InterleavedAccessInfo::isStrided'→
60
←
Returning from 'InterleavedAccessInfo::isStrided'→
61
←
Taking false branch→
      continue;
33
←
 Execution continues on line 1084→

    // Ignore A if it's already in a group or isn't the same kind of memory
    // operation as B.
    // Note that mayReadFromMemory() isn't mutually exclusive to
    // mayWriteToMemory in the case of atomic loads. We shouldn't see those
    // here, canVectorizeMemory() should have returned false - except for the
    // case we asked for optimization remarks.
    if (isInterleaved(A) ||
62
←
Calling 'InterleavedAccessInfo::isInterleaved'→
71
←
Returning from 'InterleavedAccessInfo::isInterleaved'→
74
←
Taking false branch→
        (A->mayReadFromMemory() != B->mayReadFromMemory()) ||
72
←
Assuming the condition is false→
        (A->mayWriteToMemory() != B->mayWriteToMemory()))
73
←
Assuming the condition is false→
      continue;

    // Check rules 1 and 2. Ignore A if its stride or size is different from
    // that of B.
    if (DesA.Stride != DesB.Stride || DesA.Size != DesB.Size)
75
←
Assuming 'DesA.Stride' is equal to 'DesB.Stride'→
76
←
Assuming 'DesA.Size' is equal to 'DesB.Size'→
77
←
Taking false branch→
      continue;

    // Ignore A if the memory object of A and B don't belong to the same
    // address space
    if (getLoadStoreAddressSpace(A) != getLoadStoreAddressSpace(B))
78
←
Assuming the condition is false→
79
←
Taking false branch→
      continue;

    // Calculate the distance from A to B.
    const SCEVConstant *DistToB = dyn_cast<SCEVConstant>(
80
←
Assuming the object is a 'SCEVConstant'→
        PSE.getSE()->getMinusSCEV(DesA.Scev, DesB.Scev));
    if (!DistToB80.1
'DistToB' is non-null
1
'DistToB' is non-null
1
'DistToB' is non-null
1
'DistToB' is non-null
1
'DistToB' is non-null
)
81
←
Taking false branch→
      continue;
    int64_t DistanceToB = DistToB->getAPInt().getSExtValue();

    // Check rule 3. Ignore A if its distance to B is not a multiple of the
    // size.
    if (DistanceToB % static_cast<int64_t>(DesB.Size))
82
←
Assuming the condition is false→
83
←
Taking false branch→
      continue;

    // All members of a predicated interleave-group must have the same predicate,
    // and currently must reside in the same BB.
    BasicBlock *BlockA = A->getParent();
    BasicBlock *BlockB = B->getParent();
    if ((isPredicated(BlockA) || isPredicated(BlockB)) &&
84
←
Assuming the condition is true→
87
←
Taking false branch→
        (!EnablePredicatedInterleavedMemAccesses || BlockA != BlockB))
85
←
Assuming 'EnablePredicatedInterleavedMemAccesses' is true→
86
←
Assuming 'BlockA' is equal to 'BlockB'→
      continue;

    // The index of A is the index of B plus A's distance to B in multiples
    // of the size.
    int IndexA =
        Group->getIndex(B) + DistanceToB / static_cast<int64_t>(DesB.Size);
88
←
Called C++ object pointer is null

    // Try to insert A into B's group.
    if (Group->insertMember(A, IndexA, DesA.Alignment)) {
      LLVM_DEBUG(dbgs() << "LV: Inserted:" << *A << '\n'do { } while (false)
                        << "    into the interleave group with" << *Bdo { } while (false)
                        << '\n')do { } while (false);
      InterleaveGroupMap[A] = Group;

      // Set the first load in program order as the insert position.
      if (A->mayReadFromMemory())
        Group->setInsertPos(A);
    }
  } // Iteration over A accesses.
}   // Iteration over B accesses.

// Remove interleaved store groups with gaps.
for (auto *Group : StoreGroups)
  if (Group->getNumMembers() != Group->getFactor()) {
    LLVM_DEBUG(do { } while (false)
        dbgs() << "LV: Invalidate candidate interleaved store group due "do { } while (false)
                  "to gaps.\n")do { } while (false);
    releaseGroup(Group);
  }
// Remove interleaved groups with gaps (currently only loads) whose memory
// accesses may wrap around. We have to revisit the getPtrStride analysis,
// this time with ShouldCheckWrap=true, since collectConstStrideAccesses does
// not check wrapping (see documentation there).
// FORNOW we use Assume=false;
// TODO: Change to Assume=true but making sure we don't exceed the threshold
// of runtime SCEV assumptions checks (thereby potentially failing to
// vectorize altogether).
// Additional optional optimizations:
// TODO: If we are peeling the loop and we know that the first pointer doesn't
// wrap then we can deduce that all pointers in the group don't wrap.
// This means that we can forcefully peel the loop in order to only have to
// check the first pointer for no-wrap. When we'll change to use Assume=true
// we'll only need at most one runtime check per interleaved group.
for (auto *Group : LoadGroups) {
  // Case 1: A full group. Can Skip the checks; For full groups, if the wide
  // load would wrap around the address space we would do a memory access at
  // nullptr even without the transformation.
  if (Group->getNumMembers() == Group->getFactor())
    continue;

  // Case 2: If first and last members of the group don't wrap this implies
  // that all the pointers in the group don't wrap.
  // So we check only group member 0 (which is always guaranteed to exist),
  // and group member Factor - 1; If the latter doesn't exist we rely on
  // peeling (if it is a non-reversed accsess -- see Case 3).
  Value *FirstMemberPtr = getLoadStorePointerOperand(Group->getMember(0));
  if (!getPtrStride(PSE, FirstMemberPtr, TheLoop, Strides, /*Assume=*/false,
                    /*ShouldCheckWrap=*/true)) {
    LLVM_DEBUG(do { } while (false)
        dbgs() << "LV: Invalidate candidate interleaved group due to "do { } while (false)
                  "first group member potentially pointer-wrapping.\n")do { } while (false);
    releaseGroup(Group);
    continue;
  }
  Instruction *LastMember = Group->getMember(Group->getFactor() - 1);
  if (LastMember) {
    Value *LastMemberPtr = getLoadStorePointerOperand(LastMember);
    if (!getPtrStride(PSE, LastMemberPtr, TheLoop, Strides, /*Assume=*/false,
                      /*ShouldCheckWrap=*/true)) {
      LLVM_DEBUG(do { } while (false)
          dbgs() << "LV: Invalidate candidate interleaved group due to "do { } while (false)
                    "last group member potentially pointer-wrapping.\n")do { } while (false);
      releaseGroup(Group);
    }
  } else {
    // Case 3: A non-reversed interleaved load group with gaps: We need
    // to execute at least one scalar epilogue iteration. This will ensure
    // we don't speculatively access memory out-of-bounds. We only need
    // to look for a member at index factor - 1, since every group must have
    // a member at index zero.
    if (Group->isReverse()) {
      LLVM_DEBUG(do { } while (false)
          dbgs() << "LV: Invalidate candidate interleaved group due to "do { } while (false)
                    "a reverse access with gaps.\n")do { } while (false);
      releaseGroup(Group);
      continue;
    }
    LLVM_DEBUG(do { } while (false)
        dbgs() << "LV: Interleaved group requires epilogue iteration.\n")do { } while (false);
    RequiresScalarEpilogue = true;
  }
}
1267}

1269void InterleavedAccessInfo::invalidateGroupsRequiringScalarEpilogue() {
// If no group had triggered the requirement to create an epilogue loop,
// there is nothing to do.
if (!requiresScalarEpilogue())
  return;

bool ReleasedGroup = false;
// Release groups requiring scalar epilogues. Note that this also removes them
// from InterleaveGroups.
for (auto *Group : make_early_inc_range(InterleaveGroups)) {
  if (!Group->requiresScalarEpilogue())
    continue;
  LLVM_DEBUG(do { } while (false)
      dbgs()do { } while (false)
      << "LV: Invalidate candidate interleaved group due to gaps that "do { } while (false)
         "require a scalar epilogue (not allowed under optsize) and cannot "do { } while (false)
         "be masked (not enabled). \n")do { } while (false);
  releaseGroup(Group);
  ReleasedGroup = true;
}
assert(ReleasedGroup && "At least one group must be invalidated, as a "((void)0)
                        "scalar epilogue was required")((void)0);
(void)ReleasedGroup;
RequiresScalarEpilogue = false;
1293}

1295template <typename InstT>
1296void InterleaveGroup<InstT>::addMetadata(InstT *NewInst) const {
llvm_unreachable("addMetadata can only be used for Instruction")__builtin_unreachable();
1298}

1300namespace llvm {
1301template <>
1302void InterleaveGroup<Instruction>::addMetadata(Instruction *NewInst) const {
SmallVector<Value *, 4> VL;
std::transform(Members.begin(), Members.end(), std::back_inserter(VL),
               [](std::pair<int, Instruction *> p) { return p.second; });
propagateMetadata(NewInst, VL);
1307}
1308}

1310std::string VFABI::mangleTLIVectorName(StringRef VectorName,
                                     StringRef ScalarName, unsigned numArgs,
                                     ElementCount VF) {
SmallString<256> Buffer;
llvm::raw_svector_ostream Out(Buffer);
Out << "_ZGV" << VFABI::_LLVM_ << "N";
if (VF.isScalable())
  Out << 'x';
else
  Out << VF.getFixedValue();
for (unsigned I = 0; I < numArgs; ++I)
  Out << "v";
Out << "_" << ScalarName << "(" << VectorName << ")";
return std::string(Out.str());
1324}

1326void VFABI::getVectorVariantNames(
  const CallInst &CI, SmallVectorImpl<std::string> &VariantMappings) {
const StringRef S =
    CI.getAttribute(AttributeList::FunctionIndex, VFABI::MappingsAttrName)
        .getValueAsString();
if (S.empty())
  return;

SmallVector<StringRef, 8> ListAttr;
S.split(ListAttr, ",");

for (auto &S : SetVector<StringRef>(ListAttr.begin(), ListAttr.end())) {
1338#ifndef NDEBUG1
  LLVM_DEBUG(dbgs() << "VFABI: adding mapping '" << S << "'\n")do { } while (false);
  Optional<VFInfo> Info = VFABI::tryDemangleForVFABI(S, *(CI.getModule()));
  assert(Info.hasValue() && "Invalid name for a VFABI variant.")((void)0);
  assert(CI.getModule()->getFunction(Info.getValue().VectorName) &&((void)0)
         "Vector function is missing.")((void)0);
1344#endif
  VariantMappings.push_back(std::string(S));
}
1347}

1349bool VFShape::hasValidParameterList() const {
for (unsigned Pos = 0, NumParams = Parameters.size(); Pos < NumParams;
     ++Pos) {
  assert(Parameters[Pos].ParamPos == Pos && "Broken parameter list.")((void)0);

  switch (Parameters[Pos].ParamKind) {
  default: // Nothing to check.
    break;
  case VFParamKind::OMP_Linear:
  case VFParamKind::OMP_LinearRef:
  case VFParamKind::OMP_LinearVal:
  case VFParamKind::OMP_LinearUVal:
    // Compile time linear steps must be non-zero.
    if (Parameters[Pos].LinearStepOrPos == 0)
      return false;
    break;
  case VFParamKind::OMP_LinearPos:
  case VFParamKind::OMP_LinearRefPos:
  case VFParamKind::OMP_LinearValPos:
  case VFParamKind::OMP_LinearUValPos:
    // The runtime linear step must be referring to some other
    // parameters in the signature.
    if (Parameters[Pos].LinearStepOrPos >= int(NumParams))
      return false;
    // The linear step parameter must be marked as uniform.
    if (Parameters[Parameters[Pos].LinearStepOrPos].ParamKind !=
        VFParamKind::OMP_Uniform)
      return false;
    // The linear step parameter can't point at itself.
    if (Parameters[Pos].LinearStepOrPos == int(Pos))
      return false;
    break;
  case VFParamKind::GlobalPredicate:
    // The global predicate must be the unique. Can be placed anywhere in the
    // signature.
    for (unsigned NextPos = Pos + 1; NextPos < NumParams; ++NextPos)
      if (Parameters[NextPos].ParamKind == VFParamKind::GlobalPredicate)
        return false;
    break;
  }
}
return true;
1391}

←

/usr/include/c++/v1/__iterator/reverse_iterator.h

→

1// -*- C++ -*-
2//===----------------------------------------------------------------------===//
3//
4// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
5// See https://llvm.org/LICENSE.txt for license information.
6// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7//
8//===----------------------------------------------------------------------===//
9 
10#ifndef _LIBCPP___ITERATOR_REVERSE_ITERATOR_H
11#define _LIBCPP___ITERATOR_REVERSE_ITERATOR_H
12 
13#include <__config>
14#include <__iterator/iterator.h>
15#include <__iterator/iterator_traits.h>
16#include <__memory/addressof.h>
17#include <type_traits>
18 
19#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
20#pragma GCC system_header
21#endif
22 
23_LIBCPP_PUSH_MACROSpush_macro("min")
 push_macro("max")
24#include <__undef_macros>
25 
26_LIBCPP_BEGIN_NAMESPACE_STDnamespace std { inline namespace __1 {
27 
28template <class _Tp, class = void>
29struct __is_stashing_iterator : false_type {};
30 
31template <class _Tp>
32struct __is_stashing_iterator<_Tp, typename __void_t<typename _Tp::__stashing_iterator_tag>::type>
33  : true_type {};
34 
35_LIBCPP_SUPPRESS_DEPRECATED_PUSHGCC diagnostic push
 GCC diagnostic ignored "-Wdeprecated"
 GCC
 diagnostic ignored "-Wdeprecated-declarations"
36template <class _Iter>
37class _LIBCPP_TEMPLATE_VIS__attribute__ ((__type_visibility__("default"))) reverse_iterator
38#if _LIBCPP_STD_VER14 <= 14 || !defined(_LIBCPP_ABI_NO_ITERATOR_BASES)
39    : public iterator<typename iterator_traits<_Iter>::iterator_category,
40                      typename iterator_traits<_Iter>::value_type,
41                      typename iterator_traits<_Iter>::difference_type,
42                      typename iterator_traits<_Iter>::pointer,
43                      typename iterator_traits<_Iter>::reference>
44#endif
45{
46_LIBCPP_SUPPRESS_DEPRECATED_POPGCC diagnostic pop
47private:
48#ifndef _LIBCPP_ABI_NO_ITERATOR_BASES
49    _Iter __t; // no longer used as of LWG #2360, not removed due to ABI break
50#endif
51 
52    static_assert(!__is_stashing_iterator<_Iter>::value,
53      "The specified iterator type cannot be used with reverse_iterator; "
54      "Using stashing iterators with reverse_iterator causes undefined behavior");
55 
56protected:
57    _Iter current;
58public:
59    typedef _Iter                                            iterator_type;
60    typedef typename iterator_traits<_Iter>::difference_type difference_type;
61    typedef typename iterator_traits<_Iter>::reference       reference;
62    typedef typename iterator_traits<_Iter>::pointer         pointer;
63    typedef _If<__is_cpp17_random_access_iterator<_Iter>::value,
64        random_access_iterator_tag,
65        typename iterator_traits<_Iter>::iterator_category>  iterator_category;
66    typedef typename iterator_traits<_Iter>::value_type      value_type;
67 
68#if _LIBCPP_STD_VER14 > 17
69    typedef _If<__is_cpp17_random_access_iterator<_Iter>::value,
70        random_access_iterator_tag,
71        bidirectional_iterator_tag>                          iterator_concept;
72#endif
73 
74#ifndef _LIBCPP_ABI_NO_ITERATOR_BASES
75    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
76    reverse_iterator() : __t(), current() {}
77 
78    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
79    explicit reverse_iterator(_Iter __x) : __t(__x), current(__x) {}
80 
81    template <class _Up, class = _EnableIf<
82        !is_same<_Up, _Iter>::value && is_convertible<_Up const&, _Iter>::value
83    > >
84    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
85    reverse_iterator(const reverse_iterator<_Up>& __u)
86        : __t(__u.base()), current(__u.base())
87    { }
88 
89    template <class _Up, class = _EnableIf<
90        !is_same<_Up, _Iter>::value &&
91        is_convertible<_Up const&, _Iter>::value &&
92        is_assignable<_Up const&, _Iter>::value
93    > >
94    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
95    reverse_iterator& operator=(const reverse_iterator<_Up>& __u) {
96        __t = current = __u.base();
97        return *this;
98    }
99#else
100    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
101    reverse_iterator() : current() {}
102 
103    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
104    explicit reverse_iterator(_Iter __x) : current(__x) {}
105 
106    template <class _Up, class = _EnableIf<
107        !is_same<_Up, _Iter>::value && is_convertible<_Up const&, _Iter>::value
108    > >
109    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
110    reverse_iterator(const reverse_iterator<_Up>& __u)
111        : current(__u.base())
112    { }
113 
114    template <class _Up, class = _EnableIf<
115        !is_same<_Up, _Iter>::value &&
116        is_convertible<_Up const&, _Iter>::value &&
117        is_assignable<_Up const&, _Iter>::value
118    > >
119    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
120    reverse_iterator& operator=(const reverse_iterator<_Up>& __u) {
121        current = __u.base();
122        return *this;
123    }
124#endif
125    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
126    _Iter base() const {return current;}
127    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
128    reference operator*() const {_Iter __tmp = current; return *--__tmp;}
129    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
130    pointer  operator->() const {return _VSTDstd::__1::addressof(operator*());}
131    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
132    reverse_iterator& operator++() {--current; return *this;}
133    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
134    reverse_iterator  operator++(int) {reverse_iterator __tmp(*this); --current; return __tmp;}
135    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
136    reverse_iterator& operator--() {++current; return *this;}
137    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
138    reverse_iterator  operator--(int) {reverse_iterator __tmp(*this); ++current; return __tmp;}
139    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
140    reverse_iterator  operator+ (difference_type __n) const {return reverse_iterator(current - __n);}
141    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
142    reverse_iterator& operator+=(difference_type __n) {current -= __n; return *this;}
143    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
144    reverse_iterator  operator- (difference_type __n) const {return reverse_iterator(current + __n);}
145    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
146    reverse_iterator& operator-=(difference_type __n) {current += __n; return *this;}
147    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
148    reference         operator[](difference_type __n) const {return *(*this + __n);}
149};
150 
151template <class _Iter1, class _Iter2>
152inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
153bool
154operator==(const reverse_iterator<_Iter1>& __x, const reverse_iterator<_Iter2>& __y)
155{
156    return __x.base() == __y.base();
157}
158 
159template <class _Iter1, class _Iter2>
160inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
161bool
162operator<(const reverse_iterator<_Iter1>& __x, const reverse_iterator<_Iter2>& __y)
163{
164    return __x.base() > __y.base();
165}
166 
167template <class _Iter1, class _Iter2>
168inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
169bool
170operator!=(const reverse_iterator<_Iter1>& __x, const reverse_iterator<_Iter2>& __y)
171{
172    return __x.base() != __y.base();
5
←
Calling 'operator!=<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
11
←
Returning from 'operator!=<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
12
←
Returning the value 1, which participates in a condition later→
17
←
Calling 'operator!=<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
23
←
Returning from 'operator!=<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
24
←
Returning the value 1, which participates in a condition later→
35
←
Calling 'operator!=<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
41
←
Returning from 'operator!=<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
42
←
Returning the value 1, which participates in a condition later→
173}
174 
175template <class _Iter1, class _Iter2>
176inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
177bool
178operator>(const reverse_iterator<_Iter1>& __x, const reverse_iterator<_Iter2>& __y)
179{
180    return __x.base() < __y.base();
181}
182 
183template <class _Iter1, class _Iter2>
184inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
185bool
186operator>=(const reverse_iterator<_Iter1>& __x, const reverse_iterator<_Iter2>& __y)
187{
188    return __x.base() <= __y.base();
189}
190 
191template <class _Iter1, class _Iter2>
192inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
193bool
194operator<=(const reverse_iterator<_Iter1>& __x, const reverse_iterator<_Iter2>& __y)
195{
196    return __x.base() >= __y.base();
197}
198 
199#ifndef _LIBCPP_CXX03_LANG
200template <class _Iter1, class _Iter2>
201inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
202auto
203operator-(const reverse_iterator<_Iter1>& __x, const reverse_iterator<_Iter2>& __y)
204-> decltype(__y.base() - __x.base())
205{
206    return __y.base() - __x.base();
207}
208#else
209template <class _Iter1, class _Iter2>
210inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
))
211typename reverse_iterator<_Iter1>::difference_type
212operator-(const reverse_iterator<_Iter1>& __x, const reverse_iterator<_Iter2>& __y)
213{
214    return __y.base() - __x.base();
215}
216#endif
217 
218template <class _Iter>
219inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
220reverse_iterator<_Iter>
221operator+(typename reverse_iterator<_Iter>::difference_type __n, const reverse_iterator<_Iter>& __x)
222{
223    return reverse_iterator<_Iter>(__x.base() - __n);
224}
225 
226#if _LIBCPP_STD_VER14 > 11
227template <class _Iter>
228inline _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_AFTER_CXX14
229reverse_iterator<_Iter> make_reverse_iterator(_Iter __i)
230{
231    return reverse_iterator<_Iter>(__i);
232}
233#endif
234 
235_LIBCPP_END_NAMESPACE_STD} }
236 
237_LIBCPP_POP_MACROSpop_macro("min")
 pop_macro("max")
238 
239#endif // _LIBCPP___ITERATOR_REVERSE_ITERATOR_H

←

/usr/include/c++/v1/__iterator/wrap_iter.h

→

1// -*- C++ -*-
2//===----------------------------------------------------------------------===//
3//
4// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
5// See https://llvm.org/LICENSE.txt for license information.
6// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7//
8//===----------------------------------------------------------------------===//
9 
10#ifndef _LIBCPP___ITERATOR_WRAP_ITER_H
11#define _LIBCPP___ITERATOR_WRAP_ITER_H
12 
13#include <__config>
14#include <__debug>
15#include <__iterator/iterator_traits.h>
16#include <__memory/pointer_traits.h> // __to_address
17#include <type_traits>
18 
19#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
20#pragma GCC system_header
21#endif
22 
23_LIBCPP_PUSH_MACROSpush_macro("min")
 push_macro("max")
24#include <__undef_macros>
25 
26_LIBCPP_BEGIN_NAMESPACE_STDnamespace std { inline namespace __1 {
27 
28template <class _Iter>
29class __wrap_iter
30{
31public:
32    typedef _Iter                                                      iterator_type;
33    typedef typename iterator_traits<iterator_type>::value_type        value_type;
34    typedef typename iterator_traits<iterator_type>::difference_type   difference_type;
35    typedef typename iterator_traits<iterator_type>::pointer           pointer;
36    typedef typename iterator_traits<iterator_type>::reference         reference;
37    typedef typename iterator_traits<iterator_type>::iterator_category iterator_category;
38#if _LIBCPP_STD_VER14 > 17
39    typedef contiguous_iterator_tag                                    iterator_concept;
40#endif
41 
42private:
43    iterator_type __i;
44public:
45    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter() _NOEXCEPTnoexcept
46#if _LIBCPP_STD_VER14 > 11
47                : __i{}
48#endif
49    {
50#if _LIBCPP_DEBUG_LEVEL0 == 2
51        __get_db()->__insert_i(this);
52#endif
53    }
54    template <class _Up> _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
55        __wrap_iter(const __wrap_iter<_Up>& __u,
56            typename enable_if<is_convertible<_Up, iterator_type>::value>::type* = nullptr) _NOEXCEPTnoexcept
57            : __i(__u.base())
58    {
59#if _LIBCPP_DEBUG_LEVEL0 == 2
60        __get_db()->__iterator_copy(this, &__u);
61#endif
62    }
63#if _LIBCPP_DEBUG_LEVEL0 == 2
64    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
65    __wrap_iter(const __wrap_iter& __x)
66        : __i(__x.base())
67    {
68        __get_db()->__iterator_copy(this, &__x);
69    }
70    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
71    __wrap_iter& operator=(const __wrap_iter& __x)
72    {
73        if (this != &__x)
74        {
75            __get_db()->__iterator_copy(this, &__x);
76            __i = __x.__i;
77        }
78        return *this;
79    }
80    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
81    ~__wrap_iter()
82    {
83        __get_db()->__erase_i(this);
84    }
85#endif
86    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr reference operator*() const _NOEXCEPTnoexcept
87    {
88#if _LIBCPP_DEBUG_LEVEL0 == 2
89        _LIBCPP_ASSERT(__get_const_db()->__dereferenceable(this),((void)0)
90                       "Attempted to dereference a non-dereferenceable iterator")((void)0);
91#endif
92        return *__i;
93    }
94    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr pointer  operator->() const _NOEXCEPTnoexcept
95    {
96#if _LIBCPP_DEBUG_LEVEL0 == 2
97        _LIBCPP_ASSERT(__get_const_db()->__dereferenceable(this),((void)0)
98                       "Attempted to dereference a non-dereferenceable iterator")((void)0);
99#endif
100        return _VSTDstd::__1::__to_address(__i);
101    }
102    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter& operator++() _NOEXCEPTnoexcept
103    {
104#if _LIBCPP_DEBUG_LEVEL0 == 2
105        _LIBCPP_ASSERT(__get_const_db()->__dereferenceable(this),((void)0)
106                       "Attempted to increment a non-incrementable iterator")((void)0);
107#endif
108        ++__i;
109        return *this;
110    }
111    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter  operator++(int) _NOEXCEPTnoexcept
112        {__wrap_iter __tmp(*this); ++(*this); return __tmp;}
113 
114    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter& operator--() _NOEXCEPTnoexcept
115    {
116#if _LIBCPP_DEBUG_LEVEL0 == 2
117        _LIBCPP_ASSERT(__get_const_db()->__decrementable(this),((void)0)
118                       "Attempted to decrement a non-decrementable iterator")((void)0);
119#endif
120        --__i;
121        return *this;
122    }
123    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter  operator--(int) _NOEXCEPTnoexcept
124        {__wrap_iter __tmp(*this); --(*this); return __tmp;}
125    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter  operator+ (difference_type __n) const _NOEXCEPTnoexcept
126        {__wrap_iter __w(*this); __w += __n; return __w;}
127    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter& operator+=(difference_type __n) _NOEXCEPTnoexcept
128    {
129#if _LIBCPP_DEBUG_LEVEL0 == 2
130        _LIBCPP_ASSERT(__get_const_db()->__addable(this, __n),((void)0)
131                   "Attempted to add/subtract an iterator outside its valid range")((void)0);
132#endif
133        __i += __n;
134        return *this;
135    }
136    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter  operator- (difference_type __n) const _NOEXCEPTnoexcept
137        {return *this + (-__n);}
138    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter& operator-=(difference_type __n) _NOEXCEPTnoexcept
139        {*this += -__n; return *this;}
140    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr reference    operator[](difference_type __n) const _NOEXCEPTnoexcept
141    {
142#if _LIBCPP_DEBUG_LEVEL0 == 2
143        _LIBCPP_ASSERT(__get_const_db()->__subscriptable(this, __n),((void)0)
144                   "Attempted to subscript an iterator outside its valid range")((void)0);
145#endif
146        return __i[__n];
147    }
148 
149    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr iterator_type base() const _NOEXCEPTnoexcept {return __i;}
150 
151private:
152#if _LIBCPP_DEBUG_LEVEL0 == 2
153    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter(const void* __p, iterator_type __x) : __i(__x)
154    {
155        __get_db()->__insert_ic(this, __p);
156    }
157#else
158    _LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr __wrap_iter(iterator_type __x) _NOEXCEPTnoexcept : __i(__x) {}
159#endif
160 
161    template <class _Up> friend class __wrap_iter;
162    template <class _CharT, class _Traits, class _Alloc> friend class basic_string;
163    template <class _Tp, class _Alloc> friend class _LIBCPP_TEMPLATE_VIS__attribute__ ((__type_visibility__("default"))) vector;
164    template <class _Tp, size_t> friend class _LIBCPP_TEMPLATE_VIS__attribute__ ((__type_visibility__("default"))) span;
165};
166 
167template <class _Iter1>
168_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
169bool operator==(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter1>& __y) _NOEXCEPTnoexcept
170{
171    return __x.base() == __y.base();
7
←
Assuming the condition is false→
8
←
Returning zero, which participates in a condition later→
19
←
Assuming the condition is false→
20
←
Returning zero, which participates in a condition later→
37
←
Assuming the condition is false→
38
←
Returning zero, which participates in a condition later→
172}
173 
174template <class _Iter1, class _Iter2>
175_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
176bool operator==(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter2>& __y) _NOEXCEPTnoexcept
177{
178    return __x.base() == __y.base();
179}
180 
181template <class _Iter1>
182_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
183bool operator<(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter1>& __y) _NOEXCEPTnoexcept
184{
185#if _LIBCPP_DEBUG_LEVEL0 == 2
186    _LIBCPP_ASSERT(__get_const_db()->__less_than_comparable(&__x, &__y),((void)0)
187                   "Attempted to compare incomparable iterators")((void)0);
188#endif
189    return __x.base() < __y.base();
190}
191 
192template <class _Iter1, class _Iter2>
193_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
194bool operator<(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter2>& __y) _NOEXCEPTnoexcept
195{
196#if _LIBCPP_DEBUG_LEVEL0 == 2
197    _LIBCPP_ASSERT(__get_const_db()->__less_than_comparable(&__x, &__y),((void)0)
198                   "Attempted to compare incomparable iterators")((void)0);
199#endif
200    return __x.base() < __y.base();
201}
202 
203template <class _Iter1>
204_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
205bool operator!=(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter1>& __y) _NOEXCEPTnoexcept
206{
207    return !(__x == __y);
6
←
Calling 'operator==<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
9
←
Returning from 'operator==<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
10
←
Returning the value 1, which participates in a condition later→
18
←
Calling 'operator==<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
21
←
Returning from 'operator==<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
22
←
Returning the value 1, which participates in a condition later→
36
←
Calling 'operator==<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
39
←
Returning from 'operator==<std::pair<llvm::Instruction *, llvm::InterleavedAccessInfo::StrideDescriptor> *>'→
40
←
Returning the value 1, which participates in a condition later→
208}
209 
210template <class _Iter1, class _Iter2>
211_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
212bool operator!=(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter2>& __y) _NOEXCEPTnoexcept
213{
214    return !(__x == __y);
215}
216 
217template <class _Iter1>
218_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
219bool operator>(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter1>& __y) _NOEXCEPTnoexcept
220{
221    return __y < __x;
222}
223 
224template <class _Iter1, class _Iter2>
225_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
226bool operator>(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter2>& __y) _NOEXCEPTnoexcept
227{
228    return __y < __x;
229}
230 
231template <class _Iter1>
232_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
233bool operator>=(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter1>& __y) _NOEXCEPTnoexcept
234{
235    return !(__x < __y);
236}
237 
238template <class _Iter1, class _Iter2>
239_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
240bool operator>=(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter2>& __y) _NOEXCEPTnoexcept
241{
242    return !(__x < __y);
243}
244 
245template <class _Iter1>
246_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
247bool operator<=(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter1>& __y) _NOEXCEPTnoexcept
248{
249    return !(__y < __x);
250}
251 
252template <class _Iter1, class _Iter2>
253_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
254bool operator<=(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter2>& __y) _NOEXCEPTnoexcept
255{
256    return !(__y < __x);
257}
258 
259template <class _Iter1, class _Iter2>
260_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
261#ifndef _LIBCPP_CXX03_LANG
262auto operator-(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter2>& __y) _NOEXCEPTnoexcept
263    -> decltype(__x.base() - __y.base())
264#else
265typename __wrap_iter<_Iter1>::difference_type
266operator-(const __wrap_iter<_Iter1>& __x, const __wrap_iter<_Iter2>& __y) _NOEXCEPTnoexcept
267#endif // C++03
268{
269#if _LIBCPP_DEBUG_LEVEL0 == 2
270    _LIBCPP_ASSERT(__get_const_db()->__less_than_comparable(&__x, &__y),((void)0)
271                   "Attempted to subtract incompatible iterators")((void)0);
272#endif
273    return __x.base() - __y.base();
274}
275 
276template <class _Iter1>
277_LIBCPP_INLINE_VISIBILITY__attribute__ ((__visibility__("hidden"))) __attribute__ ((__exclude_from_explicit_instantiation__
)) _LIBCPP_CONSTEXPR_IF_NODEBUGconstexpr
278__wrap_iter<_Iter1> operator+(typename __wrap_iter<_Iter1>::difference_type __n, __wrap_iter<_Iter1> __x) _NOEXCEPTnoexcept
279{
280    __x += __n;
281    return __x;
282}
283 
284#if _LIBCPP_STD_VER14 <= 17
285template <class _It>
286struct __is_cpp17_contiguous_iterator<__wrap_iter<_It> > : true_type {};
287#endif
288 
289template <class _Iter>
290_LIBCPP_CONSTEXPRconstexpr
291decltype(_VSTDstd::__1::__to_address(declval<_Iter>()))
292__to_address(__wrap_iter<_Iter> __w) _NOEXCEPTnoexcept {
293    return _VSTDstd::__1::__to_address(__w.base());
294}
295 
296_LIBCPP_END_NAMESPACE_STD} }
297 
298_LIBCPP_POP_MACROSpop_macro("min")
 pop_macro("max")
299 
300#endif // _LIBCPP___ITERATOR_WRAP_ITER_H

←

/usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/Analysis/VectorUtils.h

→

1//===- llvm/Analysis/VectorUtils.h - Vector utilities -----------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines some vectorizer utilities.
10//
11//===----------------------------------------------------------------------===//
12 
13#ifndef LLVM_ANALYSIS_VECTORUTILS_H
14#define LLVM_ANALYSIS_VECTORUTILS_H
15 
16#include "llvm/ADT/MapVector.h"
17#include "llvm/ADT/SmallVector.h"
18#include "llvm/Analysis/LoopAccessAnalysis.h"
19#include "llvm/Support/CheckedArithmetic.h"
20 
21namespace llvm {
22class TargetLibraryInfo;
23 
24/// Describes the type of Parameters
25enum class VFParamKind {
26  Vector,            // No semantic information.
27  OMP_Linear,        // declare simd linear(i)
28  OMP_LinearRef,     // declare simd linear(ref(i))
29  OMP_LinearVal,     // declare simd linear(val(i))
30  OMP_LinearUVal,    // declare simd linear(uval(i))
31  OMP_LinearPos,     // declare simd linear(i:c) uniform(c)
32  OMP_LinearValPos,  // declare simd linear(val(i:c)) uniform(c)
33  OMP_LinearRefPos,  // declare simd linear(ref(i:c)) uniform(c)
34  OMP_LinearUValPos, // declare simd linear(uval(i:c)) uniform(c)
35  OMP_Uniform,       // declare simd uniform(i)
36  GlobalPredicate,   // Global logical predicate that acts on all lanes
37                     // of the input and output mask concurrently. For
38                     // example, it is implied by the `M` token in the
39                     // Vector Function ABI mangled name.
40  Unknown
41};
42 
43/// Describes the type of Instruction Set Architecture
44enum class VFISAKind {
45  AdvancedSIMD, // AArch64 Advanced SIMD (NEON)
46  SVE,          // AArch64 Scalable Vector Extension
47  SSE,          // x86 SSE
48  AVX,          // x86 AVX
49  AVX2,         // x86 AVX2
50  AVX512,       // x86 AVX512
51  LLVM,         // LLVM internal ISA for functions that are not
52  // attached to an existing ABI via name mangling.
53  Unknown // Unknown ISA
54};
55 
56/// Encapsulates information needed to describe a parameter.
57///
58/// The description of the parameter is not linked directly to
59/// OpenMP or any other vector function description. This structure
60/// is extendible to handle other paradigms that describe vector
61/// functions and their parameters.
62struct VFParameter {
63  unsigned ParamPos;         // Parameter Position in Scalar Function.
64  VFParamKind ParamKind;     // Kind of Parameter.
65  int LinearStepOrPos = 0;   // Step or Position of the Parameter.
66  Align Alignment = Align(); // Optional alignment in bytes, defaulted to 1.
67 
68  // Comparison operator.
69  bool operator==(const VFParameter &Other) const {
70    return std::tie(ParamPos, ParamKind, LinearStepOrPos, Alignment) ==
71           std::tie(Other.ParamPos, Other.ParamKind, Other.LinearStepOrPos,
72                    Other.Alignment);
73  }
74};
75 
76/// Contains the information about the kind of vectorization
77/// available.
78///
79/// This object in independent on the paradigm used to
80/// represent vector functions. in particular, it is not attached to
81/// any target-specific ABI.
82struct VFShape {
83  ElementCount VF;                        // Vectorization factor.
84  SmallVector<VFParameter, 8> Parameters; // List of parameter information.
85  // Comparison operator.
86  bool operator==(const VFShape &Other) const {
87    return std::tie(VF, Parameters) == std::tie(Other.VF, Other.Parameters);
88  }
89 
90  /// Update the parameter in position P.ParamPos to P.
91  void updateParam(VFParameter P) {
92    assert(P.ParamPos < Parameters.size() && "Invalid parameter position.")((void)0);
93    Parameters[P.ParamPos] = P;
94    assert(hasValidParameterList() && "Invalid parameter list")((void)0);
95  }
96 
97  // Retrieve the VFShape that can be used to map a (scalar) function to itself,
98  // with VF = 1.
99  static VFShape getScalarShape(const CallInst &CI) {
100    return VFShape::get(CI, ElementCount::getFixed(1),
101                        /*HasGlobalPredicate*/ false);
102  }
103 
104  // Retrieve the basic vectorization shape of the function, where all
105  // parameters are mapped to VFParamKind::Vector with \p EC
106  // lanes. Specifies whether the function has a Global Predicate
107  // argument via \p HasGlobalPred.
108  static VFShape get(const CallInst &CI, ElementCount EC, bool HasGlobalPred) {
109    SmallVector<VFParameter, 8> Parameters;
110    for (unsigned I = 0; I < CI.arg_size(); ++I)
111      Parameters.push_back(VFParameter({I, VFParamKind::Vector}));
112    if (HasGlobalPred)
113      Parameters.push_back(
114          VFParameter({CI.arg_size(), VFParamKind::GlobalPredicate}));
115 
116    return {EC, Parameters};
117  }
118  /// Sanity check on the Parameters in the VFShape.
119  bool hasValidParameterList() const;
120};
121 
122/// Holds the VFShape for a specific scalar to vector function mapping.
123struct VFInfo {
124  VFShape Shape;          /// Classification of the vector function.
125  std::string ScalarName; /// Scalar Function Name.
126  std::string VectorName; /// Vector Function Name associated to this VFInfo.
127  VFISAKind ISA;          /// Instruction Set Architecture.
128};
129 
130namespace VFABI {
131/// LLVM Internal VFABI ISA token for vector functions.
132static constexpr char const *_LLVM_ = "_LLVM_";
133/// Prefix for internal name redirection for vector function that
134/// tells the compiler to scalarize the call using the scalar name
135/// of the function. For example, a mangled name like
136/// `_ZGV_LLVM_N2v_foo(_LLVM_Scalarize_foo)` would tell the
137/// vectorizer to vectorize the scalar call `foo`, and to scalarize
138/// it once vectorization is done.
139static constexpr char const *_LLVM_Scalarize_ = "_LLVM_Scalarize_";
140 
141/// Function to construct a VFInfo out of a mangled names in the
142/// following format:
143///
144/// <VFABI_name>{(<redirection>)}
145///
146/// where <VFABI_name> is the name of the vector function, mangled according
147/// to the rules described in the Vector Function ABI of the target vector
148/// extension (or <isa> from now on). The <VFABI_name> is in the following
149/// format:
150///
151/// _ZGV<isa><mask><vlen><parameters>_<scalarname>[(<redirection>)]
152///
153/// This methods support demangling rules for the following <isa>:
154///
155/// * AArch64: https://developer.arm.com/docs/101129/latest
156///
157/// * x86 (libmvec): https://sourceware.org/glibc/wiki/libmvec and
158///  https://sourceware.org/glibc/wiki/libmvec?action=AttachFile&do=view&target=VectorABI.txt
159///
160/// \param MangledName -> input string in the format
161/// _ZGV<isa><mask><vlen><parameters>_<scalarname>[(<redirection>)].
162/// \param M -> Module used to retrieve informations about the vector
163/// function that are not possible to retrieve from the mangled
164/// name. At the moment, this parameter is needed only to retrieve the
165/// Vectorization Factor of scalable vector functions from their
166/// respective IR declarations.
167Optional<VFInfo> tryDemangleForVFABI(StringRef MangledName, const Module &M);
168 
169/// This routine mangles the given VectorName according to the LangRef
170/// specification for vector-function-abi-variant attribute and is specific to
171/// the TLI mappings. It is the responsibility of the caller to make sure that
172/// this is only used if all parameters in the vector function are vector type.
173/// This returned string holds scalar-to-vector mapping:
174///    _ZGV<isa><mask><vlen><vparams>_<scalarname>(<vectorname>)
175///
176/// where:
177///
178/// <isa> = "_LLVM_"
179/// <mask> = "N". Note: TLI does not support masked interfaces.
180/// <vlen> = Number of concurrent lanes, stored in the `VectorizationFactor`
181///          field of the `VecDesc` struct. If the number of lanes is scalable
182///          then 'x' is printed instead.
183/// <vparams> = "v", as many as are the numArgs.
184/// <scalarname> = the name of the scalar function.
185/// <vectorname> = the name of the vector function.
186std::string mangleTLIVectorName(StringRef VectorName, StringRef ScalarName,
187                                unsigned numArgs, ElementCount VF);
188 
189/// Retrieve the `VFParamKind` from a string token.
190VFParamKind getVFParamKindFromString(const StringRef Token);
191 
192// Name of the attribute where the variant mappings are stored.
193static constexpr char const *MappingsAttrName = "vector-function-abi-variant";
194 
195/// Populates a set of strings representing the Vector Function ABI variants
196/// associated to the CallInst CI. If the CI does not contain the
197/// vector-function-abi-variant attribute, we return without populating
198/// VariantMappings, i.e. callers of getVectorVariantNames need not check for
199/// the presence of the attribute (see InjectTLIMappings).
200void getVectorVariantNames(const CallInst &CI,
201                           SmallVectorImpl<std::string> &VariantMappings);
202} // end namespace VFABI
203 
204/// The Vector Function Database.
205///
206/// Helper class used to find the vector functions associated to a
207/// scalar CallInst.
208class VFDatabase {
209  /// The Module of the CallInst CI.
210  const Module *M;
211  /// The CallInst instance being queried for scalar to vector mappings.
212  const CallInst &CI;
213  /// List of vector functions descriptors associated to the call
214  /// instruction.
215  const SmallVector<VFInfo, 8> ScalarToVectorMappings;
216 
217  /// Retrieve the scalar-to-vector mappings associated to the rule of
218  /// a vector Function ABI.
219  static void getVFABIMappings(const CallInst &CI,
220                               SmallVectorImpl<VFInfo> &Mappings) {
221    if (!CI.getCalledFunction())
222      return;
223 
224    const StringRef ScalarName = CI.getCalledFunction()->getName();
225 
226    SmallVector<std::string, 8> ListOfStrings;
227    // The check for the vector-function-abi-variant attribute is done when
228    // retrieving the vector variant names here.
229    VFABI::getVectorVariantNames(CI, ListOfStrings);
230    if (ListOfStrings.empty())
231      return;
232    for (const auto &MangledName : ListOfStrings) {
233      const Optional<VFInfo> Shape =
234          VFABI::tryDemangleForVFABI(MangledName, *(CI.getModule()));
235      // A match is found via scalar and vector names, and also by
236      // ensuring that the variant described in the attribute has a
237      // corresponding definition or declaration of the vector
238      // function in the Module M.
239      if (Shape.hasValue() && (Shape.getValue().ScalarName == ScalarName)) {
240        assert(CI.getModule()->getFunction(Shape.getValue().VectorName) &&((void)0)
241               "Vector function is missing.")((void)0);
242        Mappings.push_back(Shape.getValue());
243      }
244    }
245  }
246 
247public:
248  /// Retrieve all the VFInfo instances associated to the CallInst CI.
249  static SmallVector<VFInfo, 8> getMappings(const CallInst &CI) {
250    SmallVector<VFInfo, 8> Ret;
251 
252    // Get mappings from the Vector Function ABI variants.
253    getVFABIMappings(CI, Ret);
254 
255    // Other non-VFABI variants should be retrieved here.
256 
257    return Ret;
258  }
259 
260  /// Constructor, requires a CallInst instance.
261  VFDatabase(CallInst &CI)
262      : M(CI.getModule()), CI(CI),
263        ScalarToVectorMappings(VFDatabase::getMappings(CI)) {}
264  /// \defgroup VFDatabase query interface.
265  ///
266  /// @{
267  /// Retrieve the Function with VFShape \p Shape.
268  Function *getVectorizedFunction(const VFShape &Shape) const {
269    if (Shape == VFShape::getScalarShape(CI))
270      return CI.getCalledFunction();
271 
272    for (const auto &Info : ScalarToVectorMappings)
273      if (Info.Shape == Shape)
274        return M->getFunction(Info.VectorName);
275 
276    return nullptr;
277  }
278  /// @}
279};
280 
281template <typename T> class ArrayRef;
282class DemandedBits;
283class GetElementPtrInst;
284template <typename InstTy> class InterleaveGroup;
285class IRBuilderBase;
286class Loop;
287class ScalarEvolution;
288class TargetTransformInfo;
289class Type;
290class Value;
291 
292namespace Intrinsic {
293typedef unsigned ID;
294}
295 
296/// A helper function for converting Scalar types to vector types. If
297/// the incoming type is void, we return void. If the EC represents a
298/// scalar, we return the scalar type.
299inline Type *ToVectorTy(Type *Scalar, ElementCount EC) {
300  if (Scalar->isVoidTy() || Scalar->isMetadataTy() || EC.isScalar())
301    return Scalar;
302  return VectorType::get(Scalar, EC);
303}
304 
305inline Type *ToVectorTy(Type *Scalar, unsigned VF) {
306  return ToVectorTy(Scalar, ElementCount::getFixed(VF));
307}
308 
309/// Identify if the intrinsic is trivially vectorizable.
310/// This method returns true if the intrinsic's argument types are all scalars
311/// for the scalar form of the intrinsic and all vectors (or scalars handled by
312/// hasVectorInstrinsicScalarOpd) for the vector form of the intrinsic.
313bool isTriviallyVectorizable(Intrinsic::ID ID);
314 
315/// Identifies if the vector form of the intrinsic has a scalar operand.
316bool hasVectorInstrinsicScalarOpd(Intrinsic::ID ID, unsigned ScalarOpdIdx);
317 
318/// Identifies if the vector form of the intrinsic has a scalar operand that has
319/// an overloaded type.
320bool hasVectorInstrinsicOverloadedScalarOpd(Intrinsic::ID ID,
321                                            unsigned ScalarOpdIdx);
322 
323/// Returns intrinsic ID for call.
324/// For the input call instruction it finds mapping intrinsic and returns
325/// its intrinsic ID, in case it does not found it return not_intrinsic.
326Intrinsic::ID getVectorIntrinsicIDForCall(const CallInst *CI,
327                                          const TargetLibraryInfo *TLI);
328 
329/// Find the operand of the GEP that should be checked for consecutive
330/// stores. This ignores trailing indices that have no effect on the final
331/// pointer.
332unsigned getGEPInductionOperand(const GetElementPtrInst *Gep);
333 
334/// If the argument is a GEP, then returns the operand identified by
335/// getGEPInductionOperand. However, if there is some other non-loop-invariant
336/// operand, it returns that instead.
337Value *stripGetElementPtr(Value *Ptr, ScalarEvolution *SE, Loop *Lp);
338 
339/// If a value has only one user that is a CastInst, return it.
340Value *getUniqueCastUse(Value *Ptr, Loop *Lp, Type *Ty);
341 
342/// Get the stride of a pointer access in a loop. Looks for symbolic
343/// strides "a[i*stride]". Returns the symbolic stride, or null otherwise.
344Value *getStrideFromPointer(Value *Ptr, ScalarEvolution *SE, Loop *Lp);
345 
346/// Given a vector and an element number, see if the scalar value is
347/// already around as a register, for example if it were inserted then extracted
348/// from the vector.
349Value *findScalarElement(Value *V, unsigned EltNo);
350 
351/// If all non-negative \p Mask elements are the same value, return that value.
352/// If all elements are negative (undefined) or \p Mask contains different
353/// non-negative values, return -1.
354int getSplatIndex(ArrayRef<int> Mask);
355 
356/// Get splat value if the input is a splat vector or return nullptr.
357/// The value may be extracted from a splat constants vector or from
358/// a sequence of instructions that broadcast a single value into a vector.
359Value *getSplatValue(const Value *V);
360 
361/// Return true if each element of the vector value \p V is poisoned or equal to
362/// every other non-poisoned element. If an index element is specified, either
363/// every element of the vector is poisoned or the element at that index is not
364/// poisoned and equal to every other non-poisoned element.
365/// This may be more powerful than the related getSplatValue() because it is
366/// not limited by finding a scalar source value to a splatted vector.
367bool isSplatValue(const Value *V, int Index = -1, unsigned Depth = 0);
368 
369/// Replace each shuffle mask index with the scaled sequential indices for an
370/// equivalent mask of narrowed elements. Mask elements that are less than 0
371/// (sentinel values) are repeated in the output mask.
372///
373/// Example with Scale = 4:
374///   <4 x i32> <3, 2, 0, -1> -->
375///   <16 x i8> <12, 13, 14, 15, 8, 9, 10, 11, 0, 1, 2, 3, -1, -1, -1, -1>
376///
377/// This is the reverse process of widening shuffle mask elements, but it always
378/// succeeds because the indexes can always be multiplied (scaled up) to map to
379/// narrower vector elements.
380void narrowShuffleMaskElts(int Scale, ArrayRef<int> Mask,
381                           SmallVectorImpl<int> &ScaledMask);
382 
383/// Try to transform a shuffle mask by replacing elements with the scaled index
384/// for an equivalent mask of widened elements. If all mask elements that would
385/// map to a wider element of the new mask are the same negative number
386/// (sentinel value), that element of the new mask is the same value. If any
387/// element in a given slice is negative and some other element in that slice is
388/// not the same value, return false (partial matches with sentinel values are
389/// not allowed).
390///
391/// Example with Scale = 4:
392///   <16 x i8> <12, 13, 14, 15, 8, 9, 10, 11, 0, 1, 2, 3, -1, -1, -1, -1> -->
393///   <4 x i32> <3, 2, 0, -1>
394///
395/// This is the reverse process of narrowing shuffle mask elements if it
396/// succeeds. This transform is not always possible because indexes may not
397/// divide evenly (scale down) to map to wider vector elements.
398bool widenShuffleMaskElts(int Scale, ArrayRef<int> Mask,
399                          SmallVectorImpl<int> &ScaledMask);
400 
401/// Compute a map of integer instructions to their minimum legal type
402/// size.
403///
404/// C semantics force sub-int-sized values (e.g. i8, i16) to be promoted to int
405/// type (e.g. i32) whenever arithmetic is performed on them.
406///
407/// For targets with native i8 or i16 operations, usually InstCombine can shrink
408/// the arithmetic type down again. However InstCombine refuses to create
409/// illegal types, so for targets without i8 or i16 registers, the lengthening
410/// and shrinking remains.
411///
412/// Most SIMD ISAs (e.g. NEON) however support vectors of i8 or i16 even when
413/// their scalar equivalents do not, so during vectorization it is important to
414/// remove these lengthens and truncates when deciding the profitability of
415/// vectorization.
416///
417/// This function analyzes the given range of instructions and determines the
418/// minimum type size each can be converted to. It attempts to remove or
419/// minimize type size changes across each def-use chain, so for example in the
420/// following code:
421///
422///   %1 = load i8, i8*
423///   %2 = add i8 %1, 2
424///   %3 = load i16, i16*
425///   %4 = zext i8 %2 to i32
426///   %5 = zext i16 %3 to i32
427///   %6 = add i32 %4, %5
428///   %7 = trunc i32 %6 to i16
429///
430/// Instruction %6 must be done at least in i16, so computeMinimumValueSizes
431/// will return: {%1: 16, %2: 16, %3: 16, %4: 16, %5: 16, %6: 16, %7: 16}.
432///
433/// If the optional TargetTransformInfo is provided, this function tries harder
434/// to do less work by only looking at illegal types.
435MapVector<Instruction*, uint64_t>
436computeMinimumValueSizes(ArrayRef<BasicBlock*> Blocks,
437                         DemandedBits &DB,
438                         const TargetTransformInfo *TTI=nullptr);
439 
440/// Compute the union of two access-group lists.
441///
442/// If the list contains just one access group, it is returned directly. If the
443/// list is empty, returns nullptr.
444MDNode *uniteAccessGroups(MDNode *AccGroups1, MDNode *AccGroups2);
445 
446/// Compute the access-group list of access groups that @p Inst1 and @p Inst2
447/// are both in. If either instruction does not access memory at all, it is
448/// considered to be in every list.
449///
450/// If the list contains just one access group, it is returned directly. If the
451/// list is empty, returns nullptr.
452MDNode *intersectAccessGroups(const Instruction *Inst1,
453                              const Instruction *Inst2);
454 
455/// Specifically, let Kinds = [MD_tbaa, MD_alias_scope, MD_noalias, MD_fpmath,
456/// MD_nontemporal, MD_access_group].
457/// For K in Kinds, we get the MDNode for K from each of the
458/// elements of VL, compute their "intersection" (i.e., the most generic
459/// metadata value that covers all of the individual values), and set I's
460/// metadata for M equal to the intersection value.
461///
462/// This function always sets a (possibly null) value for each K in Kinds.
463Instruction *propagateMetadata(Instruction *I, ArrayRef<Value *> VL);
464 
465/// Create a mask that filters the members of an interleave group where there
466/// are gaps.
467///
468/// For example, the mask for \p Group with interleave-factor 3
469/// and \p VF 4, that has only its first member present is:
470///
471///   <1,0,0,1,0,0,1,0,0,1,0,0>
472///
473/// Note: The result is a mask of 0's and 1's, as opposed to the other
474/// create[*]Mask() utilities which create a shuffle mask (mask that
475/// consists of indices).
476Constant *createBitMaskForGaps(IRBuilderBase &Builder, unsigned VF,
477                               const InterleaveGroup<Instruction> &Group);
478 
479/// Create a mask with replicated elements.
480///
481/// This function creates a shuffle mask for replicating each of the \p VF
482/// elements in a vector \p ReplicationFactor times. It can be used to
483/// transform a mask of \p VF elements into a mask of
484/// \p VF * \p ReplicationFactor elements used by a predicated
485/// interleaved-group of loads/stores whose Interleaved-factor ==
486/// \p ReplicationFactor.
487///
488/// For example, the mask for \p ReplicationFactor=3 and \p VF=4 is:
489///
490///   <0,0,0,1,1,1,2,2,2,3,3,3>
491llvm::SmallVector<int, 16> createReplicatedMask(unsigned ReplicationFactor,
492                                                unsigned VF);
493 
494/// Create an interleave shuffle mask.
495///
496/// This function creates a shuffle mask for interleaving \p NumVecs vectors of
497/// vectorization factor \p VF into a single wide vector. The mask is of the
498/// form:
499///
500///   <0, VF, VF * 2, ..., VF * (NumVecs - 1), 1, VF + 1, VF * 2 + 1, ...>
501///
502/// For example, the mask for VF = 4 and NumVecs = 2 is:
503///
504///   <0, 4, 1, 5, 2, 6, 3, 7>.
505llvm::SmallVector<int, 16> createInterleaveMask(unsigned VF, unsigned NumVecs);
506 
507/// Create a stride shuffle mask.
508///
509/// This function creates a shuffle mask whose elements begin at \p Start and
510/// are incremented by \p Stride. The mask can be used to deinterleave an
511/// interleaved vector into separate vectors of vectorization factor \p VF. The
512/// mask is of the form:
513///
514///   <Start, Start + Stride, ..., Start + Stride * (VF - 1)>
515///
516/// For example, the mask for Start = 0, Stride = 2, and VF = 4 is:
517///
518///   <0, 2, 4, 6>
519llvm::SmallVector<int, 16> createStrideMask(unsigned Start, unsigned Stride,
520                                            unsigned VF);
521 
522/// Create a sequential shuffle mask.
523///
524/// This function creates shuffle mask whose elements are sequential and begin
525/// at \p Start.  The mask contains \p NumInts integers and is padded with \p
526/// NumUndefs undef values. The mask is of the form:
527///
528///   <Start, Start + 1, ... Start + NumInts - 1, undef_1, ... undef_NumUndefs>
529///
530/// For example, the mask for Start = 0, NumInsts = 4, and NumUndefs = 4 is:
531///
532///   <0, 1, 2, 3, undef, undef, undef, undef>
533llvm::SmallVector<int, 16>
534createSequentialMask(unsigned Start, unsigned NumInts, unsigned NumUndefs);
535 
536/// Concatenate a list of vectors.
537///
538/// This function generates code that concatenate the vectors in \p Vecs into a
539/// single large vector. The number of vectors should be greater than one, and
540/// their element types should be the same. The number of elements in the
541/// vectors should also be the same; however, if the last vector has fewer
542/// elements, it will be padded with undefs.
543Value *concatenateVectors(IRBuilderBase &Builder, ArrayRef<Value *> Vecs);
544 
545/// Given a mask vector of i1, Return true if all of the elements of this
546/// predicate mask are known to be false or undef.  That is, return true if all
547/// lanes can be assumed inactive.
548bool maskIsAllZeroOrUndef(Value *Mask);
549 
550/// Given a mask vector of i1, Return true if all of the elements of this
551/// predicate mask are known to be true or undef.  That is, return true if all
552/// lanes can be assumed active.
553bool maskIsAllOneOrUndef(Value *Mask);
554 
555/// Given a mask vector of the form <Y x i1>, return an APInt (of bitwidth Y)
556/// for each lane which may be active.
557APInt possiblyDemandedEltsInMask(Value *Mask);
558 
559/// The group of interleaved loads/stores sharing the same stride and
560/// close to each other.
561///
562/// Each member in this group has an index starting from 0, and the largest
563/// index should be less than interleaved factor, which is equal to the absolute
564/// value of the access's stride.
565///
566/// E.g. An interleaved load group of factor 4:
567///        for (unsigned i = 0; i < 1024; i+=4) {
568///          a = A[i];                           // Member of index 0
569///          b = A[i+1];                         // Member of index 1
570///          d = A[i+3];                         // Member of index 3
571///          ...
572///        }
573///
574///      An interleaved store group of factor 4:
575///        for (unsigned i = 0; i < 1024; i+=4) {
576///          ...
577///          A[i]   = a;                         // Member of index 0
578///          A[i+1] = b;                         // Member of index 1
579///          A[i+2] = c;                         // Member of index 2
580///          A[i+3] = d;                         // Member of index 3
581///        }
582///
583/// Note: the interleaved load group could have gaps (missing members), but
584/// the interleaved store group doesn't allow gaps.
585template <typename InstTy> class InterleaveGroup {
586public:
587  InterleaveGroup(uint32_t Factor, bool Reverse, Align Alignment)
588      : Factor(Factor), Reverse(Reverse), Alignment(Alignment),
589        InsertPos(nullptr) {}
590 
591  InterleaveGroup(InstTy *Instr, int32_t Stride, Align Alignment)
592      : Alignment(Alignment), InsertPos(Instr) {
593    Factor = std::abs(Stride);
594    assert(Factor > 1 && "Invalid interleave factor")((void)0);
595 
596    Reverse = Stride < 0;
597    Members[0] = Instr;
598  }
599 
600  bool isReverse() const { return Reverse; }
601  uint32_t getFactor() const { return Factor; }
602  Align getAlign() const { return Alignment; }
603  uint32_t getNumMembers() const { return Members.size(); }
604 
605  /// Try to insert a new member \p Instr with index \p Index and
606  /// alignment \p NewAlign. The index is related to the leader and it could be
607  /// negative if it is the new leader.
608  ///
609  /// \returns false if the instruction doesn't belong to the group.
610  bool insertMember(InstTy *Instr, int32_t Index, Align NewAlign) {
611    // Make sure the key fits in an int32_t.
612    Optional<int32_t> MaybeKey = checkedAdd(Index, SmallestKey);
613    if (!MaybeKey)
614      return false;
615    int32_t Key = *MaybeKey;
616 
617    // Skip if the key is used for either the tombstone or empty special values.
618    if (DenseMapInfo<int32_t>::getTombstoneKey() == Key ||
619        DenseMapInfo<int32_t>::getEmptyKey() == Key)
620      return false;
621 
622    // Skip if there is already a member with the same index.
623    if (Members.find(Key) != Members.end())
624      return false;
625 
626    if (Key > LargestKey) {
627      // The largest index is always less than the interleave factor.
628      if (Index >= static_cast<int32_t>(Factor))
629        return false;
630 
631      LargestKey = Key;
632    } else if (Key < SmallestKey) {
633 
634      // Make sure the largest index fits in an int32_t.
635      Optional<int32_t> MaybeLargestIndex = checkedSub(LargestKey, Key);
636      if (!MaybeLargestIndex)
637        return false;
638 
639      // The largest index is always less than the interleave factor.
640      if (*MaybeLargestIndex >= static_cast<int64_t>(Factor))
641        return false;
642 
643      SmallestKey = Key;
644    }
645 
646    // It's always safe to select the minimum alignment.
647    Alignment = std::min(Alignment, NewAlign);
648    Members[Key] = Instr;
649    return true;
650  }
651 
652  /// Get the member with the given index \p Index
653  ///
654  /// \returns nullptr if contains no such member.
655  InstTy *getMember(uint32_t Index) const {
656    int32_t Key = SmallestKey + Index;
657    return Members.lookup(Key);
658  }
659 
660  /// Get the index for the given member. Unlike the key in the member
661  /// map, the index starts from 0.
662  uint32_t getIndex(const InstTy *Instr) const {
663    for (auto I : Members) {
664      if (I.second == Instr)
665        return I.first - SmallestKey;
666    }
667 
668    llvm_unreachable("InterleaveGroup contains no such member")__builtin_unreachable();
669  }
670 
671  InstTy *getInsertPos() const { return InsertPos; }
672  void setInsertPos(InstTy *Inst) { InsertPos = Inst; }
673 
674  /// Add metadata (e.g. alias info) from the instructions in this group to \p
675  /// NewInst.
676  ///
677  /// FIXME: this function currently does not add noalias metadata a'la
678  /// addNewMedata.  To do that we need to compute the intersection of the
679  /// noalias info from all members.
680  void addMetadata(InstTy *NewInst) const;
681 
682  /// Returns true if this Group requires a scalar iteration to handle gaps.
683  bool requiresScalarEpilogue() const {
684    // If the last member of the Group exists, then a scalar epilog is not
685    // needed for this group.
686    if (getMember(getFactor() - 1))
687      return false;
688 
689    // We have a group with gaps. It therefore cannot be a group of stores,
690    // and it can't be a reversed access, because such groups get invalidated.
691    assert(!getMember(0)->mayWriteToMemory() &&((void)0)
692           "Group should have been invalidated")((void)0);
693    assert(!isReverse() && "Group should have been invalidated")((void)0);
694 
695    // This is a group of loads, with gaps, and without a last-member
696    return true;
697  }
698 
699private:
700  uint32_t Factor; // Interleave Factor.
701  bool Reverse;
702  Align Alignment;
703  DenseMap<int32_t, InstTy *> Members;
704  int32_t SmallestKey = 0;
705  int32_t LargestKey = 0;
706 
707  // To avoid breaking dependences, vectorized instructions of an interleave
708  // group should be inserted at either the first load or the last store in
709  // program order.
710  //
711  // E.g. %even = load i32             // Insert Position
712  //      %add = add i32 %even         // Use of %even
713  //      %odd = load i32
714  //
715  //      store i32 %even
716  //      %odd = add i32               // Def of %odd
717  //      store i32 %odd               // Insert Position
718  InstTy *InsertPos;
719};
720 
721/// Drive the analysis of interleaved memory accesses in the loop.
722///
723/// Use this class to analyze interleaved accesses only when we can vectorize
724/// a loop. Otherwise it's meaningless to do analysis as the vectorization
725/// on interleaved accesses is unsafe.
726///
727/// The analysis collects interleave groups and records the relationships
728/// between the member and the group in a map.
729class InterleavedAccessInfo {
730public:
731  InterleavedAccessInfo(PredicatedScalarEvolution &PSE, Loop *L,
732                        DominatorTree *DT, LoopInfo *LI,
733                        const LoopAccessInfo *LAI)
734      : PSE(PSE), TheLoop(L), DT(DT), LI(LI), LAI(LAI) {}
735 
736  ~InterleavedAccessInfo() { invalidateGroups(); }
737 
738  /// Analyze the interleaved accesses and collect them in interleave
739  /// groups. Substitute symbolic strides using \p Strides.
740  /// Consider also predicated loads/stores in the analysis if
741  /// \p EnableMaskedInterleavedGroup is true.
742  void analyzeInterleaving(bool EnableMaskedInterleavedGroup);
743 
744  /// Invalidate groups, e.g., in case all blocks in loop will be predicated
745  /// contrary to original assumption. Although we currently prevent group
746  /// formation for predicated accesses, we may be able to relax this limitation
747  /// in the future once we handle more complicated blocks. Returns true if any
748  /// groups were invalidated.
749  bool invalidateGroups() {
750    if (InterleaveGroups.empty()) {
751      assert(((void)0)
752          !RequiresScalarEpilogue &&((void)0)
753          "RequiresScalarEpilog should not be set without interleave groups")((void)0);
754      return false;
755    }
756 
757    InterleaveGroupMap.clear();
758    for (auto *Ptr : InterleaveGroups)
759      delete Ptr;
760    InterleaveGroups.clear();
761    RequiresScalarEpilogue = false;
762    return true;
763  }
764 
765  /// Check if \p Instr belongs to any interleave group.
766  bool isInterleaved(Instruction *Instr) const {
767    return InterleaveGroupMap.find(Instr) != InterleaveGroupMap.end();
63
←
Calling 'operator!='→
69
←
Returning from 'operator!='→
70
←
Returning zero, which participates in a condition later→
768  }
769 
770  /// Get the interleave group that \p Instr belongs to.
771  ///
772  /// \returns nullptr if doesn't have such group.
773  InterleaveGroup<Instruction> *
774  getInterleaveGroup(const Instruction *Instr) const {
775    return InterleaveGroupMap.lookup(Instr);
776  }
777 
778  iterator_range<SmallPtrSetIterator<llvm::InterleaveGroup<Instruction> *>>
779  getInterleaveGroups() {
780    return make_range(InterleaveGroups.begin(), InterleaveGroups.end());
781  }
782 
783  /// Returns true if an interleaved group that may access memory
784  /// out-of-bounds requires a scalar epilogue iteration for correctness.
785  bool requiresScalarEpilogue() const { return RequiresScalarEpilogue; }
786 
787  /// Invalidate groups that require a scalar epilogue (due to gaps). This can
788  /// happen when optimizing for size forbids a scalar epilogue, and the gap
789  /// cannot be filtered by masking the load/store.
790  void invalidateGroupsRequiringScalarEpilogue();
791 
792private:
793  /// A wrapper around ScalarEvolution, used to add runtime SCEV checks.
794  /// Simplifies SCEV expressions in the context of existing SCEV assumptions.
795  /// The interleaved access analysis can also add new predicates (for example
796  /// by versioning strides of pointers).
797  PredicatedScalarEvolution &PSE;
798 
799  Loop *TheLoop;
800  DominatorTree *DT;
801  LoopInfo *LI;
802  const LoopAccessInfo *LAI;
803 
804  /// True if the loop may contain non-reversed interleaved groups with
805  /// out-of-bounds accesses. We ensure we don't speculatively access memory
806  /// out-of-bounds by executing at least one scalar epilogue iteration.
807  bool RequiresScalarEpilogue = false;
808 
809  /// Holds the relationships between the members and the interleave group.
810  DenseMap<Instruction *, InterleaveGroup<Instruction> *> InterleaveGroupMap;
811 
812  SmallPtrSet<InterleaveGroup<Instruction> *, 4> InterleaveGroups;
813 
814  /// Holds dependences among the memory accesses in the loop. It maps a source
815  /// access to a set of dependent sink accesses.
816  DenseMap<Instruction *, SmallPtrSet<Instruction *, 2>> Dependences;
817 
818  /// The descriptor for a strided memory access.
819  struct StrideDescriptor {
820    StrideDescriptor() = default;
821    StrideDescriptor(int64_t Stride, const SCEV *Scev, uint64_t Size,
822                     Align Alignment)
823        : Stride(Stride), Scev(Scev), Size(Size), Alignment(Alignment) {}
824 
825    // The access's stride. It is negative for a reverse access.
826    int64_t Stride = 0;
827 
828    // The scalar expression of this access.
829    const SCEV *Scev = nullptr;
830 
831    // The size of the memory object.
832    uint64_t Size = 0;
833 
834    // The alignment of this access.
835    Align Alignment;
836  };
837 
838  /// A type for holding instructions and their stride descriptors.
839  using StrideEntry = std::pair<Instruction *, StrideDescriptor>;
840 
841  /// Create a new interleave group with the given instruction \p Instr,
842  /// stride \p Stride and alignment \p Align.
843  ///
844  /// \returns the newly created interleave group.
845  InterleaveGroup<Instruction> *
846  createInterleaveGroup(Instruction *Instr, int Stride, Align Alignment) {
847    assert(!InterleaveGroupMap.count(Instr) &&((void)0)
848           "Already in an interleaved access group")((void)0);
849    InterleaveGroupMap[Instr] =
850        new InterleaveGroup<Instruction>(Instr, Stride, Alignment);
851    InterleaveGroups.insert(InterleaveGroupMap[Instr]);
852    return InterleaveGroupMap[Instr];
853  }
854 
855  /// Release the group and remove all the relationships.
856  void releaseGroup(InterleaveGroup<Instruction> *Group) {
857    for (unsigned i = 0; i < Group->getFactor(); i++)
858      if (Instruction *Member = Group->getMember(i))
859        InterleaveGroupMap.erase(Member);
860 
861    InterleaveGroups.erase(Group);
862    delete Group;
863  }
864 
865  /// Collect all the accesses with a constant stride in program order.
866  void collectConstStrideAccesses(
867      MapVector<Instruction *, StrideDescriptor> &AccessStrideInfo,
868      const ValueToValueMap &Strides);
869 
870  /// Returns true if \p Stride is allowed in an interleaved group.
871  static bool isStrided(int Stride);
872 
873  /// Returns true if \p BB is a predicated block.
874  bool isPredicated(BasicBlock *BB) const {
875    return LoopAccessInfo::blockNeedsPredication(BB, TheLoop, DT);
876  }
877 
878  /// Returns true if LoopAccessInfo can be used for dependence queries.
879  bool areDependencesValid() const {
880    return LAI && LAI->getDepChecker().getDependences();
881  }
882 
883  /// Returns true if memory accesses \p A and \p B can be reordered, if
884  /// necessary, when constructing interleaved groups.
885  ///
886  /// \p A must precede \p B in program order. We return false if reordering is
887  /// not necessary or is prevented because \p A and \p B may be dependent.
888  bool canReorderMemAccessesForInterleavedGroups(StrideEntry *A,
889                                                 StrideEntry *B) const {
890    // Code motion for interleaved accesses can potentially hoist strided loads
891    // and sink strided stores. The code below checks the legality of the
892    // following two conditions:
893    //
894    // 1. Potentially moving a strided load (B) before any store (A) that
895    //    precedes B, or
896    //
897    // 2. Potentially moving a strided store (A) after any load or store (B)
898    //    that A precedes.
899    //
900    // It's legal to reorder A and B if we know there isn't a dependence from A
901    // to B. Note that this determination is conservative since some
902    // dependences could potentially be reordered safely.
903 
904    // A is potentially the source of a dependence.
905    auto *Src = A->first;
906    auto SrcDes = A->second;
907 
908    // B is potentially the sink of a dependence.
909    auto *Sink = B->first;
910    auto SinkDes = B->second;
911 
912    // Code motion for interleaved accesses can't violate WAR dependences.
913    // Thus, reordering is legal if the source isn't a write.
914    if (!Src->mayWriteToMemory())
28
←
Assuming the condition is true→
29
←
Taking true branch→
46
←
Assuming the condition is true→
47
←
Taking true branch→
915      return true;
30
←
Returning the value 1, which participates in a condition later→
48
←
Returning the value 1, which participates in a condition later→
916 
917    // At least one of the accesses must be strided.
918    if (!isStrided(SrcDes.Stride) && !isStrided(SinkDes.Stride))
919      return true;
920 
921    // If dependence information is not available from LoopAccessInfo,
922    // conservatively assume the instructions can't be reordered.
923    if (!areDependencesValid())
924      return false;
925 
926    // If we know there is a dependence from source to sink, assume the
927    // instructions can't be reordered. Otherwise, reordering is legal.
928    return Dependences.find(Src) == Dependences.end() ||
929           !Dependences.lookup(Src).count(Sink);
930  }
931 
932  /// Collect the dependences from LoopAccessInfo.
933  ///
934  /// We process the dependences once during the interleaved access analysis to
935  /// enable constant-time dependence queries.
936  void collectDependences() {
937    if (!areDependencesValid())
938      return;
939    auto *Deps = LAI->getDepChecker().getDependences();
940    for (auto Dep : *Deps)
941      Dependences[Dep.getSource(*LAI)].insert(Dep.getDestination(*LAI));
942  }
943};
944 
945} // llvm namespace
946 
947#endif

←

/usr/src/gnu/usr.bin/clang/libLLVM/../../../llvm/llvm/include/llvm/ADT/DenseMap.h

1//===- llvm/ADT/DenseMap.h - Dense probed hash table ------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the DenseMap class.
10//
11//===----------------------------------------------------------------------===//

13#ifndef LLVM_ADT_DENSEMAP_H
14#define LLVM_ADT_DENSEMAP_H

16#include "llvm/ADT/DenseMapInfo.h"
17#include "llvm/ADT/EpochTracker.h"
18#include "llvm/Support/AlignOf.h"
19#include "llvm/Support/Compiler.h"
20#include "llvm/Support/MathExtras.h"
21#include "llvm/Support/MemAlloc.h"
22#include "llvm/Support/ReverseIteration.h"
23#include "llvm/Support/type_traits.h"
24#include <algorithm>
25#include <cassert>
26#include <cstddef>
27#include <cstring>
28#include <initializer_list>
29#include <iterator>
30#include <new>
31#include <type_traits>
32#include <utility>

34namespace llvm {

36namespace detail {

38// We extend a pair to allow users to override the bucket type with their own
39// implementation without requiring two members.
40template <typename KeyT, typename ValueT>
41struct DenseMapPair : public std::pair<KeyT, ValueT> {
using std::pair<KeyT, ValueT>::pair;

KeyT &getFirst() { return std::pair<KeyT, ValueT>::first; }
const KeyT &getFirst() const { return std::pair<KeyT, ValueT>::first; }
ValueT &getSecond() { return std::pair<KeyT, ValueT>::second; }
const ValueT &getSecond() const { return std::pair<KeyT, ValueT>::second; }
48};

50} // end namespace detail

52template <typename KeyT, typename ValueT,
        typename KeyInfoT = DenseMapInfo<KeyT>,
        typename Bucket = llvm::detail::DenseMapPair<KeyT, ValueT>,
        bool IsConst = false>
56class DenseMapIterator;

58template <typename DerivedT, typename KeyT, typename ValueT, typename KeyInfoT,
        typename BucketT>
60class DenseMapBase : public DebugEpochBase {
template <typename T>
using const_arg_type_t = typename const_pointer_or_const_ref<T>::type;

64public:
using size_type = unsigned;
using key_type = KeyT;
using mapped_type = ValueT;
using value_type = BucketT;

using iterator = DenseMapIterator<KeyT, ValueT, KeyInfoT, BucketT>;
using const_iterator =
    DenseMapIterator<KeyT, ValueT, KeyInfoT, BucketT, true>;

inline iterator begin() {
  // When the map is empty, avoid the overhead of advancing/retreating past
  // empty buckets.
  if (empty())
    return end();
  if (shouldReverseIterate<KeyT>())
    return makeIterator(getBucketsEnd() - 1, getBuckets(), *this);
  return makeIterator(getBuckets(), getBucketsEnd(), *this);
}
inline iterator end() {
  return makeIterator(getBucketsEnd(), getBucketsEnd(), *this, true);
}
inline const_iterator begin() const {
  if (empty())
    return end();
  if (shouldReverseIterate<KeyT>())
    return makeConstIterator(getBucketsEnd() - 1, getBuckets(), *this);
  return makeConstIterator(getBuckets(), getBucketsEnd(), *this);
}
inline const_iterator end() const {
  return makeConstIterator(getBucketsEnd(), getBucketsEnd(), *this, true);
}

LLVM_NODISCARD[[clang::warn_unused_result]] bool empty() const {
  return getNumEntries() == 0;
}
unsigned size() const { return getNumEntries(); }

/// Grow the densemap so that it can contain at least \p NumEntries items
/// before resizing again.
void reserve(size_type NumEntries) {
  auto NumBuckets = getMinBucketToReserveForEntries(NumEntries);
  incrementEpoch();
  if (NumBuckets > getNumBuckets())
    grow(NumBuckets);
}

void clear() {
  incrementEpoch();
  if (getNumEntries() == 0 && getNumTombstones() == 0) return;

  // If the capacity of the array is huge, and the # elements used is small,
  // shrink the array.
  if (getNumEntries() * 4 < getNumBuckets() && getNumBuckets() > 64) {
    shrink_and_clear();
    return;
  }

  const KeyT EmptyKey = getEmptyKey(), TombstoneKey = getTombstoneKey();
  if (std::is_trivially_destructible<ValueT>::value) {
    // Use a simpler loop when values don't need destruction.
    for (BucketT *P = getBuckets(), *E = getBucketsEnd(); P != E; ++P)
      P->getFirst() = EmptyKey;
  } else {
    unsigned NumEntries = getNumEntries();
    for (BucketT *P = getBuckets(), *E = getBucketsEnd(); P != E; ++P) {
      if (!KeyInfoT::isEqual(P->getFirst(), EmptyKey)) {
        if (!KeyInfoT::isEqual(P->getFirst(), TombstoneKey)) {
          P->getSecond().~ValueT();
          --NumEntries;
        }
        P->getFirst() = EmptyKey;
      }
    }
    assert(NumEntries == 0 && "Node count imbalance!")((void)0);
  }
  setNumEntries(0);
  setNumTombstones(0);
}

/// Return 1 if the specified key is in the map, 0 otherwise.
size_type count(const_arg_type_t<KeyT> Val) const {
  const BucketT *TheBucket;
  return LookupBucketFor(Val, TheBucket) ? 1 : 0;
}

iterator find(const_arg_type_t<KeyT> Val) {
  BucketT *TheBucket;
  if (LookupBucketFor(Val, TheBucket))
    return makeIterator(TheBucket,
                        shouldReverseIterate<KeyT>() ? getBuckets()
                                                     : getBucketsEnd(),
                        *this, true);
  return end();
}
const_iterator find(const_arg_type_t<KeyT> Val) const {
  const BucketT *TheBucket;
  if (LookupBucketFor(Val, TheBucket))
    return makeConstIterator(TheBucket,
                             shouldReverseIterate<KeyT>() ? getBuckets()
                                                          : getBucketsEnd(),
                             *this, true);
  return end();
}

/// Alternate version of find() which allows a different, and possibly
/// less expensive, key type.
/// The DenseMapInfo is responsible for supplying methods
/// getHashValue(LookupKeyT) and isEqual(LookupKeyT, KeyT) for each key
/// type used.
template<class LookupKeyT>
iterator find_as(const LookupKeyT &Val) {
  BucketT *TheBucket;
  if (LookupBucketFor(Val, TheBucket))
    return makeIterator(TheBucket,
                        shouldReverseIterate<KeyT>() ? getBuckets()
                                                     : getBucketsEnd(),
                        *this, true);
  return end();
}
template<class LookupKeyT>
const_iterator find_as(const LookupKeyT &Val) const {
  const BucketT *TheBucket;
  if (LookupBucketFor(Val, TheBucket))
    return makeConstIterator(TheBucket,
                             shouldReverseIterate<KeyT>() ? getBuckets()
                                                          : getBucketsEnd(),
                             *this, true);
  return end();
}

/// lookup - Return the entry for the specified key, or a default
/// constructed value if no such entry exists.
ValueT lookup(const_arg_type_t<KeyT> Val) const {
  const BucketT *TheBucket;
  if (LookupBucketFor(Val, TheBucket))
    return TheBucket->getSecond();
  return ValueT();
}

// Inserts key,value pair into the map if the key isn't already in the map.
// If the key is already in the map, it returns false and doesn't update the
// value.
std::pair<iterator, bool> insert(const std::pair<KeyT, ValueT> &KV) {
  return try_emplace(KV.first, KV.second);
}

// Inserts key,value pair into the map if the key isn't already in the map.
// If the key is already in the map, it returns false and doesn't update the
// value.
std::pair<iterator, bool> insert(std::pair<KeyT, ValueT> &&KV) {
  return try_emplace(std::move(KV.first), std::move(KV.second));
}

// Inserts key,value pair into the map if the key isn't already in the map.
// The value is constructed in-place if the key is not in the map, otherwise
// it is not moved.
template <typename... Ts>
std::pair<iterator, bool> try_emplace(KeyT &&Key, Ts &&... Args) {
  BucketT *TheBucket;
  if (LookupBucketFor(Key, TheBucket))
    return std::make_pair(makeIterator(TheBucket,
                                       shouldReverseIterate<KeyT>()
                                           ? getBuckets()
                                           : getBucketsEnd(),
                                       *this, true),
                          false); // Already in map.

  // Otherwise, insert the new element.
  TheBucket =
      InsertIntoBucket(TheBucket, std::move(Key), std::forward<Ts>(Args)...);
  return std::make_pair(makeIterator(TheBucket,
                                     shouldReverseIterate<KeyT>()
                                         ? getBuckets()
                                         : getBucketsEnd(),
                                     *this, true),
                        true);
}

// Inserts key,value pair into the map if the key isn't already in the map.
// The value is constructed in-place if the key is not in the map, otherwise
// it is not moved.
template <typename... Ts>
std::pair<iterator, bool> try_emplace(const KeyT &Key, Ts &&... Args) {
  BucketT *TheBucket;
  if (LookupBucketFor(Key, TheBucket))
    return std::make_pair(makeIterator(TheBucket,
                                       shouldReverseIterate<KeyT>()
                                           ? getBuckets()
                                           : getBucketsEnd(),
                                       *this, true),
                          false); // Already in map.

  // Otherwise, insert the new element.
  TheBucket = InsertIntoBucket(TheBucket, Key, std::forward<Ts>(Args)...);
  return std::make_pair(makeIterator(TheBucket,
                                     shouldReverseIterate<KeyT>()
                                         ? getBuckets()
                                         : getBucketsEnd(),
                                     *this, true),
                        true);
}

/// Alternate version of insert() which allows a different, and possibly
/// less expensive, key type.
/// The DenseMapInfo is responsible for supplying methods
/// getHashValue(LookupKeyT) and isEqual(LookupKeyT, KeyT) for each key
/// type used.
template <typename LookupKeyT>
std::pair<iterator, bool> insert_as(std::pair<KeyT, ValueT> &&KV,
                                    const LookupKeyT &Val) {
  BucketT *TheBucket;
  if (LookupBucketFor(Val, TheBucket))
    return std::make_pair(makeIterator(TheBucket,
                                       shouldReverseIterate<KeyT>()
                                           ? getBuckets()
                                           : getBucketsEnd(),
                                       *this, true),
                          false); // Already in map.

  // Otherwise, insert the new element.
  TheBucket = InsertIntoBucketWithLookup(TheBucket, std::move(KV.first),
                                         std::move(KV.second), Val);
  return std::make_pair(makeIterator(TheBucket,
                                     shouldReverseIterate<KeyT>()
                                         ? getBuckets()
                                         : getBucketsEnd(),
                                     *this, true),
                        true);
}

/// insert - Range insertion of pairs.
template<typename InputIt>
void insert(InputIt I, InputIt E) {
  for (; I != E; ++I)
    insert(*I);
}

bool erase(const KeyT &Val) {
  BucketT *TheBucket;
  if (!LookupBucketFor(Val, TheBucket))
    return false; // not in map.

  TheBucket->getSecond().~ValueT();
  TheBucket->getFirst() = getTombstoneKey();
  decrementNumEntries();
  incrementNumTombstones();
  return true;
}
void erase(iterator I) {
  BucketT *TheBucket = &*I;
  TheBucket->getSecond().~ValueT();
  TheBucket->getFirst() = getTombstoneKey();
  decrementNumEntries();
  incrementNumTombstones();
}

value_type& FindAndConstruct(const KeyT &Key) {
  BucketT *TheBucket;
  if (LookupBucketFor(Key, TheBucket))
    return *TheBucket;

  return *InsertIntoBucket(TheBucket, Key);
}

ValueT &operator[](const KeyT &Key) {
  return FindAndConstruct(Key).second;
}

value_type& FindAndConstruct(KeyT &&Key) {
  BucketT *TheBucket;
  if (LookupBucketFor(Key, TheBucket))
    return *TheBucket;

  return *InsertIntoBucket(TheBucket, std::move(Key));
}

ValueT &operator[](KeyT &&Key) {
  return FindAndConstruct(std::move(Key)).second;
}

/// isPointerIntoBucketsArray - Return true if the specified pointer points
/// somewhere into the DenseMap's array of buckets (i.e. either to a key or
/// value in the DenseMap).
bool isPointerIntoBucketsArray(const void *Ptr) const {
  return Ptr >= getBuckets() && Ptr < getBucketsEnd();
}

/// getPointerIntoBucketsArray() - Return an opaque pointer into the buckets
/// array.  In conjunction with the previous method, this can be used to
/// determine whether an insertion caused the DenseMap to reallocate.
const void *getPointerIntoBucketsArray() const { return getBuckets(); }

357protected:
DenseMapBase() = default;

void destroyAll() {
  if (getNumBuckets() == 0) // Nothing to do.
    return;

  const KeyT EmptyKey = getEmptyKey(), TombstoneKey = getTombstoneKey();
  for (BucketT *P = getBuckets(), *E = getBucketsEnd(); P != E; ++P) {
    if (!KeyInfoT::isEqual(P->getFirst(), EmptyKey) &&
        !KeyInfoT::isEqual(P->getFirst(), TombstoneKey))
      P->getSecond().~ValueT();
    P->getFirst().~KeyT();
  }
}

void initEmpty() {
  setNumEntries(0);
  setNumTombstones(0);

  assert((getNumBuckets() & (getNumBuckets()-1)) == 0 &&((void)0)
         "# initial buckets must be a power of two!")((void)0);
  const KeyT EmptyKey = getEmptyKey();
  for (BucketT *B = getBuckets(), *E = getBucketsEnd(); B != E; ++B)
    ::new (&B->getFirst()) KeyT(EmptyKey);
}

/// Returns the number of buckets to allocate to ensure that the DenseMap can
/// accommodate \p NumEntries without need to grow().
unsigned getMinBucketToReserveForEntries(unsigned NumEntries) {
  // Ensure that "NumEntries * 4 < NumBuckets * 3"
  if (NumEntries == 0)
    return 0;
  // +1 is required because of the strict equality.
  // For example if NumEntries is 48, we need to return 401.
  return NextPowerOf2(NumEntries * 4 / 3 + 1);
}

void moveFromOldBuckets(BucketT *OldBucketsBegin, BucketT *OldBucketsEnd) {
  initEmpty();

  // Insert all the old elements.
  const KeyT EmptyKey = getEmptyKey();
  const KeyT TombstoneKey = getTombstoneKey();
  for (BucketT *B = OldBucketsBegin, *E = OldBucketsEnd; B != E; ++B) {
    if (!KeyInfoT::isEqual(B->getFirst(), EmptyKey) &&
        !KeyInfoT::isEqual(B->getFirst(), TombstoneKey)) {
      // Insert the key/value into the new table.
      BucketT *DestBucket;
      bool FoundVal = LookupBucketFor(B->getFirst(), DestBucket);
      (void)FoundVal; // silence warning.
      assert(!FoundVal && "Key already in new map?")((void)0);
      DestBucket->getFirst() = std::move(B->getFirst());
      ::new (&DestBucket->getSecond()) ValueT(std::move(B->getSecond()));
      incrementNumEntries();

      // Free the value.
      B->getSecond().~ValueT();
    }
    B->getFirst().~KeyT();
  }
}

template <typename OtherBaseT>
void copyFrom(
    const DenseMapBase<OtherBaseT, KeyT, ValueT, KeyInfoT, BucketT> &other) {
  assert(&other != this)((void)0);
  assert(getNumBuckets() == other.getNumBuckets())((void)0);

  setNumEntries(other.getNumEntries());
  setNumTombstones(other.getNumTombstones());

  if (std::is_trivially_copyable<KeyT>::value &&
      std::is_trivially_copyable<ValueT>::value)
    memcpy(reinterpret_cast<void *>(getBuckets()), other.getBuckets(),
           getNumBuckets() * sizeof(BucketT));
  else
    for (size_t i = 0; i < getNumBuckets(); ++i) {
      ::new (&getBuckets()[i].getFirst())
          KeyT(other.getBuckets()[i].getFirst());
      if (!KeyInfoT::isEqual(getBuckets()[i].getFirst(), getEmptyKey()) &&
          !KeyInfoT::isEqual(getBuckets()[i].getFirst(), getTombstoneKey()))
        ::new (&getBuckets()[i].getSecond())
            ValueT(other.getBuckets()[i].getSecond());
    }
}

static unsigned getHashValue(const KeyT &Val) {
  return KeyInfoT::getHashValue(Val);
}

template<typename LookupKeyT>
static unsigned getHashValue(const LookupKeyT &Val) {
  return KeyInfoT::getHashValue(Val);
}

static const KeyT getEmptyKey() {
  static_assert(std::is_base_of<DenseMapBase, DerivedT>::value,
                "Must pass the derived type to this template!");
  return KeyInfoT::getEmptyKey();
}

static const KeyT getTombstoneKey() {
  return KeyInfoT::getTombstoneKey();
}

463private:
iterator makeIterator(BucketT *P, BucketT *E,
                      DebugEpochBase &Epoch,
                      bool NoAdvance=false) {
  if (shouldReverseIterate<KeyT>()) {
    BucketT *B = P == getBucketsEnd() ? getBuckets() : P + 1;
    return iterator(B, E, Epoch, NoAdvance);
  }
  return iterator(P, E, Epoch, NoAdvance);
}

const_iterator makeConstIterator(const BucketT *P, const BucketT *E,
                                 const DebugEpochBase &Epoch,
                                 const bool NoAdvance=false) const {
  if (shouldReverseIterate<KeyT>()) {
    const BucketT *B = P == getBucketsEnd() ? getBuckets() : P + 1;
    return const_iterator(B, E, Epoch, NoAdvance);
  }
  return const_iterator(P, E, Epoch, NoAdvance);
}

unsigned getNumEntries() const {
  return static_cast<const DerivedT *>(this)->getNumEntries();
}

void setNumEntries(unsigned Num) {
  static_cast<DerivedT *>(this)->setNumEntries(Num);
}

void incrementNumEntries() {
  setNumEntries(getNumEntries() + 1);
}

void decrementNumEntries() {
  setNumEntries(getNumEntries() - 1);
}

unsigned getNumTombstones() const {
  return static_cast<const DerivedT *>(this)->getNumTombstones();
}

void setNumTombstones(unsigned Num) {
  static_cast<DerivedT *>(this)->setNumTombstones(Num);
}

void incrementNumTombstones() {
  setNumTombstones(getNumTombstones() + 1);
}

void decrementNumTombstones() {
  setNumTombstones(getNumTombstones() - 1);
}

const BucketT *getBuckets() const {
  return static_cast<const DerivedT *>(this)->getBuckets();
}

BucketT *getBuckets() {
  return static_cast<DerivedT *>(this)->getBuckets();
}

unsigned getNumBuckets() const {
  return static_cast<const DerivedT *>(this)->getNumBuckets();
}

BucketT *getBucketsEnd() {
  return getBuckets() + getNumBuckets();
}

const BucketT *getBucketsEnd() const {
  return getBuckets() + getNumBuckets();
}

void grow(unsigned AtLeast) {
  static_cast<DerivedT *>(this)->grow(AtLeast);
}

void shrink_and_clear() {
  static_cast<DerivedT *>(this)->shrink_and_clear();
}

template <typename KeyArg, typename... ValueArgs>
BucketT *InsertIntoBucket(BucketT *TheBucket, KeyArg &&Key,
                          ValueArgs &&... Values) {
  TheBucket = InsertIntoBucketImpl(Key, Key, TheBucket);

  TheBucket->getFirst() = std::forward<KeyArg>(Key);
  ::new (&TheBucket->getSecond()) ValueT(std::forward<ValueArgs>(Values)...);
  return TheBucket;
}

template <typename LookupKeyT>
BucketT *InsertIntoBucketWithLookup(BucketT *TheBucket, KeyT &&Key,
                                    ValueT &&Value, LookupKeyT &Lookup) {
  TheBucket = InsertIntoBucketImpl(Key, Lookup, TheBucket);

  TheBucket->getFirst() = std::move(Key);
  ::new (&TheBucket->getSecond()) ValueT(std::move(Value));
  return TheBucket;
}

template <typename LookupKeyT>
BucketT *InsertIntoBucketImpl(const KeyT &Key, const LookupKeyT &Lookup,
                              BucketT *TheBucket) {
  incrementEpoch();

  // If the load of the hash table is more than 3/4, or if fewer than 1/8 of
  // the buckets are empty (meaning that many are filled with tombstones),
  // grow the table.
  //
  // The later case is tricky.  For example, if we had one empty bucket with
  // tons of tombstones, failing lookups (e.g. for insertion) would have to
  // probe almost the entire table until it found the empty bucket.  If the
  // table completely filled with tombstones, no lookup would ever succeed,
  // causing infinite loops in lookup.
  unsigned NewNumEntries = getNumEntries() + 1;
  unsigned NumBuckets = getNumBuckets();
  if (LLVM_UNLIKELY(NewNumEntries * 4 >= NumBuckets * 3)__builtin_expect((bool)(NewNumEntries * 4 >= NumBuckets * 3
), false)) {
    this->grow(NumBuckets * 2);
    LookupBucketFor(Lookup, TheBucket);
    NumBuckets = getNumBuckets();
  } else if (LLVM_UNLIKELY(NumBuckets-(NewNumEntries+getNumTombstones()) <=__builtin_expect((bool)(NumBuckets-(NewNumEntries+getNumTombstones
()) <= NumBuckets/8), false)
                           NumBuckets/8)__builtin_expect((bool)(NumBuckets-(NewNumEntries+getNumTombstones
()) <= NumBuckets/8), false)) {
    this->grow(NumBuckets);
    LookupBucketFor(Lookup, TheBucket);
  }
  assert(TheBucket)((void)0);

  // Only update the state after we've grown our bucket space appropriately
  // so that when growing buckets we have self-consistent entry count.
  incrementNumEntries();

  // If we are writing over a tombstone, remember this.
  const KeyT EmptyKey = getEmptyKey();
  if (!KeyInfoT::isEqual(TheBucket->getFirst(), EmptyKey))
    decrementNumTombstones();

  return TheBucket;
}

/// LookupBucketFor - Lookup the appropriate bucket for Val, returning it in
/// FoundBucket.  If the bucket contains the key and a value, this returns
/// true, otherwise it returns a bucket with an empty marker or tombstone and
/// returns false.
template<typename LookupKeyT>
bool LookupBucketFor(const LookupKeyT &Val,
                     const BucketT *&FoundBucket) const {
  const BucketT *BucketsPtr = getBuckets();
  const unsigned NumBuckets = getNumBuckets();

  if (NumBuckets == 0) {
    FoundBucket = nullptr;
    return false;
  }

  // FoundTombstone - Keep track of whether we find a tombstone while probing.
  const BucketT *FoundTombstone = nullptr;
  const KeyT EmptyKey = getEmptyKey();
  const KeyT TombstoneKey = getTombstoneKey();
  assert(!KeyInfoT::isEqual(Val, EmptyKey) &&((void)0)
         !KeyInfoT::isEqual(Val, TombstoneKey) &&((void)0)
         "Empty/Tombstone value shouldn't be inserted into map!")((void)0);

  unsigned BucketNo = getHashValue(Val) & (NumBuckets-1);
  unsigned ProbeAmt = 1;
  while (true) {
    const BucketT *ThisBucket = BucketsPtr + BucketNo;
    // Found Val's bucket?  If so, return it.
    if (LLVM_LIKELY(KeyInfoT::isEqual(Val, ThisBucket->getFirst()))__builtin_expect((bool)(KeyInfoT::isEqual(Val, ThisBucket->
getFirst())), true)) {
      FoundBucket = ThisBucket;
      return true;
    }

    // If we found an empty bucket, the key doesn't exist in the set.
    // Insert it and return the default value.
    if (LLVM_LIKELY(KeyInfoT::isEqual(ThisBucket->getFirst(), EmptyKey))__builtin_expect((bool)(KeyInfoT::isEqual(ThisBucket->getFirst
(), EmptyKey)), true)) {
      // If we've already seen a tombstone while probing, fill it in instead
      // of the empty bucket we eventually probed to.
      FoundBucket = FoundTombstone ? FoundTombstone : ThisBucket;
      return false;
    }

    // If this is a tombstone, remember it.  If Val ends up not in the map, we
    // prefer to return it than something that would require more probing.
    if (KeyInfoT::isEqual(ThisBucket->getFirst(), TombstoneKey) &&
        !FoundTombstone)
      FoundTombstone = ThisBucket;  // Remember the first tombstone found.

    // Otherwise, it's a hash collision or a tombstone, continue quadratic
    // probing.
    BucketNo += ProbeAmt++;
    BucketNo &= (NumBuckets-1);
  }
}

template <typename LookupKeyT>
bool LookupBucketFor(const LookupKeyT &Val, BucketT *&FoundBucket) {
  const BucketT *ConstFoundBucket;
  bool Result = const_cast<const DenseMapBase *>(this)
    ->LookupBucketFor(Val, ConstFoundBucket);
  FoundBucket = const_cast<BucketT *>(ConstFoundBucket);
  return Result;
}

667public:
/// Return the approximate size (in bytes) of the actual map.
/// This is just the raw memory used by DenseMap.
/// If entries are pointers to objects, the size of the referenced objects
/// are not included.
size_t getMemorySize() const {
  return getNumBuckets() * sizeof(BucketT);
}
675};

677/// Equality comparison for DenseMap.
678///
679/// Iterates over elements of LHS confirming that each (key, value) pair in LHS
680/// is also in RHS, and that no additional pairs are in RHS.
681/// Equivalent to N calls to RHS.find and N value comparisons. Amortized
682/// complexity is linear, worst case is O(N^2) (if every hash collides).
683template <typename DerivedT, typename KeyT, typename ValueT, typename KeyInfoT,
        typename BucketT>
685bool operator==(
  const DenseMapBase<DerivedT, KeyT, ValueT, KeyInfoT, BucketT> &LHS,
  const DenseMapBase<DerivedT, KeyT, ValueT, KeyInfoT, BucketT> &RHS) {
if (LHS.size() != RHS.size())
  return false;

for (auto &KV : LHS) {
  auto I = RHS.find(KV.first);
  if (I == RHS.end() || I->second != KV.second)
    return false;
}

return true;
698}

700/// Inequality comparison for DenseMap.
701///
702/// Equivalent to !(LHS == RHS). See operator== for performance notes.
703template <typename DerivedT, typename KeyT, typename ValueT, typename KeyInfoT,
        typename BucketT>
705bool operator!=(
  const DenseMapBase<DerivedT, KeyT, ValueT, KeyInfoT, BucketT> &LHS,
  const DenseMapBase<DerivedT, KeyT, ValueT, KeyInfoT, BucketT> &RHS) {
return !(LHS == RHS);
709}

711template <typename KeyT, typename ValueT,
        typename KeyInfoT = DenseMapInfo<KeyT>,
        typename BucketT = llvm::detail::DenseMapPair<KeyT, ValueT>>
714class DenseMap : public DenseMapBase<DenseMap<KeyT, ValueT, KeyInfoT, BucketT>,
                                   KeyT, ValueT, KeyInfoT, BucketT> {
friend class DenseMapBase<DenseMap, KeyT, ValueT, KeyInfoT, BucketT>;

// Lift some types from the dependent base class into this class for
// simplicity of referring to them.
using BaseT = DenseMapBase<DenseMap, KeyT, ValueT, KeyInfoT, BucketT>;

BucketT *Buckets;
unsigned NumEntries;
unsigned NumTombstones;
unsigned NumBuckets;

727public:
/// Create a DenseMap with an optional \p InitialReserve that guarantee that
/// this number of elements can be inserted in the map without grow()
explicit DenseMap(unsigned InitialReserve = 0) { init(InitialReserve); }

DenseMap(const DenseMap &other) : BaseT() {
  init(0);
  copyFrom(other);
}

DenseMap(DenseMap &&other) : BaseT() {
  init(0);
  swap(other);
}

template<typename InputIt>
DenseMap(const InputIt &I, const InputIt &E) {
  init(std::distance(I, E));
  this->insert(I, E);
}

DenseMap(std::initializer_list<typename BaseT::value_type> Vals) {
  init(Vals.size());
  this->insert(Vals.begin(), Vals.end());
}

~DenseMap() {
  this->destroyAll();
  deallocate_buffer(Buckets, sizeof(BucketT) * NumBuckets, alignof(BucketT));
}

void swap(DenseMap& RHS) {
  this->incrementEpoch();
  RHS.incrementEpoch();
  std::swap(Buckets, RHS.Buckets);
  std::swap(NumEntries, RHS.NumEntries);
  std::swap(NumTombstones, RHS.NumTombstones);
  std::swap(NumBuckets, RHS.NumBuckets);
}

DenseMap& operator=(const DenseMap& other) {
  if (&other != this)
    copyFrom(other);
  return *this;
}

DenseMap& operator=(DenseMap &&other) {
  this->destroyAll();
  deallocate_buffer(Buckets, sizeof(BucketT) * NumBuckets, alignof(BucketT));
  init(0);
  swap(other);
  return *this;
}

void copyFrom(const DenseMap& other) {
  this->destroyAll();
  deallocate_buffer(Buckets, sizeof(BucketT) * NumBuckets, alignof(BucketT));
  if (allocateBuckets(other.NumBuckets)) {
    this->BaseT::copyFrom(other);
  } else {
    NumEntries = 0;
    NumTombstones = 0;
  }
}

void init(unsigned InitNumEntries) {
  auto InitBuckets = BaseT::getMinBucketToReserveForEntries(InitNumEntries);
  if (allocateBuckets(InitBuckets)) {
    this->BaseT::initEmpty();
  } else {
    NumEntries = 0;
    NumTombstones = 0;
  }
}

void grow(unsigned AtLeast) {
  unsigned OldNumBuckets = NumBuckets;
  BucketT *OldBuckets = Buckets;

  allocateBuckets(std::max<unsigned>(64, static_cast<unsigned>(NextPowerOf2(AtLeast-1))));
  assert(Buckets)((void)0);
  if (!OldBuckets) {
    this->BaseT::initEmpty();
    return;
  }

  this->moveFromOldBuckets(OldBuckets, OldBuckets+OldNumBuckets);

  // Free the old table.
  deallocate_buffer(OldBuckets, sizeof(BucketT) * OldNumBuckets,
                    alignof(BucketT));
}

void shrink_and_clear() {
  unsigned OldNumBuckets = NumBuckets;
  unsigned OldNumEntries = NumEntries;
  this->destroyAll();

  // Reduce the number of buckets.
  unsigned NewNumBuckets = 0;
  if (OldNumEntries)
    NewNumBuckets = std::max(64, 1 << (Log2_32_Ceil(OldNumEntries) + 1));
  if (NewNumBuckets == NumBuckets) {
    this->BaseT::initEmpty();
    return;
  }

  deallocate_buffer(Buckets, sizeof(BucketT) * OldNumBuckets,
                    alignof(BucketT));
  init(NewNumBuckets);
}

839private:
unsigned getNumEntries() const {
  return NumEntries;
}

void setNumEntries(unsigned Num) {
  NumEntries = Num;
}

unsigned getNumTombstones() const {
  return NumTombstones;
}

void setNumTombstones(unsigned Num) {
  NumTombstones = Num;
}

BucketT *getBuckets() const {
  return Buckets;
}

unsigned getNumBuckets() const {
  return NumBuckets;
}

bool allocateBuckets(unsigned Num) {
  NumBuckets = Num;
  if (NumBuckets == 0) {
    Buckets = nullptr;
    return false;
  }

  Buckets = static_cast<BucketT *>(
      allocate_buffer(sizeof(BucketT) * NumBuckets, alignof(BucketT)));
  return true;
}
875};

877template <typename KeyT, typename ValueT, unsigned InlineBuckets = 4,
        typename KeyInfoT = DenseMapInfo<KeyT>,
        typename BucketT = llvm::detail::DenseMapPair<KeyT, ValueT>>
880class SmallDenseMap
  : public DenseMapBase<
        SmallDenseMap<KeyT, ValueT, InlineBuckets, KeyInfoT, BucketT>, KeyT,
        ValueT, KeyInfoT, BucketT> {
friend class DenseMapBase<SmallDenseMap, KeyT, ValueT, KeyInfoT, BucketT>;

// Lift some types from the dependent base class into this class for
// simplicity of referring to them.
using BaseT = DenseMapBase<SmallDenseMap, KeyT, ValueT, KeyInfoT, BucketT>;

static_assert(isPowerOf2_64(InlineBuckets),
              "InlineBuckets must be a power of 2.");

unsigned Small : 1;
unsigned NumEntries : 31;
unsigned NumTombstones;

struct LargeRep {
  BucketT *Buckets;
  unsigned NumBuckets;
};

/// A "union" of an inline bucket array and the struct representing
/// a large bucket. This union will be discriminated by the 'Small' bit.
AlignedCharArrayUnion<BucketT[InlineBuckets], LargeRep> storage;

906public:
explicit SmallDenseMap(unsigned NumInitBuckets = 0) {
  init(NumInitBuckets);
}

SmallDenseMap(const SmallDenseMap &other) : BaseT() {
  init(0);
  copyFrom(other);
}

SmallDenseMap(SmallDenseMap &&other) : BaseT() {
  init(0);
  swap(other);
}

template<typename InputIt>
SmallDenseMap(const InputIt &I, const InputIt &E) {
  init(NextPowerOf2(std::distance(I, E)));
  this->insert(I, E);
}

SmallDenseMap(std::initializer_list<typename BaseT::value_type> Vals)
    : SmallDenseMap(Vals.begin(), Vals.end()) {}

~SmallDenseMap() {
  this->destroyAll();
  deallocateBuckets();
}

void swap(SmallDenseMap& RHS) {
  unsigned TmpNumEntries = RHS.NumEntries;
  RHS.NumEntries = NumEntries;
  NumEntries = TmpNumEntries;
  std::swap(NumTombstones, RHS.NumTombstones);

  const KeyT EmptyKey = this->getEmptyKey();
  const KeyT TombstoneKey = this->getTombstoneKey();
  if (Small && RHS.Small) {
    // If we're swapping inline bucket arrays, we have to cope with some of
    // the tricky bits of DenseMap's storage system: the buckets are not
    // fully initialized. Thus we swap every key, but we may have
    // a one-directional move of the value.
    for (unsigned i = 0, e = InlineBuckets; i != e; ++i) {
      BucketT *LHSB = &getInlineBuckets()[i],
              *RHSB = &RHS.getInlineBuckets()[i];
      bool hasLHSValue = (!KeyInfoT::isEqual(LHSB->getFirst(), EmptyKey) &&
                          !KeyInfoT::isEqual(LHSB->getFirst(), TombstoneKey));
      bool hasRHSValue = (!KeyInfoT::isEqual(RHSB->getFirst(), EmptyKey) &&
                          !KeyInfoT::isEqual(RHSB->getFirst(), TombstoneKey));
      if (hasLHSValue && hasRHSValue) {
        // Swap together if we can...
        std::swap(*LHSB, *RHSB);
        continue;
      }
      // Swap separately and handle any asymmetry.
      std::swap(LHSB->getFirst(), RHSB->getFirst());
      if (hasLHSValue) {
        ::new (&RHSB->getSecond()) ValueT(std::move(LHSB->getSecond()));
        LHSB->getSecond().~ValueT();
      } else if (hasRHSValue) {
        ::new (&LHSB->getSecond()) ValueT(std::move(RHSB->getSecond()));
        RHSB->getSecond().~ValueT();
      }
    }
    return;
  }
  if (!Small && !RHS.Small) {
    std::swap(getLargeRep()->Buckets, RHS.getLargeRep()->Buckets);
    std::swap(getLargeRep()->NumBuckets, RHS.getLargeRep()->NumBuckets);
    return;
  }

  SmallDenseMap &SmallSide = Small ? *this : RHS;
  SmallDenseMap &LargeSide = Small ? RHS : *this;

  // First stash the large side's rep and move the small side across.
  LargeRep TmpRep = std::move(*LargeSide.getLargeRep());
  LargeSide.getLargeRep()->~LargeRep();
  LargeSide.Small = true;
  // This is similar to the standard move-from-old-buckets, but the bucket
  // count hasn't actually rotated in this case. So we have to carefully
  // move construct the keys and values into their new locations, but there
  // is no need to re-hash things.
  for (unsigned i = 0, e = InlineBuckets; i != e; ++i) {
    BucketT *NewB = &LargeSide.getInlineBuckets()[i],
            *OldB = &SmallSide.getInlineBuckets()[i];
    ::new (&NewB->getFirst()) KeyT(std::move(OldB->getFirst()));
    OldB->getFirst().~KeyT();
    if (!KeyInfoT::isEqual(NewB->getFirst(), EmptyKey) &&
        !KeyInfoT::isEqual(NewB->getFirst(), TombstoneKey)) {
      ::new (&NewB->getSecond()) ValueT(std::move(OldB->getSecond()));
      OldB->getSecond().~ValueT();
    }
  }

  // The hard part of moving the small buckets across is done, just move
  // the TmpRep into its new home.
  SmallSide.Small = false;
  new (SmallSide.getLargeRep()) LargeRep(std::move(TmpRep));
}

SmallDenseMap& operator=(const SmallDenseMap& other) {
  if (&other != this)
    copyFrom(other);
  return *this;
}

SmallDenseMap& operator=(SmallDenseMap &&other) {
  this->destroyAll();
  deallocateBuckets();
  init(0);
  swap(other);
  return *this;
}

void copyFrom(const SmallDenseMap& other) {
  this->destroyAll();
  deallocateBuckets();
  Small = true;
  if (other.getNumBuckets() > InlineBuckets) {
    Small = false;
    new (getLargeRep()) LargeRep(allocateBuckets(other.getNumBuckets()));
  }
  this->BaseT::copyFrom(other);
}

void init(unsigned InitBuckets) {
  Small = true;
  if (InitBuckets > InlineBuckets) {
    Small = false;
    new (getLargeRep()) LargeRep(allocateBuckets(InitBuckets));
  }
  this->BaseT::initEmpty();
}

void grow(unsigned AtLeast) {
  if (AtLeast > InlineBuckets)
    AtLeast = std::max<unsigned>(64, NextPowerOf2(AtLeast-1));

  if (Small) {
    // First move the inline buckets into a temporary storage.
    AlignedCharArrayUnion<BucketT[InlineBuckets]> TmpStorage;
    BucketT *TmpBegin = reinterpret_cast<BucketT *>(&TmpStorage);
    BucketT *TmpEnd = TmpBegin;

    // Loop over the buckets, moving non-empty, non-tombstones into the
    // temporary storage. Have the loop move the TmpEnd forward as it goes.
    const KeyT EmptyKey = this->getEmptyKey();
    const KeyT TombstoneKey = this->getTombstoneKey();
    for (BucketT *P = getBuckets(), *E = P + InlineBuckets; P != E; ++P) {
      if (!KeyInfoT::isEqual(P->getFirst(), EmptyKey) &&
          !KeyInfoT::isEqual(P->getFirst(), TombstoneKey)) {
        assert(size_t(TmpEnd - TmpBegin) < InlineBuckets &&((void)0)
               "Too many inline buckets!")((void)0);
        ::new (&TmpEnd->getFirst()) KeyT(std::move(P->getFirst()));
        ::new (&TmpEnd->getSecond()) ValueT(std::move(P->getSecond()));
        ++TmpEnd;
        P->getSecond().~ValueT();
      }
      P->getFirst().~KeyT();
    }

    // AtLeast == InlineBuckets can happen if there are many tombstones,
    // and grow() is used to remove them. Usually we always switch to the
    // large rep here.
    if (AtLeast > InlineBuckets) {
      Small = false;
      new (getLargeRep()) LargeRep(allocateBuckets(AtLeast));
    }
    this->moveFromOldBuckets(TmpBegin, TmpEnd);
    return;
  }

  LargeRep OldRep = std::move(*getLargeRep());
  getLargeRep()->~LargeRep();
  if (AtLeast <= InlineBuckets) {
    Small = true;
  } else {
    new (getLargeRep()) LargeRep(allocateBuckets(AtLeast));
  }

  this->moveFromOldBuckets(OldRep.Buckets, OldRep.Buckets+OldRep.NumBuckets);

  // Free the old table.
  deallocate_buffer(OldRep.Buckets, sizeof(BucketT) * OldRep.NumBuckets,
                    alignof(BucketT));
}

void shrink_and_clear() {
  unsigned OldSize = this->size();
  this->destroyAll();

  // Reduce the number of buckets.
  unsigned NewNumBuckets = 0;
  if (OldSize) {
    NewNumBuckets = 1 << (Log2_32_Ceil(OldSize) + 1);
    if (NewNumBuckets > InlineBuckets && NewNumBuckets < 64u)
      NewNumBuckets = 64;
  }
  if ((Small && NewNumBuckets <= InlineBuckets) ||
      (!Small && NewNumBuckets == getLargeRep()->NumBuckets)) {
    this->BaseT::initEmpty();
    return;
  }

  deallocateBuckets();
  init(NewNumBuckets);
}

1115private:
unsigned getNumEntries() const {
  return NumEntries;
}

void setNumEntries(unsigned Num) {
  // NumEntries is hardcoded to be 31 bits wide.
  assert(Num < (1U << 31) && "Cannot support more than 1<<31 entries")((void)0);
  NumEntries = Num;
}

unsigned getNumTombstones() const {
  return NumTombstones;
}

void setNumTombstones(unsigned Num) {
  NumTombstones = Num;
}

const BucketT *getInlineBuckets() const {
  assert(Small)((void)0);
  // Note that this cast does not violate aliasing rules as we assert that
  // the memory's dynamic type is the small, inline bucket buffer, and the
  // 'storage' is a POD containing a char buffer.
  return reinterpret_cast<const BucketT *>(&storage);
}

BucketT *getInlineBuckets() {
  return const_cast<BucketT *>(
    const_cast<const SmallDenseMap *>(this)->getInlineBuckets());
}

const LargeRep *getLargeRep() const {
  assert(!Small)((void)0);
  // Note, same rule about aliasing as with getInlineBuckets.
  return reinterpret_cast<const LargeRep *>(&storage);
}

LargeRep *getLargeRep() {
  return const_cast<LargeRep *>(
    const_cast<const SmallDenseMap *>(this)->getLargeRep());
}

const BucketT *getBuckets() const {
  return Small ? getInlineBuckets() : getLargeRep()->Buckets;
}

BucketT *getBuckets() {
  return const_cast<BucketT *>(
    const_cast<const SmallDenseMap *>(this)->getBuckets());
}

unsigned getNumBuckets() const {
  return Small ? InlineBuckets : getLargeRep()->NumBuckets;
}

void deallocateBuckets() {
  if (Small)
    return;

  deallocate_buffer(getLargeRep()->Buckets,
                    sizeof(BucketT) * getLargeRep()->NumBuckets,
                    alignof(BucketT));
  getLargeRep()->~LargeRep();
}

LargeRep allocateBuckets(unsigned Num) {
  assert(Num > InlineBuckets && "Must allocate more buckets than are inline")((void)0);
  LargeRep Rep = {static_cast<BucketT *>(allocate_buffer(
                      sizeof(BucketT) * Num, alignof(BucketT))),
                  Num};
  return Rep;
}
1188};

1190template <typename KeyT, typename ValueT, typename KeyInfoT, typename Bucket,
        bool IsConst>
1192class DenseMapIterator : DebugEpochBase::HandleBase {
friend class DenseMapIterator<KeyT, ValueT, KeyInfoT, Bucket, true>;
friend class DenseMapIterator<KeyT, ValueT, KeyInfoT, Bucket, false>;

1196public:
using difference_type = ptrdiff_t;
using value_type =
    typename std::conditional<IsConst, const Bucket, Bucket>::type;
using pointer = value_type *;
using reference = value_type &;
using iterator_category = std::forward_iterator_tag;

1204private:
pointer Ptr = nullptr;
pointer End = nullptr;

1208public:
DenseMapIterator() = default;

DenseMapIterator(pointer Pos, pointer E, const DebugEpochBase &Epoch,
                 bool NoAdvance = false)
    : DebugEpochBase::HandleBase(&Epoch), Ptr(Pos), End(E) {
  assert(isHandleInSync() && "invalid construction!")((void)0);

  if (NoAdvance) return;
  if (shouldReverseIterate<KeyT>()) {
    RetreatPastEmptyBuckets();
    return;
  }
  AdvancePastEmptyBuckets();
}

// Converting ctor from non-const iterators to const iterators. SFINAE'd out
// for const iterator destinations so it doesn't end up as a user defined copy
// constructor.
template <bool IsConstSrc,
          typename = std::enable_if_t<!IsConstSrc && IsConst>>
DenseMapIterator(
    const DenseMapIterator<KeyT, ValueT, KeyInfoT, Bucket, IsConstSrc> &I)
    : DebugEpochBase::HandleBase(I), Ptr(I.Ptr), End(I.End) {}

reference operator*() const {
  assert(isHandleInSync() && "invalid iterator access!")((void)0);
  assert(Ptr != End && "dereferencing end() iterator")((void)0);
  if (shouldReverseIterate<KeyT>())
    return Ptr[-1];
  return *Ptr;
}
pointer operator->() const {
  assert(isHandleInSync() && "invalid iterator access!")((void)0);
  assert(Ptr != End && "dereferencing end() iterator")((void)0);
  if (shouldReverseIterate<KeyT>())
    return &(Ptr[-1]);
  return Ptr;
}

friend bool operator==(const DenseMapIterator &LHS,
                       const DenseMapIterator &RHS) {
  assert((!LHS.Ptr || LHS.isHandleInSync()) && "handle not in sync!")((void)0);
  assert((!RHS.Ptr || RHS.isHandleInSync()) && "handle not in sync!")((void)0);
  assert(LHS.getEpochAddress() == RHS.getEpochAddress() &&((void)0)
         "comparing incomparable iterators!")((void)0);
  return LHS.Ptr == RHS.Ptr;
65
←
Assuming 'LHS.Ptr' is equal to 'RHS.Ptr'→
66
←
Returning the value 1, which participates in a condition later→
}

friend bool operator!=(const DenseMapIterator &LHS,
                       const DenseMapIterator &RHS) {
  return !(LHS == RHS);
64
←
Calling 'operator=='→
67
←
Returning from 'operator=='→
68
←
Returning zero, which participates in a condition later→
}

inline DenseMapIterator& operator++() {  // Preincrement
  assert(isHandleInSync() && "invalid iterator access!")((void)0);
  assert(Ptr != End && "incrementing end() iterator")((void)0);
  if (shouldReverseIterate<KeyT>()) {
    --Ptr;
    RetreatPastEmptyBuckets();
    return *this;
  }
  ++Ptr;
  AdvancePastEmptyBuckets();
  return *this;
}
DenseMapIterator operator++(int) {  // Postincrement
  assert(isHandleInSync() && "invalid iterator access!")((void)0);
  DenseMapIterator tmp = *this; ++*this; return tmp;
}

1279private:
void AdvancePastEmptyBuckets() {
  assert(Ptr <= End)((void)0);
  const KeyT Empty = KeyInfoT::getEmptyKey();
  const KeyT Tombstone = KeyInfoT::getTombstoneKey();

  while (Ptr != End && (KeyInfoT::isEqual(Ptr->getFirst(), Empty) ||
                        KeyInfoT::isEqual(Ptr->getFirst(), Tombstone)))
    ++Ptr;
}

void RetreatPastEmptyBuckets() {
  assert(Ptr >= End)((void)0);
  const KeyT Empty = KeyInfoT::getEmptyKey();
  const KeyT Tombstone = KeyInfoT::getTombstoneKey();

  while (Ptr != End && (KeyInfoT::isEqual(Ptr[-1].getFirst(), Empty) ||
                        KeyInfoT::isEqual(Ptr[-1].getFirst(), Tombstone)))
    --Ptr;
}
1299};

1301template <typename KeyT, typename ValueT, typename KeyInfoT>
1302inline size_t capacity_in_bytes(const DenseMap<KeyT, ValueT, KeyInfoT> &X) {
return X.getMemorySize();
1304}

1306} // end namespace llvm

1308#endif // LLVM_ADT_DENSEMAP_H