doxygen/HexagonTargetTransformInfo_8cpp_source.html

//===- HexagonTargetTransformInfo.cpp - Hexagon specific TTI pass ---------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

/// \file

/// This file implements a TargetTransformInfo analysis pass specific to the

/// Hexagon target machine. It uses the target's detailed information to provide

/// more precise answers to certain TTI queries, while letting the target

/// independent and default TTI implementations handle the rest.

///

//===----------------------------------------------------------------------===//


#include "HexagonTargetTransformInfo.h"

#include "HexagonSubtarget.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/CodeGen/ValueTypes.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/User.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Transforms/Utils/LoopPeel.h"

#include "llvm/Transforms/Utils/UnrollLoop.h"


using namespace llvm;


#define DEBUG_TYPE "hexagontti"


static cl::opt<bool> HexagonAutoHVX("hexagon-autohvx", cl::init(false),

    cl::Hidden, cl::desc("Enable loop vectorizer for HVX"));


cl::opt<bool> HexagonAllowScatterGatherHVX(

    "hexagon-allow-scatter-gather-hvx", cl::init(false), cl::Hidden,

    cl::desc("Allow auto-generation of HVX scatter-gather"));


static cl::opt<bool> EnableV68FloatAutoHVX(

    "force-hvx-float", cl::Hidden,

    cl::desc("Enable auto-vectorization of floatint point types on v68."));


static cl::opt<bool> EmitLookupTables("hexagon-emit-lookup-tables",

    cl::init(true), cl::Hidden,

    cl::desc("Control lookup table emission on Hexagon target"));


static cl::opt<bool> HexagonMaskedVMem("hexagon-masked-vmem", cl::init(true),

    cl::Hidden, cl::desc("Enable masked loads/stores for HVX"));


// Constant "cost factor" to make floating point operations more expensive

// in terms of vectorization cost. This isn't the best way, but it should

// do. Ultimately, the cost should use cycles.

static const unsigned FloatFactor = 4;


bool HexagonTTIImpl::useHVX() const {

  return ST.useHVXOps() && HexagonAutoHVX;

}


bool HexagonTTIImpl::isHVXVectorType(Type *Ty) const {

  auto *VecTy = dyn_cast<VectorType>(Ty);

  if (!VecTy)

    return false;

  if (!ST.isTypeForHVX(VecTy))

    return false;

  if (ST.useHVXV69Ops() || !VecTy->getElementType()->isFloatingPointTy())

    return true;

  return ST.useHVXV68Ops() && EnableV68FloatAutoHVX;

}


unsigned HexagonTTIImpl::getTypeNumElements(Type *Ty) const {

  if (auto *VTy = dyn_cast<FixedVectorType>(Ty))

    return VTy->getNumElements();

  assert((Ty->isIntegerTy() || Ty->isFloatingPointTy()) &&

         "Expecting scalar type");

  return 1;

}


TargetTransformInfo::PopcntSupportKind


HexagonTTIImpl::getPopcntSupport(unsigned IntTyWidthInBit) const {

  // Return fast hardware support as every input < 64 bits will be promoted

  // to 64 bits.

  return TargetTransformInfo::PSK_FastHardware;

}


// The Hexagon target can unroll loops with run-time trip counts.


void HexagonTTIImpl::getUnrollingPreferences(

    Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP,

    OptimizationRemarkEmitter *ORE) const {

  UP.Runtime = UP.Partial = true;

}


void HexagonTTIImpl::getPeelingPreferences(Loop *L, ScalarEvolution &SE,

                                           TTI::PeelingPreferences &PP) const {

  BaseT::getPeelingPreferences(L, SE, PP);

  // Only try to peel innermost loops with small runtime trip counts.

  if (L && L->isInnermost() && canPeel(L) &&

      SE.getSmallConstantTripCount(L) == 0 &&

      SE.getSmallConstantMaxTripCount(L) > 0 &&

      SE.getSmallConstantMaxTripCount(L) <= 5) {

    PP.PeelCount = 2;

  }

}


TTI::AddressingModeKind


HexagonTTIImpl::getPreferredAddressingMode(const Loop *L,

                                           ScalarEvolution *SE) const {

  return TTI::AMK_PostIndexed;

}


/// --- Vector TTI begin ---


unsigned HexagonTTIImpl::getNumberOfRegisters(unsigned ClassID) const {

  bool Vector = ClassID == 1;

  if (Vector)

    return useHVX() ? 32 : 0;

  return 32;

}


unsigned HexagonTTIImpl::getMaxInterleaveFactor(ElementCount VF) const {

  return useHVX() ? 2 : 1;

}


TypeSize


HexagonTTIImpl::getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const {

  switch (K) {

  case TargetTransformInfo::RGK_Scalar:

    return TypeSize::getFixed(32);

  case TargetTransformInfo::RGK_FixedWidthVector:

    return TypeSize::getFixed(getMinVectorRegisterBitWidth());

  case TargetTransformInfo::RGK_ScalableVector:

    return TypeSize::getScalable(0);

  }


  llvm_unreachable("Unsupported register kind");

}


unsigned HexagonTTIImpl::getMinVectorRegisterBitWidth() const {

  return useHVX() ? ST.getVectorLength()*8 : 32;

}


ElementCount HexagonTTIImpl::getMinimumVF(unsigned ElemWidth,

                                          bool IsScalable) const {

  assert(!IsScalable && "Scalable VFs are not supported for Hexagon");

  return ElementCount::getFixed((8 * ST.getVectorLength()) / ElemWidth);

}


InstructionCost


HexagonTTIImpl::getCallInstrCost(Function *F, Type *RetTy, ArrayRef<Type *> Tys,

                                 TTI::TargetCostKind CostKind) const {

  return BaseT::getCallInstrCost(F, RetTy, Tys, CostKind);

}


InstructionCost


HexagonTTIImpl::getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                                      TTI::TargetCostKind CostKind) const {

  if (ICA.getID() == Intrinsic::bswap) {

    std::pair<InstructionCost, MVT> LT =

        getTypeLegalizationCost(ICA.getReturnType());

    return LT.first + 2;

  }

  return BaseT::getIntrinsicInstrCost(ICA, CostKind);

}


InstructionCost


HexagonTTIImpl::getAddressComputationCost(Type *PtrTy, ScalarEvolution *SE,

                                          const SCEV *S,

                                          TTI::TargetCostKind CostKind) const {

  return 0;

}


InstructionCost HexagonTTIImpl::getMemoryOpCost(unsigned Opcode, Type *Src,

                                                Align Alignment,

                                                unsigned AddressSpace,

                                                TTI::TargetCostKind CostKind,

                                                TTI::OperandValueInfo OpInfo,

                                                const Instruction *I) const {

  assert(Opcode == Instruction::Load || Opcode == Instruction::Store);

  // TODO: Handle other cost kinds.

  if (CostKind != TTI::TCK_RecipThroughput)

    return 1;


  if (Opcode == Instruction::Store)

    return BaseT::getMemoryOpCost(Opcode, Src, Alignment, AddressSpace,

                                  CostKind, OpInfo, I);


  if (Src->isVectorTy()) {

    VectorType *VecTy = cast<VectorType>(Src);

    unsigned VecWidth = VecTy->getPrimitiveSizeInBits().getFixedValue();

    if (isHVXVectorType(VecTy)) {

      unsigned RegWidth =

          getRegisterBitWidth(TargetTransformInfo::RGK_FixedWidthVector)

              .getFixedValue();

      assert(RegWidth && "Non-zero vector register width expected");

      // Cost of HVX loads.

      if (VecWidth % RegWidth == 0)

        return VecWidth / RegWidth;

      // Cost of constructing HVX vector from scalar loads

      const Align RegAlign(RegWidth / 8);

      if (Alignment > RegAlign)

        Alignment = RegAlign;

      unsigned AlignWidth = 8 * Alignment.value();

      unsigned NumLoads = alignTo(VecWidth, AlignWidth) / AlignWidth;

      return 3 * NumLoads;

    }


    // Non-HVX vectors.

    // Add extra cost for floating point types.

    unsigned Cost =

        VecTy->getElementType()->isFloatingPointTy() ? FloatFactor : 1;


    // At this point unspecified alignment is considered as Align(1).

    const Align BoundAlignment = std::min(Alignment, Align(8));

    unsigned AlignWidth = 8 * BoundAlignment.value();

    unsigned NumLoads = alignTo(VecWidth, AlignWidth) / AlignWidth;

    if (Alignment == Align(4) || Alignment == Align(8))

      return Cost * NumLoads;

    // Loads of less than 32 bits will need extra inserts to compose a vector.

    assert(BoundAlignment <= Align(8));

    unsigned LogA = Log2(BoundAlignment);

    return (3 - LogA) * Cost * NumLoads;

  }


  return BaseT::getMemoryOpCost(Opcode, Src, Alignment, AddressSpace, CostKind,

                                OpInfo, I);

}


InstructionCost


HexagonTTIImpl::getMaskedMemoryOpCost(unsigned Opcode, Type *Src,

                                      Align Alignment, unsigned AddressSpace,

                                      TTI::TargetCostKind CostKind) const {

  return BaseT::getMaskedMemoryOpCost(Opcode, Src, Alignment, AddressSpace,

                                      CostKind);

}


InstructionCost


HexagonTTIImpl::getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy,

                               VectorType *SrcTy, ArrayRef<int> Mask,

                               TTI::TargetCostKind CostKind, int Index,

                               VectorType *SubTp, ArrayRef<const Value *> Args,

                               const Instruction *CxtI) const {

  return 1;

}


InstructionCost HexagonTTIImpl::getGatherScatterOpCost(

    unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask,

    Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I) const {

  return BaseT::getGatherScatterOpCost(Opcode, DataTy, Ptr, VariableMask,

                                       Alignment, CostKind, I);

}


InstructionCost HexagonTTIImpl::getInterleavedMemoryOpCost(

    unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

    Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

    bool UseMaskForCond, bool UseMaskForGaps) const {

  if (Indices.size() != Factor || UseMaskForCond || UseMaskForGaps)

    return BaseT::getInterleavedMemoryOpCost(Opcode, VecTy, Factor, Indices,

                                             Alignment, AddressSpace,

                                             CostKind,

                                             UseMaskForCond, UseMaskForGaps);

  return getMemoryOpCost(Opcode, VecTy, Alignment, AddressSpace, CostKind);

}


InstructionCost HexagonTTIImpl::getCmpSelInstrCost(

    unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred,

    TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info,

    TTI::OperandValueInfo Op2Info, const Instruction *I) const {

  if (ValTy->isVectorTy() && CostKind == TTI::TCK_RecipThroughput) {

    if (!isHVXVectorType(ValTy) && ValTy->isFPOrFPVectorTy())

      return InstructionCost::getMax();

    std::pair<InstructionCost, MVT> LT = getTypeLegalizationCost(ValTy);

    if (Opcode == Instruction::FCmp)

      return LT.first + FloatFactor * getTypeNumElements(ValTy);

  }

  return BaseT::getCmpSelInstrCost(Opcode, ValTy, CondTy, VecPred, CostKind,

                                   Op1Info, Op2Info, I);

}


InstructionCost HexagonTTIImpl::getArithmeticInstrCost(

    unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

    TTI::OperandValueInfo Op1Info, TTI::OperandValueInfo Op2Info,

    ArrayRef<const Value *> Args, const Instruction *CxtI) const {

  // TODO: Handle more cost kinds.

  if (CostKind != TTI::TCK_RecipThroughput)

    return BaseT::getArithmeticInstrCost(Opcode, Ty, CostKind, Op1Info,

                                         Op2Info, Args, CxtI);


  if (Ty->isVectorTy()) {

    if (!isHVXVectorType(Ty) && Ty->isFPOrFPVectorTy())

      return InstructionCost::getMax();

    std::pair<InstructionCost, MVT> LT = getTypeLegalizationCost(Ty);

    if (LT.second.isFloatingPoint())

      return LT.first + FloatFactor * getTypeNumElements(Ty);

  }

  return BaseT::getArithmeticInstrCost(Opcode, Ty, CostKind, Op1Info, Op2Info,

                                       Args, CxtI);

}


InstructionCost HexagonTTIImpl::getCastInstrCost(unsigned Opcode, Type *DstTy,

                                                 Type *SrcTy,

                                                 TTI::CastContextHint CCH,

                                                 TTI::TargetCostKind CostKind,

                                                 const Instruction *I) const {

  auto isNonHVXFP = [this] (Type *Ty) {

    return Ty->isVectorTy() && !isHVXVectorType(Ty) && Ty->isFPOrFPVectorTy();

  };

  if (isNonHVXFP(SrcTy) || isNonHVXFP(DstTy))

    return InstructionCost::getMax();


  if (SrcTy->isFPOrFPVectorTy() || DstTy->isFPOrFPVectorTy()) {

    unsigned SrcN = SrcTy->isFPOrFPVectorTy() ? getTypeNumElements(SrcTy) : 0;

    unsigned DstN = DstTy->isFPOrFPVectorTy() ? getTypeNumElements(DstTy) : 0;


    std::pair<InstructionCost, MVT> SrcLT = getTypeLegalizationCost(SrcTy);

    std::pair<InstructionCost, MVT> DstLT = getTypeLegalizationCost(DstTy);

    InstructionCost Cost =

        std::max(SrcLT.first, DstLT.first) + FloatFactor * (SrcN + DstN);

    // TODO: Allow non-throughput costs that aren't binary.

    if (CostKind != TTI::TCK_RecipThroughput)

      return Cost == 0 ? 0 : 1;

    return Cost;

  }

  return 1;

}


InstructionCost HexagonTTIImpl::getVectorInstrCost(unsigned Opcode, Type *Val,

                                                   TTI::TargetCostKind CostKind,

                                                   unsigned Index,

                                                   const Value *Op0,

                                                   const Value *Op1) const {

  Type *ElemTy = Val->isVectorTy() ? cast<VectorType>(Val)->getElementType()

                                   : Val;

  if (Opcode == Instruction::InsertElement) {

    // Need two rotations for non-zero index.

    unsigned Cost = (Index != 0) ? 2 : 0;

    if (ElemTy->isIntegerTy(32))

      return Cost;

    // If it's not a 32-bit value, there will need to be an extract.

    return Cost + getVectorInstrCost(Instruction::ExtractElement, Val, CostKind,

                                     Index, Op0, Op1);

  }


  if (Opcode == Instruction::ExtractElement)

    return 2;


  return 1;

}


bool HexagonTTIImpl::isLegalMaskedStore(Type *DataType, Align /*Alignment*/,

                                        unsigned /*AddressSpace*/) const {

  // This function is called from scalarize-masked-mem-intrin, which runs

  // in pre-isel. Use ST directly instead of calling isHVXVectorType.

  return HexagonMaskedVMem && ST.isTypeForHVX(DataType);

}


bool HexagonTTIImpl::isLegalMaskedLoad(Type *DataType, Align /*Alignment*/,

                                       unsigned /*AddressSpace*/) const {

  // This function is called from scalarize-masked-mem-intrin, which runs

  // in pre-isel. Use ST directly instead of calling isHVXVectorType.

  return HexagonMaskedVMem && ST.isTypeForHVX(DataType);

}


bool HexagonTTIImpl::isLegalMaskedGather(Type *Ty, Align Alignment) const {

  // For now assume we can not deal with all HVX datatypes.

  if (!Ty->isVectorTy() || !ST.isTypeForHVX(Ty) ||

      !HexagonAllowScatterGatherHVX)

    return false;

  // This must be in sync with HexagonVectorCombine pass.

  switch (Ty->getScalarSizeInBits()) {

  case 8:

    return (getTypeNumElements(Ty) == 128);

  case 16:

    if (getTypeNumElements(Ty) == 64 || getTypeNumElements(Ty) == 32)

      return (Alignment >= 2);

    break;

  case 32:

    if (getTypeNumElements(Ty) == 32)

      return (Alignment >= 4);

    break;

  default:

    break;

  }

  return false;

}


bool HexagonTTIImpl::isLegalMaskedScatter(Type *Ty, Align Alignment) const {

  if (!Ty->isVectorTy() || !ST.isTypeForHVX(Ty) ||

      !HexagonAllowScatterGatherHVX)

    return false;

  // This must be in sync with HexagonVectorCombine pass.

  switch (Ty->getScalarSizeInBits()) {

  case 8:

    return (getTypeNumElements(Ty) == 128);

  case 16:

    if (getTypeNumElements(Ty) == 64)

      return (Alignment >= 2);

    break;

  case 32:

    if (getTypeNumElements(Ty) == 32)

      return (Alignment >= 4);

    break;

  default:

    break;

  }

  return false;

}


bool HexagonTTIImpl::forceScalarizeMaskedGather(VectorType *VTy,

                                                Align Alignment) const {

  return !isLegalMaskedGather(VTy, Alignment);

}


bool HexagonTTIImpl::forceScalarizeMaskedScatter(VectorType *VTy,

                                                 Align Alignment) const {

  return !isLegalMaskedScatter(VTy, Alignment);

}


/// --- Vector TTI end ---


unsigned HexagonTTIImpl::getPrefetchDistance() const {

  return ST.getL1PrefetchDistance();

}


unsigned HexagonTTIImpl::getCacheLineSize() const {

  return ST.getL1CacheLineSize();

}


InstructionCost


HexagonTTIImpl::getInstructionCost(const User *U,

                                   ArrayRef<const Value *> Operands,

                                   TTI::TargetCostKind CostKind) const {

  auto isCastFoldedIntoLoad = [this](const CastInst *CI) -> bool {

    if (!CI->isIntegerCast())

      return false;

    // Only extensions from an integer type shorter than 32-bit to i32

    // can be folded into the load.

    const DataLayout &DL = getDataLayout();

    unsigned SBW = DL.getTypeSizeInBits(CI->getSrcTy());

    unsigned DBW = DL.getTypeSizeInBits(CI->getDestTy());

    if (DBW != 32 || SBW >= DBW)

      return false;


    const LoadInst *LI = dyn_cast<const LoadInst>(CI->getOperand(0));

    // Technically, this code could allow multiple uses of the load, and

    // check if all the uses are the same extension operation, but this

    // should be sufficient for most cases.

    return LI && LI->hasOneUse();

  };


  if (const CastInst *CI = dyn_cast<const CastInst>(U))

    if (isCastFoldedIntoLoad(CI))

      return TargetTransformInfo::TCC_Free;

  return BaseT::getInstructionCost(U, Operands, CostKind);

}


bool HexagonTTIImpl::shouldBuildLookupTables() const {

  return EmitLookupTables;

}


assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Casting.h

CommandLine.h

CostKind
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))

HexagonSubtarget.h

FloatFactor
static const unsigned FloatFactor
Definition HexagonTargetTransformInfo.cpp:52

EnableV68FloatAutoHVX
static cl::opt< bool > EnableV68FloatAutoHVX("force-hvx-float", cl::Hidden, cl::desc("Enable auto-vectorization of floatint point types on v68."))

HexagonAllowScatterGatherHVX
cl::opt< bool > HexagonAllowScatterGatherHVX("hexagon-allow-scatter-gather-hvx", cl::init(false), cl::Hidden, cl::desc("Allow auto-generation of HVX scatter-gather"))

EmitLookupTables
static cl::opt< bool > EmitLookupTables("hexagon-emit-lookup-tables", cl::init(true), cl::Hidden, cl::desc("Control lookup table emission on Hexagon target"))

HexagonMaskedVMem
static cl::opt< bool > HexagonMaskedVMem("hexagon-masked-vmem", cl::init(true), cl::Hidden, cl::desc("Enable masked loads/stores for HVX"))

HexagonAutoHVX
static cl::opt< bool > HexagonAutoHVX("hexagon-autohvx", cl::init(false), cl::Hidden, cl::desc("Enable loop vectorizer for HVX"))

HexagonTargetTransformInfo.h
This file implements a TargetTransformInfo analysis pass specific to the Hexagon target machine.

User.h

InstrTypes.h

Instructions.h

LoopPeel.h

F
#define F(x, y, z)
Definition MD5.cpp:55

I
#define I(x, y, z)
Definition MD5.cpp:58

Ptr
@ Ptr
Definition TargetLibraryInfo.cpp:77

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

UnrollLoop.h

ValueTypes.h

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41

llvm::ArrayRef::size
size_t size() const
size - Get the array size.
Definition ArrayRef.h:143

llvm::BasicTTIImplBase< HexagonTTIImpl >::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false) const override
Definition BasicTTIImpl.h:1615

llvm::BasicTTIImplBase< HexagonTTIImpl >::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Opd1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Opd2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition BasicTTIImpl.h:1059

llvm::BasicTTIImplBase< HexagonTTIImpl >::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition BasicTTIImpl.h:1397

llvm::BasicTTIImplBase< HexagonTTIImpl >::getCallInstrCost
InstructionCost getCallInstrCost(Function *F, Type *RetTy, ArrayRef< Type * > Tys, TTI::TargetCostKind CostKind) const override
Definition BasicTTIImpl.h:3041

llvm::BasicTTIImplBase< HexagonTTIImpl >::getPeelingPreferences
void getPeelingPreferences(Loop *L, ScalarEvolution &SE, TTI::PeelingPreferences &PP) const override
Definition BasicTTIImpl.h:800

llvm::BasicTTIImplBase< HexagonTTIImpl >::getTypeLegalizationCost
std::pair< InstructionCost, MVT > getTypeLegalizationCost(Type *Ty) const
Definition BasicTTIImpl.h:1023

llvm::BasicTTIImplBase< HexagonTTIImpl >::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const override
Definition BasicTTIImpl.h:1760

llvm::BasicTTIImplBase< HexagonTTIImpl >::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition BasicTTIImpl.h:1584

llvm::BasicTTIImplBase< HexagonTTIImpl >::DL
const DataLayout & DL

llvm::BasicTTIImplBase< HexagonTTIImpl >::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition BasicTTIImpl.h:1529

llvm::BasicTTIImplBase< HexagonTTIImpl >::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *DataTy, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind) const override
Definition BasicTTIImpl.h:1575

llvm::CastInst
This is the base class for all instructions that perform data casts.
Definition InstrTypes.h:448

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:676

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:63

llvm::ElementCount
Definition TypeSize.h:299

llvm::ElementCount::getFixed
static constexpr ElementCount getFixed(ScalarTy MinVal)
Definition TypeSize.h:310

llvm::Function
Definition Function.h:64

llvm::HexagonSubtarget::useHVXOps
bool useHVXOps() const
Definition HexagonSubtarget.h:256

llvm::HexagonTTIImpl::isLegalMaskedStore
bool isLegalMaskedStore(Type *DataType, Align Alignment, unsigned AddressSpace) const override
Definition HexagonTargetTransformInfo.cpp:347

llvm::HexagonTTIImpl::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition HexagonTargetTransformInfo.cpp:170

llvm::HexagonTTIImpl::forceScalarizeMaskedScatter
bool forceScalarizeMaskedScatter(VectorType *VTy, Align Alignment) const override
Definition HexagonTargetTransformInfo.cpp:411

llvm::HexagonTTIImpl::getMinimumVF
ElementCount getMinimumVF(unsigned ElemWidth, bool IsScalable) const override
Definition HexagonTargetTransformInfo.cpp:140

llvm::HexagonTTIImpl::isLegalMaskedLoad
bool isLegalMaskedLoad(Type *DataType, Align Alignment, unsigned AddressSpace) const override
Definition HexagonTargetTransformInfo.cpp:354

llvm::HexagonTTIImpl::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition HexagonTargetTransformInfo.cpp:297

llvm::HexagonTTIImpl::forceScalarizeMaskedGather
bool forceScalarizeMaskedGather(VectorType *VTy, Align Alignment) const override
Definition HexagonTargetTransformInfo.cpp:406

llvm::HexagonTTIImpl::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false) const override
Definition HexagonTargetTransformInfo.cpp:250

llvm::HexagonTTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const override
— Vector TTI begin —
Definition HexagonTargetTransformInfo.cpp:111

llvm::HexagonTTIImpl::getAddressComputationCost
InstructionCost getAddressComputationCost(Type *PtrTy, ScalarEvolution *SE, const SCEV *S, TTI::TargetCostKind CostKind) const override
Definition HexagonTargetTransformInfo.cpp:164

llvm::HexagonTTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition HexagonTargetTransformInfo.cpp:277

llvm::HexagonTTIImpl::getPopcntSupport
TTI::PopcntSupportKind getPopcntSupport(unsigned IntTyWidthInBit) const override
Definition HexagonTargetTransformInfo.cpp:78

llvm::HexagonTTIImpl::getMinVectorRegisterBitWidth
unsigned getMinVectorRegisterBitWidth() const override
Definition HexagonTargetTransformInfo.cpp:136

llvm::HexagonTTIImpl::isLegalMaskedGather
bool isLegalMaskedGather(Type *Ty, Align Alignment) const override
Definition HexagonTargetTransformInfo.cpp:361

llvm::HexagonTTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const override
Definition HexagonTargetTransformInfo.cpp:123

llvm::HexagonTTIImpl::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I) const override
Definition HexagonTargetTransformInfo.cpp:243

llvm::HexagonTTIImpl::getCallInstrCost
InstructionCost getCallInstrCost(Function *F, Type *RetTy, ArrayRef< Type * > Tys, TTI::TargetCostKind CostKind) const override
Compute a cost of the given call instruction.
Definition HexagonTargetTransformInfo.cpp:147

llvm::HexagonTTIImpl::getPeelingPreferences
void getPeelingPreferences(Loop *L, ScalarEvolution &SE, TTI::PeelingPreferences &PP) const override
Definition HexagonTargetTransformInfo.cpp:91

llvm::HexagonTTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1) const override
Definition HexagonTargetTransformInfo.cpp:324

llvm::HexagonTTIImpl::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const override
Get intrinsic cost based on arguments.
Definition HexagonTargetTransformInfo.cpp:153

llvm::HexagonTTIImpl::getShuffleCost
InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition HexagonTargetTransformInfo.cpp:235

llvm::HexagonTTIImpl::getPreferredAddressingMode
TTI::AddressingModeKind getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const override
Bias LSR towards creating post-increment opportunities.
Definition HexagonTargetTransformInfo.cpp:104

llvm::HexagonTTIImpl::shouldBuildLookupTables
bool shouldBuildLookupTables() const override
Definition HexagonTargetTransformInfo.cpp:454

llvm::HexagonTTIImpl::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind) const override
Definition HexagonTargetTransformInfo.cpp:227

llvm::HexagonTTIImpl::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF) const override
Definition HexagonTargetTransformInfo.cpp:118

llvm::HexagonTTIImpl::isLegalMaskedScatter
bool isLegalMaskedScatter(Type *Ty, Align Alignment) const override
Definition HexagonTargetTransformInfo.cpp:384

llvm::HexagonTTIImpl::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition HexagonTargetTransformInfo.cpp:262

llvm::HexagonTTIImpl::getInstructionCost
InstructionCost getInstructionCost(const User *U, ArrayRef< const Value * > Operands, TTI::TargetCostKind CostKind) const override
Definition HexagonTargetTransformInfo.cpp:427

llvm::HexagonTTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE) const override
Definition HexagonTargetTransformInfo.cpp:85

llvm::HexagonTTIImpl::getCacheLineSize
unsigned getCacheLineSize() const override
Definition HexagonTargetTransformInfo.cpp:422

llvm::HexagonTTIImpl::getPrefetchDistance
unsigned getPrefetchDistance() const override
— Vector TTI end —
Definition HexagonTargetTransformInfo.cpp:418

llvm::InstructionCost
Definition InstructionCost.h:30

llvm::InstructionCost::getMax
static InstructionCost getMax()
Definition InstructionCost.h:72

llvm::Instruction
Definition Instruction.h:69

llvm::IntrinsicCostAttributes
Definition TargetTransformInfo.h:126

llvm::IntrinsicCostAttributes::getReturnType
Type * getReturnType() const
Definition TargetTransformInfo.h:161

llvm::IntrinsicCostAttributes::getID
Intrinsic::ID getID() const
Definition TargetTransformInfo.h:159

llvm::LoadInst
An instruction for reading from memory.
Definition Instructions.h:181

llvm::Loop
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition OptimizationRemarkEmitter.h:33

llvm::SCEV
This class represents an analyzed expression in the program.
Definition ScalarEvolution.h:72

llvm::ScalarEvolution
The main scalar evolution driver.
Definition ScalarEvolution.h:448

llvm::ScalarEvolution::getSmallConstantMaxTripCount
LLVM_ABI unsigned getSmallConstantMaxTripCount(const Loop *L, SmallVectorImpl< const SCEVPredicate * > *Predicates=nullptr)
Returns the upper bound of the loop trip count as a normal unsigned value.
Definition ScalarEvolution.cpp:8298

llvm::ScalarEvolution::getSmallConstantTripCount
LLVM_ABI unsigned getSmallConstantTripCount(const Loop *L)
Returns the exact trip count of the loop if we can compute it, and the result is a small constant.
Definition ScalarEvolution.cpp:8282

llvm::TargetTransformInfoImplBase::getDataLayout
virtual const DataLayout & getDataLayout() const
Definition TargetTransformInfoImpl.h:50

llvm::TargetTransformInfoImplBase::getInstructionCost
virtual InstructionCost getInstructionCost(const User *U, ArrayRef< const Value * > Operands, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:85

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition TargetTransformInfo.h:278

llvm::TargetTransformInfo::TCK_RecipThroughput
@ TCK_RecipThroughput
Reciprocal throughput.
Definition TargetTransformInfo.h:279

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition TargetTransformInfo.h:1218

llvm::TargetTransformInfo::RGK_FixedWidthVector
@ RGK_FixedWidthVector
Definition TargetTransformInfo.h:1218

llvm::TargetTransformInfo::RGK_ScalableVector
@ RGK_ScalableVector
Definition TargetTransformInfo.h:1218

llvm::TargetTransformInfo::RGK_Scalar
@ RGK_Scalar
Definition TargetTransformInfo.h:1218

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition TargetTransformInfo.h:744

llvm::TargetTransformInfo::PSK_FastHardware
@ PSK_FastHardware
Definition TargetTransformInfo.h:744

llvm::TargetTransformInfo::TCC_Free
@ TCC_Free
Expected to fold away in lowering.
Definition TargetTransformInfo.h:304

llvm::TargetTransformInfo::AddressingModeKind
AddressingModeKind
Which addressing mode Loop Strength Reduction will try to generate.
Definition TargetTransformInfo.h:807

llvm::TargetTransformInfo::AMK_PostIndexed
@ AMK_PostIndexed
Prefer post-indexed addressing mode.
Definition TargetTransformInfo.h:810

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition TargetTransformInfo.h:1135

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition TargetTransformInfo.h:1440

llvm::TypeSize
Definition TypeSize.h:333

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:344

llvm::TypeSize::getScalable
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition TypeSize.h:347

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:273

llvm::Type::getPrimitiveSizeInBits
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:198

llvm::Type::isFloatingPointTy
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
Definition Type.h:184

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:240

llvm::Type::isFPOrFPVectorTy
bool isFPOrFPVectorTy() const
Return true if this is a FP type or a vector of FP.
Definition Type.h:225

llvm::User
Definition User.h:44

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::Value::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition Value.h:439

llvm::VectorType
Base class of all SIMD vector types.
Definition DerivedTypes.h:430

llvm::VectorType::getElementType
Type * getElementType() const
Definition DerivedTypes.h:463

llvm::cl::opt
Definition CommandLine.h:1455

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:201

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::NVPTXAS::AddressSpace
AddressSpace
Definition NVPTXAddrSpace.h:21

llvm::cl::Hidden
@ Hidden
Definition CommandLine.h:139

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition CommandLine.h:445

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::Cost
InstructionCost Cost
Definition FunctionSpecialization.h:103

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643

llvm::canPeel
bool canPeel(const Loop *L)
Definition LoopPeel.cpp:91

llvm::alignTo
uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
Definition Alignment.h:144

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559

llvm::Log2
unsigned Log2(Align A)
Returns the log2 of the alignment.
Definition Alignment.h:197

llvm::VFParamKind::Vector
@ Vector
Definition VFABIDemangler.h:27

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39

llvm::Align::value
constexpr uint64_t value() const
This is a hole in the type system and should not be abused.
Definition Alignment.h:77

llvm::TargetTransformInfo::OperandValueInfo
Definition TargetTransformInfo.h:1172

llvm::TargetTransformInfo::PeelingPreferences
Definition TargetTransformInfo.h:684

llvm::TargetTransformInfo::PeelingPreferences::PeelCount
unsigned PeelCount
A forced peeling factor (the number of bodied of the original loop that should be peeled off before t...
Definition TargetTransformInfo.h:688

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition TargetTransformInfo.h:554

llvm::TargetTransformInfo::UnrollingPreferences::Runtime
bool Runtime
Allow runtime unrolling (unrolling of loops to expand the size of the loop body even when the number ...
Definition TargetTransformInfo.h:615

llvm::TargetTransformInfo::UnrollingPreferences::Partial
bool Partial
Allow partial unrolling (unrolling of loops to expand the size of the loop body, not only to eliminat...
Definition TargetTransformInfo.h:611

llvm::cl::desc
Definition CommandLine.h:411