utility/all.php

//===- ARMTargetTransformInfo.h - ARM specific TTI --------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file

/// This file a TargetTransformInfoImplBase conforming object specific to the

/// ARM target machine. It uses the target's detailed information to

/// provide more precise answers to certain TTI queries, while letting the

/// target independent and default TTI implementations handle the rest.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H

#define LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H


#include "ARM.h"

#include "ARMSubtarget.h"

#include "ARMTargetMachine.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/CodeGen/BasicTTIImpl.h"

#include "llvm/IR/Constant.h"

#include "llvm/IR/Function.h"

#include "llvm/TargetParser/SubtargetFeature.h"

#include <optional>


namespace llvm {


class APInt;

class ARMTargetLowering;

class Instruction;

class Loop;

class SCEV;

class ScalarEvolution;

class Type;

class Value;


namespace TailPredication {


  enum Mode {

    Disabled = 0,

    EnabledNoReductions,

    Enabled,

    ForceEnabledNoReductions,

    ForceEnabled

  };


}


// For controlling conversion of memcpy into Tail Predicated loop.


namespace TPLoop {

enum MemTransfer { ForceDisabled = 0, ForceEnabled, Allow };

}


class ARMTTIImpl final : public BasicTTIImplBase<ARMTTIImpl> {

  using BaseT = BasicTTIImplBase<ARMTTIImpl>;

  using TTI = TargetTransformInfo;


  friend BaseT;


  const ARMSubtarget *ST;

  const ARMTargetLowering *TLI;


  // Currently the following features are excluded from InlineFeaturesAllowed.

  // ModeThumb, FeatureNoARM, ModeSoftFloat, FeatureFP64, FeatureD32

  // Depending on whether they are set or unset, different

  // instructions/registers are available. For example, inlining a callee with

  // -thumb-mode in a caller with +thumb-mode, may cause the assembler to

  // fail if the callee uses ARM only instructions, e.g. in inline asm.

  const FeatureBitset InlineFeaturesAllowed = {

      ARM::FeatureVFP2, ARM::FeatureVFP3, ARM::FeatureNEON, ARM::FeatureThumb2,

      ARM::FeatureFP16, ARM::FeatureVFP4, ARM::FeatureFPARMv8,

      ARM::FeatureFullFP16, ARM::FeatureFP16FML, ARM::FeatureHWDivThumb,

      ARM::FeatureHWDivARM, ARM::FeatureDB, ARM::FeatureV7Clrex,

      ARM::FeatureAcquireRelease, ARM::FeatureSlowFPBrcc,

      ARM::FeaturePerfMon, ARM::FeatureTrustZone, ARM::Feature8MSecExt,

      ARM::FeatureCrypto, ARM::FeatureCRC, ARM::FeatureRAS,

      ARM::FeatureFPAO, ARM::FeatureFuseAES, ARM::FeatureZCZeroing,

      ARM::FeatureProfUnpredicate, ARM::FeatureSlowVGETLNi32,

      ARM::FeatureSlowVDUP32, ARM::FeaturePreferVMOVSR,

      ARM::FeaturePrefISHSTBarrier, ARM::FeatureMuxedUnits,

      ARM::FeatureSlowOddRegister, ARM::FeatureSlowLoadDSubreg,

      ARM::FeatureDontWidenVMOVS, ARM::FeatureExpandMLx,

      ARM::FeatureHasVMLxHazards, ARM::FeatureNEONForFPMovs,

      ARM::FeatureNEONForFP, ARM::FeatureCheckVLDnAlign,

      ARM::FeatureHasSlowFPVMLx, ARM::FeatureHasSlowFPVFMx,

      ARM::FeatureVMLxForwarding, ARM::FeaturePref32BitThumb,

      ARM::FeatureAvoidPartialCPSR, ARM::FeatureCheapPredicableCPSR,

      ARM::FeatureAvoidMOVsShOp, ARM::FeatureHasRetAddrStack,

      ARM::FeatureHasNoBranchPredictor, ARM::FeatureDSP, ARM::FeatureMP,

      ARM::FeatureVirtualization, ARM::FeatureMClass, ARM::FeatureRClass,

      ARM::FeatureAClass, ARM::FeatureStrictAlign, ARM::FeatureLongCalls,

      ARM::FeatureExecuteOnly, ARM::FeatureReserveR9, ARM::FeatureNoMovt,

      ARM::FeatureNoNegativeImmediates

  };


  const ARMSubtarget *getST() const { return ST; }

  const ARMTargetLowering *getTLI() const { return TLI; }


public:


  explicit ARMTTIImpl(const ARMBaseTargetMachine *TM, const Function &F)

      : BaseT(TM, F.getDataLayout()), ST(TM->getSubtargetImpl(F)),

        TLI(ST->getTargetLowering()) {}


  bool areInlineCompatible(const Function *Caller,

                           const Function *Callee) const override;


  bool enableInterleavedAccessVectorization() const override { return true; }


  TTI::AddressingModeKind

  getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const override;


  /// Floating-point computation using ARMv8 AArch32 Advanced

  /// SIMD instructions remains unchanged from ARMv7. Only AArch64 SIMD

  /// and Arm MVE are IEEE-754 compliant.


  bool isFPVectorizationPotentiallyUnsafe() const override {

    return !ST->isTargetDarwin() && !ST->hasMVEFloatOps();

  }


  std::optional<Instruction *>

  instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const override;

  std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const override;


  /// \name Scalar TTI Implementations

  /// @{


  InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx,

                                        const APInt &Imm,

                                        Type *Ty) const override;


  using BaseT::getIntImmCost;

  InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                TTI::TargetCostKind CostKind) const override;


  InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx,

                                    const APInt &Imm, Type *Ty,

                                    TTI::TargetCostKind CostKind,

                                    Instruction *Inst = nullptr) const override;


  /// @}


  /// \name Vector TTI Implementations

  /// @{


  unsigned getNumberOfRegisters(unsigned ClassID) const override {

    bool Vector = (ClassID == 1);

    if (Vector) {

      if (ST->hasNEON())

        return 16;

      if (ST->hasMVEIntegerOps())

        return 8;

      return 0;

    }


    if (ST->isThumb1Only())

      return 8;

    return 13;

  }


  TypeSize


  getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const override {

    switch (K) {

    case TargetTransformInfo::RGK_Scalar:

      return TypeSize::getFixed(32);

    case TargetTransformInfo::RGK_FixedWidthVector:

      if (ST->hasNEON())

        return TypeSize::getFixed(128);

      if (ST->hasMVEIntegerOps())

        return TypeSize::getFixed(128);

      return TypeSize::getFixed(0);

    case TargetTransformInfo::RGK_ScalableVector:

      return TypeSize::getScalable(0);

    }

    llvm_unreachable("Unsupported register kind");

  }


  unsigned getMaxInterleaveFactor(ElementCount VF) const override {

    return ST->getMaxInterleaveFactor();

  }


  bool isProfitableLSRChainElement(Instruction *I) const override;


  bool isLegalMaskedLoad(Type *DataTy, Align Alignment,

                         unsigned AddressSpace) const override;


  bool isLegalMaskedStore(Type *DataTy, Align Alignment,

                          unsigned AddressSpace) const override {

    return isLegalMaskedLoad(DataTy, Alignment, AddressSpace);

  }


  bool forceScalarizeMaskedGather(VectorType *VTy,

                                  Align Alignment) const override {

    // For MVE, we have a custom lowering pass that will already have custom

    // legalised any gathers that we can lower to MVE intrinsics, and want to

    // expand all the rest. The pass runs before the masked intrinsic lowering

    // pass.

    return true;

  }


  bool forceScalarizeMaskedScatter(VectorType *VTy,

                                   Align Alignment) const override {

    return forceScalarizeMaskedGather(VTy, Alignment);

  }


  bool isLegalMaskedGather(Type *Ty, Align Alignment) const override;


  bool isLegalMaskedScatter(Type *Ty, Align Alignment) const override {

    return isLegalMaskedGather(Ty, Alignment);

  }


  InstructionCost getMemcpyCost(const Instruction *I) const override;


  uint64_t getMaxMemIntrinsicInlineSizeThreshold() const override {

    return ST->getMaxInlineSizeThreshold();

  }


  int getNumMemOps(const IntrinsicInst *I) const;


  InstructionCost

  getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy,

                 ArrayRef<int> Mask, TTI::TargetCostKind CostKind, int Index,

                 VectorType *SubTp, ArrayRef<const Value *> Args = {},

                 const Instruction *CxtI = nullptr) const override;


  bool preferInLoopReduction(RecurKind Kind, Type *Ty) const override;


  bool preferPredicatedReductionSelect() const override;


  bool shouldExpandReduction(const IntrinsicInst *II) const override {

    return false;

  }


  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                 const Instruction *I = nullptr) const override;


  InstructionCost

  getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src,

                   TTI::CastContextHint CCH, TTI::TargetCostKind CostKind,

                   const Instruction *I = nullptr) const override;


  InstructionCost getCmpSelInstrCost(

      unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred,

      TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      const Instruction *I = nullptr) const override;


  using BaseT::getVectorInstrCost;

  InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val,

                                     TTI::TargetCostKind CostKind,

                                     unsigned Index, const Value *Op0,

                                     const Value *Op1) const override;


  InstructionCost

  getAddressComputationCost(Type *Val, ScalarEvolution *SE, const SCEV *Ptr,

                            TTI::TargetCostKind CostKind) const override;


  InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      ArrayRef<const Value *> Args = {},

      const Instruction *CxtI = nullptr) const override;


  InstructionCost getMemoryOpCost(

      unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace,

      TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo OpInfo = {TTI::OK_AnyValue, TTI::OP_None},

      const Instruction *I = nullptr) const override;


  InstructionCost

  getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment,

                        unsigned AddressSpace,

                        TTI::TargetCostKind CostKind) const override;


  InstructionCost getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

      bool UseMaskForCond = false, bool UseMaskForGaps = false) const override;


  InstructionCost

  getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr,

                         bool VariableMask, Align Alignment,

                         TTI::TargetCostKind CostKind,

                         const Instruction *I = nullptr) const override;


  InstructionCost

  getArithmeticReductionCost(unsigned Opcode, VectorType *ValTy,

                             std::optional<FastMathFlags> FMF,

                             TTI::TargetCostKind CostKind) const override;

  InstructionCost

  getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy,

                           VectorType *ValTy, std::optional<FastMathFlags> FMF,

                           TTI::TargetCostKind CostKind) const override;

  InstructionCost

  getMulAccReductionCost(bool IsUnsigned, unsigned RedOpcode, Type *ResTy,

                         VectorType *ValTy,

                         TTI::TargetCostKind CostKind) const override;


  InstructionCost

  getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF,

                         TTI::TargetCostKind CostKind) const override;


  InstructionCost

  getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                        TTI::TargetCostKind CostKind) const override;


  /// getScalingFactorCost - Return the cost of the scaling used in

  /// addressing mode represented by AM.

  /// If the AM is supported, the return value must be >= 0.

  /// If the AM is not supported, the return value is an invalid cost.

  InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                       StackOffset BaseOffset, bool HasBaseReg,

                                       int64_t Scale,

                                       unsigned AddrSpace) const override;


  bool maybeLoweredToCall(Instruction &I) const;

  bool isLoweredToCall(const Function *F) const override;

  bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE,

                                AssumptionCache &AC, TargetLibraryInfo *LibInfo,

                                HardwareLoopInfo &HWLoopInfo) const override;

  bool preferPredicateOverEpilogue(TailFoldingInfo *TFI) const override;

  void getUnrollingPreferences(Loop *L, ScalarEvolution &SE,

                               TTI::UnrollingPreferences &UP,

                               OptimizationRemarkEmitter *ORE) const override;


  TailFoldingStyle

  getPreferredTailFoldingStyle(bool IVUpdateMayOverflow = true) const override;


  void getPeelingPreferences(Loop *L, ScalarEvolution &SE,

                             TTI::PeelingPreferences &PP) const override;


  bool shouldBuildLookupTablesForConstant(Constant *C) const override {

    // In the ROPI and RWPI relocation models we can't have pointers to global

    // variables or functions in constant data, so don't convert switches to

    // lookup tables if any of the values would need relocation.

    if (ST->isROPI() || ST->isRWPI())

      return !C->needsDynamicRelocation();


    return true;

  }


  bool hasArmWideBranch(bool Thumb) const override;


  bool isProfitableToSinkOperands(Instruction *I,

                                  SmallVectorImpl<Use *> &Ops) const override;


  unsigned getNumBytesToPadGlobalArray(unsigned Size,

                                       Type *ArrayType) const override;


  /// @}

};


/// isVREVMask - Check if a vector shuffle corresponds to a VREV

/// instruction with the specified blocksize.  (The order of the elements

/// within each block of the vector is reversed.)


inline bool isVREVMask(ArrayRef<int> M, EVT VT, unsigned BlockSize) {

  assert((BlockSize == 16 || BlockSize == 32 || BlockSize == 64) &&

         "Only possible block sizes for VREV are: 16, 32, 64");


  unsigned EltSz = VT.getScalarSizeInBits();

  if (EltSz != 8 && EltSz != 16 && EltSz != 32)

    return false;


  unsigned BlockElts = M[0] + 1;

  // If the first shuffle index is UNDEF, be optimistic.

  if (M[0] < 0)

    BlockElts = BlockSize / EltSz;


  if (BlockSize <= EltSz || BlockSize != BlockElts * EltSz)

    return false;


  for (unsigned i = 0, e = M.size(); i < e; ++i) {

    if (M[i] < 0)

      continue; // ignore UNDEF indices

    if ((unsigned)M[i] != (i - i % BlockElts) + (BlockElts - 1 - i % BlockElts))

      return false;

  }


  return true;

}


} // end namespace llvm


#endif // LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

ARMSubtarget.h

ARMTargetMachine.h

ARM.h

ArrayRef.h

BasicTTIImpl.h
This file provides a helper that implements much of the TTI interface in terms of the target-independ...

CostKind
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))

IntrinsicCostStrategy::InstructionCost
@ InstructionCost
Definition CostModel.cpp:52

Constant.h

Function.h

InlinePriorityMode::Size
@ Size
Definition InlineOrder.cpp:25

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

Ops
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Definition ItaniumDemangle.h:3368

F
#define F(x, y, z)
Definition MD5.cpp:55

I
#define I(x, y, z)
Definition MD5.cpp:58

II
uint64_t IntrinsicInst * II
Definition NVVMIntrRange.cpp:46

SubtargetFeature.h

BlockSize
static const int BlockSize
Definition TarWriter.cpp:33

Ptr
@ Ptr
Definition TargetLibraryInfo.cpp:77

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::ARMBaseTargetMachine
Definition ARMTargetMachine.h:29

llvm::ARMSubtarget
Definition ARMSubtarget.h:48

llvm::ARMTTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const override
Definition ARMTargetTransformInfo.h:167

llvm::ARMTTIImpl::getAddressComputationCost
InstructionCost getAddressComputationCost(Type *Val, ScalarEvolution *SE, const SCEV *Ptr, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1088

llvm::ARMTTIImpl::getPreferredTailFoldingStyle
TailFoldingStyle getPreferredTailFoldingStyle(bool IVUpdateMayOverflow=true) const override
Definition ARMTargetTransformInfo.cpp:2592

llvm::ARMTTIImpl::isFPVectorizationPotentiallyUnsafe
bool isFPVectorizationPotentiallyUnsafe() const override
Floating-point computation using ARMv8 AArch32 Advanced SIMD instructions remains unchanged from ARMv...
Definition ARMTargetTransformInfo.h:118

llvm::ARMTTIImpl::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:1587

llvm::ARMTTIImpl::getMemcpyCost
InstructionCost getMemcpyCost(const Instruction *I) const override
Definition ARMTargetTransformInfo.cpp:1226

llvm::ARMTTIImpl::isLegalMaskedScatter
bool isLegalMaskedScatter(Type *Ty, Align Alignment) const override
Definition ARMTargetTransformInfo.h:213

llvm::ARMTTIImpl::maybeLoweredToCall
bool maybeLoweredToCall(Instruction &I) const
Definition ARMTargetTransformInfo.cpp:2216

llvm::ARMTTIImpl::preferInLoopReduction
bool preferInLoopReduction(RecurKind Kind, Type *Ty) const override
Definition ARMTargetTransformInfo.cpp:2737

llvm::ARMTTIImpl::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:941

llvm::ARMTTIImpl::getMulAccReductionCost
InstructionCost getMulAccReductionCost(bool IsUnsigned, unsigned RedOpcode, Type *ResTy, VectorType *ValTy, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1919

llvm::ARMTTIImpl::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false) const override
Definition ARMTargetTransformInfo.cpp:1653

llvm::ARMTTIImpl::getIntImmCost
InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:320

llvm::ARMTTIImpl::hasArmWideBranch
bool hasArmWideBranch(bool Thumb) const override
Definition ARMTargetTransformInfo.cpp:2774

llvm::ARMTTIImpl::shouldExpandReduction
bool shouldExpandReduction(const IntrinsicInst *II) const override
Definition ARMTargetTransformInfo.h:235

llvm::ARMTTIImpl::shouldBuildLookupTablesForConstant
bool shouldBuildLookupTablesForConstant(Constant *C) const override
Definition ARMTargetTransformInfo.h:338

llvm::ARMTTIImpl::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:498

llvm::ARMTTIImpl::getNumMemOps
int getNumMemOps(const IntrinsicInst *I) const
Given a memcpy/memset/memmove instruction, return the number of memory operations performed,...
Definition ARMTargetTransformInfo.cpp:1160

llvm::ARMTTIImpl::getCFInstrCost
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:484

llvm::ARMTTIImpl::getIntImmCodeSizeCost
InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty) const override
Definition ARMTargetTransformInfo.cpp:355

llvm::ARMTTIImpl::isLoweredToCall
bool isLoweredToCall(const Function *F) const override
Definition ARMTargetTransformInfo.cpp:2154

llvm::ARMTTIImpl::getExtendedReductionCost
InstructionCost getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy, VectorType *ValTy, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1884

llvm::ARMTTIImpl::isProfitableToSinkOperands
bool isProfitableToSinkOperands(Instruction *I, SmallVectorImpl< Use * > &Ops) const override
Check if sinking I's operands to I's basic block is profitable, because the operands can be folded in...
Definition ARMTargetTransformInfo.cpp:2809

llvm::ARMTTIImpl::isLegalMaskedStore
bool isLegalMaskedStore(Type *DataTy, Align Alignment, unsigned AddressSpace) const override
Definition ARMTargetTransformInfo.h:192

llvm::ARMTTIImpl::getMaxMemIntrinsicInlineSizeThreshold
uint64_t getMaxMemIntrinsicInlineSizeThreshold() const override
Definition ARMTargetTransformInfo.h:219

llvm::ARMTTIImpl::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:1694

llvm::ARMTTIImpl::forceScalarizeMaskedScatter
bool forceScalarizeMaskedScatter(VectorType *VTy, Align Alignment) const override
Definition ARMTargetTransformInfo.h:206

llvm::ARMTTIImpl::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1634

llvm::ARMTTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1) const override
Definition ARMTargetTransformInfo.cpp:902

llvm::ARMTTIImpl::getArithmeticReductionCost
InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *ValTy, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1799

llvm::ARMTTIImpl::simplifyDemandedVectorEltsIntrinsic
std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const override
Definition ARMTargetTransformInfo.cpp:278

llvm::ARMTTIImpl::isLegalMaskedLoad
bool isLegalMaskedLoad(Type *DataTy, Align Alignment, unsigned AddressSpace) const override
Definition ARMTargetTransformInfo.cpp:1127

llvm::ARMTTIImpl::ARMTTIImpl
ARMTTIImpl(const ARMBaseTargetMachine *TM, const Function &F)
Definition ARMTargetTransformInfo.h:103

llvm::ARMTTIImpl::getIntImmCostInst
InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind, Instruction *Inst=nullptr) const override
Definition ARMTargetTransformInfo.cpp:413

llvm::ARMTTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition ARMTargetTransformInfo.cpp:1390

llvm::ARMTTIImpl::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:2009

llvm::ARMTTIImpl::instCombineIntrinsic
std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const override
Definition ARMTargetTransformInfo.cpp:125

llvm::ARMTTIImpl::getPeelingPreferences
void getPeelingPreferences(Loop *L, ScalarEvolution &SE, TTI::PeelingPreferences &PP) const override
Definition ARMTargetTransformInfo.cpp:2732

llvm::ARMTTIImpl::getMinMaxReductionCost
InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1949

llvm::ARMTTIImpl::getPreferredAddressingMode
TTI::AddressingModeKind getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const override
Definition ARMTargetTransformInfo.cpp:109

llvm::ARMTTIImpl::preferPredicateOverEpilogue
bool preferPredicateOverEpilogue(TailFoldingInfo *TFI) const override
Definition ARMTargetTransformInfo.cpp:2538

llvm::ARMTTIImpl::forceScalarizeMaskedGather
bool forceScalarizeMaskedGather(VectorType *VTy, Align Alignment) const override
Definition ARMTargetTransformInfo.h:197

llvm::ARMTTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const override
Definition ARMTargetTransformInfo.h:151

llvm::ARMTTIImpl::getShuffleCost
InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition ARMTargetTransformInfo.cpp:1236

llvm::ARMTTIImpl::areInlineCompatible
bool areInlineCompatible(const Function *Caller, const Function *Callee) const override
Definition ARMTargetTransformInfo.cpp:90

llvm::ARMTTIImpl::preferPredicatedReductionSelect
bool preferPredicatedReductionSelect() const override
Definition ARMTargetTransformInfo.cpp:2750

llvm::ARMTTIImpl::isLegalMaskedGather
bool isLegalMaskedGather(Type *Ty, Align Alignment) const override
Definition ARMTargetTransformInfo.cpp:1148

llvm::ARMTTIImpl::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF) const override
Definition ARMTargetTransformInfo.h:183

llvm::ARMTTIImpl::getNumBytesToPadGlobalArray
unsigned getNumBytesToPadGlobalArray(unsigned Size, Type *ArrayType) const override
Definition ARMTargetTransformInfo.cpp:2933

llvm::ARMTTIImpl::isProfitableLSRChainElement
bool isProfitableLSRChainElement(Instruction *I) const override
Definition ARMTargetTransformInfo.cpp:1110

llvm::ARMTTIImpl::isHardwareLoopProfitable
bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE, AssumptionCache &AC, TargetLibraryInfo *LibInfo, HardwareLoopInfo &HWLoopInfo) const override
Definition ARMTargetTransformInfo.cpp:2303

llvm::ARMTTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE) const override
Definition ARMTargetTransformInfo.cpp:2602

llvm::ARMTTIImpl::enableInterleavedAccessVectorization
bool enableInterleavedAccessVectorization() const override
Definition ARMTargetTransformInfo.h:110

llvm::ARMTTIImpl::getScalingFactorCost
InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, StackOffset BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace) const override
getScalingFactorCost - Return the cost of the scaling used in addressing mode represented by AM.
Definition ARMTargetTransformInfo.cpp:2756

llvm::ARMTargetLowering
Definition ARMISelLowering.h:400

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41

llvm::ArrayType
Class to represent array types.
Definition DerivedTypes.h:398

llvm::BasicTTIImplBase< ARMTTIImpl >::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1) const override
Definition BasicTTIImpl.h:1423

llvm::BasicTTIImplBase< ARMTTIImpl >::BasicTTIImplBase
BasicTTIImplBase(const TargetMachine *TM, const DataLayout &DL)
Definition BasicTTIImpl.h:367

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:678

llvm::Constant
This is an important base class in LLVM.
Definition Constant.h:43

llvm::ElementCount
Definition TypeSize.h:298

llvm::FeatureBitset
Container class for subtarget features.
Definition SubtargetFeature.h:42

llvm::Function
Definition Function.h:64

llvm::InstCombiner
The core instruction combiner logic.
Definition InstCombiner.h:48

llvm::InstructionCost
Definition InstructionCost.h:30

llvm::Instruction
Definition Instruction.h:69

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition IntrinsicInst.h:49

llvm::Loop
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40

llvm::SCEV
This class represents an analyzed expression in the program.
Definition ScalarEvolution.h:72

llvm::ScalarEvolution
The main scalar evolution driver.
Definition ScalarEvolution.h:448

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:573

llvm::TargetTransformInfoImplBase::getDataLayout
virtual const DataLayout & getDataLayout() const
Definition TargetTransformInfoImpl.h:50

llvm::TargetTransformInfoImplBase::getIntImmCost
virtual InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:538

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition TargetTransformInfo.h:220

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition TargetTransformInfo.h:272

llvm::TargetTransformInfo::OP_None
@ OP_None
Definition TargetTransformInfo.h:1158

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition TargetTransformInfo.h:1212

llvm::TargetTransformInfo::RGK_FixedWidthVector
@ RGK_FixedWidthVector
Definition TargetTransformInfo.h:1212

llvm::TargetTransformInfo::RGK_ScalableVector
@ RGK_ScalableVector
Definition TargetTransformInfo.h:1212

llvm::TargetTransformInfo::RGK_Scalar
@ RGK_Scalar
Definition TargetTransformInfo.h:1212

llvm::TargetTransformInfo::AddressingModeKind
AddressingModeKind
Which addressing mode Loop Strength Reduction will try to generate.
Definition TargetTransformInfo.h:801

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition TargetTransformInfo.h:1129

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition TargetTransformInfo.h:1434

llvm::TargetTransformInfo::OK_AnyValue
@ OK_AnyValue
Definition TargetTransformInfo.h:1150

llvm::TypeSize
Definition TypeSize.h:332

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343

llvm::TypeSize::getScalable
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition TypeSize.h:346

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::VectorType
Base class of all SIMD vector types.
Definition DerivedTypes.h:430

uint64_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition AMDGPUMetadata.h:396

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::NVPTXAS::AddressSpace
AddressSpace
Definition NVPTXAddrSpace.h:21

llvm::TPLoop
Definition ARMTargetTransformInfo.h:53

llvm::TPLoop::MemTransfer
MemTransfer
Definition ARMTargetTransformInfo.h:54

llvm::TPLoop::Allow
@ Allow
Definition ARMTargetTransformInfo.h:54

llvm::TPLoop::ForceDisabled
@ ForceDisabled
Definition ARMTargetTransformInfo.h:54

llvm::TPLoop::ForceEnabled
@ ForceEnabled
Definition ARMTargetTransformInfo.h:54

llvm::TailPredication
Definition ARMTargetTransformInfo.h:42

llvm::TailPredication::Mode
Mode
Definition ARMTargetTransformInfo.h:43

llvm::TailPredication::ForceEnabled
@ ForceEnabled
Definition ARMTargetTransformInfo.h:48

llvm::TailPredication::Disabled
@ Disabled
Definition ARMTargetTransformInfo.h:44

llvm::TailPredication::EnabledNoReductions
@ EnabledNoReductions
Definition ARMTargetTransformInfo.h:45

llvm::TailPredication::ForceEnabledNoReductions
@ ForceEnabledNoReductions
Definition ARMTargetTransformInfo.h:47

llvm::TailPredication::Enabled
@ Enabled
Definition ARMTargetTransformInfo.h:46

llvm::sandboxir::Instruction
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::isVREVMask
bool isVREVMask(ArrayRef< int > M, EVT VT, unsigned BlockSize)
isVREVMask - Check if a vector shuffle corresponds to a VREV instruction with the specified blocksize...
Definition ARMTargetTransformInfo.h:362

llvm::TailFoldingStyle
TailFoldingStyle
Definition TargetTransformInfo.h:172

llvm::VFParamKind::Vector
@ Vector
Definition VFABIDemangler.h:27

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39

llvm::EVT
Extended Value Type.
Definition ValueTypes.h:35

llvm::EVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition ValueTypes.h:385

llvm::TargetTransformInfo::OperandValueInfo
Definition TargetTransformInfo.h:1166

llvm::TargetTransformInfo::PeelingPreferences
Definition TargetTransformInfo.h:678

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition TargetTransformInfo.h:548