CbC/CbC_llvm: lib/Target/X86/X86TargetTransformInfo.h comparison

comparison lib/Target/X86/X86TargetTransformInfo.h @ 148:63bd29f05246

merged

author	Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date	Wed, 14 Aug 2019 19:46:37 +0900
parents	c2174574ed3a
children

comparison

equal deleted inserted replaced

-:3fc4d5c3e21e
+:63bd29f05246
 //===-- X86TargetTransformInfo.h - X86 specific TTI -------------*- C++ -*-===//
 //
-//                     The LLVM Compiler Infrastructure
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-//
+// See https://llvm.org/LICENSE.txt for license information.
-// This file is distributed under the University of Illinois Open Source
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-// License. See LICENSE.TXT for details.
 //
 //===----------------------------------------------------------------------===//
 /// \file
 /// This file a TargetTransformInfo::Concept conforming object specific to the
 /// X86 target machine. It uses the target's detailed information to
 const X86Subtarget *ST;
 const X86TargetLowering *TLI;
 const X86Subtarget *getST() const { return ST; }
 const X86TargetLowering *getTLI() const { return TLI; }
+const FeatureBitset InlineFeatureIgnoreList = {
+// This indicates the CPU is 64 bit capable not that we are in 64-bit
+// mode.
+X86::Feature64Bit,
+// These features don't have any intrinsics or ABI effect.
+X86::FeatureNOPL,
+X86::FeatureCMPXCHG16B,
+X86::FeatureLAHFSAHF,
+// Codegen control options.
+X86::FeatureFast11ByteNOP,
+X86::FeatureFast15ByteNOP,
+X86::FeatureFastBEXTR,
+X86::FeatureFastHorizontalOps,
+X86::FeatureFastLZCNT,
+X86::FeatureFastPartialYMMorZMMWrite,
+X86::FeatureFastScalarFSQRT,
+X86::FeatureFastSHLDRotate,
+X86::FeatureFastScalarShiftMasks,
+X86::FeatureFastVectorShiftMasks,
+X86::FeatureFastVariableShuffle,
+X86::FeatureFastVectorFSQRT,
+X86::FeatureLEAForSP,
+X86::FeatureLEAUsesAG,
+X86::FeatureLZCNTFalseDeps,
+X86::FeatureBranchFusion,
+X86::FeatureMacroFusion,
+X86::FeatureMergeToThreeWayBranch,
+X86::FeaturePadShortFunctions,
+X86::FeaturePOPCNTFalseDeps,
+X86::FeatureSSEUnalignedMem,
+X86::FeatureSlow3OpsLEA,
+X86::FeatureSlowDivide32,
+X86::FeatureSlowDivide64,
+X86::FeatureSlowIncDec,
+X86::FeatureSlowLEA,
+X86::FeatureSlowPMADDWD,
+X86::FeatureSlowPMULLD,
+X86::FeatureSlowSHLD,
+X86::FeatureSlowTwoMemOps,
+X86::FeatureSlowUAMem16,
+// Perf-tuning flags.
+X86::FeatureHasFastGather,
+X86::FeatureSlowUAMem32,
+// Based on whether user set the -mprefer-vector-width command line.
+X86::FeaturePrefer256Bit,
+// CPU name enums. These just follow CPU string.
+X86::ProcIntelAtom,
+X86::ProcIntelGLM,
+X86::ProcIntelGLP,
+X86::ProcIntelSLM,
+X86::ProcIntelTRM,
+};
 public:
 explicit X86TTIImpl(const X86TargetMachine *TM, const Function &F)
 : BaseT(TM, F.getParent()->getDataLayout()), ST(TM->getSubtargetImpl(F)),
 TLI(ST->getTargetLowering()) {}
 int getMinMaxReductionCost(Type *Ty, Type *CondTy, bool IsPairwiseForm,
 bool IsUnsigned);
 int getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy,
 unsigned Factor, ArrayRef<unsigned> Indices,
-unsigned Alignment, unsigned AddressSpace);
+unsigned Alignment, unsigned AddressSpace,
+bool UseMaskForCond = false,
+bool UseMaskForGaps = false);
 int getInterleavedMemoryOpCostAVX512(unsigned Opcode, Type *VecTy,
 unsigned Factor, ArrayRef<unsigned> Indices,
-unsigned Alignment, unsigned AddressSpace);
+unsigned Alignment, unsigned AddressSpace,
+bool UseMaskForCond = false,
+bool UseMaskForGaps = false);
 int getInterleavedMemoryOpCostAVX2(unsigned Opcode, Type *VecTy,
 unsigned Factor, ArrayRef<unsigned> Indices,
-unsigned Alignment, unsigned AddressSpace);
+unsigned Alignment, unsigned AddressSpace,
+bool UseMaskForCond = false,
+bool UseMaskForGaps = false);
 int getIntImmCost(int64_t);
 int getIntImmCost(const APInt &Imm, Type *Ty);
 bool isLSRCostLess(TargetTransformInfo::LSRCost &C1,
 TargetTransformInfo::LSRCost &C2);
 bool canMacroFuseCmp();
 bool isLegalMaskedLoad(Type *DataType);
 bool isLegalMaskedStore(Type *DataType);
+bool isLegalNTLoad(Type *DataType, unsigned Alignment);
+bool isLegalNTStore(Type *DataType, unsigned Alignment);
 bool isLegalMaskedGather(Type *DataType);
 bool isLegalMaskedScatter(Type *DataType);
+bool isLegalMaskedExpandLoad(Type *DataType);
+bool isLegalMaskedCompressStore(Type *DataType);
 bool hasDivRemOp(Type *DataType, bool IsSigned);
 bool isFCmpOrdCheaperThanFCmpZero(Type *Ty);
 bool areInlineCompatible(const Function *Caller,
 const Function *Callee) const;
-const TTI::MemCmpExpansionOptions *enableMemCmpExpansion(
+bool areFunctionArgsABICompatible(const Function *Caller,
-bool IsZeroCmp) const;
+const Function *Callee,
+SmallPtrSetImpl<Argument *> &Args) const;
+TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize,
+bool IsZeroCmp) const;
 bool enableInterleavedAccessVectorization();
 private:
 int getGSScalarCost(unsigned Opcode, Type *DataTy, bool VariableMask,
 unsigned Alignment, unsigned AddressSpace);
 int getGSVectorCost(unsigned Opcode, Type *DataTy, Value *Ptr,

Mercurial > hg > CbC > CbC_llvm

comparison lib/Target/X86/X86TargetTransformInfo.h @ 148:63bd29f05246