CbC/CbC_llvm: llvm/lib/Analysis/TargetTransformInfo.cpp annotate

annotate llvm/lib/Analysis/TargetTransformInfo.cpp @ 204:e348f3e5c8b2

ReadFromString worked.

author	Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date	Sat, 05 Jun 2021 15:35:13 +0900
parents	0572611fdcc8
children	2e18cbf3894f

rev	line source
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1 //===- llvm/Analysis/TargetTransformInfo.cpp ------------------------------===//
1d019706d866 LLVM10 anatofuz parents: diff changeset	2 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
1d019706d866 LLVM10 anatofuz parents: diff changeset	4 // See https://llvm.org/LICENSE.txt for license information.
1d019706d866 LLVM10 anatofuz parents: diff changeset	5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
1d019706d866 LLVM10 anatofuz parents: diff changeset	6 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	7 //===----------------------------------------------------------------------===//
1d019706d866 LLVM10 anatofuz parents: diff changeset	8
1d019706d866 LLVM10 anatofuz parents: diff changeset	9 #include "llvm/Analysis/TargetTransformInfo.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	10 #include "llvm/Analysis/CFG.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	11 #include "llvm/Analysis/LoopIterator.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	12 #include "llvm/Analysis/TargetTransformInfoImpl.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	13 #include "llvm/IR/CFG.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	14 #include "llvm/IR/DataLayout.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	15 #include "llvm/IR/Instruction.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	16 #include "llvm/IR/Instructions.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	17 #include "llvm/IR/IntrinsicInst.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	18 #include "llvm/IR/Module.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	19 #include "llvm/IR/Operator.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	20 #include "llvm/IR/PatternMatch.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	21 #include "llvm/InitializePasses.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	22 #include "llvm/Support/CommandLine.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	23 #include "llvm/Support/ErrorHandling.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	24 #include <utility>
1d019706d866 LLVM10 anatofuz parents: diff changeset	25
1d019706d866 LLVM10 anatofuz parents: diff changeset	26 using namespace llvm;
1d019706d866 LLVM10 anatofuz parents: diff changeset	27 using namespace PatternMatch;
1d019706d866 LLVM10 anatofuz parents: diff changeset	28
1d019706d866 LLVM10 anatofuz parents: diff changeset	29 #define DEBUG_TYPE "tti"
1d019706d866 LLVM10 anatofuz parents: diff changeset	30
1d019706d866 LLVM10 anatofuz parents: diff changeset	31 static cl::opt<bool> EnableReduxCost("costmodel-reduxcost", cl::init(false),
1d019706d866 LLVM10 anatofuz parents: diff changeset	32 cl::Hidden,
1d019706d866 LLVM10 anatofuz parents: diff changeset	33 cl::desc("Recognize reduction patterns."));
1d019706d866 LLVM10 anatofuz parents: diff changeset	34
1d019706d866 LLVM10 anatofuz parents: diff changeset	35 namespace {
1d019706d866 LLVM10 anatofuz parents: diff changeset	36 /// No-op implementation of the TTI interface using the utility base
1d019706d866 LLVM10 anatofuz parents: diff changeset	37 /// classes.
1d019706d866 LLVM10 anatofuz parents: diff changeset	38 ///
1d019706d866 LLVM10 anatofuz parents: diff changeset	39 /// This is used when no target specific information is available.
1d019706d866 LLVM10 anatofuz parents: diff changeset	40 struct NoTTIImpl : TargetTransformInfoImplCRTPBase<NoTTIImpl> {
1d019706d866 LLVM10 anatofuz parents: diff changeset	41 explicit NoTTIImpl(const DataLayout &DL)
1d019706d866 LLVM10 anatofuz parents: diff changeset	42 : TargetTransformInfoImplCRTPBase<NoTTIImpl>(DL) {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	43 };
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	44 } // namespace
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	45
1d019706d866 LLVM10 anatofuz parents: diff changeset	46 bool HardwareLoopInfo::canAnalyze(LoopInfo &LI) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	47 // If the loop has irreducible control flow, it can not be converted to
1d019706d866 LLVM10 anatofuz parents: diff changeset	48 // Hardware loop.
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	49 LoopBlocksRPO RPOT(L);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	50 RPOT.perform(&LI);
1d019706d866 LLVM10 anatofuz parents: diff changeset	51 if (containsIrreducibleCFG<const BasicBlock *>(RPOT, LI))
1d019706d866 LLVM10 anatofuz parents: diff changeset	52 return false;
1d019706d866 LLVM10 anatofuz parents: diff changeset	53 return true;
1d019706d866 LLVM10 anatofuz parents: diff changeset	54 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	55
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	56 IntrinsicCostAttributes::IntrinsicCostAttributes(const IntrinsicInst &I) :
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	57 II(&I), RetTy(I.getType()), IID(I.getIntrinsicID()) {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	58
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	59 FunctionType *FTy = I.getCalledFunction()->getFunctionType();
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	60 ParamTys.insert(ParamTys.begin(), FTy->param_begin(), FTy->param_end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	61 Arguments.insert(Arguments.begin(), I.arg_begin(), I.arg_end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	62 if (auto *FPMO = dyn_cast<FPMathOperator>(&I))
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	63 FMF = FPMO->getFastMathFlags();
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	64 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	65
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	66 IntrinsicCostAttributes::IntrinsicCostAttributes(Intrinsic::ID Id, CallInst &CI,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	67 unsigned Factor) :
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	68 RetTy(CI.getType()), IID(Id), VF(Factor) {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	69
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	70 if (auto *FPMO = dyn_cast<FPMathOperator>(&CI))
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	71 FMF = FPMO->getFastMathFlags();
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	72
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	73 Arguments.insert(Arguments.begin(), CI.arg_begin(), CI.arg_end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	74 FunctionType *FTy =
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	75 CI.getCalledFunction()->getFunctionType();
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	76 ParamTys.insert(ParamTys.begin(), FTy->param_begin(), FTy->param_end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	77 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	78
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	79 IntrinsicCostAttributes::IntrinsicCostAttributes(Intrinsic::ID Id, CallInst &CI,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	80 unsigned Factor,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	81 unsigned ScalarCost) :
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	82 RetTy(CI.getType()), IID(Id), VF(Factor), ScalarizationCost(ScalarCost) {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	83
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	84 if (auto *FPMO = dyn_cast<FPMathOperator>(&CI))
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	85 FMF = FPMO->getFastMathFlags();
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	86
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	87 Arguments.insert(Arguments.begin(), CI.arg_begin(), CI.arg_end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	88 FunctionType *FTy =
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	89 CI.getCalledFunction()->getFunctionType();
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	90 ParamTys.insert(ParamTys.begin(), FTy->param_begin(), FTy->param_end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	91 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	92
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	93 IntrinsicCostAttributes::IntrinsicCostAttributes(Intrinsic::ID Id, Type *RTy,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	94 ArrayRef<Type *> Tys,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	95 FastMathFlags Flags) :
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	96 RetTy(RTy), IID(Id), FMF(Flags) {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	97 ParamTys.insert(ParamTys.begin(), Tys.begin(), Tys.end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	98 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	99
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	100 IntrinsicCostAttributes::IntrinsicCostAttributes(Intrinsic::ID Id, Type *RTy,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	101 ArrayRef<Type *> Tys,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	102 FastMathFlags Flags,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	103 unsigned ScalarCost) :
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	104 RetTy(RTy), IID(Id), FMF(Flags), ScalarizationCost(ScalarCost) {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	105 ParamTys.insert(ParamTys.begin(), Tys.begin(), Tys.end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	106 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	107
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	108 IntrinsicCostAttributes::IntrinsicCostAttributes(Intrinsic::ID Id, Type *RTy,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	109 ArrayRef<Type *> Tys,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	110 FastMathFlags Flags,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	111 unsigned ScalarCost,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	112 const IntrinsicInst *I) :
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	113 II(I), RetTy(RTy), IID(Id), FMF(Flags), ScalarizationCost(ScalarCost) {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	114 ParamTys.insert(ParamTys.begin(), Tys.begin(), Tys.end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	115 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	116
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	117 IntrinsicCostAttributes::IntrinsicCostAttributes(Intrinsic::ID Id, Type *RTy,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	118 ArrayRef<Type *> Tys) :
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	119 RetTy(RTy), IID(Id) {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	120 ParamTys.insert(ParamTys.begin(), Tys.begin(), Tys.end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	121 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	122
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	123 IntrinsicCostAttributes::IntrinsicCostAttributes(Intrinsic::ID Id, Type *Ty,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	124 ArrayRef<Value *> Args) :
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	125 RetTy(Ty), IID(Id) {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	126
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	127 Arguments.insert(Arguments.begin(), Args.begin(), Args.end());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	128 ParamTys.reserve(Arguments.size());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	129 for (unsigned Idx = 0, Size = Arguments.size(); Idx != Size; ++Idx)
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	130 ParamTys.push_back(Arguments[Idx]->getType());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	131 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	132
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	133 bool HardwareLoopInfo::isHardwareLoopCandidate(ScalarEvolution &SE,
1d019706d866 LLVM10 anatofuz parents: diff changeset	134 LoopInfo &LI, DominatorTree &DT,
1d019706d866 LLVM10 anatofuz parents: diff changeset	135 bool ForceNestedLoop,
1d019706d866 LLVM10 anatofuz parents: diff changeset	136 bool ForceHardwareLoopPHI) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	137 SmallVector<BasicBlock *, 4> ExitingBlocks;
1d019706d866 LLVM10 anatofuz parents: diff changeset	138 L->getExitingBlocks(ExitingBlocks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	139
1d019706d866 LLVM10 anatofuz parents: diff changeset	140 for (BasicBlock *BB : ExitingBlocks) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	141 // If we pass the updated counter back through a phi, we need to know
1d019706d866 LLVM10 anatofuz parents: diff changeset	142 // which latch the updated value will be coming from.
1d019706d866 LLVM10 anatofuz parents: diff changeset	143 if (!L->isLoopLatch(BB)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	144 if (ForceHardwareLoopPHI \|\| CounterInReg)
1d019706d866 LLVM10 anatofuz parents: diff changeset	145 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	146 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	147
1d019706d866 LLVM10 anatofuz parents: diff changeset	148 const SCEV *EC = SE.getExitCount(L, BB);
1d019706d866 LLVM10 anatofuz parents: diff changeset	149 if (isa<SCEVCouldNotCompute>(EC))
1d019706d866 LLVM10 anatofuz parents: diff changeset	150 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	151 if (const SCEVConstant *ConstEC = dyn_cast<SCEVConstant>(EC)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	152 if (ConstEC->getValue()->isZero())
1d019706d866 LLVM10 anatofuz parents: diff changeset	153 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	154 } else if (!SE.isLoopInvariant(EC, L))
1d019706d866 LLVM10 anatofuz parents: diff changeset	155 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	156
1d019706d866 LLVM10 anatofuz parents: diff changeset	157 if (SE.getTypeSizeInBits(EC->getType()) > CountType->getBitWidth())
1d019706d866 LLVM10 anatofuz parents: diff changeset	158 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	159
1d019706d866 LLVM10 anatofuz parents: diff changeset	160 // If this exiting block is contained in a nested loop, it is not eligible
1d019706d866 LLVM10 anatofuz parents: diff changeset	161 // for insertion of the branch-and-decrement since the inner loop would
1d019706d866 LLVM10 anatofuz parents: diff changeset	162 // end up messing up the value in the CTR.
1d019706d866 LLVM10 anatofuz parents: diff changeset	163 if (!IsNestingLegal && LI.getLoopFor(BB) != L && !ForceNestedLoop)
1d019706d866 LLVM10 anatofuz parents: diff changeset	164 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	165
1d019706d866 LLVM10 anatofuz parents: diff changeset	166 // We now have a loop-invariant count of loop iterations (which is not the
1d019706d866 LLVM10 anatofuz parents: diff changeset	167 // constant zero) for which we know that this loop will not exit via this
1d019706d866 LLVM10 anatofuz parents: diff changeset	168 // existing block.
1d019706d866 LLVM10 anatofuz parents: diff changeset	169
1d019706d866 LLVM10 anatofuz parents: diff changeset	170 // We need to make sure that this block will run on every loop iteration.
1d019706d866 LLVM10 anatofuz parents: diff changeset	171 // For this to be true, we must dominate all blocks with backedges. Such
1d019706d866 LLVM10 anatofuz parents: diff changeset	172 // blocks are in-loop predecessors to the header block.
1d019706d866 LLVM10 anatofuz parents: diff changeset	173 bool NotAlways = false;
1d019706d866 LLVM10 anatofuz parents: diff changeset	174 for (BasicBlock *Pred : predecessors(L->getHeader())) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	175 if (!L->contains(Pred))
1d019706d866 LLVM10 anatofuz parents: diff changeset	176 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	177
1d019706d866 LLVM10 anatofuz parents: diff changeset	178 if (!DT.dominates(BB, Pred)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	179 NotAlways = true;
1d019706d866 LLVM10 anatofuz parents: diff changeset	180 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	181 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	182 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	183
1d019706d866 LLVM10 anatofuz parents: diff changeset	184 if (NotAlways)
1d019706d866 LLVM10 anatofuz parents: diff changeset	185 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	186
1d019706d866 LLVM10 anatofuz parents: diff changeset	187 // Make sure this blocks ends with a conditional branch.
1d019706d866 LLVM10 anatofuz parents: diff changeset	188 Instruction *TI = BB->getTerminator();
1d019706d866 LLVM10 anatofuz parents: diff changeset	189 if (!TI)
1d019706d866 LLVM10 anatofuz parents: diff changeset	190 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	191
1d019706d866 LLVM10 anatofuz parents: diff changeset	192 if (BranchInst *BI = dyn_cast<BranchInst>(TI)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	193 if (!BI->isConditional())
1d019706d866 LLVM10 anatofuz parents: diff changeset	194 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	195
1d019706d866 LLVM10 anatofuz parents: diff changeset	196 ExitBranch = BI;
1d019706d866 LLVM10 anatofuz parents: diff changeset	197 } else
1d019706d866 LLVM10 anatofuz parents: diff changeset	198 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	199
1d019706d866 LLVM10 anatofuz parents: diff changeset	200 // Note that this block may not be the loop latch block, even if the loop
1d019706d866 LLVM10 anatofuz parents: diff changeset	201 // has a latch block.
1d019706d866 LLVM10 anatofuz parents: diff changeset	202 ExitBlock = BB;
1d019706d866 LLVM10 anatofuz parents: diff changeset	203 ExitCount = EC;
1d019706d866 LLVM10 anatofuz parents: diff changeset	204 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	205 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	206
1d019706d866 LLVM10 anatofuz parents: diff changeset	207 if (!ExitBlock)
1d019706d866 LLVM10 anatofuz parents: diff changeset	208 return false;
1d019706d866 LLVM10 anatofuz parents: diff changeset	209 return true;
1d019706d866 LLVM10 anatofuz parents: diff changeset	210 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	211
1d019706d866 LLVM10 anatofuz parents: diff changeset	212 TargetTransformInfo::TargetTransformInfo(const DataLayout &DL)
1d019706d866 LLVM10 anatofuz parents: diff changeset	213 : TTIImpl(new Model<NoTTIImpl>(NoTTIImpl(DL))) {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	214
1d019706d866 LLVM10 anatofuz parents: diff changeset	215 TargetTransformInfo::~TargetTransformInfo() {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	216
1d019706d866 LLVM10 anatofuz parents: diff changeset	217 TargetTransformInfo::TargetTransformInfo(TargetTransformInfo &&Arg)
1d019706d866 LLVM10 anatofuz parents: diff changeset	218 : TTIImpl(std::move(Arg.TTIImpl)) {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	219
1d019706d866 LLVM10 anatofuz parents: diff changeset	220 TargetTransformInfo &TargetTransformInfo::operator=(TargetTransformInfo &&RHS) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	221 TTIImpl = std::move(RHS.TTIImpl);
1d019706d866 LLVM10 anatofuz parents: diff changeset	222 return *this;
1d019706d866 LLVM10 anatofuz parents: diff changeset	223 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	224
1d019706d866 LLVM10 anatofuz parents: diff changeset	225 unsigned TargetTransformInfo::getInliningThresholdMultiplier() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	226 return TTIImpl->getInliningThresholdMultiplier();
1d019706d866 LLVM10 anatofuz parents: diff changeset	227 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	228
1d019706d866 LLVM10 anatofuz parents: diff changeset	229 int TargetTransformInfo::getInlinerVectorBonusPercent() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	230 return TTIImpl->getInlinerVectorBonusPercent();
1d019706d866 LLVM10 anatofuz parents: diff changeset	231 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	232
1d019706d866 LLVM10 anatofuz parents: diff changeset	233 int TargetTransformInfo::getGEPCost(Type PointeeType, const Value Ptr,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	234 ArrayRef<const Value *> Operands,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	235 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	236 return TTIImpl->getGEPCost(PointeeType, Ptr, Operands, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	237 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	238
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	239 int TargetTransformInfo::getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	240 ArrayRef<const Value *> Arguments,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	241 const User *U,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	242 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	243 int Cost = TTIImpl->getIntrinsicCost(IID, RetTy, Arguments, U, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	244 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	245 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	246 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	247
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	248 unsigned TargetTransformInfo::getEstimatedNumberOfCaseClusters(
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	249 const SwitchInst &SI, unsigned &JTSize, ProfileSummaryInfo *PSI,
1d019706d866 LLVM10 anatofuz parents: diff changeset	250 BlockFrequencyInfo *BFI) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	251 return TTIImpl->getEstimatedNumberOfCaseClusters(SI, JTSize, PSI, BFI);
1d019706d866 LLVM10 anatofuz parents: diff changeset	252 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	253
1d019706d866 LLVM10 anatofuz parents: diff changeset	254 int TargetTransformInfo::getUserCost(const User *U,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	255 ArrayRef<const Value *> Operands,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	256 enum TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	257 int Cost = TTIImpl->getUserCost(U, Operands, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	258 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	259 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	260 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	261
1d019706d866 LLVM10 anatofuz parents: diff changeset	262 bool TargetTransformInfo::hasBranchDivergence() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	263 return TTIImpl->hasBranchDivergence();
1d019706d866 LLVM10 anatofuz parents: diff changeset	264 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	265
1d019706d866 LLVM10 anatofuz parents: diff changeset	266 bool TargetTransformInfo::useGPUDivergenceAnalysis() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	267 return TTIImpl->useGPUDivergenceAnalysis();
1d019706d866 LLVM10 anatofuz parents: diff changeset	268 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	269
1d019706d866 LLVM10 anatofuz parents: diff changeset	270 bool TargetTransformInfo::isSourceOfDivergence(const Value *V) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	271 return TTIImpl->isSourceOfDivergence(V);
1d019706d866 LLVM10 anatofuz parents: diff changeset	272 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	273
1d019706d866 LLVM10 anatofuz parents: diff changeset	274 bool llvm::TargetTransformInfo::isAlwaysUniform(const Value *V) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	275 return TTIImpl->isAlwaysUniform(V);
1d019706d866 LLVM10 anatofuz parents: diff changeset	276 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	277
1d019706d866 LLVM10 anatofuz parents: diff changeset	278 unsigned TargetTransformInfo::getFlatAddressSpace() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	279 return TTIImpl->getFlatAddressSpace();
1d019706d866 LLVM10 anatofuz parents: diff changeset	280 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	281
1d019706d866 LLVM10 anatofuz parents: diff changeset	282 bool TargetTransformInfo::collectFlatAddressOperands(
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	283 SmallVectorImpl<int> &OpIndexes, Intrinsic::ID IID) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	284 return TTIImpl->collectFlatAddressOperands(OpIndexes, IID);
1d019706d866 LLVM10 anatofuz parents: diff changeset	285 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	286
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	287 bool TargetTransformInfo::rewriteIntrinsicWithAddressSpace(IntrinsicInst *II,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	288 Value *OldV,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	289 Value *NewV) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	290 return TTIImpl->rewriteIntrinsicWithAddressSpace(II, OldV, NewV);
1d019706d866 LLVM10 anatofuz parents: diff changeset	291 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	292
1d019706d866 LLVM10 anatofuz parents: diff changeset	293 bool TargetTransformInfo::isLoweredToCall(const Function *F) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	294 return TTIImpl->isLoweredToCall(F);
1d019706d866 LLVM10 anatofuz parents: diff changeset	295 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	296
1d019706d866 LLVM10 anatofuz parents: diff changeset	297 bool TargetTransformInfo::isHardwareLoopProfitable(
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	298 Loop *L, ScalarEvolution &SE, AssumptionCache &AC,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	299 TargetLibraryInfo *LibInfo, HardwareLoopInfo &HWLoopInfo) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	300 return TTIImpl->isHardwareLoopProfitable(L, SE, AC, LibInfo, HWLoopInfo);
1d019706d866 LLVM10 anatofuz parents: diff changeset	301 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	302
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	303 bool TargetTransformInfo::preferPredicateOverEpilogue(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	304 Loop L, LoopInfo LI, ScalarEvolution &SE, AssumptionCache &AC,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	305 TargetLibraryInfo TLI, DominatorTree DT,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	306 const LoopAccessInfo *LAI) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	307 return TTIImpl->preferPredicateOverEpilogue(L, LI, SE, AC, TLI, DT, LAI);
1d019706d866 LLVM10 anatofuz parents: diff changeset	308 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	309
1d019706d866 LLVM10 anatofuz parents: diff changeset	310 void TargetTransformInfo::getUnrollingPreferences(
1d019706d866 LLVM10 anatofuz parents: diff changeset	311 Loop *L, ScalarEvolution &SE, UnrollingPreferences &UP) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	312 return TTIImpl->getUnrollingPreferences(L, SE, UP);
1d019706d866 LLVM10 anatofuz parents: diff changeset	313 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	314
1d019706d866 LLVM10 anatofuz parents: diff changeset	315 bool TargetTransformInfo::isLegalAddImmediate(int64_t Imm) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	316 return TTIImpl->isLegalAddImmediate(Imm);
1d019706d866 LLVM10 anatofuz parents: diff changeset	317 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	318
1d019706d866 LLVM10 anatofuz parents: diff changeset	319 bool TargetTransformInfo::isLegalICmpImmediate(int64_t Imm) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	320 return TTIImpl->isLegalICmpImmediate(Imm);
1d019706d866 LLVM10 anatofuz parents: diff changeset	321 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	322
1d019706d866 LLVM10 anatofuz parents: diff changeset	323 bool TargetTransformInfo::isLegalAddressingMode(Type Ty, GlobalValue BaseGV,
1d019706d866 LLVM10 anatofuz parents: diff changeset	324 int64_t BaseOffset,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	325 bool HasBaseReg, int64_t Scale,
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	326 unsigned AddrSpace,
1d019706d866 LLVM10 anatofuz parents: diff changeset	327 Instruction *I) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	328 return TTIImpl->isLegalAddressingMode(Ty, BaseGV, BaseOffset, HasBaseReg,
1d019706d866 LLVM10 anatofuz parents: diff changeset	329 Scale, AddrSpace, I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	330 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	331
1d019706d866 LLVM10 anatofuz parents: diff changeset	332 bool TargetTransformInfo::isLSRCostLess(LSRCost &C1, LSRCost &C2) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	333 return TTIImpl->isLSRCostLess(C1, C2);
1d019706d866 LLVM10 anatofuz parents: diff changeset	334 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	335
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	336 bool TargetTransformInfo::isProfitableLSRChainElement(Instruction *I) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	337 return TTIImpl->isProfitableLSRChainElement(I);
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	338 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	339
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	340 bool TargetTransformInfo::canMacroFuseCmp() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	341 return TTIImpl->canMacroFuseCmp();
1d019706d866 LLVM10 anatofuz parents: diff changeset	342 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	343
1d019706d866 LLVM10 anatofuz parents: diff changeset	344 bool TargetTransformInfo::canSaveCmp(Loop L, BranchInst *BI,
1d019706d866 LLVM10 anatofuz parents: diff changeset	345 ScalarEvolution SE, LoopInfo LI,
1d019706d866 LLVM10 anatofuz parents: diff changeset	346 DominatorTree DT, AssumptionCache AC,
1d019706d866 LLVM10 anatofuz parents: diff changeset	347 TargetLibraryInfo *LibInfo) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	348 return TTIImpl->canSaveCmp(L, BI, SE, LI, DT, AC, LibInfo);
1d019706d866 LLVM10 anatofuz parents: diff changeset	349 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	350
1d019706d866 LLVM10 anatofuz parents: diff changeset	351 bool TargetTransformInfo::shouldFavorPostInc() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	352 return TTIImpl->shouldFavorPostInc();
1d019706d866 LLVM10 anatofuz parents: diff changeset	353 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	354
1d019706d866 LLVM10 anatofuz parents: diff changeset	355 bool TargetTransformInfo::shouldFavorBackedgeIndex(const Loop *L) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	356 return TTIImpl->shouldFavorBackedgeIndex(L);
1d019706d866 LLVM10 anatofuz parents: diff changeset	357 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	358
1d019706d866 LLVM10 anatofuz parents: diff changeset	359 bool TargetTransformInfo::isLegalMaskedStore(Type *DataType,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	360 Align Alignment) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	361 return TTIImpl->isLegalMaskedStore(DataType, Alignment);
1d019706d866 LLVM10 anatofuz parents: diff changeset	362 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	363
1d019706d866 LLVM10 anatofuz parents: diff changeset	364 bool TargetTransformInfo::isLegalMaskedLoad(Type *DataType,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	365 Align Alignment) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	366 return TTIImpl->isLegalMaskedLoad(DataType, Alignment);
1d019706d866 LLVM10 anatofuz parents: diff changeset	367 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	368
1d019706d866 LLVM10 anatofuz parents: diff changeset	369 bool TargetTransformInfo::isLegalNTStore(Type *DataType,
1d019706d866 LLVM10 anatofuz parents: diff changeset	370 Align Alignment) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	371 return TTIImpl->isLegalNTStore(DataType, Alignment);
1d019706d866 LLVM10 anatofuz parents: diff changeset	372 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	373
1d019706d866 LLVM10 anatofuz parents: diff changeset	374 bool TargetTransformInfo::isLegalNTLoad(Type *DataType, Align Alignment) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	375 return TTIImpl->isLegalNTLoad(DataType, Alignment);
1d019706d866 LLVM10 anatofuz parents: diff changeset	376 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	377
1d019706d866 LLVM10 anatofuz parents: diff changeset	378 bool TargetTransformInfo::isLegalMaskedGather(Type *DataType,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	379 Align Alignment) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	380 return TTIImpl->isLegalMaskedGather(DataType, Alignment);
1d019706d866 LLVM10 anatofuz parents: diff changeset	381 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	382
1d019706d866 LLVM10 anatofuz parents: diff changeset	383 bool TargetTransformInfo::isLegalMaskedScatter(Type *DataType,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	384 Align Alignment) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	385 return TTIImpl->isLegalMaskedScatter(DataType, Alignment);
1d019706d866 LLVM10 anatofuz parents: diff changeset	386 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	387
1d019706d866 LLVM10 anatofuz parents: diff changeset	388 bool TargetTransformInfo::isLegalMaskedCompressStore(Type *DataType) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	389 return TTIImpl->isLegalMaskedCompressStore(DataType);
1d019706d866 LLVM10 anatofuz parents: diff changeset	390 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	391
1d019706d866 LLVM10 anatofuz parents: diff changeset	392 bool TargetTransformInfo::isLegalMaskedExpandLoad(Type *DataType) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	393 return TTIImpl->isLegalMaskedExpandLoad(DataType);
1d019706d866 LLVM10 anatofuz parents: diff changeset	394 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	395
1d019706d866 LLVM10 anatofuz parents: diff changeset	396 bool TargetTransformInfo::hasDivRemOp(Type *DataType, bool IsSigned) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	397 return TTIImpl->hasDivRemOp(DataType, IsSigned);
1d019706d866 LLVM10 anatofuz parents: diff changeset	398 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	399
1d019706d866 LLVM10 anatofuz parents: diff changeset	400 bool TargetTransformInfo::hasVolatileVariant(Instruction *I,
1d019706d866 LLVM10 anatofuz parents: diff changeset	401 unsigned AddrSpace) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	402 return TTIImpl->hasVolatileVariant(I, AddrSpace);
1d019706d866 LLVM10 anatofuz parents: diff changeset	403 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	404
1d019706d866 LLVM10 anatofuz parents: diff changeset	405 bool TargetTransformInfo::prefersVectorizedAddressing() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	406 return TTIImpl->prefersVectorizedAddressing();
1d019706d866 LLVM10 anatofuz parents: diff changeset	407 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	408
1d019706d866 LLVM10 anatofuz parents: diff changeset	409 int TargetTransformInfo::getScalingFactorCost(Type Ty, GlobalValue BaseGV,
1d019706d866 LLVM10 anatofuz parents: diff changeset	410 int64_t BaseOffset,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	411 bool HasBaseReg, int64_t Scale,
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	412 unsigned AddrSpace) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	413 int Cost = TTIImpl->getScalingFactorCost(Ty, BaseGV, BaseOffset, HasBaseReg,
1d019706d866 LLVM10 anatofuz parents: diff changeset	414 Scale, AddrSpace);
1d019706d866 LLVM10 anatofuz parents: diff changeset	415 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	416 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	417 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	418
1d019706d866 LLVM10 anatofuz parents: diff changeset	419 bool TargetTransformInfo::LSRWithInstrQueries() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	420 return TTIImpl->LSRWithInstrQueries();
1d019706d866 LLVM10 anatofuz parents: diff changeset	421 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	422
1d019706d866 LLVM10 anatofuz parents: diff changeset	423 bool TargetTransformInfo::isTruncateFree(Type Ty1, Type Ty2) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	424 return TTIImpl->isTruncateFree(Ty1, Ty2);
1d019706d866 LLVM10 anatofuz parents: diff changeset	425 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	426
1d019706d866 LLVM10 anatofuz parents: diff changeset	427 bool TargetTransformInfo::isProfitableToHoist(Instruction *I) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	428 return TTIImpl->isProfitableToHoist(I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	429 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	430
1d019706d866 LLVM10 anatofuz parents: diff changeset	431 bool TargetTransformInfo::useAA() const { return TTIImpl->useAA(); }
1d019706d866 LLVM10 anatofuz parents: diff changeset	432
1d019706d866 LLVM10 anatofuz parents: diff changeset	433 bool TargetTransformInfo::isTypeLegal(Type *Ty) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	434 return TTIImpl->isTypeLegal(Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	435 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	436
1d019706d866 LLVM10 anatofuz parents: diff changeset	437 bool TargetTransformInfo::shouldBuildLookupTables() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	438 return TTIImpl->shouldBuildLookupTables();
1d019706d866 LLVM10 anatofuz parents: diff changeset	439 }
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	440 bool TargetTransformInfo::shouldBuildLookupTablesForConstant(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	441 Constant *C) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	442 return TTIImpl->shouldBuildLookupTablesForConstant(C);
1d019706d866 LLVM10 anatofuz parents: diff changeset	443 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	444
1d019706d866 LLVM10 anatofuz parents: diff changeset	445 bool TargetTransformInfo::useColdCCForColdCall(Function &F) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	446 return TTIImpl->useColdCCForColdCall(F);
1d019706d866 LLVM10 anatofuz parents: diff changeset	447 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	448
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	449 unsigned
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	450 TargetTransformInfo::getScalarizationOverhead(VectorType *Ty,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	451 const APInt &DemandedElts,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	452 bool Insert, bool Extract) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	453 return TTIImpl->getScalarizationOverhead(Ty, DemandedElts, Insert, Extract);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	454 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	455
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	456 unsigned TargetTransformInfo::getOperandsScalarizationOverhead(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	457 ArrayRef<const Value *> Args, unsigned VF) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	458 return TTIImpl->getOperandsScalarizationOverhead(Args, VF);
1d019706d866 LLVM10 anatofuz parents: diff changeset	459 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	460
1d019706d866 LLVM10 anatofuz parents: diff changeset	461 bool TargetTransformInfo::supportsEfficientVectorElementLoadStore() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	462 return TTIImpl->supportsEfficientVectorElementLoadStore();
1d019706d866 LLVM10 anatofuz parents: diff changeset	463 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	464
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	465 bool TargetTransformInfo::enableAggressiveInterleaving(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	466 bool LoopHasReductions) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	467 return TTIImpl->enableAggressiveInterleaving(LoopHasReductions);
1d019706d866 LLVM10 anatofuz parents: diff changeset	468 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	469
1d019706d866 LLVM10 anatofuz parents: diff changeset	470 TargetTransformInfo::MemCmpExpansionOptions
1d019706d866 LLVM10 anatofuz parents: diff changeset	471 TargetTransformInfo::enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	472 return TTIImpl->enableMemCmpExpansion(OptSize, IsZeroCmp);
1d019706d866 LLVM10 anatofuz parents: diff changeset	473 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	474
1d019706d866 LLVM10 anatofuz parents: diff changeset	475 bool TargetTransformInfo::enableInterleavedAccessVectorization() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	476 return TTIImpl->enableInterleavedAccessVectorization();
1d019706d866 LLVM10 anatofuz parents: diff changeset	477 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	478
1d019706d866 LLVM10 anatofuz parents: diff changeset	479 bool TargetTransformInfo::enableMaskedInterleavedAccessVectorization() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	480 return TTIImpl->enableMaskedInterleavedAccessVectorization();
1d019706d866 LLVM10 anatofuz parents: diff changeset	481 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	482
1d019706d866 LLVM10 anatofuz parents: diff changeset	483 bool TargetTransformInfo::isFPVectorizationPotentiallyUnsafe() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	484 return TTIImpl->isFPVectorizationPotentiallyUnsafe();
1d019706d866 LLVM10 anatofuz parents: diff changeset	485 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	486
1d019706d866 LLVM10 anatofuz parents: diff changeset	487 bool TargetTransformInfo::allowsMisalignedMemoryAccesses(LLVMContext &Context,
1d019706d866 LLVM10 anatofuz parents: diff changeset	488 unsigned BitWidth,
1d019706d866 LLVM10 anatofuz parents: diff changeset	489 unsigned AddressSpace,
1d019706d866 LLVM10 anatofuz parents: diff changeset	490 unsigned Alignment,
1d019706d866 LLVM10 anatofuz parents: diff changeset	491 bool *Fast) const {
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	492 return TTIImpl->allowsMisalignedMemoryAccesses(Context, BitWidth,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	493 AddressSpace, Alignment, Fast);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	494 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	495
1d019706d866 LLVM10 anatofuz parents: diff changeset	496 TargetTransformInfo::PopcntSupportKind
1d019706d866 LLVM10 anatofuz parents: diff changeset	497 TargetTransformInfo::getPopcntSupport(unsigned IntTyWidthInBit) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	498 return TTIImpl->getPopcntSupport(IntTyWidthInBit);
1d019706d866 LLVM10 anatofuz parents: diff changeset	499 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	500
1d019706d866 LLVM10 anatofuz parents: diff changeset	501 bool TargetTransformInfo::haveFastSqrt(Type *Ty) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	502 return TTIImpl->haveFastSqrt(Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	503 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	504
1d019706d866 LLVM10 anatofuz parents: diff changeset	505 bool TargetTransformInfo::isFCmpOrdCheaperThanFCmpZero(Type *Ty) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	506 return TTIImpl->isFCmpOrdCheaperThanFCmpZero(Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	507 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	508
1d019706d866 LLVM10 anatofuz parents: diff changeset	509 int TargetTransformInfo::getFPOpCost(Type *Ty) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	510 int Cost = TTIImpl->getFPOpCost(Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	511 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	512 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	513 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	514
1d019706d866 LLVM10 anatofuz parents: diff changeset	515 int TargetTransformInfo::getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx,
1d019706d866 LLVM10 anatofuz parents: diff changeset	516 const APInt &Imm,
1d019706d866 LLVM10 anatofuz parents: diff changeset	517 Type *Ty) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	518 int Cost = TTIImpl->getIntImmCodeSizeCost(Opcode, Idx, Imm, Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	519 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	520 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	521 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	522
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	523 int TargetTransformInfo::getIntImmCost(const APInt &Imm, Type *Ty,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	524 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	525 int Cost = TTIImpl->getIntImmCost(Imm, Ty, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	526 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	527 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	528 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	529
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	530 int
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	531 TargetTransformInfo::getIntImmCostInst(unsigned Opcode, unsigned Idx,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	532 const APInt &Imm, Type *Ty,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	533 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	534 int Cost = TTIImpl->getIntImmCostInst(Opcode, Idx, Imm, Ty, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	535 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	536 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	537 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	538
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	539 int
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	540 TargetTransformInfo::getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	541 const APInt &Imm, Type *Ty,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	542 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	543 int Cost = TTIImpl->getIntImmCostIntrin(IID, Idx, Imm, Ty, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	544 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	545 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	546 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	547
1d019706d866 LLVM10 anatofuz parents: diff changeset	548 unsigned TargetTransformInfo::getNumberOfRegisters(unsigned ClassID) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	549 return TTIImpl->getNumberOfRegisters(ClassID);
1d019706d866 LLVM10 anatofuz parents: diff changeset	550 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	551
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	552 unsigned TargetTransformInfo::getRegisterClassForType(bool Vector,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	553 Type *Ty) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	554 return TTIImpl->getRegisterClassForType(Vector, Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	555 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	556
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	557 const char *TargetTransformInfo::getRegisterClassName(unsigned ClassID) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	558 return TTIImpl->getRegisterClassName(ClassID);
1d019706d866 LLVM10 anatofuz parents: diff changeset	559 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	560
1d019706d866 LLVM10 anatofuz parents: diff changeset	561 unsigned TargetTransformInfo::getRegisterBitWidth(bool Vector) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	562 return TTIImpl->getRegisterBitWidth(Vector);
1d019706d866 LLVM10 anatofuz parents: diff changeset	563 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	564
1d019706d866 LLVM10 anatofuz parents: diff changeset	565 unsigned TargetTransformInfo::getMinVectorRegisterBitWidth() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	566 return TTIImpl->getMinVectorRegisterBitWidth();
1d019706d866 LLVM10 anatofuz parents: diff changeset	567 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	568
1d019706d866 LLVM10 anatofuz parents: diff changeset	569 bool TargetTransformInfo::shouldMaximizeVectorBandwidth(bool OptSize) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	570 return TTIImpl->shouldMaximizeVectorBandwidth(OptSize);
1d019706d866 LLVM10 anatofuz parents: diff changeset	571 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	572
1d019706d866 LLVM10 anatofuz parents: diff changeset	573 unsigned TargetTransformInfo::getMinimumVF(unsigned ElemWidth) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	574 return TTIImpl->getMinimumVF(ElemWidth);
1d019706d866 LLVM10 anatofuz parents: diff changeset	575 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	576
1d019706d866 LLVM10 anatofuz parents: diff changeset	577 bool TargetTransformInfo::shouldConsiderAddressTypePromotion(
1d019706d866 LLVM10 anatofuz parents: diff changeset	578 const Instruction &I, bool &AllowPromotionWithoutCommonHeader) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	579 return TTIImpl->shouldConsiderAddressTypePromotion(
1d019706d866 LLVM10 anatofuz parents: diff changeset	580 I, AllowPromotionWithoutCommonHeader);
1d019706d866 LLVM10 anatofuz parents: diff changeset	581 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	582
1d019706d866 LLVM10 anatofuz parents: diff changeset	583 unsigned TargetTransformInfo::getCacheLineSize() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	584 return TTIImpl->getCacheLineSize();
1d019706d866 LLVM10 anatofuz parents: diff changeset	585 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	586
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	587 llvm::Optional<unsigned>
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	588 TargetTransformInfo::getCacheSize(CacheLevel Level) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	589 return TTIImpl->getCacheSize(Level);
1d019706d866 LLVM10 anatofuz parents: diff changeset	590 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	591
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	592 llvm::Optional<unsigned>
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	593 TargetTransformInfo::getCacheAssociativity(CacheLevel Level) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	594 return TTIImpl->getCacheAssociativity(Level);
1d019706d866 LLVM10 anatofuz parents: diff changeset	595 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	596
1d019706d866 LLVM10 anatofuz parents: diff changeset	597 unsigned TargetTransformInfo::getPrefetchDistance() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	598 return TTIImpl->getPrefetchDistance();
1d019706d866 LLVM10 anatofuz parents: diff changeset	599 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	600
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	601 unsigned TargetTransformInfo::getMinPrefetchStride(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	602 unsigned NumMemAccesses, unsigned NumStridedMemAccesses,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	603 unsigned NumPrefetches, bool HasCall) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	604 return TTIImpl->getMinPrefetchStride(NumMemAccesses, NumStridedMemAccesses,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	605 NumPrefetches, HasCall);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	606 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	607
1d019706d866 LLVM10 anatofuz parents: diff changeset	608 unsigned TargetTransformInfo::getMaxPrefetchIterationsAhead() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	609 return TTIImpl->getMaxPrefetchIterationsAhead();
1d019706d866 LLVM10 anatofuz parents: diff changeset	610 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	611
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	612 bool TargetTransformInfo::enableWritePrefetching() const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	613 return TTIImpl->enableWritePrefetching();
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	614 }
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	615
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	616 unsigned TargetTransformInfo::getMaxInterleaveFactor(unsigned VF) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	617 return TTIImpl->getMaxInterleaveFactor(VF);
1d019706d866 LLVM10 anatofuz parents: diff changeset	618 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	619
1d019706d866 LLVM10 anatofuz parents: diff changeset	620 TargetTransformInfo::OperandValueKind
1d019706d866 LLVM10 anatofuz parents: diff changeset	621 TargetTransformInfo::getOperandInfo(Value *V, OperandValueProperties &OpProps) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	622 OperandValueKind OpInfo = OK_AnyValue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	623 OpProps = OP_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	624
1d019706d866 LLVM10 anatofuz parents: diff changeset	625 if (auto *CI = dyn_cast<ConstantInt>(V)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	626 if (CI->getValue().isPowerOf2())
1d019706d866 LLVM10 anatofuz parents: diff changeset	627 OpProps = OP_PowerOf2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	628 return OK_UniformConstantValue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	629 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	630
1d019706d866 LLVM10 anatofuz parents: diff changeset	631 // A broadcast shuffle creates a uniform value.
1d019706d866 LLVM10 anatofuz parents: diff changeset	632 // TODO: Add support for non-zero index broadcasts.
1d019706d866 LLVM10 anatofuz parents: diff changeset	633 // TODO: Add support for different source vector width.
1d019706d866 LLVM10 anatofuz parents: diff changeset	634 if (auto *ShuffleInst = dyn_cast<ShuffleVectorInst>(V))
1d019706d866 LLVM10 anatofuz parents: diff changeset	635 if (ShuffleInst->isZeroEltSplat())
1d019706d866 LLVM10 anatofuz parents: diff changeset	636 OpInfo = OK_UniformValue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	637
1d019706d866 LLVM10 anatofuz parents: diff changeset	638 const Value *Splat = getSplatValue(V);
1d019706d866 LLVM10 anatofuz parents: diff changeset	639
1d019706d866 LLVM10 anatofuz parents: diff changeset	640 // Check for a splat of a constant or for a non uniform vector of constants
1d019706d866 LLVM10 anatofuz parents: diff changeset	641 // and check if the constant(s) are all powers of two.
1d019706d866 LLVM10 anatofuz parents: diff changeset	642 if (isa<ConstantVector>(V) \|\| isa<ConstantDataVector>(V)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	643 OpInfo = OK_NonUniformConstantValue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	644 if (Splat) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	645 OpInfo = OK_UniformConstantValue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	646 if (auto *CI = dyn_cast<ConstantInt>(Splat))
1d019706d866 LLVM10 anatofuz parents: diff changeset	647 if (CI->getValue().isPowerOf2())
1d019706d866 LLVM10 anatofuz parents: diff changeset	648 OpProps = OP_PowerOf2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	649 } else if (auto *CDS = dyn_cast<ConstantDataSequential>(V)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	650 OpProps = OP_PowerOf2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	651 for (unsigned I = 0, E = CDS->getNumElements(); I != E; ++I) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	652 if (auto *CI = dyn_cast<ConstantInt>(CDS->getElementAsConstant(I)))
1d019706d866 LLVM10 anatofuz parents: diff changeset	653 if (CI->getValue().isPowerOf2())
1d019706d866 LLVM10 anatofuz parents: diff changeset	654 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	655 OpProps = OP_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	656 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	657 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	658 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	659 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	660
1d019706d866 LLVM10 anatofuz parents: diff changeset	661 // Check for a splat of a uniform value. This is not loop aware, so return
1d019706d866 LLVM10 anatofuz parents: diff changeset	662 // true only for the obviously uniform cases (argument, globalvalue)
1d019706d866 LLVM10 anatofuz parents: diff changeset	663 if (Splat && (isa<Argument>(Splat) \|\| isa<GlobalValue>(Splat)))
1d019706d866 LLVM10 anatofuz parents: diff changeset	664 OpInfo = OK_UniformValue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	665
1d019706d866 LLVM10 anatofuz parents: diff changeset	666 return OpInfo;
1d019706d866 LLVM10 anatofuz parents: diff changeset	667 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	668
1d019706d866 LLVM10 anatofuz parents: diff changeset	669 int TargetTransformInfo::getArithmeticInstrCost(
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	670 unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	671 OperandValueKind Opd1Info,
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	672 OperandValueKind Opd2Info, OperandValueProperties Opd1PropInfo,
1d019706d866 LLVM10 anatofuz parents: diff changeset	673 OperandValueProperties Opd2PropInfo, ArrayRef<const Value *> Args,
1d019706d866 LLVM10 anatofuz parents: diff changeset	674 const Instruction *CxtI) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	675 int Cost = TTIImpl->getArithmeticInstrCost(
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	676 Opcode, Ty, CostKind, Opd1Info, Opd2Info, Opd1PropInfo, Opd2PropInfo,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	677 Args, CxtI);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	678 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	679 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	680 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	681
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	682 int TargetTransformInfo::getShuffleCost(ShuffleKind Kind, VectorType *Ty,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	683 int Index, VectorType *SubTp) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	684 int Cost = TTIImpl->getShuffleCost(Kind, Ty, Index, SubTp);
1d019706d866 LLVM10 anatofuz parents: diff changeset	685 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	686 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	687 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	688
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	689 int TargetTransformInfo::getCastInstrCost(unsigned Opcode, Type Dst, Type Src,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	690 TTI::TargetCostKind CostKind,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	691 const Instruction *I) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	692 assert((I == nullptr \|\| I->getOpcode() == Opcode) &&
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	693 "Opcode should reflect passed instruction.");
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	694 int Cost = TTIImpl->getCastInstrCost(Opcode, Dst, Src, CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	695 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	696 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	697 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	698
1d019706d866 LLVM10 anatofuz parents: diff changeset	699 int TargetTransformInfo::getExtractWithExtendCost(unsigned Opcode, Type *Dst,
1d019706d866 LLVM10 anatofuz parents: diff changeset	700 VectorType *VecTy,
1d019706d866 LLVM10 anatofuz parents: diff changeset	701 unsigned Index) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	702 int Cost = TTIImpl->getExtractWithExtendCost(Opcode, Dst, VecTy, Index);
1d019706d866 LLVM10 anatofuz parents: diff changeset	703 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	704 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	705 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	706
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	707 int TargetTransformInfo::getCFInstrCost(unsigned Opcode,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	708 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	709 int Cost = TTIImpl->getCFInstrCost(Opcode, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	710 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	711 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	712 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	713
1d019706d866 LLVM10 anatofuz parents: diff changeset	714 int TargetTransformInfo::getCmpSelInstrCost(unsigned Opcode, Type *ValTy,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	715 Type *CondTy,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	716 TTI::TargetCostKind CostKind,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	717 const Instruction *I) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	718 assert((I == nullptr \|\| I->getOpcode() == Opcode) &&
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	719 "Opcode should reflect passed instruction.");
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	720 int Cost = TTIImpl->getCmpSelInstrCost(Opcode, ValTy, CondTy, CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	721 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	722 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	723 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	724
1d019706d866 LLVM10 anatofuz parents: diff changeset	725 int TargetTransformInfo::getVectorInstrCost(unsigned Opcode, Type *Val,
1d019706d866 LLVM10 anatofuz parents: diff changeset	726 unsigned Index) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	727 int Cost = TTIImpl->getVectorInstrCost(Opcode, Val, Index);
1d019706d866 LLVM10 anatofuz parents: diff changeset	728 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	729 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	730 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	731
1d019706d866 LLVM10 anatofuz parents: diff changeset	732 int TargetTransformInfo::getMemoryOpCost(unsigned Opcode, Type *Src,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	733 Align Alignment, unsigned AddressSpace,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	734 TTI::TargetCostKind CostKind,
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	735 const Instruction *I) const {
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	736 assert((I == nullptr \|\| I->getOpcode() == Opcode) &&
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	737 "Opcode should reflect passed instruction.");
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	738 int Cost = TTIImpl->getMemoryOpCost(Opcode, Src, Alignment, AddressSpace,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	739 CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	740 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	741 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	742 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	743
1d019706d866 LLVM10 anatofuz parents: diff changeset	744 int TargetTransformInfo::getMaskedMemoryOpCost(unsigned Opcode, Type *Src,
1d019706d866 LLVM10 anatofuz parents: diff changeset	745 unsigned Alignment,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	746 unsigned AddressSpace,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	747 TTI::TargetCostKind CostKind) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	748 int Cost =
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	749 TTIImpl->getMaskedMemoryOpCost(Opcode, Src, Alignment, AddressSpace,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	750 CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	751 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	752 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	753 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	754
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	755 int TargetTransformInfo::getGatherScatterOpCost(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	756 unsigned Opcode, Type DataTy, Value Ptr, bool VariableMask,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	757 unsigned Alignment, TTI::TargetCostKind CostKind,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	758 const Instruction *I) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	759 int Cost = TTIImpl->getGatherScatterOpCost(Opcode, DataTy, Ptr, VariableMask,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	760 Alignment, CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	761 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	762 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	763 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	764
1d019706d866 LLVM10 anatofuz parents: diff changeset	765 int TargetTransformInfo::getInterleavedMemoryOpCost(
1d019706d866 LLVM10 anatofuz parents: diff changeset	766 unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	767 unsigned Alignment, unsigned AddressSpace,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	768 TTI::TargetCostKind CostKind,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	769 bool UseMaskForCond, bool UseMaskForGaps) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	770 int Cost = TTIImpl->getInterleavedMemoryOpCost(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	771 Opcode, VecTy, Factor, Indices, Alignment, AddressSpace, CostKind,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	772 UseMaskForCond, UseMaskForGaps);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	773 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	774 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	775 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	776
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	777 int
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	778 TargetTransformInfo::getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	779 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	780 int Cost = TTIImpl->getIntrinsicInstrCost(ICA, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	781 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	782 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	783 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	784
1d019706d866 LLVM10 anatofuz parents: diff changeset	785 int TargetTransformInfo::getCallInstrCost(Function F, Type RetTy,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	786 ArrayRef<Type *> Tys,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	787 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	788 int Cost = TTIImpl->getCallInstrCost(F, RetTy, Tys, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	789 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	790 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	791 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	792
1d019706d866 LLVM10 anatofuz parents: diff changeset	793 unsigned TargetTransformInfo::getNumberOfParts(Type *Tp) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	794 return TTIImpl->getNumberOfParts(Tp);
1d019706d866 LLVM10 anatofuz parents: diff changeset	795 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	796
1d019706d866 LLVM10 anatofuz parents: diff changeset	797 int TargetTransformInfo::getAddressComputationCost(Type *Tp,
1d019706d866 LLVM10 anatofuz parents: diff changeset	798 ScalarEvolution *SE,
1d019706d866 LLVM10 anatofuz parents: diff changeset	799 const SCEV *Ptr) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	800 int Cost = TTIImpl->getAddressComputationCost(Tp, SE, Ptr);
1d019706d866 LLVM10 anatofuz parents: diff changeset	801 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	802 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	803 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	804
1d019706d866 LLVM10 anatofuz parents: diff changeset	805 int TargetTransformInfo::getMemcpyCost(const Instruction *I) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	806 int Cost = TTIImpl->getMemcpyCost(I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	807 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	808 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	809 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	810
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	811 int TargetTransformInfo::getArithmeticReductionCost(unsigned Opcode,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	812 VectorType *Ty,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	813 bool IsPairwiseForm,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	814 TTI::TargetCostKind CostKind) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	815 int Cost = TTIImpl->getArithmeticReductionCost(Opcode, Ty, IsPairwiseForm,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	816 CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	817 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	818 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	819 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	820
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	821 int TargetTransformInfo::getMinMaxReductionCost(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	822 VectorType Ty, VectorType CondTy, bool IsPairwiseForm, bool IsUnsigned,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	823 TTI::TargetCostKind CostKind) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	824 int Cost =
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	825 TTIImpl->getMinMaxReductionCost(Ty, CondTy, IsPairwiseForm, IsUnsigned,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	826 CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	827 assert(Cost >= 0 && "TTI should not produce negative costs!");
1d019706d866 LLVM10 anatofuz parents: diff changeset	828 return Cost;
1d019706d866 LLVM10 anatofuz parents: diff changeset	829 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	830
1d019706d866 LLVM10 anatofuz parents: diff changeset	831 unsigned
1d019706d866 LLVM10 anatofuz parents: diff changeset	832 TargetTransformInfo::getCostOfKeepingLiveOverCall(ArrayRef<Type *> Tys) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	833 return TTIImpl->getCostOfKeepingLiveOverCall(Tys);
1d019706d866 LLVM10 anatofuz parents: diff changeset	834 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	835
1d019706d866 LLVM10 anatofuz parents: diff changeset	836 bool TargetTransformInfo::getTgtMemIntrinsic(IntrinsicInst *Inst,
1d019706d866 LLVM10 anatofuz parents: diff changeset	837 MemIntrinsicInfo &Info) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	838 return TTIImpl->getTgtMemIntrinsic(Inst, Info);
1d019706d866 LLVM10 anatofuz parents: diff changeset	839 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	840
1d019706d866 LLVM10 anatofuz parents: diff changeset	841 unsigned TargetTransformInfo::getAtomicMemIntrinsicMaxElementSize() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	842 return TTIImpl->getAtomicMemIntrinsicMaxElementSize();
1d019706d866 LLVM10 anatofuz parents: diff changeset	843 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	844
1d019706d866 LLVM10 anatofuz parents: diff changeset	845 Value *TargetTransformInfo::getOrCreateResultFromMemIntrinsic(
1d019706d866 LLVM10 anatofuz parents: diff changeset	846 IntrinsicInst Inst, Type ExpectedType) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	847 return TTIImpl->getOrCreateResultFromMemIntrinsic(Inst, ExpectedType);
1d019706d866 LLVM10 anatofuz parents: diff changeset	848 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	849
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	850 Type *TargetTransformInfo::getMemcpyLoopLoweringType(
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	851 LLVMContext &Context, Value *Length, unsigned SrcAddrSpace,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	852 unsigned DestAddrSpace, unsigned SrcAlign, unsigned DestAlign) const {
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	853 return TTIImpl->getMemcpyLoopLoweringType(Context, Length, SrcAddrSpace,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	854 DestAddrSpace, SrcAlign, DestAlign);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	855 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	856
1d019706d866 LLVM10 anatofuz parents: diff changeset	857 void TargetTransformInfo::getMemcpyLoopResidualLoweringType(
1d019706d866 LLVM10 anatofuz parents: diff changeset	858 SmallVectorImpl<Type *> &OpsOut, LLVMContext &Context,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	859 unsigned RemainingBytes, unsigned SrcAddrSpace, unsigned DestAddrSpace,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	860 unsigned SrcAlign, unsigned DestAlign) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	861 TTIImpl->getMemcpyLoopResidualLoweringType(OpsOut, Context, RemainingBytes,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	862 SrcAddrSpace, DestAddrSpace,
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	863 SrcAlign, DestAlign);
1d019706d866 LLVM10 anatofuz parents: diff changeset	864 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	865
1d019706d866 LLVM10 anatofuz parents: diff changeset	866 bool TargetTransformInfo::areInlineCompatible(const Function *Caller,
1d019706d866 LLVM10 anatofuz parents: diff changeset	867 const Function *Callee) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	868 return TTIImpl->areInlineCompatible(Caller, Callee);
1d019706d866 LLVM10 anatofuz parents: diff changeset	869 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	870
1d019706d866 LLVM10 anatofuz parents: diff changeset	871 bool TargetTransformInfo::areFunctionArgsABICompatible(
1d019706d866 LLVM10 anatofuz parents: diff changeset	872 const Function Caller, const Function Callee,
1d019706d866 LLVM10 anatofuz parents: diff changeset	873 SmallPtrSetImpl<Argument *> &Args) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	874 return TTIImpl->areFunctionArgsABICompatible(Caller, Callee, Args);
1d019706d866 LLVM10 anatofuz parents: diff changeset	875 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	876
1d019706d866 LLVM10 anatofuz parents: diff changeset	877 bool TargetTransformInfo::isIndexedLoadLegal(MemIndexedMode Mode,
1d019706d866 LLVM10 anatofuz parents: diff changeset	878 Type *Ty) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	879 return TTIImpl->isIndexedLoadLegal(Mode, Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	880 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	881
1d019706d866 LLVM10 anatofuz parents: diff changeset	882 bool TargetTransformInfo::isIndexedStoreLegal(MemIndexedMode Mode,
1d019706d866 LLVM10 anatofuz parents: diff changeset	883 Type *Ty) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	884 return TTIImpl->isIndexedStoreLegal(Mode, Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	885 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	886
1d019706d866 LLVM10 anatofuz parents: diff changeset	887 unsigned TargetTransformInfo::getLoadStoreVecRegBitWidth(unsigned AS) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	888 return TTIImpl->getLoadStoreVecRegBitWidth(AS);
1d019706d866 LLVM10 anatofuz parents: diff changeset	889 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	890
1d019706d866 LLVM10 anatofuz parents: diff changeset	891 bool TargetTransformInfo::isLegalToVectorizeLoad(LoadInst *LI) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	892 return TTIImpl->isLegalToVectorizeLoad(LI);
1d019706d866 LLVM10 anatofuz parents: diff changeset	893 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	894
1d019706d866 LLVM10 anatofuz parents: diff changeset	895 bool TargetTransformInfo::isLegalToVectorizeStore(StoreInst *SI) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	896 return TTIImpl->isLegalToVectorizeStore(SI);
1d019706d866 LLVM10 anatofuz parents: diff changeset	897 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	898
1d019706d866 LLVM10 anatofuz parents: diff changeset	899 bool TargetTransformInfo::isLegalToVectorizeLoadChain(
1d019706d866 LLVM10 anatofuz parents: diff changeset	900 unsigned ChainSizeInBytes, unsigned Alignment, unsigned AddrSpace) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	901 return TTIImpl->isLegalToVectorizeLoadChain(ChainSizeInBytes, Alignment,
1d019706d866 LLVM10 anatofuz parents: diff changeset	902 AddrSpace);
1d019706d866 LLVM10 anatofuz parents: diff changeset	903 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	904
1d019706d866 LLVM10 anatofuz parents: diff changeset	905 bool TargetTransformInfo::isLegalToVectorizeStoreChain(
1d019706d866 LLVM10 anatofuz parents: diff changeset	906 unsigned ChainSizeInBytes, unsigned Alignment, unsigned AddrSpace) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	907 return TTIImpl->isLegalToVectorizeStoreChain(ChainSizeInBytes, Alignment,
1d019706d866 LLVM10 anatofuz parents: diff changeset	908 AddrSpace);
1d019706d866 LLVM10 anatofuz parents: diff changeset	909 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	910
1d019706d866 LLVM10 anatofuz parents: diff changeset	911 unsigned TargetTransformInfo::getLoadVectorFactor(unsigned VF,
1d019706d866 LLVM10 anatofuz parents: diff changeset	912 unsigned LoadSize,
1d019706d866 LLVM10 anatofuz parents: diff changeset	913 unsigned ChainSizeInBytes,
1d019706d866 LLVM10 anatofuz parents: diff changeset	914 VectorType *VecTy) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	915 return TTIImpl->getLoadVectorFactor(VF, LoadSize, ChainSizeInBytes, VecTy);
1d019706d866 LLVM10 anatofuz parents: diff changeset	916 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	917
1d019706d866 LLVM10 anatofuz parents: diff changeset	918 unsigned TargetTransformInfo::getStoreVectorFactor(unsigned VF,
1d019706d866 LLVM10 anatofuz parents: diff changeset	919 unsigned StoreSize,
1d019706d866 LLVM10 anatofuz parents: diff changeset	920 unsigned ChainSizeInBytes,
1d019706d866 LLVM10 anatofuz parents: diff changeset	921 VectorType *VecTy) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	922 return TTIImpl->getStoreVectorFactor(VF, StoreSize, ChainSizeInBytes, VecTy);
1d019706d866 LLVM10 anatofuz parents: diff changeset	923 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	924
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	925 bool TargetTransformInfo::useReductionIntrinsic(unsigned Opcode, Type *Ty,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	926 ReductionFlags Flags) const {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	927 return TTIImpl->useReductionIntrinsic(Opcode, Ty, Flags);
1d019706d866 LLVM10 anatofuz parents: diff changeset	928 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	929
1d019706d866 LLVM10 anatofuz parents: diff changeset	930 bool TargetTransformInfo::shouldExpandReduction(const IntrinsicInst *II) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	931 return TTIImpl->shouldExpandReduction(II);
1d019706d866 LLVM10 anatofuz parents: diff changeset	932 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	933
1d019706d866 LLVM10 anatofuz parents: diff changeset	934 unsigned TargetTransformInfo::getGISelRematGlobalCost() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	935 return TTIImpl->getGISelRematGlobalCost();
1d019706d866 LLVM10 anatofuz parents: diff changeset	936 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	937
1d019706d866 LLVM10 anatofuz parents: diff changeset	938 int TargetTransformInfo::getInstructionLatency(const Instruction *I) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	939 return TTIImpl->getInstructionLatency(I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	940 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	941
1d019706d866 LLVM10 anatofuz parents: diff changeset	942 static bool matchPairwiseShuffleMask(ShuffleVectorInst *SI, bool IsLeft,
1d019706d866 LLVM10 anatofuz parents: diff changeset	943 unsigned Level) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	944 // We don't need a shuffle if we just want to have element 0 in position 0 of
1d019706d866 LLVM10 anatofuz parents: diff changeset	945 // the vector.
1d019706d866 LLVM10 anatofuz parents: diff changeset	946 if (!SI && Level == 0 && IsLeft)
1d019706d866 LLVM10 anatofuz parents: diff changeset	947 return true;
1d019706d866 LLVM10 anatofuz parents: diff changeset	948 else if (!SI)
1d019706d866 LLVM10 anatofuz parents: diff changeset	949 return false;
1d019706d866 LLVM10 anatofuz parents: diff changeset	950
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	951 SmallVector<int, 32> Mask(SI->getType()->getNumElements(), -1);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	952
1d019706d866 LLVM10 anatofuz parents: diff changeset	953 // Build a mask of 0, 2, ... (left) or 1, 3, ... (right) depending on whether
1d019706d866 LLVM10 anatofuz parents: diff changeset	954 // we look at the left or right side.
1d019706d866 LLVM10 anatofuz parents: diff changeset	955 for (unsigned i = 0, e = (1 << Level), val = !IsLeft; i != e; ++i, val += 2)
1d019706d866 LLVM10 anatofuz parents: diff changeset	956 Mask[i] = val;
1d019706d866 LLVM10 anatofuz parents: diff changeset	957
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	958 ArrayRef<int> ActualMask = SI->getShuffleMask();
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	959 return Mask == ActualMask;
1d019706d866 LLVM10 anatofuz parents: diff changeset	960 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	961
1d019706d866 LLVM10 anatofuz parents: diff changeset	962 namespace {
1d019706d866 LLVM10 anatofuz parents: diff changeset	963 /// Kind of the reduction data.
1d019706d866 LLVM10 anatofuz parents: diff changeset	964 enum ReductionKind {
1d019706d866 LLVM10 anatofuz parents: diff changeset	965 RK_None, /// Not a reduction.
1d019706d866 LLVM10 anatofuz parents: diff changeset	966 RK_Arithmetic, /// Binary reduction data.
1d019706d866 LLVM10 anatofuz parents: diff changeset	967 RK_MinMax, /// Min/max reduction data.
1d019706d866 LLVM10 anatofuz parents: diff changeset	968 RK_UnsignedMinMax, /// Unsigned min/max reduction data.
1d019706d866 LLVM10 anatofuz parents: diff changeset	969 };
1d019706d866 LLVM10 anatofuz parents: diff changeset	970 /// Contains opcode + LHS/RHS parts of the reduction operations.
1d019706d866 LLVM10 anatofuz parents: diff changeset	971 struct ReductionData {
1d019706d866 LLVM10 anatofuz parents: diff changeset	972 ReductionData() = delete;
1d019706d866 LLVM10 anatofuz parents: diff changeset	973 ReductionData(ReductionKind Kind, unsigned Opcode, Value LHS, Value RHS)
1d019706d866 LLVM10 anatofuz parents: diff changeset	974 : Opcode(Opcode), LHS(LHS), RHS(RHS), Kind(Kind) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	975 assert(Kind != RK_None && "expected binary or min/max reduction only.");
1d019706d866 LLVM10 anatofuz parents: diff changeset	976 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	977 unsigned Opcode = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	978 Value *LHS = nullptr;
1d019706d866 LLVM10 anatofuz parents: diff changeset	979 Value *RHS = nullptr;
1d019706d866 LLVM10 anatofuz parents: diff changeset	980 ReductionKind Kind = RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	981 bool hasSameData(ReductionData &RD) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	982 return Kind == RD.Kind && Opcode == RD.Opcode;
1d019706d866 LLVM10 anatofuz parents: diff changeset	983 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	984 };
1d019706d866 LLVM10 anatofuz parents: diff changeset	985 } // namespace
1d019706d866 LLVM10 anatofuz parents: diff changeset	986
1d019706d866 LLVM10 anatofuz parents: diff changeset	987 static Optional<ReductionData> getReductionData(Instruction *I) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	988 Value L, R;
1d019706d866 LLVM10 anatofuz parents: diff changeset	989 if (m_BinOp(m_Value(L), m_Value(R)).match(I))
1d019706d866 LLVM10 anatofuz parents: diff changeset	990 return ReductionData(RK_Arithmetic, I->getOpcode(), L, R);
1d019706d866 LLVM10 anatofuz parents: diff changeset	991 if (auto *SI = dyn_cast<SelectInst>(I)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	992 if (m_SMin(m_Value(L), m_Value(R)).match(SI) \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	993 m_SMax(m_Value(L), m_Value(R)).match(SI) \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	994 m_OrdFMin(m_Value(L), m_Value(R)).match(SI) \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	995 m_OrdFMax(m_Value(L), m_Value(R)).match(SI) \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	996 m_UnordFMin(m_Value(L), m_Value(R)).match(SI) \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	997 m_UnordFMax(m_Value(L), m_Value(R)).match(SI)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	998 auto *CI = cast<CmpInst>(SI->getCondition());
1d019706d866 LLVM10 anatofuz parents: diff changeset	999 return ReductionData(RK_MinMax, CI->getOpcode(), L, R);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1000 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1001 if (m_UMin(m_Value(L), m_Value(R)).match(SI) \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	1002 m_UMax(m_Value(L), m_Value(R)).match(SI)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1003 auto *CI = cast<CmpInst>(SI->getCondition());
1d019706d866 LLVM10 anatofuz parents: diff changeset	1004 return ReductionData(RK_UnsignedMinMax, CI->getOpcode(), L, R);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1005 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1006 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1007 return llvm::None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1008 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1009
1d019706d866 LLVM10 anatofuz parents: diff changeset	1010 static ReductionKind matchPairwiseReductionAtLevel(Instruction *I,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1011 unsigned Level,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1012 unsigned NumLevels) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1013 // Match one level of pairwise operations.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1014 // %rdx.shuf.0.0 = shufflevector <4 x float> %rdx, <4 x float> undef,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1015 // <4 x i32> <i32 0, i32 2 , i32 undef, i32 undef>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1016 // %rdx.shuf.0.1 = shufflevector <4 x float> %rdx, <4 x float> undef,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1017 // <4 x i32> <i32 1, i32 3, i32 undef, i32 undef>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1018 // %bin.rdx.0 = fadd <4 x float> %rdx.shuf.0.0, %rdx.shuf.0.1
1d019706d866 LLVM10 anatofuz parents: diff changeset	1019 if (!I)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1020 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1021
1d019706d866 LLVM10 anatofuz parents: diff changeset	1022 assert(I->getType()->isVectorTy() && "Expecting a vector type");
1d019706d866 LLVM10 anatofuz parents: diff changeset	1023
1d019706d866 LLVM10 anatofuz parents: diff changeset	1024 Optional<ReductionData> RD = getReductionData(I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1025 if (!RD)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1026 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1027
1d019706d866 LLVM10 anatofuz parents: diff changeset	1028 ShuffleVectorInst *LS = dyn_cast<ShuffleVectorInst>(RD->LHS);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1029 if (!LS && Level)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1030 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1031 ShuffleVectorInst *RS = dyn_cast<ShuffleVectorInst>(RD->RHS);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1032 if (!RS && Level)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1033 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1034
1d019706d866 LLVM10 anatofuz parents: diff changeset	1035 // On level 0 we can omit one shufflevector instruction.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1036 if (!Level && !RS && !LS)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1037 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1038
1d019706d866 LLVM10 anatofuz parents: diff changeset	1039 // Shuffle inputs must match.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1040 Value *NextLevelOpL = LS ? LS->getOperand(0) : nullptr;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1041 Value *NextLevelOpR = RS ? RS->getOperand(0) : nullptr;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1042 Value *NextLevelOp = nullptr;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1043 if (NextLevelOpR && NextLevelOpL) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1044 // If we have two shuffles their operands must match.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1045 if (NextLevelOpL != NextLevelOpR)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1046 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1047
1d019706d866 LLVM10 anatofuz parents: diff changeset	1048 NextLevelOp = NextLevelOpL;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1049 } else if (Level == 0 && (NextLevelOpR \|\| NextLevelOpL)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1050 // On the first level we can omit the shufflevector <0, undef,...>. So the
1d019706d866 LLVM10 anatofuz parents: diff changeset	1051 // input to the other shufflevector <1, undef> must match with one of the
1d019706d866 LLVM10 anatofuz parents: diff changeset	1052 // inputs to the current binary operation.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1053 // Example:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1054 // %NextLevelOpL = shufflevector %R, <1, undef ...>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1055 // %BinOp = fadd %NextLevelOpL, %R
1d019706d866 LLVM10 anatofuz parents: diff changeset	1056 if (NextLevelOpL && NextLevelOpL != RD->RHS)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1057 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1058 else if (NextLevelOpR && NextLevelOpR != RD->LHS)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1059 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1060
1d019706d866 LLVM10 anatofuz parents: diff changeset	1061 NextLevelOp = NextLevelOpL ? RD->RHS : RD->LHS;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1062 } else
1d019706d866 LLVM10 anatofuz parents: diff changeset	1063 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1064
1d019706d866 LLVM10 anatofuz parents: diff changeset	1065 // Check that the next levels binary operation exists and matches with the
1d019706d866 LLVM10 anatofuz parents: diff changeset	1066 // current one.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1067 if (Level + 1 != NumLevels) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1068 Optional<ReductionData> NextLevelRD =
1d019706d866 LLVM10 anatofuz parents: diff changeset	1069 getReductionData(cast<Instruction>(NextLevelOp));
1d019706d866 LLVM10 anatofuz parents: diff changeset	1070 if (!NextLevelRD \|\| !RD->hasSameData(*NextLevelRD))
1d019706d866 LLVM10 anatofuz parents: diff changeset	1071 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1072 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1073
1d019706d866 LLVM10 anatofuz parents: diff changeset	1074 // Shuffle mask for pairwise operation must match.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1075 if (matchPairwiseShuffleMask(LS, /IsLeft=/true, Level)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1076 if (!matchPairwiseShuffleMask(RS, /IsLeft=/false, Level))
1d019706d866 LLVM10 anatofuz parents: diff changeset	1077 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1078 } else if (matchPairwiseShuffleMask(RS, /IsLeft=/true, Level)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1079 if (!matchPairwiseShuffleMask(LS, /IsLeft=/false, Level))
1d019706d866 LLVM10 anatofuz parents: diff changeset	1080 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1081 } else {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1082 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1083 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1084
1d019706d866 LLVM10 anatofuz parents: diff changeset	1085 if (++Level == NumLevels)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1086 return RD->Kind;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1087
1d019706d866 LLVM10 anatofuz parents: diff changeset	1088 // Match next level.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1089 return matchPairwiseReductionAtLevel(cast<Instruction>(NextLevelOp), Level,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1090 NumLevels);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1091 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1092
1d019706d866 LLVM10 anatofuz parents: diff changeset	1093 static ReductionKind matchPairwiseReduction(const ExtractElementInst *ReduxRoot,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1094 unsigned &Opcode,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1095 VectorType *&Ty) {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1096 if (!EnableReduxCost)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1097 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1098
1d019706d866 LLVM10 anatofuz parents: diff changeset	1099 // Need to extract the first element.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1100 ConstantInt *CI = dyn_cast<ConstantInt>(ReduxRoot->getOperand(1));
1d019706d866 LLVM10 anatofuz parents: diff changeset	1101 unsigned Idx = ~0u;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1102 if (CI)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1103 Idx = CI->getZExtValue();
1d019706d866 LLVM10 anatofuz parents: diff changeset	1104 if (Idx != 0)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1105 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1106
1d019706d866 LLVM10 anatofuz parents: diff changeset	1107 auto *RdxStart = dyn_cast<Instruction>(ReduxRoot->getOperand(0));
1d019706d866 LLVM10 anatofuz parents: diff changeset	1108 if (!RdxStart)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1109 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1110 Optional<ReductionData> RD = getReductionData(RdxStart);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1111 if (!RD)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1112 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1113
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1114 auto *VecTy = cast<VectorType>(RdxStart->getType());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1115 unsigned NumVecElems = VecTy->getNumElements();
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1116 if (!isPowerOf2_32(NumVecElems))
1d019706d866 LLVM10 anatofuz parents: diff changeset	1117 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1118
1d019706d866 LLVM10 anatofuz parents: diff changeset	1119 // We look for a sequence of shuffle,shuffle,add triples like the following
1d019706d866 LLVM10 anatofuz parents: diff changeset	1120 // that builds a pairwise reduction tree.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1121 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	1122 // (X0, X1, X2, X3)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1123 // (X0 + X1, X2 + X3, undef, undef)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1124 // ((X0 + X1) + (X2 + X3), undef, undef, undef)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1125 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	1126 // %rdx.shuf.0.0 = shufflevector <4 x float> %rdx, <4 x float> undef,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1127 // <4 x i32> <i32 0, i32 2 , i32 undef, i32 undef>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1128 // %rdx.shuf.0.1 = shufflevector <4 x float> %rdx, <4 x float> undef,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1129 // <4 x i32> <i32 1, i32 3, i32 undef, i32 undef>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1130 // %bin.rdx.0 = fadd <4 x float> %rdx.shuf.0.0, %rdx.shuf.0.1
1d019706d866 LLVM10 anatofuz parents: diff changeset	1131 // %rdx.shuf.1.0 = shufflevector <4 x float> %bin.rdx.0, <4 x float> undef,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1132 // <4 x i32> <i32 0, i32 undef, i32 undef, i32 undef>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1133 // %rdx.shuf.1.1 = shufflevector <4 x float> %bin.rdx.0, <4 x float> undef,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1134 // <4 x i32> <i32 1, i32 undef, i32 undef, i32 undef>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1135 // %bin.rdx8 = fadd <4 x float> %rdx.shuf.1.0, %rdx.shuf.1.1
1d019706d866 LLVM10 anatofuz parents: diff changeset	1136 // %r = extractelement <4 x float> %bin.rdx8, i32 0
1d019706d866 LLVM10 anatofuz parents: diff changeset	1137 if (matchPairwiseReductionAtLevel(RdxStart, 0, Log2_32(NumVecElems)) ==
1d019706d866 LLVM10 anatofuz parents: diff changeset	1138 RK_None)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1139 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1140
1d019706d866 LLVM10 anatofuz parents: diff changeset	1141 Opcode = RD->Opcode;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1142 Ty = VecTy;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1143
1d019706d866 LLVM10 anatofuz parents: diff changeset	1144 return RD->Kind;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1145 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1146
1d019706d866 LLVM10 anatofuz parents: diff changeset	1147 static std::pair<Value , ShuffleVectorInst >
1d019706d866 LLVM10 anatofuz parents: diff changeset	1148 getShuffleAndOtherOprd(Value L, Value R) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1149 ShuffleVectorInst *S = nullptr;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1150
1d019706d866 LLVM10 anatofuz parents: diff changeset	1151 if ((S = dyn_cast<ShuffleVectorInst>(L)))
1d019706d866 LLVM10 anatofuz parents: diff changeset	1152 return std::make_pair(R, S);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1153
1d019706d866 LLVM10 anatofuz parents: diff changeset	1154 S = dyn_cast<ShuffleVectorInst>(R);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1155 return std::make_pair(L, S);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1156 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1157
1d019706d866 LLVM10 anatofuz parents: diff changeset	1158 static ReductionKind
1d019706d866 LLVM10 anatofuz parents: diff changeset	1159 matchVectorSplittingReduction(const ExtractElementInst *ReduxRoot,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1160 unsigned &Opcode, VectorType *&Ty) {
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1161 if (!EnableReduxCost)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1162 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1163
1d019706d866 LLVM10 anatofuz parents: diff changeset	1164 // Need to extract the first element.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1165 ConstantInt *CI = dyn_cast<ConstantInt>(ReduxRoot->getOperand(1));
1d019706d866 LLVM10 anatofuz parents: diff changeset	1166 unsigned Idx = ~0u;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1167 if (CI)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1168 Idx = CI->getZExtValue();
1d019706d866 LLVM10 anatofuz parents: diff changeset	1169 if (Idx != 0)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1170 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1171
1d019706d866 LLVM10 anatofuz parents: diff changeset	1172 auto *RdxStart = dyn_cast<Instruction>(ReduxRoot->getOperand(0));
1d019706d866 LLVM10 anatofuz parents: diff changeset	1173 if (!RdxStart)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1174 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1175 Optional<ReductionData> RD = getReductionData(RdxStart);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1176 if (!RD)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1177 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1178
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1179 auto *VecTy = cast<VectorType>(ReduxRoot->getOperand(0)->getType());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1180 unsigned NumVecElems = VecTy->getNumElements();
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1181 if (!isPowerOf2_32(NumVecElems))
1d019706d866 LLVM10 anatofuz parents: diff changeset	1182 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1183
1d019706d866 LLVM10 anatofuz parents: diff changeset	1184 // We look for a sequence of shuffles and adds like the following matching one
1d019706d866 LLVM10 anatofuz parents: diff changeset	1185 // fadd, shuffle vector pair at a time.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1186 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	1187 // %rdx.shuf = shufflevector <4 x float> %rdx, <4 x float> undef,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1188 // <4 x i32> <i32 2, i32 3, i32 undef, i32 undef>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1189 // %bin.rdx = fadd <4 x float> %rdx, %rdx.shuf
1d019706d866 LLVM10 anatofuz parents: diff changeset	1190 // %rdx.shuf7 = shufflevector <4 x float> %bin.rdx, <4 x float> undef,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1191 // <4 x i32> <i32 1, i32 undef, i32 undef, i32 undef>
1d019706d866 LLVM10 anatofuz parents: diff changeset	1192 // %bin.rdx8 = fadd <4 x float> %bin.rdx, %rdx.shuf7
1d019706d866 LLVM10 anatofuz parents: diff changeset	1193 // %r = extractelement <4 x float> %bin.rdx8, i32 0
1d019706d866 LLVM10 anatofuz parents: diff changeset	1194
1d019706d866 LLVM10 anatofuz parents: diff changeset	1195 unsigned MaskStart = 1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1196 Instruction *RdxOp = RdxStart;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1197 SmallVector<int, 32> ShuffleMask(NumVecElems, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1198 unsigned NumVecElemsRemain = NumVecElems;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1199 while (NumVecElemsRemain - 1) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1200 // Check for the right reduction operation.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1201 if (!RdxOp)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1202 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1203 Optional<ReductionData> RDLevel = getReductionData(RdxOp);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1204 if (!RDLevel \|\| !RDLevel->hasSameData(*RD))
1d019706d866 LLVM10 anatofuz parents: diff changeset	1205 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1206
1d019706d866 LLVM10 anatofuz parents: diff changeset	1207 Value *NextRdxOp;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1208 ShuffleVectorInst *Shuffle;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1209 std::tie(NextRdxOp, Shuffle) =
1d019706d866 LLVM10 anatofuz parents: diff changeset	1210 getShuffleAndOtherOprd(RDLevel->LHS, RDLevel->RHS);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1211
1d019706d866 LLVM10 anatofuz parents: diff changeset	1212 // Check the current reduction operation and the shuffle use the same value.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1213 if (Shuffle == nullptr)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1214 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1215 if (Shuffle->getOperand(0) != NextRdxOp)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1216 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1217
1d019706d866 LLVM10 anatofuz parents: diff changeset	1218 // Check that shuffle masks matches.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1219 for (unsigned j = 0; j != MaskStart; ++j)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1220 ShuffleMask[j] = MaskStart + j;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1221 // Fill the rest of the mask with -1 for undef.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1222 std::fill(&ShuffleMask[MaskStart], ShuffleMask.end(), -1);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1223
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1224 ArrayRef<int> Mask = Shuffle->getShuffleMask();
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1225 if (ShuffleMask != Mask)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1226 return RK_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1227
1d019706d866 LLVM10 anatofuz parents: diff changeset	1228 RdxOp = dyn_cast<Instruction>(NextRdxOp);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1229 NumVecElemsRemain /= 2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1230 MaskStart *= 2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1231 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1232
1d019706d866 LLVM10 anatofuz parents: diff changeset	1233 Opcode = RD->Opcode;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1234 Ty = VecTy;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1235 return RD->Kind;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1236 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1237
1d019706d866 LLVM10 anatofuz parents: diff changeset	1238 int TargetTransformInfo::getInstructionThroughput(const Instruction *I) const {
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1239 TTI::TargetCostKind CostKind = TTI::TCK_RecipThroughput;
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1240
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1241 switch (I->getOpcode()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1242 case Instruction::GetElementPtr:
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1243 return getUserCost(I, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1244
1d019706d866 LLVM10 anatofuz parents: diff changeset	1245 case Instruction::Ret:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1246 case Instruction::PHI:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1247 case Instruction::Br: {
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1248 return getCFInstrCost(I->getOpcode(), CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1249 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1250 case Instruction::Add:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1251 case Instruction::FAdd:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1252 case Instruction::Sub:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1253 case Instruction::FSub:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1254 case Instruction::Mul:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1255 case Instruction::FMul:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1256 case Instruction::UDiv:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1257 case Instruction::SDiv:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1258 case Instruction::FDiv:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1259 case Instruction::URem:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1260 case Instruction::SRem:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1261 case Instruction::FRem:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1262 case Instruction::Shl:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1263 case Instruction::LShr:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1264 case Instruction::AShr:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1265 case Instruction::And:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1266 case Instruction::Or:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1267 case Instruction::Xor: {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1268 TargetTransformInfo::OperandValueKind Op1VK, Op2VK;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1269 TargetTransformInfo::OperandValueProperties Op1VP, Op2VP;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1270 Op1VK = getOperandInfo(I->getOperand(0), Op1VP);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1271 Op2VK = getOperandInfo(I->getOperand(1), Op2VP);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1272 SmallVector<const Value *, 2> Operands(I->operand_values());
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1273 return getArithmeticInstrCost(I->getOpcode(), I->getType(), CostKind,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1274 Op1VK, Op2VK,
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1275 Op1VP, Op2VP, Operands, I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1276 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1277 case Instruction::FNeg: {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1278 TargetTransformInfo::OperandValueKind Op1VK, Op2VK;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1279 TargetTransformInfo::OperandValueProperties Op1VP, Op2VP;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1280 Op1VK = getOperandInfo(I->getOperand(0), Op1VP);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1281 Op2VK = OK_AnyValue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1282 Op2VP = OP_None;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1283 SmallVector<const Value *, 2> Operands(I->operand_values());
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1284 return getArithmeticInstrCost(I->getOpcode(), I->getType(), CostKind,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1285 Op1VK, Op2VK,
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1286 Op1VP, Op2VP, Operands, I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1287 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1288 case Instruction::Select: {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1289 const SelectInst *SI = cast<SelectInst>(I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1290 Type *CondTy = SI->getCondition()->getType();
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1291 return getCmpSelInstrCost(I->getOpcode(), I->getType(), CondTy,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1292 CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1293 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1294 case Instruction::ICmp:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1295 case Instruction::FCmp: {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1296 Type *ValTy = I->getOperand(0)->getType();
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1297 return getCmpSelInstrCost(I->getOpcode(), ValTy, I->getType(),
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1298 CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1299 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1300 case Instruction::Store: {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1301 const StoreInst *SI = cast<StoreInst>(I);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1302 Type *ValTy = SI->getValueOperand()->getType();
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1303 return getMemoryOpCost(I->getOpcode(), ValTy, SI->getAlign(),
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1304 SI->getPointerAddressSpace(), CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1305 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1306 case Instruction::Load: {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1307 const LoadInst *LI = cast<LoadInst>(I);
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1308 return getMemoryOpCost(I->getOpcode(), I->getType(), LI->getAlign(),
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1309 LI->getPointerAddressSpace(), CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1310 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1311 case Instruction::ZExt:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1312 case Instruction::SExt:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1313 case Instruction::FPToUI:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1314 case Instruction::FPToSI:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1315 case Instruction::FPExt:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1316 case Instruction::PtrToInt:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1317 case Instruction::IntToPtr:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1318 case Instruction::SIToFP:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1319 case Instruction::UIToFP:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1320 case Instruction::Trunc:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1321 case Instruction::FPTrunc:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1322 case Instruction::BitCast:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1323 case Instruction::AddrSpaceCast: {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1324 Type *SrcTy = I->getOperand(0)->getType();
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1325 return getCastInstrCost(I->getOpcode(), I->getType(), SrcTy, CostKind, I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1326 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1327 case Instruction::ExtractElement: {
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1328 const ExtractElementInst *EEI = cast<ExtractElementInst>(I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1329 ConstantInt *CI = dyn_cast<ConstantInt>(I->getOperand(1));
1d019706d866 LLVM10 anatofuz parents: diff changeset	1330 unsigned Idx = -1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1331 if (CI)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1332 Idx = CI->getZExtValue();
1d019706d866 LLVM10 anatofuz parents: diff changeset	1333
1d019706d866 LLVM10 anatofuz parents: diff changeset	1334 // Try to match a reduction sequence (series of shufflevector and vector
1d019706d866 LLVM10 anatofuz parents: diff changeset	1335 // adds followed by a extractelement).
1d019706d866 LLVM10 anatofuz parents: diff changeset	1336 unsigned ReduxOpCode;
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1337 VectorType *ReduxType;
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1338
1d019706d866 LLVM10 anatofuz parents: diff changeset	1339 switch (matchVectorSplittingReduction(EEI, ReduxOpCode, ReduxType)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1340 case RK_Arithmetic:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1341 return getArithmeticReductionCost(ReduxOpCode, ReduxType,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1342 /IsPairwiseForm=/false,
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1343 CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1344 case RK_MinMax:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1345 return getMinMaxReductionCost(
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1346 ReduxType, cast<VectorType>(CmpInst::makeCmpResultType(ReduxType)),
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1347 /IsPairwiseForm=/false, /IsUnsigned=/false);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1348 case RK_UnsignedMinMax:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1349 return getMinMaxReductionCost(
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1350 ReduxType, cast<VectorType>(CmpInst::makeCmpResultType(ReduxType)),
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1351 /IsPairwiseForm=/false, /IsUnsigned=/true);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1352 case RK_None:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1353 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1354 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1355
1d019706d866 LLVM10 anatofuz parents: diff changeset	1356 switch (matchPairwiseReduction(EEI, ReduxOpCode, ReduxType)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1357 case RK_Arithmetic:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1358 return getArithmeticReductionCost(ReduxOpCode, ReduxType,
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1359 /IsPairwiseForm=/true, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1360 case RK_MinMax:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1361 return getMinMaxReductionCost(
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1362 ReduxType, cast<VectorType>(CmpInst::makeCmpResultType(ReduxType)),
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1363 /IsPairwiseForm=/true, /IsUnsigned=/false);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1364 case RK_UnsignedMinMax:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1365 return getMinMaxReductionCost(
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1366 ReduxType, cast<VectorType>(CmpInst::makeCmpResultType(ReduxType)),
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1367 /IsPairwiseForm=/true, /IsUnsigned=/true);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1368 case RK_None:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1369 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1370 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1371
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1372 return getVectorInstrCost(I->getOpcode(), EEI->getOperand(0)->getType(),
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1373 Idx);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1374 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1375 case Instruction::InsertElement: {
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1376 const InsertElementInst *IE = cast<InsertElementInst>(I);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1377 ConstantInt *CI = dyn_cast<ConstantInt>(IE->getOperand(2));
1d019706d866 LLVM10 anatofuz parents: diff changeset	1378 unsigned Idx = -1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1379 if (CI)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1380 Idx = CI->getZExtValue();
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1381 return getVectorInstrCost(I->getOpcode(), IE->getType(), Idx);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1382 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1383 case Instruction::ExtractValue:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1384 return 0; // Model all ExtractValue nodes as free.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1385 case Instruction::ShuffleVector: {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1386 const ShuffleVectorInst *Shuffle = cast<ShuffleVectorInst>(I);
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1387 auto *Ty = cast<VectorType>(Shuffle->getType());
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1388 auto *SrcTy = cast<VectorType>(Shuffle->getOperand(0)->getType());
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1389
1d019706d866 LLVM10 anatofuz parents: diff changeset	1390 // TODO: Identify and add costs for insert subvector, etc.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1391 int SubIndex;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1392 if (Shuffle->isExtractSubvectorMask(SubIndex))
1d019706d866 LLVM10 anatofuz parents: diff changeset	1393 return TTIImpl->getShuffleCost(SK_ExtractSubvector, SrcTy, SubIndex, Ty);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1394
1d019706d866 LLVM10 anatofuz parents: diff changeset	1395 if (Shuffle->changesLength())
1d019706d866 LLVM10 anatofuz parents: diff changeset	1396 return -1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1397
1d019706d866 LLVM10 anatofuz parents: diff changeset	1398 if (Shuffle->isIdentity())
1d019706d866 LLVM10 anatofuz parents: diff changeset	1399 return 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1400
1d019706d866 LLVM10 anatofuz parents: diff changeset	1401 if (Shuffle->isReverse())
1d019706d866 LLVM10 anatofuz parents: diff changeset	1402 return TTIImpl->getShuffleCost(SK_Reverse, Ty, 0, nullptr);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1403
1d019706d866 LLVM10 anatofuz parents: diff changeset	1404 if (Shuffle->isSelect())
1d019706d866 LLVM10 anatofuz parents: diff changeset	1405 return TTIImpl->getShuffleCost(SK_Select, Ty, 0, nullptr);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1406
1d019706d866 LLVM10 anatofuz parents: diff changeset	1407 if (Shuffle->isTranspose())
1d019706d866 LLVM10 anatofuz parents: diff changeset	1408 return TTIImpl->getShuffleCost(SK_Transpose, Ty, 0, nullptr);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1409
1d019706d866 LLVM10 anatofuz parents: diff changeset	1410 if (Shuffle->isZeroEltSplat())
1d019706d866 LLVM10 anatofuz parents: diff changeset	1411 return TTIImpl->getShuffleCost(SK_Broadcast, Ty, 0, nullptr);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1412
1d019706d866 LLVM10 anatofuz parents: diff changeset	1413 if (Shuffle->isSingleSource())
1d019706d866 LLVM10 anatofuz parents: diff changeset	1414 return TTIImpl->getShuffleCost(SK_PermuteSingleSrc, Ty, 0, nullptr);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1415
1d019706d866 LLVM10 anatofuz parents: diff changeset	1416 return TTIImpl->getShuffleCost(SK_PermuteTwoSrc, Ty, 0, nullptr);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1417 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1418 case Instruction::Call:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1419 if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(I)) {
173 0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1420 IntrinsicCostAttributes CostAttrs(*II);
0572611fdcc8 reorgnization done Shinji KONO <kono@ie.u-ryukyu.ac.jp> parents: 150 diff changeset	1421 return getIntrinsicInstrCost(CostAttrs, CostKind);
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1422 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1423 return -1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1424 default:
1d019706d866 LLVM10 anatofuz parents: diff changeset	1425 // We don't have any information on this instruction.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1426 return -1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1427 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1428 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1429
1d019706d866 LLVM10 anatofuz parents: diff changeset	1430 TargetTransformInfo::Concept::~Concept() {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	1431
1d019706d866 LLVM10 anatofuz parents: diff changeset	1432 TargetIRAnalysis::TargetIRAnalysis() : TTICallback(&getDefaultTTI) {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	1433
1d019706d866 LLVM10 anatofuz parents: diff changeset	1434 TargetIRAnalysis::TargetIRAnalysis(
1d019706d866 LLVM10 anatofuz parents: diff changeset	1435 std::function<Result(const Function &)> TTICallback)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1436 : TTICallback(std::move(TTICallback)) {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	1437
1d019706d866 LLVM10 anatofuz parents: diff changeset	1438 TargetIRAnalysis::Result TargetIRAnalysis::run(const Function &F,
1d019706d866 LLVM10 anatofuz parents: diff changeset	1439 FunctionAnalysisManager &) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1440 return TTICallback(F);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1441 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1442
1d019706d866 LLVM10 anatofuz parents: diff changeset	1443 AnalysisKey TargetIRAnalysis::Key;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1444
1d019706d866 LLVM10 anatofuz parents: diff changeset	1445 TargetIRAnalysis::Result TargetIRAnalysis::getDefaultTTI(const Function &F) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1446 return Result(F.getParent()->getDataLayout());
1d019706d866 LLVM10 anatofuz parents: diff changeset	1447 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1448
1d019706d866 LLVM10 anatofuz parents: diff changeset	1449 // Register the basic pass.
1d019706d866 LLVM10 anatofuz parents: diff changeset	1450 INITIALIZE_PASS(TargetTransformInfoWrapperPass, "tti",
1d019706d866 LLVM10 anatofuz parents: diff changeset	1451 "Target Transform Information", false, true)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1452 char TargetTransformInfoWrapperPass::ID = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1453
1d019706d866 LLVM10 anatofuz parents: diff changeset	1454 void TargetTransformInfoWrapperPass::anchor() {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	1455
1d019706d866 LLVM10 anatofuz parents: diff changeset	1456 TargetTransformInfoWrapperPass::TargetTransformInfoWrapperPass()
1d019706d866 LLVM10 anatofuz parents: diff changeset	1457 : ImmutablePass(ID) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1458 initializeTargetTransformInfoWrapperPassPass(
1d019706d866 LLVM10 anatofuz parents: diff changeset	1459 *PassRegistry::getPassRegistry());
1d019706d866 LLVM10 anatofuz parents: diff changeset	1460 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1461
1d019706d866 LLVM10 anatofuz parents: diff changeset	1462 TargetTransformInfoWrapperPass::TargetTransformInfoWrapperPass(
1d019706d866 LLVM10 anatofuz parents: diff changeset	1463 TargetIRAnalysis TIRA)
1d019706d866 LLVM10 anatofuz parents: diff changeset	1464 : ImmutablePass(ID), TIRA(std::move(TIRA)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1465 initializeTargetTransformInfoWrapperPassPass(
1d019706d866 LLVM10 anatofuz parents: diff changeset	1466 *PassRegistry::getPassRegistry());
1d019706d866 LLVM10 anatofuz parents: diff changeset	1467 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1468
1d019706d866 LLVM10 anatofuz parents: diff changeset	1469 TargetTransformInfo &TargetTransformInfoWrapperPass::getTTI(const Function &F) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1470 FunctionAnalysisManager DummyFAM;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1471 TTI = TIRA.run(F, DummyFAM);
1d019706d866 LLVM10 anatofuz parents: diff changeset	1472 return *TTI;
1d019706d866 LLVM10 anatofuz parents: diff changeset	1473 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	1474
1d019706d866 LLVM10 anatofuz parents: diff changeset	1475 ImmutablePass *
1d019706d866 LLVM10 anatofuz parents: diff changeset	1476 llvm::createTargetTransformInfoWrapperPass(TargetIRAnalysis TIRA) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	1477 return new TargetTransformInfoWrapperPass(std::move(TIRA));
1d019706d866 LLVM10 anatofuz parents: diff changeset	1478 }

Mercurial > hg > CbC > CbC_llvm

annotate llvm/lib/Analysis/TargetTransformInfo.cpp @ 204:e348f3e5c8b2