annotate lib/Target/NVPTX/NVVMReflect.cpp @ 131:f476a9ba4795

http://llvm.org/svn/llvm-project/compiler-rt/trunk compiler-rt
author mir3636
date Fri, 16 Feb 2018 21:02:11 +0900
parents 803732b1fca8
children c2174574ed3a
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
1 //===- NVVMReflect.cpp - NVVM Emulate conditional compilation -------------===//
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
2 //
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
3 // The LLVM Compiler Infrastructure
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
4 //
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
5 // This file is distributed under the University of Illinois Open Source
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
6 // License. See LICENSE.TXT for details.
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
7 //
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
8 //===----------------------------------------------------------------------===//
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
9 //
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
10 // This pass replaces occurrences of __nvvm_reflect("foo") and llvm.nvvm.reflect
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
11 // with an integer.
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
12 //
121
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
13 // We choose the value we use by looking at metadata in the module itself. Note
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
14 // that we intentionally only have one way to choose these values, because other
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
15 // parts of LLVM (particularly, InstCombineCall) rely on being able to predict
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
16 // the values chosen by this pass.
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
17 //
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
18 // If we see an unknown string, we replace its call with 0.
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
19 //
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
20 //===----------------------------------------------------------------------===//
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
21
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
22 #include "NVPTX.h"
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
23 #include "llvm/ADT/SmallVector.h"
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
24 #include "llvm/ADT/StringMap.h"
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
25 #include "llvm/IR/Constants.h"
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
26 #include "llvm/IR/DerivedTypes.h"
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
27 #include "llvm/IR/Function.h"
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
28 #include "llvm/IR/InstIterator.h"
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
29 #include "llvm/IR/Instructions.h"
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
30 #include "llvm/IR/Intrinsics.h"
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
31 #include "llvm/IR/Module.h"
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
32 #include "llvm/IR/Type.h"
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
33 #include "llvm/Pass.h"
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
34 #include "llvm/Support/CommandLine.h"
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
35 #include "llvm/Support/Debug.h"
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
36 #include "llvm/Support/raw_os_ostream.h"
95
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
37 #include "llvm/Support/raw_ostream.h"
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
38 #include "llvm/Transforms/Scalar.h"
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
39 #include <sstream>
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
40 #include <string>
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
41 #define NVVM_REFLECT_FUNCTION "__nvvm_reflect"
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
42
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
43 using namespace llvm;
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
44
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
45 #define DEBUG_TYPE "nvptx-reflect"
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
46
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
47 namespace llvm { void initializeNVVMReflectPass(PassRegistry &); }
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
48
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
49 namespace {
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
50 class NVVMReflect : public FunctionPass {
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
51 public:
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
52 static char ID;
121
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
53 NVVMReflect() : FunctionPass(ID) {
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
54 initializeNVVMReflectPass(*PassRegistry::getPassRegistry());
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
55 }
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
56
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
57 bool runOnFunction(Function &) override;
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
58 };
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
59 }
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
60
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
61 FunctionPass *llvm::createNVVMReflectPass() { return new NVVMReflect(); }
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
62
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
63 static cl::opt<bool>
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
64 NVVMReflectEnabled("nvvm-reflect-enable", cl::init(true), cl::Hidden,
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
65 cl::desc("NVVM reflection, enabled by default"));
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
66
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
67 char NVVMReflect::ID = 0;
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
68 INITIALIZE_PASS(NVVMReflect, "nvvm-reflect",
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
69 "Replace occurrences of __nvvm_reflect() calls with 0/1", false,
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
70 false)
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
71
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
72 bool NVVMReflect::runOnFunction(Function &F) {
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
73 if (!NVVMReflectEnabled)
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
74 return false;
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
75
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
76 if (F.getName() == NVVM_REFLECT_FUNCTION) {
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
77 assert(F.isDeclaration() && "_reflect function should not have a body");
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
78 assert(F.getReturnType()->isIntegerTy() &&
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
79 "_reflect's return type should be integer");
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
80 return false;
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
81 }
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
82
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
83 SmallVector<Instruction *, 4> ToRemove;
95
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
84
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
85 // Go through the calls in this function. Each call to __nvvm_reflect or
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
86 // llvm.nvvm.reflect should be a CallInst with a ConstantArray argument.
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
87 // First validate that. If the c-string corresponding to the ConstantArray can
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
88 // be found successfully, see if it can be found in VarMap. If so, replace the
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
89 // uses of CallInst with the value found in VarMap. If not, replace the use
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
90 // with value 0.
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
91
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
92 // The IR for __nvvm_reflect calls differs between CUDA versions.
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
93 //
95
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
94 // CUDA 6.5 and earlier uses this sequence:
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
95 // %ptr = tail call i8* @llvm.nvvm.ptr.constant.to.gen.p0i8.p4i8
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
96 // (i8 addrspace(4)* getelementptr inbounds
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
97 // ([8 x i8], [8 x i8] addrspace(4)* @str, i32 0, i32 0))
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
98 // %reflect = tail call i32 @__nvvm_reflect(i8* %ptr)
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
99 //
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
100 // The value returned by Sym->getOperand(0) is a Constant with a
95
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
101 // ConstantDataSequential operand which can be converted to string and used
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
102 // for lookup.
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
103 //
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
104 // CUDA 7.0 does it slightly differently:
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
105 // %reflect = call i32 @__nvvm_reflect(i8* addrspacecast
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
106 // (i8 addrspace(1)* getelementptr inbounds
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
107 // ([8 x i8], [8 x i8] addrspace(1)* @str, i32 0, i32 0) to i8*))
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
108 //
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
109 // In this case, we get a Constant with a GlobalVariable operand and we need
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
110 // to dig deeper to find its initializer with the string we'll use for lookup.
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
111 for (Instruction &I : instructions(F)) {
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
112 CallInst *Call = dyn_cast<CallInst>(&I);
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
113 if (!Call)
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
114 continue;
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
115 Function *Callee = Call->getCalledFunction();
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
116 if (!Callee || (Callee->getName() != NVVM_REFLECT_FUNCTION &&
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
117 Callee->getIntrinsicID() != Intrinsic::nvvm_reflect))
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
118 continue;
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
119
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
120 // FIXME: Improve error handling here and elsewhere in this pass.
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
121 assert(Call->getNumOperands() == 2 &&
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
122 "Wrong number of operands to __nvvm_reflect function");
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
123
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
124 // In cuda 6.5 and earlier, we will have an extra constant-to-generic
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
125 // conversion of the string.
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
126 const Value *Str = Call->getArgOperand(0);
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
127 if (const CallInst *ConvCall = dyn_cast<CallInst>(Str)) {
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
128 // FIXME: Add assertions about ConvCall.
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
129 Str = ConvCall->getArgOperand(0);
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
130 }
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
131 assert(isa<ConstantExpr>(Str) &&
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
132 "Format of __nvvm__reflect function not recognized");
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
133 const ConstantExpr *GEP = cast<ConstantExpr>(Str);
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
134
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
135 const Value *Sym = GEP->getOperand(0);
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
136 assert(isa<Constant>(Sym) &&
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
137 "Format of __nvvm_reflect function not recognized");
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
138
95
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
139 const Value *Operand = cast<Constant>(Sym)->getOperand(0);
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
140 if (const GlobalVariable *GV = dyn_cast<GlobalVariable>(Operand)) {
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
141 // For CUDA-7.0 style __nvvm_reflect calls, we need to find the operand's
95
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
142 // initializer.
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
143 assert(GV->hasInitializer() &&
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
144 "Format of _reflect function not recognized");
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
145 const Constant *Initializer = GV->getInitializer();
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
146 Operand = Initializer;
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
147 }
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
148
95
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
149 assert(isa<ConstantDataSequential>(Operand) &&
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
150 "Format of _reflect function not recognized");
95
afa8332a0e37 LLVM 3.8
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 77
diff changeset
151 assert(cast<ConstantDataSequential>(Operand)->isCString() &&
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
152 "Format of _reflect function not recognized");
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
153
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
154 StringRef ReflectArg = cast<ConstantDataSequential>(Operand)->getAsString();
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
155 ReflectArg = ReflectArg.substr(0, ReflectArg.size() - 1);
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
156 DEBUG(dbgs() << "Arg of _reflect : " << ReflectArg << "\n");
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
157
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
158 int ReflectVal = 0; // The default value is 0
121
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
159 if (ReflectArg == "__CUDA_FTZ") {
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
160 // Try to pull __CUDA_FTZ from the nvvm-reflect-ftz module flag. Our
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
161 // choice here must be kept in sync with AutoUpgrade, which uses the same
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
162 // technique to detect whether ftz is enabled.
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
163 if (auto *Flag = mdconst::extract_or_null<ConstantInt>(
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
164 F.getParent()->getModuleFlag("nvvm-reflect-ftz")))
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
165 ReflectVal = Flag->getSExtValue();
0
95c75e76d11b LLVM 3.4
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff changeset
166 }
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
167 Call->replaceAllUsesWith(ConstantInt::get(Call->getType(), ReflectVal));
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
168 ToRemove.push_back(Call);
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
169 }
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
170
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
171 for (Instruction *I : ToRemove)
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
172 I->eraseFromParent();
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
173
120
1172e4bd9c6f update 4.0.0
mir3636
parents: 95
diff changeset
174 return ToRemove.size() > 0;
77
54457678186b LLVM 3.6
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents: 0
diff changeset
175 }