83
|
1 ; RUN: opt < %s -indvars -S | FileCheck %s
|
|
2 target triple = "aarch64--linux-gnu"
|
|
3
|
95
|
4 ; Provide legal integer types.
|
|
5 target datalayout = "n8:16:32:64"
|
|
6
|
|
7
|
83
|
8 ; Check the loop exit i32 compare instruction and operand are widened to i64
|
|
9 ; instead of truncating IV before its use in the i32 compare instruction.
|
|
10
|
|
11 @idx = common global i32 0, align 4
|
|
12 @e = common global i32 0, align 4
|
|
13 @ptr = common global i32* null, align 8
|
|
14
|
|
15 ; CHECK-LABEL: @test1
|
|
16 ; CHECK: for.body.lr.ph:
|
|
17 ; CHECK: sext i32
|
|
18 ; CHECK: for.cond:
|
|
19 ; CHECK: icmp slt i64
|
|
20 ; CHECK: for.body:
|
|
21 ; CHECK: phi i64
|
|
22
|
|
23 define i32 @test1() {
|
|
24 entry:
|
|
25 store i32 -1, i32* @idx, align 4
|
95
|
26 %0 = load i32, i32* @e, align 4
|
83
|
27 %cmp4 = icmp slt i32 %0, 0
|
|
28 br i1 %cmp4, label %for.end.loopexit, label %for.body.lr.ph
|
|
29
|
|
30 for.body.lr.ph:
|
95
|
31 %1 = load i32*, i32** @ptr, align 8
|
|
32 %2 = load i32, i32* @e, align 4
|
83
|
33 br label %for.body
|
|
34
|
|
35 for.cond:
|
|
36 %inc = add nsw i32 %i.05, 1
|
|
37 %cmp = icmp slt i32 %i.05, %2
|
|
38 br i1 %cmp, label %for.body, label %for.cond.for.end.loopexit_crit_edge
|
|
39
|
|
40 for.body:
|
|
41 %i.05 = phi i32 [ 0, %for.body.lr.ph ], [ %inc, %for.cond ]
|
|
42 %idxprom = sext i32 %i.05 to i64
|
95
|
43 %arrayidx = getelementptr inbounds i32, i32* %1, i64 %idxprom
|
|
44 %3 = load i32, i32* %arrayidx, align 4
|
83
|
45 %tobool = icmp eq i32 %3, 0
|
|
46 br i1 %tobool, label %if.then, label %for.cond
|
|
47
|
|
48 if.then:
|
|
49 %i.05.lcssa = phi i32 [ %i.05, %for.body ]
|
|
50 store i32 %i.05.lcssa, i32* @idx, align 4
|
|
51 br label %for.end
|
|
52
|
|
53 for.cond.for.end.loopexit_crit_edge:
|
|
54 br label %for.end.loopexit
|
|
55
|
|
56 for.end.loopexit:
|
|
57 br label %for.end
|
|
58
|
|
59 for.end:
|
95
|
60 %4 = load i32, i32* @idx, align 4
|
83
|
61 ret i32 %4
|
|
62 }
|
|
63
|
|
64 ; CHECK-LABEL: @test2
|
|
65 ; CHECK: for.body4.us
|
|
66 ; CHECK: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
121
|
67 ; CHECK: %cmp2.us = icmp ult i64
|
83
|
68 ; CHECK-NOT: %2 = trunc i64 %indvars.iv.next to i32
|
|
69 ; CHECK-NOT: %cmp2.us = icmp slt i32
|
|
70
|
|
71 define void @test2([8 x i8]* %a, i8* %b, i8 %limit) {
|
|
72 entry:
|
|
73 %conv = zext i8 %limit to i32
|
|
74 br i1 undef, label %for.cond1.preheader, label %for.cond1.preheader.us
|
|
75
|
|
76 for.cond1.preheader.us:
|
|
77 %storemerge5.us = phi i32 [ 0, %entry ], [ %inc14.us, %for.inc13.us ]
|
|
78 br i1 true, label %for.body4.lr.ph.us, label %for.inc13.us
|
|
79
|
|
80 for.inc13.us:
|
|
81 %inc14.us = add nsw i32 %storemerge5.us, 1
|
|
82 %cmp.us = icmp slt i32 %inc14.us, 4
|
|
83 br i1 %cmp.us, label %for.cond1.preheader.us, label %for.end
|
|
84
|
|
85 for.body4.us:
|
|
86 %storemerge14.us = phi i32 [ 0, %for.body4.lr.ph.us ], [ %inc.us, %for.body4.us ]
|
|
87 %idxprom.us = sext i32 %storemerge14.us to i64
|
95
|
88 %arrayidx6.us = getelementptr inbounds [8 x i8], [8 x i8]* %a, i64 %idxprom5.us, i64 %idxprom.us
|
|
89 %0 = load i8, i8* %arrayidx6.us, align 1
|
83
|
90 %idxprom7.us = zext i8 %0 to i64
|
95
|
91 %arrayidx8.us = getelementptr inbounds i8, i8* %b, i64 %idxprom7.us
|
|
92 %1 = load i8, i8* %arrayidx8.us, align 1
|
83
|
93 store i8 %1, i8* %arrayidx6.us, align 1
|
|
94 %inc.us = add nsw i32 %storemerge14.us, 1
|
|
95 %cmp2.us = icmp slt i32 %inc.us, %conv
|
|
96 br i1 %cmp2.us, label %for.body4.us, label %for.inc13.us
|
|
97
|
|
98 for.body4.lr.ph.us:
|
|
99 %idxprom5.us = sext i32 %storemerge5.us to i64
|
|
100 br label %for.body4.us
|
|
101
|
|
102 for.cond1.preheader:
|
|
103 %storemerge5 = phi i32 [ 0, %entry ], [ %inc14, %for.inc13 ]
|
|
104 br i1 false, label %for.inc13, label %for.inc13
|
|
105
|
|
106 for.inc13:
|
|
107 %inc14 = add nsw i32 %storemerge5, 1
|
|
108 %cmp = icmp slt i32 %inc14, 4
|
|
109 br i1 %cmp, label %for.cond1.preheader, label %for.end
|
|
110
|
|
111 for.end:
|
|
112 ret void
|
|
113 }
|
|
114
|
|
115 ; CHECK-LABEL: @test3
|
|
116 ; CHECK: sext i32 %b
|
|
117 ; CHECK: for.cond:
|
|
118 ; CHECK: phi i64
|
|
119 ; CHECK: icmp slt i64
|
|
120
|
|
121 define i32 @test3(i32* %a, i32 %b) {
|
|
122 entry:
|
|
123 br label %for.cond
|
|
124
|
|
125 for.cond:
|
|
126 %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
127 %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
128 %cmp = icmp slt i32 %i.0, %b
|
|
129 br i1 %cmp, label %for.body, label %for.end
|
|
130
|
|
131 for.body:
|
|
132 %idxprom = sext i32 %i.0 to i64
|
95
|
133 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
134 %0 = load i32, i32* %arrayidx, align 4
|
83
|
135 %add = add nsw i32 %sum.0, %0
|
|
136 %inc = add nsw i32 %i.0, 1
|
|
137 br label %for.cond
|
|
138
|
|
139 for.end:
|
|
140 ret i32 %sum.0
|
|
141 }
|
|
142
|
|
143 declare i32 @fn1(i8 signext)
|
|
144
|
|
145 ; PR21030
|
|
146 ; CHECK-LABEL: @test4
|
|
147 ; CHECK: for.body:
|
|
148 ; CHECK: phi i32
|
|
149 ; CHECK: icmp sgt i8
|
|
150
|
|
151 define i32 @test4(i32 %a) {
|
|
152 entry:
|
|
153 br label %for.body
|
|
154
|
|
155 for.body:
|
|
156 %c.07 = phi i8 [ -3, %entry ], [ %dec, %for.body ]
|
|
157 %conv6 = zext i8 %c.07 to i32
|
|
158 %or = or i32 %a, %conv6
|
|
159 %conv3 = trunc i32 %or to i8
|
|
160 %call = call i32 @fn1(i8 signext %conv3)
|
|
161 %dec = add i8 %c.07, -1
|
|
162 %cmp = icmp sgt i8 %dec, -14
|
|
163 br i1 %cmp, label %for.body, label %for.end
|
|
164
|
|
165 for.end:
|
|
166 ret i32 0
|
|
167 }
|
|
168
|
|
169 ; CHECK-LABEL: @test5
|
|
170 ; CHECK: zext i32 %b
|
|
171 ; CHECK: for.cond:
|
|
172 ; CHECK: phi i64
|
|
173 ; CHECK: icmp ule i64
|
|
174
|
|
175 define i32 @test5(i32* %a, i32 %b) {
|
|
176 entry:
|
|
177 br label %for.cond
|
|
178
|
|
179 for.cond:
|
|
180 %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
181 %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
182 %cmp = icmp ule i32 %i.0, %b
|
|
183 br i1 %cmp, label %for.body, label %for.end
|
|
184
|
|
185 for.body:
|
|
186 %idxprom = zext i32 %i.0 to i64
|
95
|
187 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
188 %0 = load i32, i32* %arrayidx, align 4
|
|
189 %add = add nsw i32 %sum.0, %0
|
|
190 %inc = add nsw i32 %i.0, 1
|
|
191 br label %for.cond
|
|
192
|
|
193 for.end:
|
|
194 ret i32 %sum.0
|
|
195 }
|
|
196
|
|
197 define i32 @test6(i32* %a, i32 %b) {
|
|
198 ; CHECK-LABEL: @test6(
|
|
199 ; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
|
|
200 ; CHECK: for.cond:
|
|
201 ; CHECK: icmp sle i64 %indvars.iv, [[B_SEXT]]
|
|
202
|
|
203 entry:
|
|
204 br label %for.cond
|
|
205
|
|
206 for.cond:
|
|
207 %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
208 %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
209 %cmp = icmp sle i32 %i.0, %b
|
|
210 br i1 %cmp, label %for.body, label %for.end
|
|
211
|
|
212 for.body:
|
|
213 %idxprom = zext i32 %i.0 to i64
|
|
214 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
215 %0 = load i32, i32* %arrayidx, align 4
|
83
|
216 %add = add nsw i32 %sum.0, %0
|
|
217 %inc = add nsw i32 %i.0, 1
|
|
218 br label %for.cond
|
|
219
|
|
220 for.end:
|
|
221 ret i32 %sum.0
|
|
222 }
|
95
|
223
|
|
224 define i32 @test7(i32* %a, i32 %b) {
|
|
225 ; CHECK-LABEL: @test7(
|
|
226 ; CHECK: [[B_ZEXT:%[a-z0-9]+]] = zext i32 %b to i64
|
|
227 ; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
|
|
228 ; CHECK: for.cond:
|
|
229 ; CHECK: icmp ule i64 %indvars.iv, [[B_ZEXT]]
|
|
230 ; CHECK: for.body:
|
|
231 ; CHECK: icmp sle i64 %indvars.iv, [[B_SEXT]]
|
|
232
|
|
233 entry:
|
|
234 br label %for.cond
|
|
235
|
|
236 for.cond:
|
|
237 %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
238 %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
239 %cmp = icmp ule i32 %i.0, %b
|
|
240 br i1 %cmp, label %for.body, label %for.end
|
|
241
|
|
242 for.body:
|
|
243 %idxprom = sext i32 %i.0 to i64
|
|
244 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
245 %0 = load i32, i32* %arrayidx, align 4
|
|
246 %add = add nsw i32 %sum.0, %0
|
|
247 %inc = add nsw i32 %i.0, 1
|
|
248 %cmp2 = icmp sle i32 %i.0, %b
|
|
249 br i1 %cmp2, label %for.cond, label %for.end
|
|
250
|
|
251 for.end:
|
|
252 ret i32 %sum.0
|
|
253 }
|
|
254
|
|
255 define i32 @test8(i32* %a, i32 %b, i32 %init) {
|
|
256 ; CHECK-LABEL: @test8(
|
|
257 ; CHECK: [[INIT_SEXT:%[a-z0-9]+]] = sext i32 %init to i64
|
|
258 ; CHECK: [[B_ZEXT:%[a-z0-9]+]] = zext i32 %b to i64
|
|
259 ; CHECK: for.cond:
|
|
260 ; Note: %indvars.iv is the sign extension of %i.0
|
|
261 ; CHECK: %indvars.iv = phi i64 [ [[INIT_SEXT]], %for.cond.preheader ], [ %indvars.iv.next, %for.body ]
|
|
262 ; CHECK: icmp ule i64 %indvars.iv, [[B_ZEXT]]
|
|
263
|
|
264 entry:
|
|
265 %e = icmp sgt i32 %init, 0
|
|
266 br i1 %e, label %for.cond, label %leave
|
|
267
|
|
268 for.cond:
|
|
269 %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
270 %i.0 = phi i32 [ %init, %entry ], [ %inc, %for.body ]
|
|
271 %cmp = icmp ule i32 %i.0, %b
|
|
272 br i1 %cmp, label %for.body, label %for.end
|
|
273
|
|
274 for.body:
|
|
275 %idxprom = sext i32 %i.0 to i64
|
|
276 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
277 %0 = load i32, i32* %arrayidx, align 4
|
|
278 %add = add nsw i32 %sum.0, %0
|
|
279 %inc = add nsw i32 %i.0, 1
|
|
280 %cmp2 = icmp slt i32 0, %inc
|
|
281 br i1 %cmp2, label %for.cond, label %for.end
|
|
282
|
|
283 for.end:
|
|
284 ret i32 %sum.0
|
|
285
|
|
286 leave:
|
|
287 ret i32 0
|
|
288 }
|
|
289
|
|
290 define i32 @test9(i32* %a, i32 %b, i32 %init) {
|
|
291 ; CHECK-LABEL: @test9(
|
|
292 ; CHECK: [[INIT_ZEXT:%[a-z0-9]+]] = zext i32 %init to i64
|
|
293 ; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
|
|
294 ; CHECK: for.cond:
|
|
295 ; Note: %indvars.iv is the zero extension of %i.0
|
|
296 ; CHECK: %indvars.iv = phi i64 [ [[INIT_ZEXT]], %for.cond.preheader ], [ %indvars.iv.next, %for.body ]
|
|
297 ; CHECK: icmp slt i64 %indvars.iv, [[B_SEXT]]
|
|
298
|
|
299 entry:
|
|
300 %e = icmp sgt i32 %init, 0
|
|
301 br i1 %e, label %for.cond, label %leave
|
|
302
|
|
303 for.cond:
|
|
304 %sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
305 %i.0 = phi i32 [ %init, %entry ], [ %inc, %for.body ]
|
|
306 %cmp = icmp slt i32 %i.0, %b
|
|
307 br i1 %cmp, label %for.body, label %for.end
|
|
308
|
|
309 for.body:
|
|
310 %idxprom = zext i32 %i.0 to i64
|
|
311 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
312 %0 = load i32, i32* %arrayidx, align 4
|
|
313 %add = add nsw i32 %sum.0, %0
|
|
314 %inc = add nsw i32 %i.0, 1
|
|
315 %cmp2 = icmp slt i32 0, %inc
|
|
316 br i1 %cmp2, label %for.cond, label %for.end
|
|
317
|
|
318 for.end:
|
|
319 ret i32 %sum.0
|
|
320
|
|
321 leave:
|
|
322 ret i32 0
|
|
323 }
|
|
324
|
|
325 declare void @consume.i64(i64)
|
|
326 declare void @consume.i1(i1)
|
|
327
|
|
328 define i32 @test10(i32 %v) {
|
|
329 ; CHECK-LABEL: @test10(
|
|
330 entry:
|
|
331 ; CHECK-NOT: zext
|
|
332 br label %loop
|
|
333
|
|
334 loop:
|
|
335 ; CHECK: loop:
|
|
336 ; CHECK: %indvars.iv = phi i64 [ %indvars.iv.next, %loop ], [ 0, %entry ]
|
|
337 ; CHECK: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
338 ; CHECK: [[MUL:%[a-z0-9]+]] = mul nsw i64 %indvars.iv, -1
|
|
339 ; CHECK: [[MUL_TRUNC:%[a-z0-9]+]] = trunc i64 [[MUL]] to i32
|
|
340 ; CHECK: [[CMP:%[a-z0-9]+]] = icmp eq i32 [[MUL_TRUNC]], %v
|
|
341 ; CHECK: call void @consume.i1(i1 [[CMP]])
|
|
342
|
|
343 %i = phi i32 [ 0, %entry ], [ %i.inc, %loop ]
|
|
344 %i.inc = add i32 %i, 1
|
|
345 %iv = mul i32 %i, -1
|
|
346 %cmp = icmp eq i32 %iv, %v
|
|
347 call void @consume.i1(i1 %cmp)
|
|
348 %be.cond = icmp slt i32 %i.inc, 11
|
|
349 %ext = sext i32 %iv to i64
|
|
350 call void @consume.i64(i64 %ext)
|
|
351 br i1 %be.cond, label %loop, label %leave
|
|
352
|
|
353 leave:
|
|
354 ret i32 22
|
|
355 }
|