annotate test/CodeGen/Hexagon/v60-vsel1.ll @ 128:c347d3398279 default tip

fix
author mir3636
date Wed, 06 Dec 2017 14:37:17 +0900
parents 803732b1fca8
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
120
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
1 ; RUN: llc -march=hexagon < %s | FileCheck %s
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
2
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
3 ; CHECK: if (p{{[0-3]}}) v{{[0-9]+}} = v{{[0-9]+}}
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
4
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
5 target triple = "hexagon"
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
6
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
7 ; Function Attrs: nounwind
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
8 define void @fast9_detect_coarse(i8* nocapture readnone %img, i32 %xsize, i32 %stride, i32 %barrier, i32* nocapture %bitmask, i32 %boundary) #0 {
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
9 entry:
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
10 %0 = bitcast i32* %bitmask to <16 x i32>*
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
11 %1 = mul i32 %boundary, -2
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
12 %sub = add i32 %1, %xsize
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
13 %rem = and i32 %boundary, 63
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
14 %add = add i32 %sub, %rem
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
15 %2 = tail call <16 x i32> @llvm.hexagon.V6.lvsplatw(i32 -1)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
16 %3 = tail call <16 x i32> @llvm.hexagon.V6.lvsplatw(i32 1)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
17 %4 = tail call <512 x i1> @llvm.hexagon.V6.pred.scalar2(i32 %add)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
18 %5 = tail call <16 x i32> @llvm.hexagon.V6.vandqrt.acc(<16 x i32> %3, <512 x i1> %4, i32 12)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
19 %and4 = and i32 %add, 511
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
20 %cmp = icmp eq i32 %and4, 0
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
21 %sMaskR.0 = select i1 %cmp, <16 x i32> %2, <16 x i32> %5
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
22 %cmp547 = icmp sgt i32 %add, 0
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
23 br i1 %cmp547, label %for.body.lr.ph, label %for.end
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
24
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
25 for.body.lr.ph: ; preds = %entry
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
26 %6 = tail call <512 x i1> @llvm.hexagon.V6.pred.scalar2(i32 %boundary)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
27 %7 = tail call <16 x i32> @llvm.hexagon.V6.vandqrt(<512 x i1> %6, i32 16843009)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
28 %8 = tail call <16 x i32> @llvm.hexagon.V6.vnot(<16 x i32> %7)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
29 %9 = add i32 %rem, %xsize
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
30 %10 = add i32 %9, -1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
31 %11 = add i32 %10, %1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
32 %12 = lshr i32 %11, 9
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
33 %13 = mul i32 %12, 16
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
34 %14 = add nuw nsw i32 %13, 16
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
35 %scevgep = getelementptr i32, i32* %bitmask, i32 %14
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
36 br label %for.body
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
37
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
38 for.body: ; preds = %for.body.lr.ph, %for.body
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
39 %i.050 = phi i32 [ %add, %for.body.lr.ph ], [ %sub6, %for.body ]
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
40 %sMask.049 = phi <16 x i32> [ %8, %for.body.lr.ph ], [ %2, %for.body ]
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
41 %optr.048 = phi <16 x i32>* [ %0, %for.body.lr.ph ], [ %incdec.ptr, %for.body ]
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
42 %15 = tail call <16 x i32> @llvm.hexagon.V6.vand(<16 x i32> undef, <16 x i32> %sMask.049)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
43 %incdec.ptr = getelementptr inbounds <16 x i32>, <16 x i32>* %optr.048, i32 1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
44 store <16 x i32> %15, <16 x i32>* %optr.048, align 64
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
45 %sub6 = add nsw i32 %i.050, -512
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
46 %cmp5 = icmp sgt i32 %sub6, 0
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
47 br i1 %cmp5, label %for.body, label %for.cond.for.end_crit_edge
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
48
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
49 for.cond.for.end_crit_edge: ; preds = %for.body
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
50 %scevgep51 = bitcast i32* %scevgep to <16 x i32>*
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
51 br label %for.end
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
52
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
53 for.end: ; preds = %for.cond.for.end_crit_edge, %entry
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
54 %optr.0.lcssa = phi <16 x i32>* [ %scevgep51, %for.cond.for.end_crit_edge ], [ %0, %entry ]
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
55 %16 = load <16 x i32>, <16 x i32>* %optr.0.lcssa, align 64
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
56 %17 = tail call <16 x i32> @llvm.hexagon.V6.vand(<16 x i32> %16, <16 x i32> %sMaskR.0)
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
57 store <16 x i32> %17, <16 x i32>* %optr.0.lcssa, align 64
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
58 ret void
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
59 }
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
60
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
61 declare <16 x i32> @llvm.hexagon.V6.lvsplatw(i32) #1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
62 declare <512 x i1> @llvm.hexagon.V6.pred.scalar2(i32) #1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
63 declare <16 x i32> @llvm.hexagon.V6.vandqrt.acc(<16 x i32>, <512 x i1>, i32) #1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
64 declare <16 x i32> @llvm.hexagon.V6.vandqrt(<512 x i1>, i32) #1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
65 declare <16 x i32> @llvm.hexagon.V6.vnot(<16 x i32>) #1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
66 declare <16 x i32> @llvm.hexagon.V6.vand(<16 x i32>, <16 x i32>) #1
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
67
121
803732b1fca8 LLVM 5.0
kono
parents: 120
diff changeset
68 attributes #0 = { nounwind "target-cpu"="hexagonv60" "target-features"="+hvxv60,+hvx-length64b" }
120
1172e4bd9c6f update 4.0.0
mir3636
parents:
diff changeset
69 attributes #1 = { nounwind readnone }