comparison test/CodeGen/ARM/vcgt.ll @ 95:afa8332a0e37

LLVM 3.8
author Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
date Tue, 13 Oct 2015 17:48:58 +0900
parents 54457678186b
children 803732b1fca8
comparison
equal deleted inserted replaced
84:f3e34b893a5f 95:afa8332a0e37
2 ; RUN: llc -mtriple=arm-eabi -mattr=+neon -regalloc=basic %s -o - | FileCheck %s 2 ; RUN: llc -mtriple=arm-eabi -mattr=+neon -regalloc=basic %s -o - | FileCheck %s
3 3
4 define <8 x i8> @vcgts8(<8 x i8>* %A, <8 x i8>* %B) nounwind { 4 define <8 x i8> @vcgts8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
5 ;CHECK-LABEL: vcgts8: 5 ;CHECK-LABEL: vcgts8:
6 ;CHECK: vcgt.s8 6 ;CHECK: vcgt.s8
7 %tmp1 = load <8 x i8>* %A 7 %tmp1 = load <8 x i8>, <8 x i8>* %A
8 %tmp2 = load <8 x i8>* %B 8 %tmp2 = load <8 x i8>, <8 x i8>* %B
9 %tmp3 = icmp sgt <8 x i8> %tmp1, %tmp2 9 %tmp3 = icmp sgt <8 x i8> %tmp1, %tmp2
10 %tmp4 = sext <8 x i1> %tmp3 to <8 x i8> 10 %tmp4 = sext <8 x i1> %tmp3 to <8 x i8>
11 ret <8 x i8> %tmp4 11 ret <8 x i8> %tmp4
12 } 12 }
13 13
14 define <4 x i16> @vcgts16(<4 x i16>* %A, <4 x i16>* %B) nounwind { 14 define <4 x i16> @vcgts16(<4 x i16>* %A, <4 x i16>* %B) nounwind {
15 ;CHECK-LABEL: vcgts16: 15 ;CHECK-LABEL: vcgts16:
16 ;CHECK: vcgt.s16 16 ;CHECK: vcgt.s16
17 %tmp1 = load <4 x i16>* %A 17 %tmp1 = load <4 x i16>, <4 x i16>* %A
18 %tmp2 = load <4 x i16>* %B 18 %tmp2 = load <4 x i16>, <4 x i16>* %B
19 %tmp3 = icmp sgt <4 x i16> %tmp1, %tmp2 19 %tmp3 = icmp sgt <4 x i16> %tmp1, %tmp2
20 %tmp4 = sext <4 x i1> %tmp3 to <4 x i16> 20 %tmp4 = sext <4 x i1> %tmp3 to <4 x i16>
21 ret <4 x i16> %tmp4 21 ret <4 x i16> %tmp4
22 } 22 }
23 23
24 define <2 x i32> @vcgts32(<2 x i32>* %A, <2 x i32>* %B) nounwind { 24 define <2 x i32> @vcgts32(<2 x i32>* %A, <2 x i32>* %B) nounwind {
25 ;CHECK-LABEL: vcgts32: 25 ;CHECK-LABEL: vcgts32:
26 ;CHECK: vcgt.s32 26 ;CHECK: vcgt.s32
27 %tmp1 = load <2 x i32>* %A 27 %tmp1 = load <2 x i32>, <2 x i32>* %A
28 %tmp2 = load <2 x i32>* %B 28 %tmp2 = load <2 x i32>, <2 x i32>* %B
29 %tmp3 = icmp sgt <2 x i32> %tmp1, %tmp2 29 %tmp3 = icmp sgt <2 x i32> %tmp1, %tmp2
30 %tmp4 = sext <2 x i1> %tmp3 to <2 x i32> 30 %tmp4 = sext <2 x i1> %tmp3 to <2 x i32>
31 ret <2 x i32> %tmp4 31 ret <2 x i32> %tmp4
32 } 32 }
33 33
34 define <8 x i8> @vcgtu8(<8 x i8>* %A, <8 x i8>* %B) nounwind { 34 define <8 x i8> @vcgtu8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
35 ;CHECK-LABEL: vcgtu8: 35 ;CHECK-LABEL: vcgtu8:
36 ;CHECK: vcgt.u8 36 ;CHECK: vcgt.u8
37 %tmp1 = load <8 x i8>* %A 37 %tmp1 = load <8 x i8>, <8 x i8>* %A
38 %tmp2 = load <8 x i8>* %B 38 %tmp2 = load <8 x i8>, <8 x i8>* %B
39 %tmp3 = icmp ugt <8 x i8> %tmp1, %tmp2 39 %tmp3 = icmp ugt <8 x i8> %tmp1, %tmp2
40 %tmp4 = sext <8 x i1> %tmp3 to <8 x i8> 40 %tmp4 = sext <8 x i1> %tmp3 to <8 x i8>
41 ret <8 x i8> %tmp4 41 ret <8 x i8> %tmp4
42 } 42 }
43 43
44 define <4 x i16> @vcgtu16(<4 x i16>* %A, <4 x i16>* %B) nounwind { 44 define <4 x i16> @vcgtu16(<4 x i16>* %A, <4 x i16>* %B) nounwind {
45 ;CHECK-LABEL: vcgtu16: 45 ;CHECK-LABEL: vcgtu16:
46 ;CHECK: vcgt.u16 46 ;CHECK: vcgt.u16
47 %tmp1 = load <4 x i16>* %A 47 %tmp1 = load <4 x i16>, <4 x i16>* %A
48 %tmp2 = load <4 x i16>* %B 48 %tmp2 = load <4 x i16>, <4 x i16>* %B
49 %tmp3 = icmp ugt <4 x i16> %tmp1, %tmp2 49 %tmp3 = icmp ugt <4 x i16> %tmp1, %tmp2
50 %tmp4 = sext <4 x i1> %tmp3 to <4 x i16> 50 %tmp4 = sext <4 x i1> %tmp3 to <4 x i16>
51 ret <4 x i16> %tmp4 51 ret <4 x i16> %tmp4
52 } 52 }
53 53
54 define <2 x i32> @vcgtu32(<2 x i32>* %A, <2 x i32>* %B) nounwind { 54 define <2 x i32> @vcgtu32(<2 x i32>* %A, <2 x i32>* %B) nounwind {
55 ;CHECK-LABEL: vcgtu32: 55 ;CHECK-LABEL: vcgtu32:
56 ;CHECK: vcgt.u32 56 ;CHECK: vcgt.u32
57 %tmp1 = load <2 x i32>* %A 57 %tmp1 = load <2 x i32>, <2 x i32>* %A
58 %tmp2 = load <2 x i32>* %B 58 %tmp2 = load <2 x i32>, <2 x i32>* %B
59 %tmp3 = icmp ugt <2 x i32> %tmp1, %tmp2 59 %tmp3 = icmp ugt <2 x i32> %tmp1, %tmp2
60 %tmp4 = sext <2 x i1> %tmp3 to <2 x i32> 60 %tmp4 = sext <2 x i1> %tmp3 to <2 x i32>
61 ret <2 x i32> %tmp4 61 ret <2 x i32> %tmp4
62 } 62 }
63 63
64 define <2 x i32> @vcgtf32(<2 x float>* %A, <2 x float>* %B) nounwind { 64 define <2 x i32> @vcgtf32(<2 x float>* %A, <2 x float>* %B) nounwind {
65 ;CHECK-LABEL: vcgtf32: 65 ;CHECK-LABEL: vcgtf32:
66 ;CHECK: vcgt.f32 66 ;CHECK: vcgt.f32
67 %tmp1 = load <2 x float>* %A 67 %tmp1 = load <2 x float>, <2 x float>* %A
68 %tmp2 = load <2 x float>* %B 68 %tmp2 = load <2 x float>, <2 x float>* %B
69 %tmp3 = fcmp ogt <2 x float> %tmp1, %tmp2 69 %tmp3 = fcmp ogt <2 x float> %tmp1, %tmp2
70 %tmp4 = sext <2 x i1> %tmp3 to <2 x i32> 70 %tmp4 = sext <2 x i1> %tmp3 to <2 x i32>
71 ret <2 x i32> %tmp4 71 ret <2 x i32> %tmp4
72 } 72 }
73 73
74 define <16 x i8> @vcgtQs8(<16 x i8>* %A, <16 x i8>* %B) nounwind { 74 define <16 x i8> @vcgtQs8(<16 x i8>* %A, <16 x i8>* %B) nounwind {
75 ;CHECK-LABEL: vcgtQs8: 75 ;CHECK-LABEL: vcgtQs8:
76 ;CHECK: vcgt.s8 76 ;CHECK: vcgt.s8
77 %tmp1 = load <16 x i8>* %A 77 %tmp1 = load <16 x i8>, <16 x i8>* %A
78 %tmp2 = load <16 x i8>* %B 78 %tmp2 = load <16 x i8>, <16 x i8>* %B
79 %tmp3 = icmp sgt <16 x i8> %tmp1, %tmp2 79 %tmp3 = icmp sgt <16 x i8> %tmp1, %tmp2
80 %tmp4 = sext <16 x i1> %tmp3 to <16 x i8> 80 %tmp4 = sext <16 x i1> %tmp3 to <16 x i8>
81 ret <16 x i8> %tmp4 81 ret <16 x i8> %tmp4
82 } 82 }
83 83
84 define <8 x i16> @vcgtQs16(<8 x i16>* %A, <8 x i16>* %B) nounwind { 84 define <8 x i16> @vcgtQs16(<8 x i16>* %A, <8 x i16>* %B) nounwind {
85 ;CHECK-LABEL: vcgtQs16: 85 ;CHECK-LABEL: vcgtQs16:
86 ;CHECK: vcgt.s16 86 ;CHECK: vcgt.s16
87 %tmp1 = load <8 x i16>* %A 87 %tmp1 = load <8 x i16>, <8 x i16>* %A
88 %tmp2 = load <8 x i16>* %B 88 %tmp2 = load <8 x i16>, <8 x i16>* %B
89 %tmp3 = icmp sgt <8 x i16> %tmp1, %tmp2 89 %tmp3 = icmp sgt <8 x i16> %tmp1, %tmp2
90 %tmp4 = sext <8 x i1> %tmp3 to <8 x i16> 90 %tmp4 = sext <8 x i1> %tmp3 to <8 x i16>
91 ret <8 x i16> %tmp4 91 ret <8 x i16> %tmp4
92 } 92 }
93 93
94 define <4 x i32> @vcgtQs32(<4 x i32>* %A, <4 x i32>* %B) nounwind { 94 define <4 x i32> @vcgtQs32(<4 x i32>* %A, <4 x i32>* %B) nounwind {
95 ;CHECK-LABEL: vcgtQs32: 95 ;CHECK-LABEL: vcgtQs32:
96 ;CHECK: vcgt.s32 96 ;CHECK: vcgt.s32
97 %tmp1 = load <4 x i32>* %A 97 %tmp1 = load <4 x i32>, <4 x i32>* %A
98 %tmp2 = load <4 x i32>* %B 98 %tmp2 = load <4 x i32>, <4 x i32>* %B
99 %tmp3 = icmp sgt <4 x i32> %tmp1, %tmp2 99 %tmp3 = icmp sgt <4 x i32> %tmp1, %tmp2
100 %tmp4 = sext <4 x i1> %tmp3 to <4 x i32> 100 %tmp4 = sext <4 x i1> %tmp3 to <4 x i32>
101 ret <4 x i32> %tmp4 101 ret <4 x i32> %tmp4
102 } 102 }
103 103
104 define <16 x i8> @vcgtQu8(<16 x i8>* %A, <16 x i8>* %B) nounwind { 104 define <16 x i8> @vcgtQu8(<16 x i8>* %A, <16 x i8>* %B) nounwind {
105 ;CHECK-LABEL: vcgtQu8: 105 ;CHECK-LABEL: vcgtQu8:
106 ;CHECK: vcgt.u8 106 ;CHECK: vcgt.u8
107 %tmp1 = load <16 x i8>* %A 107 %tmp1 = load <16 x i8>, <16 x i8>* %A
108 %tmp2 = load <16 x i8>* %B 108 %tmp2 = load <16 x i8>, <16 x i8>* %B
109 %tmp3 = icmp ugt <16 x i8> %tmp1, %tmp2 109 %tmp3 = icmp ugt <16 x i8> %tmp1, %tmp2
110 %tmp4 = sext <16 x i1> %tmp3 to <16 x i8> 110 %tmp4 = sext <16 x i1> %tmp3 to <16 x i8>
111 ret <16 x i8> %tmp4 111 ret <16 x i8> %tmp4
112 } 112 }
113 113
114 define <8 x i16> @vcgtQu16(<8 x i16>* %A, <8 x i16>* %B) nounwind { 114 define <8 x i16> @vcgtQu16(<8 x i16>* %A, <8 x i16>* %B) nounwind {
115 ;CHECK-LABEL: vcgtQu16: 115 ;CHECK-LABEL: vcgtQu16:
116 ;CHECK: vcgt.u16 116 ;CHECK: vcgt.u16
117 %tmp1 = load <8 x i16>* %A 117 %tmp1 = load <8 x i16>, <8 x i16>* %A
118 %tmp2 = load <8 x i16>* %B 118 %tmp2 = load <8 x i16>, <8 x i16>* %B
119 %tmp3 = icmp ugt <8 x i16> %tmp1, %tmp2 119 %tmp3 = icmp ugt <8 x i16> %tmp1, %tmp2
120 %tmp4 = sext <8 x i1> %tmp3 to <8 x i16> 120 %tmp4 = sext <8 x i1> %tmp3 to <8 x i16>
121 ret <8 x i16> %tmp4 121 ret <8 x i16> %tmp4
122 } 122 }
123 123
124 define <4 x i32> @vcgtQu32(<4 x i32>* %A, <4 x i32>* %B) nounwind { 124 define <4 x i32> @vcgtQu32(<4 x i32>* %A, <4 x i32>* %B) nounwind {
125 ;CHECK-LABEL: vcgtQu32: 125 ;CHECK-LABEL: vcgtQu32:
126 ;CHECK: vcgt.u32 126 ;CHECK: vcgt.u32
127 %tmp1 = load <4 x i32>* %A 127 %tmp1 = load <4 x i32>, <4 x i32>* %A
128 %tmp2 = load <4 x i32>* %B 128 %tmp2 = load <4 x i32>, <4 x i32>* %B
129 %tmp3 = icmp ugt <4 x i32> %tmp1, %tmp2 129 %tmp3 = icmp ugt <4 x i32> %tmp1, %tmp2
130 %tmp4 = sext <4 x i1> %tmp3 to <4 x i32> 130 %tmp4 = sext <4 x i1> %tmp3 to <4 x i32>
131 ret <4 x i32> %tmp4 131 ret <4 x i32> %tmp4
132 } 132 }
133 133
134 define <4 x i32> @vcgtQf32(<4 x float>* %A, <4 x float>* %B) nounwind { 134 define <4 x i32> @vcgtQf32(<4 x float>* %A, <4 x float>* %B) nounwind {
135 ;CHECK-LABEL: vcgtQf32: 135 ;CHECK-LABEL: vcgtQf32:
136 ;CHECK: vcgt.f32 136 ;CHECK: vcgt.f32
137 %tmp1 = load <4 x float>* %A 137 %tmp1 = load <4 x float>, <4 x float>* %A
138 %tmp2 = load <4 x float>* %B 138 %tmp2 = load <4 x float>, <4 x float>* %B
139 %tmp3 = fcmp ogt <4 x float> %tmp1, %tmp2 139 %tmp3 = fcmp ogt <4 x float> %tmp1, %tmp2
140 %tmp4 = sext <4 x i1> %tmp3 to <4 x i32> 140 %tmp4 = sext <4 x i1> %tmp3 to <4 x i32>
141 ret <4 x i32> %tmp4 141 ret <4 x i32> %tmp4
142 } 142 }
143 143
144 define <2 x i32> @vacgtf32(<2 x float>* %A, <2 x float>* %B) nounwind { 144 define <2 x i32> @vacgtf32(<2 x float>* %A, <2 x float>* %B) nounwind {
145 ;CHECK-LABEL: vacgtf32: 145 ;CHECK-LABEL: vacgtf32:
146 ;CHECK: vacgt.f32 146 ;CHECK: vacgt.f32
147 %tmp1 = load <2 x float>* %A 147 %tmp1 = load <2 x float>, <2 x float>* %A
148 %tmp2 = load <2 x float>* %B 148 %tmp2 = load <2 x float>, <2 x float>* %B
149 %tmp3 = call <2 x i32> @llvm.arm.neon.vacgt.v2i32.v2f32(<2 x float> %tmp1, <2 x float> %tmp2) 149 %tmp3 = call <2 x i32> @llvm.arm.neon.vacgt.v2i32.v2f32(<2 x float> %tmp1, <2 x float> %tmp2)
150 ret <2 x i32> %tmp3 150 ret <2 x i32> %tmp3
151 } 151 }
152 152
153 define <4 x i32> @vacgtQf32(<4 x float>* %A, <4 x float>* %B) nounwind { 153 define <4 x i32> @vacgtQf32(<4 x float>* %A, <4 x float>* %B) nounwind {
154 ;CHECK-LABEL: vacgtQf32: 154 ;CHECK-LABEL: vacgtQf32:
155 ;CHECK: vacgt.f32 155 ;CHECK: vacgt.f32
156 %tmp1 = load <4 x float>* %A 156 %tmp1 = load <4 x float>, <4 x float>* %A
157 %tmp2 = load <4 x float>* %B 157 %tmp2 = load <4 x float>, <4 x float>* %B
158 %tmp3 = call <4 x i32> @llvm.arm.neon.vacgt.v4i32.v4f32(<4 x float> %tmp1, <4 x float> %tmp2) 158 %tmp3 = call <4 x i32> @llvm.arm.neon.vacgt.v4i32.v4f32(<4 x float> %tmp1, <4 x float> %tmp2)
159 ret <4 x i32> %tmp3 159 ret <4 x i32> %tmp3
160 } 160 }
161 161
162 ; rdar://7923010 162 ; rdar://7923010
163 define <4 x i32> @vcgt_zext(<4 x float>* %A, <4 x float>* %B) nounwind { 163 define <4 x i32> @vcgt_zext(<4 x float>* %A, <4 x float>* %B) nounwind {
164 ;CHECK-LABEL: vcgt_zext: 164 ;CHECK-LABEL: vcgt_zext:
165 ;CHECK: vmov.i32 [[Q0:q[0-9]+]], #0x1 165 ;CHECK: vmov.i32 [[Q0:q[0-9]+]], #0x1
166 ;CHECK: vcgt.f32 [[Q1:q[0-9]+]] 166 ;CHECK: vcgt.f32 [[Q1:q[0-9]+]]
167 ;CHECK: vand [[Q2:q[0-9]+]], [[Q1]], [[Q0]] 167 ;CHECK: vand [[Q2:q[0-9]+]], [[Q1]], [[Q0]]
168 %tmp1 = load <4 x float>* %A 168 %tmp1 = load <4 x float>, <4 x float>* %A
169 %tmp2 = load <4 x float>* %B 169 %tmp2 = load <4 x float>, <4 x float>* %B
170 %tmp3 = fcmp ogt <4 x float> %tmp1, %tmp2 170 %tmp3 = fcmp ogt <4 x float> %tmp1, %tmp2
171 %tmp4 = zext <4 x i1> %tmp3 to <4 x i32> 171 %tmp4 = zext <4 x i1> %tmp3 to <4 x i32>
172 ret <4 x i32> %tmp4 172 ret <4 x i32> %tmp4
173 } 173 }
174 174
178 define <8 x i8> @vcgti8Z(<8 x i8>* %A) nounwind { 178 define <8 x i8> @vcgti8Z(<8 x i8>* %A) nounwind {
179 ;CHECK-LABEL: vcgti8Z: 179 ;CHECK-LABEL: vcgti8Z:
180 ;CHECK-NOT: vmov 180 ;CHECK-NOT: vmov
181 ;CHECK-NOT: vmvn 181 ;CHECK-NOT: vmvn
182 ;CHECK: vcgt.s8 182 ;CHECK: vcgt.s8
183 %tmp1 = load <8 x i8>* %A 183 %tmp1 = load <8 x i8>, <8 x i8>* %A
184 %tmp3 = icmp sgt <8 x i8> %tmp1, <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0> 184 %tmp3 = icmp sgt <8 x i8> %tmp1, <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>
185 %tmp4 = sext <8 x i1> %tmp3 to <8 x i8> 185 %tmp4 = sext <8 x i1> %tmp3 to <8 x i8>
186 ret <8 x i8> %tmp4 186 ret <8 x i8> %tmp4
187 } 187 }
188 188
189 define <8 x i8> @vclti8Z(<8 x i8>* %A) nounwind { 189 define <8 x i8> @vclti8Z(<8 x i8>* %A) nounwind {
190 ;CHECK-LABEL: vclti8Z: 190 ;CHECK-LABEL: vclti8Z:
191 ;CHECK-NOT: vmov 191 ;CHECK-NOT: vmov
192 ;CHECK-NOT: vmvn 192 ;CHECK-NOT: vmvn
193 ;CHECK: vclt.s8 193 ;CHECK: vclt.s8
194 %tmp1 = load <8 x i8>* %A 194 %tmp1 = load <8 x i8>, <8 x i8>* %A
195 %tmp3 = icmp slt <8 x i8> %tmp1, <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0> 195 %tmp3 = icmp slt <8 x i8> %tmp1, <i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0, i8 0>
196 %tmp4 = sext <8 x i1> %tmp3 to <8 x i8> 196 %tmp4 = sext <8 x i1> %tmp3 to <8 x i8>
197 ret <8 x i8> %tmp4 197 ret <8 x i8> %tmp4
198 } 198 }