annotate llvm/test/Transforms/SLPVectorizer/AMDGPU/reduction.ll @ 207:2e18cbf3894f

LLVM12
author Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date Tue, 08 Jun 2021 06:07:14 +0900
parents 1d019706d866
children 1f2b6ac9f198
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
150
anatofuz
parents:
diff changeset
1 ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
anatofuz
parents:
diff changeset
2 ; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -slp-vectorizer -dce < %s | FileCheck -check-prefixes=GCN,GFX9 %s
anatofuz
parents:
diff changeset
3 ; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -mcpu=fiji -slp-vectorizer -dce < %s | FileCheck -check-prefixes=GCN,VI %s
anatofuz
parents:
diff changeset
4
anatofuz
parents:
diff changeset
5 define half @reduction_half4(<4 x half> %a) {
anatofuz
parents:
diff changeset
6 ; GFX9-LABEL: @reduction_half4(
anatofuz
parents:
diff changeset
7 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
8 ; GFX9-NEXT: [[TMP0:%.*]] = call fast half @llvm.vector.reduce.fadd.v4f16(half 0xH8000, <4 x half> [[A:%.*]])
150
anatofuz
parents:
diff changeset
9 ; GFX9-NEXT: ret half [[TMP0]]
anatofuz
parents:
diff changeset
10 ;
anatofuz
parents:
diff changeset
11 ; VI-LABEL: @reduction_half4(
anatofuz
parents:
diff changeset
12 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
13 ; VI-NEXT: [[ELT0:%.*]] = extractelement <4 x half> [[A:%.*]], i64 0
anatofuz
parents:
diff changeset
14 ; VI-NEXT: [[ELT1:%.*]] = extractelement <4 x half> [[A]], i64 1
anatofuz
parents:
diff changeset
15 ; VI-NEXT: [[ELT2:%.*]] = extractelement <4 x half> [[A]], i64 2
anatofuz
parents:
diff changeset
16 ; VI-NEXT: [[ELT3:%.*]] = extractelement <4 x half> [[A]], i64 3
anatofuz
parents:
diff changeset
17 ; VI-NEXT: [[ADD1:%.*]] = fadd fast half [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
18 ; VI-NEXT: [[ADD2:%.*]] = fadd fast half [[ELT2]], [[ADD1]]
anatofuz
parents:
diff changeset
19 ; VI-NEXT: [[ADD3:%.*]] = fadd fast half [[ELT3]], [[ADD2]]
anatofuz
parents:
diff changeset
20 ; VI-NEXT: ret half [[ADD3]]
anatofuz
parents:
diff changeset
21 ;
anatofuz
parents:
diff changeset
22 entry:
anatofuz
parents:
diff changeset
23 %elt0 = extractelement <4 x half> %a, i64 0
anatofuz
parents:
diff changeset
24 %elt1 = extractelement <4 x half> %a, i64 1
anatofuz
parents:
diff changeset
25 %elt2 = extractelement <4 x half> %a, i64 2
anatofuz
parents:
diff changeset
26 %elt3 = extractelement <4 x half> %a, i64 3
anatofuz
parents:
diff changeset
27
anatofuz
parents:
diff changeset
28 %add1 = fadd fast half %elt1, %elt0
anatofuz
parents:
diff changeset
29 %add2 = fadd fast half %elt2, %add1
anatofuz
parents:
diff changeset
30 %add3 = fadd fast half %elt3, %add2
anatofuz
parents:
diff changeset
31
anatofuz
parents:
diff changeset
32 ret half %add3
anatofuz
parents:
diff changeset
33 }
anatofuz
parents:
diff changeset
34
anatofuz
parents:
diff changeset
35 define half @reduction_half8(<8 x half> %vec8) {
anatofuz
parents:
diff changeset
36 ; GFX9-LABEL: @reduction_half8(
anatofuz
parents:
diff changeset
37 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
38 ; GFX9-NEXT: [[TMP0:%.*]] = call fast half @llvm.vector.reduce.fadd.v8f16(half 0xH8000, <8 x half> [[VEC8:%.*]])
150
anatofuz
parents:
diff changeset
39 ; GFX9-NEXT: ret half [[TMP0]]
anatofuz
parents:
diff changeset
40 ;
anatofuz
parents:
diff changeset
41 ; VI-LABEL: @reduction_half8(
anatofuz
parents:
diff changeset
42 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
43 ; VI-NEXT: [[ELT0:%.*]] = extractelement <8 x half> [[VEC8:%.*]], i64 0
anatofuz
parents:
diff changeset
44 ; VI-NEXT: [[ELT1:%.*]] = extractelement <8 x half> [[VEC8]], i64 1
anatofuz
parents:
diff changeset
45 ; VI-NEXT: [[ELT2:%.*]] = extractelement <8 x half> [[VEC8]], i64 2
anatofuz
parents:
diff changeset
46 ; VI-NEXT: [[ELT3:%.*]] = extractelement <8 x half> [[VEC8]], i64 3
anatofuz
parents:
diff changeset
47 ; VI-NEXT: [[ELT4:%.*]] = extractelement <8 x half> [[VEC8]], i64 4
anatofuz
parents:
diff changeset
48 ; VI-NEXT: [[ELT5:%.*]] = extractelement <8 x half> [[VEC8]], i64 5
anatofuz
parents:
diff changeset
49 ; VI-NEXT: [[ELT6:%.*]] = extractelement <8 x half> [[VEC8]], i64 6
anatofuz
parents:
diff changeset
50 ; VI-NEXT: [[ELT7:%.*]] = extractelement <8 x half> [[VEC8]], i64 7
anatofuz
parents:
diff changeset
51 ; VI-NEXT: [[ADD1:%.*]] = fadd fast half [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
52 ; VI-NEXT: [[ADD2:%.*]] = fadd fast half [[ELT2]], [[ADD1]]
anatofuz
parents:
diff changeset
53 ; VI-NEXT: [[ADD3:%.*]] = fadd fast half [[ELT3]], [[ADD2]]
anatofuz
parents:
diff changeset
54 ; VI-NEXT: [[ADD4:%.*]] = fadd fast half [[ELT4]], [[ADD3]]
anatofuz
parents:
diff changeset
55 ; VI-NEXT: [[ADD5:%.*]] = fadd fast half [[ELT5]], [[ADD4]]
anatofuz
parents:
diff changeset
56 ; VI-NEXT: [[ADD6:%.*]] = fadd fast half [[ELT6]], [[ADD5]]
anatofuz
parents:
diff changeset
57 ; VI-NEXT: [[ADD7:%.*]] = fadd fast half [[ELT7]], [[ADD6]]
anatofuz
parents:
diff changeset
58 ; VI-NEXT: ret half [[ADD7]]
anatofuz
parents:
diff changeset
59 ;
anatofuz
parents:
diff changeset
60 entry:
anatofuz
parents:
diff changeset
61 %elt0 = extractelement <8 x half> %vec8, i64 0
anatofuz
parents:
diff changeset
62 %elt1 = extractelement <8 x half> %vec8, i64 1
anatofuz
parents:
diff changeset
63 %elt2 = extractelement <8 x half> %vec8, i64 2
anatofuz
parents:
diff changeset
64 %elt3 = extractelement <8 x half> %vec8, i64 3
anatofuz
parents:
diff changeset
65 %elt4 = extractelement <8 x half> %vec8, i64 4
anatofuz
parents:
diff changeset
66 %elt5 = extractelement <8 x half> %vec8, i64 5
anatofuz
parents:
diff changeset
67 %elt6 = extractelement <8 x half> %vec8, i64 6
anatofuz
parents:
diff changeset
68 %elt7 = extractelement <8 x half> %vec8, i64 7
anatofuz
parents:
diff changeset
69
anatofuz
parents:
diff changeset
70 %add1 = fadd fast half %elt1, %elt0
anatofuz
parents:
diff changeset
71 %add2 = fadd fast half %elt2, %add1
anatofuz
parents:
diff changeset
72 %add3 = fadd fast half %elt3, %add2
anatofuz
parents:
diff changeset
73 %add4 = fadd fast half %elt4, %add3
anatofuz
parents:
diff changeset
74 %add5 = fadd fast half %elt5, %add4
anatofuz
parents:
diff changeset
75 %add6 = fadd fast half %elt6, %add5
anatofuz
parents:
diff changeset
76 %add7 = fadd fast half %elt7, %add6
anatofuz
parents:
diff changeset
77
anatofuz
parents:
diff changeset
78 ret half %add7
anatofuz
parents:
diff changeset
79 }
anatofuz
parents:
diff changeset
80
anatofuz
parents:
diff changeset
81 define half @reduction_half16(<16 x half> %vec16) {
anatofuz
parents:
diff changeset
82 ; GFX9-LABEL: @reduction_half16(
anatofuz
parents:
diff changeset
83 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
84 ; GFX9-NEXT: [[TMP0:%.*]] = call fast half @llvm.vector.reduce.fadd.v16f16(half 0xH8000, <16 x half> [[VEC16:%.*]])
150
anatofuz
parents:
diff changeset
85 ; GFX9-NEXT: ret half [[TMP0]]
anatofuz
parents:
diff changeset
86 ;
anatofuz
parents:
diff changeset
87 ; VI-LABEL: @reduction_half16(
anatofuz
parents:
diff changeset
88 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
89 ; VI-NEXT: [[ELT0:%.*]] = extractelement <16 x half> [[VEC16:%.*]], i64 0
anatofuz
parents:
diff changeset
90 ; VI-NEXT: [[ELT1:%.*]] = extractelement <16 x half> [[VEC16]], i64 1
anatofuz
parents:
diff changeset
91 ; VI-NEXT: [[ELT2:%.*]] = extractelement <16 x half> [[VEC16]], i64 2
anatofuz
parents:
diff changeset
92 ; VI-NEXT: [[ELT3:%.*]] = extractelement <16 x half> [[VEC16]], i64 3
anatofuz
parents:
diff changeset
93 ; VI-NEXT: [[ELT4:%.*]] = extractelement <16 x half> [[VEC16]], i64 4
anatofuz
parents:
diff changeset
94 ; VI-NEXT: [[ELT5:%.*]] = extractelement <16 x half> [[VEC16]], i64 5
anatofuz
parents:
diff changeset
95 ; VI-NEXT: [[ELT6:%.*]] = extractelement <16 x half> [[VEC16]], i64 6
anatofuz
parents:
diff changeset
96 ; VI-NEXT: [[ELT7:%.*]] = extractelement <16 x half> [[VEC16]], i64 7
anatofuz
parents:
diff changeset
97 ; VI-NEXT: [[ELT8:%.*]] = extractelement <16 x half> [[VEC16]], i64 8
anatofuz
parents:
diff changeset
98 ; VI-NEXT: [[ELT9:%.*]] = extractelement <16 x half> [[VEC16]], i64 9
anatofuz
parents:
diff changeset
99 ; VI-NEXT: [[ELT10:%.*]] = extractelement <16 x half> [[VEC16]], i64 10
anatofuz
parents:
diff changeset
100 ; VI-NEXT: [[ELT11:%.*]] = extractelement <16 x half> [[VEC16]], i64 11
anatofuz
parents:
diff changeset
101 ; VI-NEXT: [[ELT12:%.*]] = extractelement <16 x half> [[VEC16]], i64 12
anatofuz
parents:
diff changeset
102 ; VI-NEXT: [[ELT13:%.*]] = extractelement <16 x half> [[VEC16]], i64 13
anatofuz
parents:
diff changeset
103 ; VI-NEXT: [[ELT14:%.*]] = extractelement <16 x half> [[VEC16]], i64 14
anatofuz
parents:
diff changeset
104 ; VI-NEXT: [[ELT15:%.*]] = extractelement <16 x half> [[VEC16]], i64 15
anatofuz
parents:
diff changeset
105 ; VI-NEXT: [[ADD1:%.*]] = fadd fast half [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
106 ; VI-NEXT: [[ADD2:%.*]] = fadd fast half [[ELT2]], [[ADD1]]
anatofuz
parents:
diff changeset
107 ; VI-NEXT: [[ADD3:%.*]] = fadd fast half [[ELT3]], [[ADD2]]
anatofuz
parents:
diff changeset
108 ; VI-NEXT: [[ADD4:%.*]] = fadd fast half [[ELT4]], [[ADD3]]
anatofuz
parents:
diff changeset
109 ; VI-NEXT: [[ADD5:%.*]] = fadd fast half [[ELT5]], [[ADD4]]
anatofuz
parents:
diff changeset
110 ; VI-NEXT: [[ADD6:%.*]] = fadd fast half [[ELT6]], [[ADD5]]
anatofuz
parents:
diff changeset
111 ; VI-NEXT: [[ADD7:%.*]] = fadd fast half [[ELT7]], [[ADD6]]
anatofuz
parents:
diff changeset
112 ; VI-NEXT: [[ADD8:%.*]] = fadd fast half [[ELT8]], [[ADD7]]
anatofuz
parents:
diff changeset
113 ; VI-NEXT: [[ADD9:%.*]] = fadd fast half [[ELT9]], [[ADD8]]
anatofuz
parents:
diff changeset
114 ; VI-NEXT: [[ADD10:%.*]] = fadd fast half [[ELT10]], [[ADD9]]
anatofuz
parents:
diff changeset
115 ; VI-NEXT: [[ADD11:%.*]] = fadd fast half [[ELT11]], [[ADD10]]
anatofuz
parents:
diff changeset
116 ; VI-NEXT: [[ADD12:%.*]] = fadd fast half [[ELT12]], [[ADD11]]
anatofuz
parents:
diff changeset
117 ; VI-NEXT: [[ADD13:%.*]] = fadd fast half [[ELT13]], [[ADD12]]
anatofuz
parents:
diff changeset
118 ; VI-NEXT: [[ADD14:%.*]] = fadd fast half [[ELT14]], [[ADD13]]
anatofuz
parents:
diff changeset
119 ; VI-NEXT: [[ADD15:%.*]] = fadd fast half [[ELT15]], [[ADD14]]
anatofuz
parents:
diff changeset
120 ; VI-NEXT: ret half [[ADD15]]
anatofuz
parents:
diff changeset
121 ;
anatofuz
parents:
diff changeset
122 entry:
anatofuz
parents:
diff changeset
123 %elt0 = extractelement <16 x half> %vec16, i64 0
anatofuz
parents:
diff changeset
124 %elt1 = extractelement <16 x half> %vec16, i64 1
anatofuz
parents:
diff changeset
125 %elt2 = extractelement <16 x half> %vec16, i64 2
anatofuz
parents:
diff changeset
126 %elt3 = extractelement <16 x half> %vec16, i64 3
anatofuz
parents:
diff changeset
127 %elt4 = extractelement <16 x half> %vec16, i64 4
anatofuz
parents:
diff changeset
128 %elt5 = extractelement <16 x half> %vec16, i64 5
anatofuz
parents:
diff changeset
129 %elt6 = extractelement <16 x half> %vec16, i64 6
anatofuz
parents:
diff changeset
130 %elt7 = extractelement <16 x half> %vec16, i64 7
anatofuz
parents:
diff changeset
131 %elt8 = extractelement <16 x half> %vec16, i64 8
anatofuz
parents:
diff changeset
132 %elt9 = extractelement <16 x half> %vec16, i64 9
anatofuz
parents:
diff changeset
133 %elt10 = extractelement <16 x half> %vec16, i64 10
anatofuz
parents:
diff changeset
134 %elt11 = extractelement <16 x half> %vec16, i64 11
anatofuz
parents:
diff changeset
135 %elt12 = extractelement <16 x half> %vec16, i64 12
anatofuz
parents:
diff changeset
136 %elt13 = extractelement <16 x half> %vec16, i64 13
anatofuz
parents:
diff changeset
137 %elt14 = extractelement <16 x half> %vec16, i64 14
anatofuz
parents:
diff changeset
138 %elt15 = extractelement <16 x half> %vec16, i64 15
anatofuz
parents:
diff changeset
139
anatofuz
parents:
diff changeset
140 %add1 = fadd fast half %elt1, %elt0
anatofuz
parents:
diff changeset
141 %add2 = fadd fast half %elt2, %add1
anatofuz
parents:
diff changeset
142 %add3 = fadd fast half %elt3, %add2
anatofuz
parents:
diff changeset
143 %add4 = fadd fast half %elt4, %add3
anatofuz
parents:
diff changeset
144 %add5 = fadd fast half %elt5, %add4
anatofuz
parents:
diff changeset
145 %add6 = fadd fast half %elt6, %add5
anatofuz
parents:
diff changeset
146 %add7 = fadd fast half %elt7, %add6
anatofuz
parents:
diff changeset
147 %add8 = fadd fast half %elt8, %add7
anatofuz
parents:
diff changeset
148 %add9 = fadd fast half %elt9, %add8
anatofuz
parents:
diff changeset
149 %add10 = fadd fast half %elt10, %add9
anatofuz
parents:
diff changeset
150 %add11 = fadd fast half %elt11, %add10
anatofuz
parents:
diff changeset
151 %add12 = fadd fast half %elt12, %add11
anatofuz
parents:
diff changeset
152 %add13 = fadd fast half %elt13, %add12
anatofuz
parents:
diff changeset
153 %add14 = fadd fast half %elt14, %add13
anatofuz
parents:
diff changeset
154 %add15 = fadd fast half %elt15, %add14
anatofuz
parents:
diff changeset
155
anatofuz
parents:
diff changeset
156 ret half %add15
anatofuz
parents:
diff changeset
157 }
anatofuz
parents:
diff changeset
158
anatofuz
parents:
diff changeset
159 ; FIXME: support vectorization;
anatofuz
parents:
diff changeset
160 define half @reduction_sub_half4(<4 x half> %a) {
anatofuz
parents:
diff changeset
161 ; GCN-LABEL: @reduction_sub_half4(
anatofuz
parents:
diff changeset
162 ; GCN-NEXT: entry:
anatofuz
parents:
diff changeset
163 ; GCN-NEXT: [[ELT0:%.*]] = extractelement <4 x half> [[A:%.*]], i64 0
anatofuz
parents:
diff changeset
164 ; GCN-NEXT: [[ELT1:%.*]] = extractelement <4 x half> [[A]], i64 1
anatofuz
parents:
diff changeset
165 ; GCN-NEXT: [[ELT2:%.*]] = extractelement <4 x half> [[A]], i64 2
anatofuz
parents:
diff changeset
166 ; GCN-NEXT: [[ELT3:%.*]] = extractelement <4 x half> [[A]], i64 3
anatofuz
parents:
diff changeset
167 ; GCN-NEXT: [[ADD1:%.*]] = fsub fast half [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
168 ; GCN-NEXT: [[ADD2:%.*]] = fsub fast half [[ELT2]], [[ADD1]]
anatofuz
parents:
diff changeset
169 ; GCN-NEXT: [[ADD3:%.*]] = fsub fast half [[ELT3]], [[ADD2]]
anatofuz
parents:
diff changeset
170 ; GCN-NEXT: ret half [[ADD3]]
anatofuz
parents:
diff changeset
171 ;
anatofuz
parents:
diff changeset
172 entry:
anatofuz
parents:
diff changeset
173 %elt0 = extractelement <4 x half> %a, i64 0
anatofuz
parents:
diff changeset
174 %elt1 = extractelement <4 x half> %a, i64 1
anatofuz
parents:
diff changeset
175 %elt2 = extractelement <4 x half> %a, i64 2
anatofuz
parents:
diff changeset
176 %elt3 = extractelement <4 x half> %a, i64 3
anatofuz
parents:
diff changeset
177
anatofuz
parents:
diff changeset
178 %add1 = fsub fast half %elt1, %elt0
anatofuz
parents:
diff changeset
179 %add2 = fsub fast half %elt2, %add1
anatofuz
parents:
diff changeset
180 %add3 = fsub fast half %elt3, %add2
anatofuz
parents:
diff changeset
181
anatofuz
parents:
diff changeset
182 ret half %add3
anatofuz
parents:
diff changeset
183 }
anatofuz
parents:
diff changeset
184
anatofuz
parents:
diff changeset
185 define i16 @reduction_v4i16(<4 x i16> %a) {
anatofuz
parents:
diff changeset
186 ; GFX9-LABEL: @reduction_v4i16(
anatofuz
parents:
diff changeset
187 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
188 ; GFX9-NEXT: [[TMP0:%.*]] = call i16 @llvm.vector.reduce.add.v4i16(<4 x i16> [[A:%.*]])
150
anatofuz
parents:
diff changeset
189 ; GFX9-NEXT: ret i16 [[TMP0]]
anatofuz
parents:
diff changeset
190 ;
anatofuz
parents:
diff changeset
191 ; VI-LABEL: @reduction_v4i16(
anatofuz
parents:
diff changeset
192 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
193 ; VI-NEXT: [[ELT0:%.*]] = extractelement <4 x i16> [[A:%.*]], i64 0
anatofuz
parents:
diff changeset
194 ; VI-NEXT: [[ELT1:%.*]] = extractelement <4 x i16> [[A]], i64 1
anatofuz
parents:
diff changeset
195 ; VI-NEXT: [[ELT2:%.*]] = extractelement <4 x i16> [[A]], i64 2
anatofuz
parents:
diff changeset
196 ; VI-NEXT: [[ELT3:%.*]] = extractelement <4 x i16> [[A]], i64 3
anatofuz
parents:
diff changeset
197 ; VI-NEXT: [[ADD1:%.*]] = add i16 [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
198 ; VI-NEXT: [[ADD2:%.*]] = add i16 [[ELT2]], [[ADD1]]
anatofuz
parents:
diff changeset
199 ; VI-NEXT: [[ADD3:%.*]] = add i16 [[ELT3]], [[ADD2]]
anatofuz
parents:
diff changeset
200 ; VI-NEXT: ret i16 [[ADD3]]
anatofuz
parents:
diff changeset
201 ;
anatofuz
parents:
diff changeset
202 entry:
anatofuz
parents:
diff changeset
203 %elt0 = extractelement <4 x i16> %a, i64 0
anatofuz
parents:
diff changeset
204 %elt1 = extractelement <4 x i16> %a, i64 1
anatofuz
parents:
diff changeset
205 %elt2 = extractelement <4 x i16> %a, i64 2
anatofuz
parents:
diff changeset
206 %elt3 = extractelement <4 x i16> %a, i64 3
anatofuz
parents:
diff changeset
207
anatofuz
parents:
diff changeset
208 %add1 = add i16 %elt1, %elt0
anatofuz
parents:
diff changeset
209 %add2 = add i16 %elt2, %add1
anatofuz
parents:
diff changeset
210 %add3 = add i16 %elt3, %add2
anatofuz
parents:
diff changeset
211
anatofuz
parents:
diff changeset
212 ret i16 %add3
anatofuz
parents:
diff changeset
213 }
anatofuz
parents:
diff changeset
214
anatofuz
parents:
diff changeset
215 define i16 @reduction_v8i16(<8 x i16> %vec8) {
anatofuz
parents:
diff changeset
216 ; GFX9-LABEL: @reduction_v8i16(
anatofuz
parents:
diff changeset
217 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
218 ; GFX9-NEXT: [[TMP0:%.*]] = call i16 @llvm.vector.reduce.add.v8i16(<8 x i16> [[VEC8:%.*]])
150
anatofuz
parents:
diff changeset
219 ; GFX9-NEXT: ret i16 [[TMP0]]
anatofuz
parents:
diff changeset
220 ;
anatofuz
parents:
diff changeset
221 ; VI-LABEL: @reduction_v8i16(
anatofuz
parents:
diff changeset
222 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
223 ; VI-NEXT: [[ELT0:%.*]] = extractelement <8 x i16> [[VEC8:%.*]], i64 0
anatofuz
parents:
diff changeset
224 ; VI-NEXT: [[ELT1:%.*]] = extractelement <8 x i16> [[VEC8]], i64 1
anatofuz
parents:
diff changeset
225 ; VI-NEXT: [[ELT2:%.*]] = extractelement <8 x i16> [[VEC8]], i64 2
anatofuz
parents:
diff changeset
226 ; VI-NEXT: [[ELT3:%.*]] = extractelement <8 x i16> [[VEC8]], i64 3
anatofuz
parents:
diff changeset
227 ; VI-NEXT: [[ELT4:%.*]] = extractelement <8 x i16> [[VEC8]], i64 4
anatofuz
parents:
diff changeset
228 ; VI-NEXT: [[ELT5:%.*]] = extractelement <8 x i16> [[VEC8]], i64 5
anatofuz
parents:
diff changeset
229 ; VI-NEXT: [[ELT6:%.*]] = extractelement <8 x i16> [[VEC8]], i64 6
anatofuz
parents:
diff changeset
230 ; VI-NEXT: [[ELT7:%.*]] = extractelement <8 x i16> [[VEC8]], i64 7
anatofuz
parents:
diff changeset
231 ; VI-NEXT: [[ADD1:%.*]] = add i16 [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
232 ; VI-NEXT: [[ADD2:%.*]] = add i16 [[ELT2]], [[ADD1]]
anatofuz
parents:
diff changeset
233 ; VI-NEXT: [[ADD3:%.*]] = add i16 [[ELT3]], [[ADD2]]
anatofuz
parents:
diff changeset
234 ; VI-NEXT: [[ADD4:%.*]] = add i16 [[ELT4]], [[ADD3]]
anatofuz
parents:
diff changeset
235 ; VI-NEXT: [[ADD5:%.*]] = add i16 [[ELT5]], [[ADD4]]
anatofuz
parents:
diff changeset
236 ; VI-NEXT: [[ADD6:%.*]] = add i16 [[ELT6]], [[ADD5]]
anatofuz
parents:
diff changeset
237 ; VI-NEXT: [[ADD7:%.*]] = add i16 [[ELT7]], [[ADD6]]
anatofuz
parents:
diff changeset
238 ; VI-NEXT: ret i16 [[ADD7]]
anatofuz
parents:
diff changeset
239 ;
anatofuz
parents:
diff changeset
240 entry:
anatofuz
parents:
diff changeset
241 %elt0 = extractelement <8 x i16> %vec8, i64 0
anatofuz
parents:
diff changeset
242 %elt1 = extractelement <8 x i16> %vec8, i64 1
anatofuz
parents:
diff changeset
243 %elt2 = extractelement <8 x i16> %vec8, i64 2
anatofuz
parents:
diff changeset
244 %elt3 = extractelement <8 x i16> %vec8, i64 3
anatofuz
parents:
diff changeset
245 %elt4 = extractelement <8 x i16> %vec8, i64 4
anatofuz
parents:
diff changeset
246 %elt5 = extractelement <8 x i16> %vec8, i64 5
anatofuz
parents:
diff changeset
247 %elt6 = extractelement <8 x i16> %vec8, i64 6
anatofuz
parents:
diff changeset
248 %elt7 = extractelement <8 x i16> %vec8, i64 7
anatofuz
parents:
diff changeset
249
anatofuz
parents:
diff changeset
250 %add1 = add i16 %elt1, %elt0
anatofuz
parents:
diff changeset
251 %add2 = add i16 %elt2, %add1
anatofuz
parents:
diff changeset
252 %add3 = add i16 %elt3, %add2
anatofuz
parents:
diff changeset
253 %add4 = add i16 %elt4, %add3
anatofuz
parents:
diff changeset
254 %add5 = add i16 %elt5, %add4
anatofuz
parents:
diff changeset
255 %add6 = add i16 %elt6, %add5
anatofuz
parents:
diff changeset
256 %add7 = add i16 %elt7, %add6
anatofuz
parents:
diff changeset
257
anatofuz
parents:
diff changeset
258 ret i16 %add7
anatofuz
parents:
diff changeset
259 }
anatofuz
parents:
diff changeset
260
anatofuz
parents:
diff changeset
261 define i16 @reduction_umin_v4i16(<4 x i16> %vec4) {
anatofuz
parents:
diff changeset
262 ; GFX9-LABEL: @reduction_umin_v4i16(
anatofuz
parents:
diff changeset
263 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
264 ; GFX9-NEXT: [[TMP0:%.*]] = call i16 @llvm.vector.reduce.umin.v4i16(<4 x i16> [[VEC4:%.*]])
150
anatofuz
parents:
diff changeset
265 ; GFX9-NEXT: ret i16 [[TMP0]]
anatofuz
parents:
diff changeset
266 ;
anatofuz
parents:
diff changeset
267 ; VI-LABEL: @reduction_umin_v4i16(
anatofuz
parents:
diff changeset
268 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
269 ; VI-NEXT: [[ELT0:%.*]] = extractelement <4 x i16> [[VEC4:%.*]], i64 0
anatofuz
parents:
diff changeset
270 ; VI-NEXT: [[ELT1:%.*]] = extractelement <4 x i16> [[VEC4]], i64 1
anatofuz
parents:
diff changeset
271 ; VI-NEXT: [[ELT2:%.*]] = extractelement <4 x i16> [[VEC4]], i64 2
anatofuz
parents:
diff changeset
272 ; VI-NEXT: [[ELT3:%.*]] = extractelement <4 x i16> [[VEC4]], i64 3
anatofuz
parents:
diff changeset
273 ; VI-NEXT: [[CMP1:%.*]] = icmp ult i16 [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
274 ; VI-NEXT: [[MIN1:%.*]] = select i1 [[CMP1]], i16 [[ELT1]], i16 [[ELT0]]
anatofuz
parents:
diff changeset
275 ; VI-NEXT: [[CMP2:%.*]] = icmp ult i16 [[ELT2]], [[MIN1]]
anatofuz
parents:
diff changeset
276 ; VI-NEXT: [[MIN2:%.*]] = select i1 [[CMP2]], i16 [[ELT2]], i16 [[MIN1]]
anatofuz
parents:
diff changeset
277 ; VI-NEXT: [[CMP3:%.*]] = icmp ult i16 [[ELT3]], [[MIN2]]
anatofuz
parents:
diff changeset
278 ; VI-NEXT: [[MIN3:%.*]] = select i1 [[CMP3]], i16 [[ELT3]], i16 [[MIN2]]
anatofuz
parents:
diff changeset
279 ; VI-NEXT: ret i16 [[MIN3]]
anatofuz
parents:
diff changeset
280 ;
anatofuz
parents:
diff changeset
281 entry:
anatofuz
parents:
diff changeset
282 %elt0 = extractelement <4 x i16> %vec4, i64 0
anatofuz
parents:
diff changeset
283 %elt1 = extractelement <4 x i16> %vec4, i64 1
anatofuz
parents:
diff changeset
284 %elt2 = extractelement <4 x i16> %vec4, i64 2
anatofuz
parents:
diff changeset
285 %elt3 = extractelement <4 x i16> %vec4, i64 3
anatofuz
parents:
diff changeset
286
anatofuz
parents:
diff changeset
287 %cmp1 = icmp ult i16 %elt1, %elt0
anatofuz
parents:
diff changeset
288 %min1 = select i1 %cmp1, i16 %elt1, i16 %elt0
anatofuz
parents:
diff changeset
289 %cmp2 = icmp ult i16 %elt2, %min1
anatofuz
parents:
diff changeset
290 %min2 = select i1 %cmp2, i16 %elt2, i16 %min1
anatofuz
parents:
diff changeset
291 %cmp3 = icmp ult i16 %elt3, %min2
anatofuz
parents:
diff changeset
292 %min3 = select i1 %cmp3, i16 %elt3, i16 %min2
anatofuz
parents:
diff changeset
293
anatofuz
parents:
diff changeset
294 ret i16 %min3
anatofuz
parents:
diff changeset
295 }
anatofuz
parents:
diff changeset
296
anatofuz
parents:
diff changeset
297 define i16 @reduction_icmp_v8i16(<8 x i16> %vec8) {
anatofuz
parents:
diff changeset
298 ; GFX9-LABEL: @reduction_icmp_v8i16(
anatofuz
parents:
diff changeset
299 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
300 ; GFX9-NEXT: [[TMP0:%.*]] = call i16 @llvm.vector.reduce.umin.v8i16(<8 x i16> [[VEC8:%.*]])
150
anatofuz
parents:
diff changeset
301 ; GFX9-NEXT: ret i16 [[TMP0]]
anatofuz
parents:
diff changeset
302 ;
anatofuz
parents:
diff changeset
303 ; VI-LABEL: @reduction_icmp_v8i16(
anatofuz
parents:
diff changeset
304 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
305 ; VI-NEXT: [[ELT0:%.*]] = extractelement <8 x i16> [[VEC8:%.*]], i64 0
anatofuz
parents:
diff changeset
306 ; VI-NEXT: [[ELT1:%.*]] = extractelement <8 x i16> [[VEC8]], i64 1
anatofuz
parents:
diff changeset
307 ; VI-NEXT: [[ELT2:%.*]] = extractelement <8 x i16> [[VEC8]], i64 2
anatofuz
parents:
diff changeset
308 ; VI-NEXT: [[ELT3:%.*]] = extractelement <8 x i16> [[VEC8]], i64 3
anatofuz
parents:
diff changeset
309 ; VI-NEXT: [[ELT4:%.*]] = extractelement <8 x i16> [[VEC8]], i64 4
anatofuz
parents:
diff changeset
310 ; VI-NEXT: [[ELT5:%.*]] = extractelement <8 x i16> [[VEC8]], i64 5
anatofuz
parents:
diff changeset
311 ; VI-NEXT: [[ELT6:%.*]] = extractelement <8 x i16> [[VEC8]], i64 6
anatofuz
parents:
diff changeset
312 ; VI-NEXT: [[ELT7:%.*]] = extractelement <8 x i16> [[VEC8]], i64 7
anatofuz
parents:
diff changeset
313 ; VI-NEXT: [[CMP0:%.*]] = icmp ult i16 [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
314 ; VI-NEXT: [[MIN1:%.*]] = select i1 [[CMP0]], i16 [[ELT1]], i16 [[ELT0]]
anatofuz
parents:
diff changeset
315 ; VI-NEXT: [[CMP1:%.*]] = icmp ult i16 [[ELT2]], [[MIN1]]
anatofuz
parents:
diff changeset
316 ; VI-NEXT: [[MIN2:%.*]] = select i1 [[CMP1]], i16 [[ELT2]], i16 [[MIN1]]
anatofuz
parents:
diff changeset
317 ; VI-NEXT: [[CMP2:%.*]] = icmp ult i16 [[ELT3]], [[MIN2]]
anatofuz
parents:
diff changeset
318 ; VI-NEXT: [[MIN3:%.*]] = select i1 [[CMP2]], i16 [[ELT3]], i16 [[MIN2]]
anatofuz
parents:
diff changeset
319 ; VI-NEXT: [[CMP3:%.*]] = icmp ult i16 [[ELT4]], [[MIN3]]
anatofuz
parents:
diff changeset
320 ; VI-NEXT: [[MIN4:%.*]] = select i1 [[CMP3]], i16 [[ELT4]], i16 [[MIN3]]
anatofuz
parents:
diff changeset
321 ; VI-NEXT: [[CMP4:%.*]] = icmp ult i16 [[ELT5]], [[MIN4]]
anatofuz
parents:
diff changeset
322 ; VI-NEXT: [[MIN5:%.*]] = select i1 [[CMP4]], i16 [[ELT5]], i16 [[MIN4]]
anatofuz
parents:
diff changeset
323 ; VI-NEXT: [[CMP5:%.*]] = icmp ult i16 [[ELT6]], [[MIN5]]
anatofuz
parents:
diff changeset
324 ; VI-NEXT: [[MIN6:%.*]] = select i1 [[CMP5]], i16 [[ELT6]], i16 [[MIN5]]
anatofuz
parents:
diff changeset
325 ; VI-NEXT: [[CMP6:%.*]] = icmp ult i16 [[ELT7]], [[MIN6]]
anatofuz
parents:
diff changeset
326 ; VI-NEXT: [[MIN7:%.*]] = select i1 [[CMP6]], i16 [[ELT7]], i16 [[MIN6]]
anatofuz
parents:
diff changeset
327 ; VI-NEXT: ret i16 [[MIN7]]
anatofuz
parents:
diff changeset
328 ;
anatofuz
parents:
diff changeset
329 entry:
anatofuz
parents:
diff changeset
330 %elt0 = extractelement <8 x i16> %vec8, i64 0
anatofuz
parents:
diff changeset
331 %elt1 = extractelement <8 x i16> %vec8, i64 1
anatofuz
parents:
diff changeset
332 %elt2 = extractelement <8 x i16> %vec8, i64 2
anatofuz
parents:
diff changeset
333 %elt3 = extractelement <8 x i16> %vec8, i64 3
anatofuz
parents:
diff changeset
334 %elt4 = extractelement <8 x i16> %vec8, i64 4
anatofuz
parents:
diff changeset
335 %elt5 = extractelement <8 x i16> %vec8, i64 5
anatofuz
parents:
diff changeset
336 %elt6 = extractelement <8 x i16> %vec8, i64 6
anatofuz
parents:
diff changeset
337 %elt7 = extractelement <8 x i16> %vec8, i64 7
anatofuz
parents:
diff changeset
338
anatofuz
parents:
diff changeset
339 %cmp0 = icmp ult i16 %elt1, %elt0
anatofuz
parents:
diff changeset
340 %min1 = select i1 %cmp0, i16 %elt1, i16 %elt0
anatofuz
parents:
diff changeset
341 %cmp1 = icmp ult i16 %elt2, %min1
anatofuz
parents:
diff changeset
342 %min2 = select i1 %cmp1, i16 %elt2, i16 %min1
anatofuz
parents:
diff changeset
343 %cmp2 = icmp ult i16 %elt3, %min2
anatofuz
parents:
diff changeset
344 %min3 = select i1 %cmp2, i16 %elt3, i16 %min2
anatofuz
parents:
diff changeset
345
anatofuz
parents:
diff changeset
346 %cmp3 = icmp ult i16 %elt4, %min3
anatofuz
parents:
diff changeset
347 %min4 = select i1 %cmp3, i16 %elt4, i16 %min3
anatofuz
parents:
diff changeset
348 %cmp4 = icmp ult i16 %elt5, %min4
anatofuz
parents:
diff changeset
349 %min5 = select i1 %cmp4, i16 %elt5, i16 %min4
anatofuz
parents:
diff changeset
350
anatofuz
parents:
diff changeset
351 %cmp5 = icmp ult i16 %elt6, %min5
anatofuz
parents:
diff changeset
352 %min6 = select i1 %cmp5, i16 %elt6, i16 %min5
anatofuz
parents:
diff changeset
353 %cmp6 = icmp ult i16 %elt7, %min6
anatofuz
parents:
diff changeset
354 %min7 = select i1 %cmp6, i16 %elt7, i16 %min6
anatofuz
parents:
diff changeset
355
anatofuz
parents:
diff changeset
356 ret i16 %min7
anatofuz
parents:
diff changeset
357 }
anatofuz
parents:
diff changeset
358
anatofuz
parents:
diff changeset
359 define i16 @reduction_smin_v16i16(<16 x i16> %vec16) {
anatofuz
parents:
diff changeset
360 ; GFX9-LABEL: @reduction_smin_v16i16(
anatofuz
parents:
diff changeset
361 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
362 ; GFX9-NEXT: [[TMP0:%.*]] = call i16 @llvm.vector.reduce.smin.v16i16(<16 x i16> [[VEC16:%.*]])
150
anatofuz
parents:
diff changeset
363 ; GFX9-NEXT: ret i16 [[TMP0]]
anatofuz
parents:
diff changeset
364 ;
anatofuz
parents:
diff changeset
365 ; VI-LABEL: @reduction_smin_v16i16(
anatofuz
parents:
diff changeset
366 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
367 ; VI-NEXT: [[ELT0:%.*]] = extractelement <16 x i16> [[VEC16:%.*]], i64 0
anatofuz
parents:
diff changeset
368 ; VI-NEXT: [[ELT1:%.*]] = extractelement <16 x i16> [[VEC16]], i64 1
anatofuz
parents:
diff changeset
369 ; VI-NEXT: [[ELT2:%.*]] = extractelement <16 x i16> [[VEC16]], i64 2
anatofuz
parents:
diff changeset
370 ; VI-NEXT: [[ELT3:%.*]] = extractelement <16 x i16> [[VEC16]], i64 3
anatofuz
parents:
diff changeset
371 ; VI-NEXT: [[ELT4:%.*]] = extractelement <16 x i16> [[VEC16]], i64 4
anatofuz
parents:
diff changeset
372 ; VI-NEXT: [[ELT5:%.*]] = extractelement <16 x i16> [[VEC16]], i64 5
anatofuz
parents:
diff changeset
373 ; VI-NEXT: [[ELT6:%.*]] = extractelement <16 x i16> [[VEC16]], i64 6
anatofuz
parents:
diff changeset
374 ; VI-NEXT: [[ELT7:%.*]] = extractelement <16 x i16> [[VEC16]], i64 7
anatofuz
parents:
diff changeset
375 ; VI-NEXT: [[ELT8:%.*]] = extractelement <16 x i16> [[VEC16]], i64 8
anatofuz
parents:
diff changeset
376 ; VI-NEXT: [[ELT9:%.*]] = extractelement <16 x i16> [[VEC16]], i64 9
anatofuz
parents:
diff changeset
377 ; VI-NEXT: [[ELT10:%.*]] = extractelement <16 x i16> [[VEC16]], i64 10
anatofuz
parents:
diff changeset
378 ; VI-NEXT: [[ELT11:%.*]] = extractelement <16 x i16> [[VEC16]], i64 11
anatofuz
parents:
diff changeset
379 ; VI-NEXT: [[ELT12:%.*]] = extractelement <16 x i16> [[VEC16]], i64 12
anatofuz
parents:
diff changeset
380 ; VI-NEXT: [[ELT13:%.*]] = extractelement <16 x i16> [[VEC16]], i64 13
anatofuz
parents:
diff changeset
381 ; VI-NEXT: [[ELT14:%.*]] = extractelement <16 x i16> [[VEC16]], i64 14
anatofuz
parents:
diff changeset
382 ; VI-NEXT: [[ELT15:%.*]] = extractelement <16 x i16> [[VEC16]], i64 15
anatofuz
parents:
diff changeset
383 ; VI-NEXT: [[CMP0:%.*]] = icmp slt i16 [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
384 ; VI-NEXT: [[MIN1:%.*]] = select i1 [[CMP0]], i16 [[ELT1]], i16 [[ELT0]]
anatofuz
parents:
diff changeset
385 ; VI-NEXT: [[CMP1:%.*]] = icmp slt i16 [[ELT2]], [[MIN1]]
anatofuz
parents:
diff changeset
386 ; VI-NEXT: [[MIN2:%.*]] = select i1 [[CMP1]], i16 [[ELT2]], i16 [[MIN1]]
anatofuz
parents:
diff changeset
387 ; VI-NEXT: [[CMP2:%.*]] = icmp slt i16 [[ELT3]], [[MIN2]]
anatofuz
parents:
diff changeset
388 ; VI-NEXT: [[MIN3:%.*]] = select i1 [[CMP2]], i16 [[ELT3]], i16 [[MIN2]]
anatofuz
parents:
diff changeset
389 ; VI-NEXT: [[CMP3:%.*]] = icmp slt i16 [[ELT4]], [[MIN3]]
anatofuz
parents:
diff changeset
390 ; VI-NEXT: [[MIN4:%.*]] = select i1 [[CMP3]], i16 [[ELT4]], i16 [[MIN3]]
anatofuz
parents:
diff changeset
391 ; VI-NEXT: [[CMP4:%.*]] = icmp slt i16 [[ELT5]], [[MIN4]]
anatofuz
parents:
diff changeset
392 ; VI-NEXT: [[MIN5:%.*]] = select i1 [[CMP4]], i16 [[ELT5]], i16 [[MIN4]]
anatofuz
parents:
diff changeset
393 ; VI-NEXT: [[CMP5:%.*]] = icmp slt i16 [[ELT6]], [[MIN5]]
anatofuz
parents:
diff changeset
394 ; VI-NEXT: [[MIN6:%.*]] = select i1 [[CMP5]], i16 [[ELT6]], i16 [[MIN5]]
anatofuz
parents:
diff changeset
395 ; VI-NEXT: [[CMP6:%.*]] = icmp slt i16 [[ELT7]], [[MIN6]]
anatofuz
parents:
diff changeset
396 ; VI-NEXT: [[MIN7:%.*]] = select i1 [[CMP6]], i16 [[ELT7]], i16 [[MIN6]]
anatofuz
parents:
diff changeset
397 ; VI-NEXT: [[CMP7:%.*]] = icmp slt i16 [[ELT8]], [[MIN7]]
anatofuz
parents:
diff changeset
398 ; VI-NEXT: [[MIN8:%.*]] = select i1 [[CMP7]], i16 [[ELT8]], i16 [[MIN7]]
anatofuz
parents:
diff changeset
399 ; VI-NEXT: [[CMP8:%.*]] = icmp slt i16 [[ELT9]], [[MIN8]]
anatofuz
parents:
diff changeset
400 ; VI-NEXT: [[MIN9:%.*]] = select i1 [[CMP8]], i16 [[ELT9]], i16 [[MIN8]]
anatofuz
parents:
diff changeset
401 ; VI-NEXT: [[CMP9:%.*]] = icmp slt i16 [[ELT10]], [[MIN9]]
anatofuz
parents:
diff changeset
402 ; VI-NEXT: [[MIN10:%.*]] = select i1 [[CMP9]], i16 [[ELT10]], i16 [[MIN9]]
anatofuz
parents:
diff changeset
403 ; VI-NEXT: [[CMP10:%.*]] = icmp slt i16 [[ELT11]], [[MIN10]]
anatofuz
parents:
diff changeset
404 ; VI-NEXT: [[MIN11:%.*]] = select i1 [[CMP10]], i16 [[ELT11]], i16 [[MIN10]]
anatofuz
parents:
diff changeset
405 ; VI-NEXT: [[CMP11:%.*]] = icmp slt i16 [[ELT12]], [[MIN11]]
anatofuz
parents:
diff changeset
406 ; VI-NEXT: [[MIN12:%.*]] = select i1 [[CMP11]], i16 [[ELT12]], i16 [[MIN11]]
anatofuz
parents:
diff changeset
407 ; VI-NEXT: [[CMP12:%.*]] = icmp slt i16 [[ELT13]], [[MIN12]]
anatofuz
parents:
diff changeset
408 ; VI-NEXT: [[MIN13:%.*]] = select i1 [[CMP12]], i16 [[ELT13]], i16 [[MIN12]]
anatofuz
parents:
diff changeset
409 ; VI-NEXT: [[CMP13:%.*]] = icmp slt i16 [[ELT14]], [[MIN13]]
anatofuz
parents:
diff changeset
410 ; VI-NEXT: [[MIN14:%.*]] = select i1 [[CMP13]], i16 [[ELT14]], i16 [[MIN13]]
anatofuz
parents:
diff changeset
411 ; VI-NEXT: [[CMP14:%.*]] = icmp slt i16 [[ELT15]], [[MIN14]]
anatofuz
parents:
diff changeset
412 ; VI-NEXT: [[MIN15:%.*]] = select i1 [[CMP14]], i16 [[ELT15]], i16 [[MIN14]]
anatofuz
parents:
diff changeset
413 ; VI-NEXT: ret i16 [[MIN15]]
anatofuz
parents:
diff changeset
414 ;
anatofuz
parents:
diff changeset
415 entry:
anatofuz
parents:
diff changeset
416 %elt0 = extractelement <16 x i16> %vec16, i64 0
anatofuz
parents:
diff changeset
417 %elt1 = extractelement <16 x i16> %vec16, i64 1
anatofuz
parents:
diff changeset
418 %elt2 = extractelement <16 x i16> %vec16, i64 2
anatofuz
parents:
diff changeset
419 %elt3 = extractelement <16 x i16> %vec16, i64 3
anatofuz
parents:
diff changeset
420 %elt4 = extractelement <16 x i16> %vec16, i64 4
anatofuz
parents:
diff changeset
421 %elt5 = extractelement <16 x i16> %vec16, i64 5
anatofuz
parents:
diff changeset
422 %elt6 = extractelement <16 x i16> %vec16, i64 6
anatofuz
parents:
diff changeset
423 %elt7 = extractelement <16 x i16> %vec16, i64 7
anatofuz
parents:
diff changeset
424
anatofuz
parents:
diff changeset
425 %elt8 = extractelement <16 x i16> %vec16, i64 8
anatofuz
parents:
diff changeset
426 %elt9 = extractelement <16 x i16> %vec16, i64 9
anatofuz
parents:
diff changeset
427 %elt10 = extractelement <16 x i16> %vec16, i64 10
anatofuz
parents:
diff changeset
428 %elt11 = extractelement <16 x i16> %vec16, i64 11
anatofuz
parents:
diff changeset
429 %elt12 = extractelement <16 x i16> %vec16, i64 12
anatofuz
parents:
diff changeset
430 %elt13 = extractelement <16 x i16> %vec16, i64 13
anatofuz
parents:
diff changeset
431 %elt14 = extractelement <16 x i16> %vec16, i64 14
anatofuz
parents:
diff changeset
432 %elt15 = extractelement <16 x i16> %vec16, i64 15
anatofuz
parents:
diff changeset
433
anatofuz
parents:
diff changeset
434 %cmp0 = icmp slt i16 %elt1, %elt0
anatofuz
parents:
diff changeset
435 %min1 = select i1 %cmp0, i16 %elt1, i16 %elt0
anatofuz
parents:
diff changeset
436 %cmp1 = icmp slt i16 %elt2, %min1
anatofuz
parents:
diff changeset
437 %min2 = select i1 %cmp1, i16 %elt2, i16 %min1
anatofuz
parents:
diff changeset
438 %cmp2 = icmp slt i16 %elt3, %min2
anatofuz
parents:
diff changeset
439 %min3 = select i1 %cmp2, i16 %elt3, i16 %min2
anatofuz
parents:
diff changeset
440
anatofuz
parents:
diff changeset
441 %cmp3 = icmp slt i16 %elt4, %min3
anatofuz
parents:
diff changeset
442 %min4 = select i1 %cmp3, i16 %elt4, i16 %min3
anatofuz
parents:
diff changeset
443 %cmp4 = icmp slt i16 %elt5, %min4
anatofuz
parents:
diff changeset
444 %min5 = select i1 %cmp4, i16 %elt5, i16 %min4
anatofuz
parents:
diff changeset
445
anatofuz
parents:
diff changeset
446 %cmp5 = icmp slt i16 %elt6, %min5
anatofuz
parents:
diff changeset
447 %min6 = select i1 %cmp5, i16 %elt6, i16 %min5
anatofuz
parents:
diff changeset
448 %cmp6 = icmp slt i16 %elt7, %min6
anatofuz
parents:
diff changeset
449 %min7 = select i1 %cmp6, i16 %elt7, i16 %min6
anatofuz
parents:
diff changeset
450
anatofuz
parents:
diff changeset
451 %cmp7 = icmp slt i16 %elt8, %min7
anatofuz
parents:
diff changeset
452 %min8 = select i1 %cmp7, i16 %elt8, i16 %min7
anatofuz
parents:
diff changeset
453 %cmp8 = icmp slt i16 %elt9, %min8
anatofuz
parents:
diff changeset
454 %min9 = select i1 %cmp8, i16 %elt9, i16 %min8
anatofuz
parents:
diff changeset
455
anatofuz
parents:
diff changeset
456 %cmp9 = icmp slt i16 %elt10, %min9
anatofuz
parents:
diff changeset
457 %min10 = select i1 %cmp9, i16 %elt10, i16 %min9
anatofuz
parents:
diff changeset
458 %cmp10 = icmp slt i16 %elt11, %min10
anatofuz
parents:
diff changeset
459 %min11 = select i1 %cmp10, i16 %elt11, i16 %min10
anatofuz
parents:
diff changeset
460
anatofuz
parents:
diff changeset
461 %cmp11 = icmp slt i16 %elt12, %min11
anatofuz
parents:
diff changeset
462 %min12 = select i1 %cmp11, i16 %elt12, i16 %min11
anatofuz
parents:
diff changeset
463 %cmp12 = icmp slt i16 %elt13, %min12
anatofuz
parents:
diff changeset
464 %min13 = select i1 %cmp12, i16 %elt13, i16 %min12
anatofuz
parents:
diff changeset
465
anatofuz
parents:
diff changeset
466 %cmp13 = icmp slt i16 %elt14, %min13
anatofuz
parents:
diff changeset
467 %min14 = select i1 %cmp13, i16 %elt14, i16 %min13
anatofuz
parents:
diff changeset
468 %cmp14 = icmp slt i16 %elt15, %min14
anatofuz
parents:
diff changeset
469 %min15 = select i1 %cmp14, i16 %elt15, i16 %min14
anatofuz
parents:
diff changeset
470
anatofuz
parents:
diff changeset
471
anatofuz
parents:
diff changeset
472 ret i16 %min15
anatofuz
parents:
diff changeset
473 }
anatofuz
parents:
diff changeset
474
anatofuz
parents:
diff changeset
475 define i16 @reduction_umax_v4i16(<4 x i16> %vec4) {
anatofuz
parents:
diff changeset
476 ; GFX9-LABEL: @reduction_umax_v4i16(
anatofuz
parents:
diff changeset
477 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
478 ; GFX9-NEXT: [[TMP0:%.*]] = call i16 @llvm.vector.reduce.umax.v4i16(<4 x i16> [[VEC4:%.*]])
150
anatofuz
parents:
diff changeset
479 ; GFX9-NEXT: ret i16 [[TMP0]]
anatofuz
parents:
diff changeset
480 ;
anatofuz
parents:
diff changeset
481 ; VI-LABEL: @reduction_umax_v4i16(
anatofuz
parents:
diff changeset
482 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
483 ; VI-NEXT: [[ELT0:%.*]] = extractelement <4 x i16> [[VEC4:%.*]], i64 0
anatofuz
parents:
diff changeset
484 ; VI-NEXT: [[ELT1:%.*]] = extractelement <4 x i16> [[VEC4]], i64 1
anatofuz
parents:
diff changeset
485 ; VI-NEXT: [[ELT2:%.*]] = extractelement <4 x i16> [[VEC4]], i64 2
anatofuz
parents:
diff changeset
486 ; VI-NEXT: [[ELT3:%.*]] = extractelement <4 x i16> [[VEC4]], i64 3
anatofuz
parents:
diff changeset
487 ; VI-NEXT: [[CMP1:%.*]] = icmp ugt i16 [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
488 ; VI-NEXT: [[MAX1:%.*]] = select i1 [[CMP1]], i16 [[ELT1]], i16 [[ELT0]]
anatofuz
parents:
diff changeset
489 ; VI-NEXT: [[CMP2:%.*]] = icmp ugt i16 [[ELT2]], [[MAX1]]
anatofuz
parents:
diff changeset
490 ; VI-NEXT: [[MAX2:%.*]] = select i1 [[CMP2]], i16 [[ELT2]], i16 [[MAX1]]
anatofuz
parents:
diff changeset
491 ; VI-NEXT: [[CMP3:%.*]] = icmp ugt i16 [[ELT3]], [[MAX2]]
anatofuz
parents:
diff changeset
492 ; VI-NEXT: [[MAX3:%.*]] = select i1 [[CMP3]], i16 [[ELT3]], i16 [[MAX2]]
anatofuz
parents:
diff changeset
493 ; VI-NEXT: ret i16 [[MAX3]]
anatofuz
parents:
diff changeset
494 ;
anatofuz
parents:
diff changeset
495 entry:
anatofuz
parents:
diff changeset
496 %elt0 = extractelement <4 x i16> %vec4, i64 0
anatofuz
parents:
diff changeset
497 %elt1 = extractelement <4 x i16> %vec4, i64 1
anatofuz
parents:
diff changeset
498 %elt2 = extractelement <4 x i16> %vec4, i64 2
anatofuz
parents:
diff changeset
499 %elt3 = extractelement <4 x i16> %vec4, i64 3
anatofuz
parents:
diff changeset
500
anatofuz
parents:
diff changeset
501 %cmp1 = icmp ugt i16 %elt1, %elt0
anatofuz
parents:
diff changeset
502 %max1 = select i1 %cmp1, i16 %elt1, i16 %elt0
anatofuz
parents:
diff changeset
503 %cmp2 = icmp ugt i16 %elt2, %max1
anatofuz
parents:
diff changeset
504 %max2 = select i1 %cmp2, i16 %elt2, i16 %max1
anatofuz
parents:
diff changeset
505 %cmp3 = icmp ugt i16 %elt3, %max2
anatofuz
parents:
diff changeset
506 %max3 = select i1 %cmp3, i16 %elt3, i16 %max2
anatofuz
parents:
diff changeset
507
anatofuz
parents:
diff changeset
508 ret i16 %max3
anatofuz
parents:
diff changeset
509 }
anatofuz
parents:
diff changeset
510
anatofuz
parents:
diff changeset
511 define i16 @reduction_smax_v4i16(<4 x i16> %vec4) {
anatofuz
parents:
diff changeset
512 ; GFX9-LABEL: @reduction_smax_v4i16(
anatofuz
parents:
diff changeset
513 ; GFX9-NEXT: entry:
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
514 ; GFX9-NEXT: [[TMP0:%.*]] = call i16 @llvm.vector.reduce.smax.v4i16(<4 x i16> [[VEC4:%.*]])
150
anatofuz
parents:
diff changeset
515 ; GFX9-NEXT: ret i16 [[TMP0]]
anatofuz
parents:
diff changeset
516 ;
anatofuz
parents:
diff changeset
517 ; VI-LABEL: @reduction_smax_v4i16(
anatofuz
parents:
diff changeset
518 ; VI-NEXT: entry:
anatofuz
parents:
diff changeset
519 ; VI-NEXT: [[ELT0:%.*]] = extractelement <4 x i16> [[VEC4:%.*]], i64 0
anatofuz
parents:
diff changeset
520 ; VI-NEXT: [[ELT1:%.*]] = extractelement <4 x i16> [[VEC4]], i64 1
anatofuz
parents:
diff changeset
521 ; VI-NEXT: [[ELT2:%.*]] = extractelement <4 x i16> [[VEC4]], i64 2
anatofuz
parents:
diff changeset
522 ; VI-NEXT: [[ELT3:%.*]] = extractelement <4 x i16> [[VEC4]], i64 3
anatofuz
parents:
diff changeset
523 ; VI-NEXT: [[CMP1:%.*]] = icmp sgt i16 [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
524 ; VI-NEXT: [[MAX1:%.*]] = select i1 [[CMP1]], i16 [[ELT1]], i16 [[ELT0]]
anatofuz
parents:
diff changeset
525 ; VI-NEXT: [[CMP2:%.*]] = icmp sgt i16 [[ELT2]], [[MAX1]]
anatofuz
parents:
diff changeset
526 ; VI-NEXT: [[MAX2:%.*]] = select i1 [[CMP2]], i16 [[ELT2]], i16 [[MAX1]]
anatofuz
parents:
diff changeset
527 ; VI-NEXT: [[CMP3:%.*]] = icmp sgt i16 [[ELT3]], [[MAX2]]
anatofuz
parents:
diff changeset
528 ; VI-NEXT: [[MAX3:%.*]] = select i1 [[CMP3]], i16 [[ELT3]], i16 [[MAX2]]
anatofuz
parents:
diff changeset
529 ; VI-NEXT: ret i16 [[MAX3]]
anatofuz
parents:
diff changeset
530 ;
anatofuz
parents:
diff changeset
531 entry:
anatofuz
parents:
diff changeset
532 %elt0 = extractelement <4 x i16> %vec4, i64 0
anatofuz
parents:
diff changeset
533 %elt1 = extractelement <4 x i16> %vec4, i64 1
anatofuz
parents:
diff changeset
534 %elt2 = extractelement <4 x i16> %vec4, i64 2
anatofuz
parents:
diff changeset
535 %elt3 = extractelement <4 x i16> %vec4, i64 3
anatofuz
parents:
diff changeset
536
anatofuz
parents:
diff changeset
537 %cmp1 = icmp sgt i16 %elt1, %elt0
anatofuz
parents:
diff changeset
538 %max1 = select i1 %cmp1, i16 %elt1, i16 %elt0
anatofuz
parents:
diff changeset
539 %cmp2 = icmp sgt i16 %elt2, %max1
anatofuz
parents:
diff changeset
540 %max2 = select i1 %cmp2, i16 %elt2, i16 %max1
anatofuz
parents:
diff changeset
541 %cmp3 = icmp sgt i16 %elt3, %max2
anatofuz
parents:
diff changeset
542 %max3 = select i1 %cmp3, i16 %elt3, i16 %max2
anatofuz
parents:
diff changeset
543
anatofuz
parents:
diff changeset
544 ret i16 %max3
anatofuz
parents:
diff changeset
545 }
anatofuz
parents:
diff changeset
546
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
547 ; FIXME: Use fmaxnum intrinsics to match what InstCombine creates for fcmp+select
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
548 ; with fastmath on the select.
150
anatofuz
parents:
diff changeset
549 define half @reduction_fmax_v4half(<4 x half> %vec4) {
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
550 ; GCN-LABEL: @reduction_fmax_v4half(
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
551 ; GCN-NEXT: entry:
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
552 ; GCN-NEXT: [[ELT0:%.*]] = extractelement <4 x half> [[VEC4:%.*]], i64 0
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
553 ; GCN-NEXT: [[ELT1:%.*]] = extractelement <4 x half> [[VEC4]], i64 1
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
554 ; GCN-NEXT: [[ELT2:%.*]] = extractelement <4 x half> [[VEC4]], i64 2
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
555 ; GCN-NEXT: [[ELT3:%.*]] = extractelement <4 x half> [[VEC4]], i64 3
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
556 ; GCN-NEXT: [[CMP1:%.*]] = fcmp fast ogt half [[ELT1]], [[ELT0]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
557 ; GCN-NEXT: [[MAX1:%.*]] = select i1 [[CMP1]], half [[ELT1]], half [[ELT0]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
558 ; GCN-NEXT: [[CMP2:%.*]] = fcmp fast ogt half [[ELT2]], [[MAX1]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
559 ; GCN-NEXT: [[MAX2:%.*]] = select i1 [[CMP2]], half [[ELT2]], half [[MAX1]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
560 ; GCN-NEXT: [[CMP3:%.*]] = fcmp fast ogt half [[ELT3]], [[MAX2]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
561 ; GCN-NEXT: [[MAX3:%.*]] = select i1 [[CMP3]], half [[ELT3]], half [[MAX2]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
562 ; GCN-NEXT: ret half [[MAX3]]
150
anatofuz
parents:
diff changeset
563 ;
anatofuz
parents:
diff changeset
564 entry:
anatofuz
parents:
diff changeset
565 %elt0 = extractelement <4 x half> %vec4, i64 0
anatofuz
parents:
diff changeset
566 %elt1 = extractelement <4 x half> %vec4, i64 1
anatofuz
parents:
diff changeset
567 %elt2 = extractelement <4 x half> %vec4, i64 2
anatofuz
parents:
diff changeset
568 %elt3 = extractelement <4 x half> %vec4, i64 3
anatofuz
parents:
diff changeset
569
anatofuz
parents:
diff changeset
570 %cmp1 = fcmp fast ogt half %elt1, %elt0
anatofuz
parents:
diff changeset
571 %max1 = select i1 %cmp1, half %elt1, half %elt0
anatofuz
parents:
diff changeset
572 %cmp2 = fcmp fast ogt half %elt2, %max1
anatofuz
parents:
diff changeset
573 %max2 = select i1 %cmp2, half %elt2, half %max1
anatofuz
parents:
diff changeset
574 %cmp3 = fcmp fast ogt half %elt3, %max2
anatofuz
parents:
diff changeset
575 %max3 = select i1 %cmp3, half %elt3, half %max2
anatofuz
parents:
diff changeset
576
anatofuz
parents:
diff changeset
577 ret half %max3
anatofuz
parents:
diff changeset
578 }
anatofuz
parents:
diff changeset
579
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
580 ; FIXME: Use fmaxnum intrinsics to match what InstCombine creates for fcmp+select
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
581 ; with fastmath on the select.
150
anatofuz
parents:
diff changeset
582 define half @reduction_fmin_v4half(<4 x half> %vec4) {
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
583 ; GCN-LABEL: @reduction_fmin_v4half(
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
584 ; GCN-NEXT: entry:
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
585 ; GCN-NEXT: [[ELT0:%.*]] = extractelement <4 x half> [[VEC4:%.*]], i64 0
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
586 ; GCN-NEXT: [[ELT1:%.*]] = extractelement <4 x half> [[VEC4]], i64 1
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
587 ; GCN-NEXT: [[ELT2:%.*]] = extractelement <4 x half> [[VEC4]], i64 2
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
588 ; GCN-NEXT: [[ELT3:%.*]] = extractelement <4 x half> [[VEC4]], i64 3
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
589 ; GCN-NEXT: [[CMP1:%.*]] = fcmp fast olt half [[ELT1]], [[ELT0]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
590 ; GCN-NEXT: [[MIN1:%.*]] = select i1 [[CMP1]], half [[ELT1]], half [[ELT0]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
591 ; GCN-NEXT: [[CMP2:%.*]] = fcmp fast olt half [[ELT2]], [[MIN1]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
592 ; GCN-NEXT: [[MIN2:%.*]] = select i1 [[CMP2]], half [[ELT2]], half [[MIN1]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
593 ; GCN-NEXT: [[CMP3:%.*]] = fcmp fast olt half [[ELT3]], [[MIN2]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
594 ; GCN-NEXT: [[MIN3:%.*]] = select i1 [[CMP3]], half [[ELT3]], half [[MIN2]]
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
595 ; GCN-NEXT: ret half [[MIN3]]
150
anatofuz
parents:
diff changeset
596 ;
anatofuz
parents:
diff changeset
597 entry:
anatofuz
parents:
diff changeset
598 %elt0 = extractelement <4 x half> %vec4, i64 0
anatofuz
parents:
diff changeset
599 %elt1 = extractelement <4 x half> %vec4, i64 1
anatofuz
parents:
diff changeset
600 %elt2 = extractelement <4 x half> %vec4, i64 2
anatofuz
parents:
diff changeset
601 %elt3 = extractelement <4 x half> %vec4, i64 3
anatofuz
parents:
diff changeset
602
anatofuz
parents:
diff changeset
603 %cmp1 = fcmp fast olt half %elt1, %elt0
anatofuz
parents:
diff changeset
604 %min1 = select i1 %cmp1, half %elt1, half %elt0
anatofuz
parents:
diff changeset
605 %cmp2 = fcmp fast olt half %elt2, %min1
anatofuz
parents:
diff changeset
606 %min2 = select i1 %cmp2, half %elt2, half %min1
anatofuz
parents:
diff changeset
607 %cmp3 = fcmp fast olt half %elt3, %min2
anatofuz
parents:
diff changeset
608 %min3 = select i1 %cmp3, half %elt3, half %min2
anatofuz
parents:
diff changeset
609
anatofuz
parents:
diff changeset
610 ret half %min3
anatofuz
parents:
diff changeset
611 }
anatofuz
parents:
diff changeset
612
anatofuz
parents:
diff changeset
613 ; Tests to make sure reduction does not kick in. vega does not support packed math for types larger than 16 bits.
anatofuz
parents:
diff changeset
614 define float @reduction_v4float(<4 x float> %a) {
anatofuz
parents:
diff changeset
615 ; GCN-LABEL: @reduction_v4float(
anatofuz
parents:
diff changeset
616 ; GCN-NEXT: entry:
anatofuz
parents:
diff changeset
617 ; GCN-NEXT: [[ELT0:%.*]] = extractelement <4 x float> [[A:%.*]], i64 0
anatofuz
parents:
diff changeset
618 ; GCN-NEXT: [[ELT1:%.*]] = extractelement <4 x float> [[A]], i64 1
anatofuz
parents:
diff changeset
619 ; GCN-NEXT: [[ELT2:%.*]] = extractelement <4 x float> [[A]], i64 2
anatofuz
parents:
diff changeset
620 ; GCN-NEXT: [[ELT3:%.*]] = extractelement <4 x float> [[A]], i64 3
anatofuz
parents:
diff changeset
621 ; GCN-NEXT: [[ADD1:%.*]] = fadd fast float [[ELT1]], [[ELT0]]
anatofuz
parents:
diff changeset
622 ; GCN-NEXT: [[ADD2:%.*]] = fadd fast float [[ELT2]], [[ADD1]]
anatofuz
parents:
diff changeset
623 ; GCN-NEXT: [[ADD3:%.*]] = fadd fast float [[ELT3]], [[ADD2]]
anatofuz
parents:
diff changeset
624 ; GCN-NEXT: ret float [[ADD3]]
anatofuz
parents:
diff changeset
625 ;
anatofuz
parents:
diff changeset
626 entry:
anatofuz
parents:
diff changeset
627 %elt0 = extractelement <4 x float> %a, i64 0
anatofuz
parents:
diff changeset
628 %elt1 = extractelement <4 x float> %a, i64 1
anatofuz
parents:
diff changeset
629 %elt2 = extractelement <4 x float> %a, i64 2
anatofuz
parents:
diff changeset
630 %elt3 = extractelement <4 x float> %a, i64 3
anatofuz
parents:
diff changeset
631
anatofuz
parents:
diff changeset
632 %add1 = fadd fast float %elt1, %elt0
anatofuz
parents:
diff changeset
633 %add2 = fadd fast float %elt2, %add1
anatofuz
parents:
diff changeset
634 %add3 = fadd fast float %elt3, %add2
anatofuz
parents:
diff changeset
635
anatofuz
parents:
diff changeset
636 ret float %add3
207
Shinji KONO <kono@ie.u-ryukyu.ac.jp>
parents: 150
diff changeset
637 }