150
|
1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
2 ; RUN: llc -march=amdgcn -mcpu=gfx900 -verify-machineinstrs < %s | FileCheck -check-prefixes=GFX9 %s
|
|
3 ; RUN: llc -march=amdgcn -mcpu=gfx1010 -verify-machineinstrs < %s | FileCheck -check-prefixes=GFX10 %s
|
|
4
|
|
5 define amdgpu_ps <4 x float> @load_1d(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
6 ; GFX9-LABEL: load_1d:
|
|
7 ; GFX9: ; %bb.0: ; %main_body
|
|
8 ; GFX9-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf unorm a16
|
|
9 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
10 ; GFX9-NEXT: ; return to shader part epilog
|
|
11 ;
|
|
12 ; GFX10-LABEL: load_1d:
|
|
13 ; GFX10: ; %bb.0: ; %main_body
|
|
14 ; GFX10-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm a16
|
|
15 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
16 ; GFX10-NEXT: ; return to shader part epilog
|
|
17 main_body:
|
|
18 %s = extractelement <2 x i16> %coords, i32 0
|
|
19 %v = call <4 x float> @llvm.amdgcn.image.load.1d.v4f32.i16(i32 15, i16 %s, <8 x i32> %rsrc, i32 0, i32 0)
|
|
20 ret <4 x float> %v
|
|
21 }
|
|
22
|
|
23 define amdgpu_ps <4 x float> @load_2d(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
24 ; GFX9-LABEL: load_2d:
|
|
25 ; GFX9: ; %bb.0: ; %main_body
|
|
26 ; GFX9-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf unorm a16
|
|
27 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
28 ; GFX9-NEXT: ; return to shader part epilog
|
|
29 ;
|
|
30 ; GFX10-LABEL: load_2d:
|
|
31 ; GFX10: ; %bb.0: ; %main_body
|
|
32 ; GFX10-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D unorm a16
|
|
33 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
34 ; GFX10-NEXT: ; return to shader part epilog
|
|
35 main_body:
|
|
36 %s = extractelement <2 x i16> %coords, i32 0
|
|
37 %t = extractelement <2 x i16> %coords, i32 1
|
|
38 %v = call <4 x float> @llvm.amdgcn.image.load.2d.v4f32.i16(i32 15, i16 %s, i16 %t, <8 x i32> %rsrc, i32 0, i32 0)
|
|
39 ret <4 x float> %v
|
|
40 }
|
|
41
|
|
42 define amdgpu_ps <4 x float> @load_3d(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
43 ; GFX9-LABEL: load_3d:
|
|
44 ; GFX9: ; %bb.0: ; %main_body
|
|
45 ; GFX9-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16
|
|
46 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
47 ; GFX9-NEXT: ; return to shader part epilog
|
|
48 ;
|
|
49 ; GFX10-LABEL: load_3d:
|
|
50 ; GFX10: ; %bb.0: ; %main_body
|
|
51 ; GFX10-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_3D unorm a16
|
|
52 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
53 ; GFX10-NEXT: ; return to shader part epilog
|
|
54 main_body:
|
|
55 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
56 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
57 %r = extractelement <2 x i16> %coords_hi, i32 0
|
|
58 %v = call <4 x float> @llvm.amdgcn.image.load.3d.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %r, <8 x i32> %rsrc, i32 0, i32 0)
|
|
59 ret <4 x float> %v
|
|
60 }
|
|
61
|
|
62 define amdgpu_ps <4 x float> @load_cube(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
63 ; GFX9-LABEL: load_cube:
|
|
64 ; GFX9: ; %bb.0: ; %main_body
|
|
65 ; GFX9-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16 da
|
|
66 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
67 ; GFX9-NEXT: ; return to shader part epilog
|
|
68 ;
|
|
69 ; GFX10-LABEL: load_cube:
|
|
70 ; GFX10: ; %bb.0: ; %main_body
|
|
71 ; GFX10-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_CUBE unorm a16
|
|
72 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
73 ; GFX10-NEXT: ; return to shader part epilog
|
|
74 main_body:
|
|
75 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
76 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
77 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
78 %v = call <4 x float> @llvm.amdgcn.image.load.cube.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %slice, <8 x i32> %rsrc, i32 0, i32 0)
|
|
79 ret <4 x float> %v
|
|
80 }
|
|
81
|
|
82 define amdgpu_ps <4 x float> @load_1darray(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
83 ; GFX9-LABEL: load_1darray:
|
|
84 ; GFX9: ; %bb.0: ; %main_body
|
|
85 ; GFX9-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf unorm a16 da
|
|
86 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
87 ; GFX9-NEXT: ; return to shader part epilog
|
|
88 ;
|
|
89 ; GFX10-LABEL: load_1darray:
|
|
90 ; GFX10: ; %bb.0: ; %main_body
|
|
91 ; GFX10-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D_ARRAY unorm a16
|
|
92 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
93 ; GFX10-NEXT: ; return to shader part epilog
|
|
94 main_body:
|
|
95 %s = extractelement <2 x i16> %coords, i32 0
|
|
96 %slice = extractelement <2 x i16> %coords, i32 1
|
|
97 %v = call <4 x float> @llvm.amdgcn.image.load.1darray.v4f32.i16(i32 15, i16 %s, i16 %slice, <8 x i32> %rsrc, i32 0, i32 0)
|
|
98 ret <4 x float> %v
|
|
99 }
|
|
100
|
|
101 define amdgpu_ps <4 x float> @load_2darray(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
102 ; GFX9-LABEL: load_2darray:
|
|
103 ; GFX9: ; %bb.0: ; %main_body
|
|
104 ; GFX9-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16 da
|
|
105 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
106 ; GFX9-NEXT: ; return to shader part epilog
|
|
107 ;
|
|
108 ; GFX10-LABEL: load_2darray:
|
|
109 ; GFX10: ; %bb.0: ; %main_body
|
|
110 ; GFX10-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_ARRAY unorm a16
|
|
111 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
112 ; GFX10-NEXT: ; return to shader part epilog
|
|
113 main_body:
|
|
114 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
115 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
116 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
117 %v = call <4 x float> @llvm.amdgcn.image.load.2darray.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %slice, <8 x i32> %rsrc, i32 0, i32 0)
|
|
118 ret <4 x float> %v
|
|
119 }
|
|
120
|
|
121 define amdgpu_ps <4 x float> @load_2dmsaa(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
122 ; GFX9-LABEL: load_2dmsaa:
|
|
123 ; GFX9: ; %bb.0: ; %main_body
|
|
124 ; GFX9-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16
|
|
125 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
126 ; GFX9-NEXT: ; return to shader part epilog
|
|
127 ;
|
|
128 ; GFX10-LABEL: load_2dmsaa:
|
|
129 ; GFX10: ; %bb.0: ; %main_body
|
|
130 ; GFX10-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_MSAA unorm a16
|
|
131 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
132 ; GFX10-NEXT: ; return to shader part epilog
|
|
133 main_body:
|
|
134 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
135 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
136 %fragid = extractelement <2 x i16> %coords_hi, i32 0
|
|
137 %v = call <4 x float> @llvm.amdgcn.image.load.2dmsaa.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %fragid, <8 x i32> %rsrc, i32 0, i32 0)
|
|
138 ret <4 x float> %v
|
|
139 }
|
|
140
|
|
141 define amdgpu_ps <4 x float> @load_2darraymsaa(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
142 ; GFX9-LABEL: load_2darraymsaa:
|
|
143 ; GFX9: ; %bb.0: ; %main_body
|
|
144 ; GFX9-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16 da
|
|
145 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
146 ; GFX9-NEXT: ; return to shader part epilog
|
|
147 ;
|
|
148 ; GFX10-LABEL: load_2darraymsaa:
|
|
149 ; GFX10: ; %bb.0: ; %main_body
|
|
150 ; GFX10-NEXT: image_load v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm a16
|
|
151 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
152 ; GFX10-NEXT: ; return to shader part epilog
|
|
153 main_body:
|
|
154 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
155 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
156 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
157 %fragid = extractelement <2 x i16> %coords_hi, i32 1
|
|
158 %v = call <4 x float> @llvm.amdgcn.image.load.2darraymsaa.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %slice, i16 %fragid, <8 x i32> %rsrc, i32 0, i32 0)
|
|
159 ret <4 x float> %v
|
|
160 }
|
|
161
|
|
162 define amdgpu_ps <4 x float> @load_mip_1d(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
163 ; GFX9-LABEL: load_mip_1d:
|
|
164 ; GFX9: ; %bb.0: ; %main_body
|
|
165 ; GFX9-NEXT: image_load_mip v[0:3], v0, s[0:7] dmask:0xf unorm a16
|
|
166 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
167 ; GFX9-NEXT: ; return to shader part epilog
|
|
168 ;
|
|
169 ; GFX10-LABEL: load_mip_1d:
|
|
170 ; GFX10: ; %bb.0: ; %main_body
|
|
171 ; GFX10-NEXT: image_load_mip v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm a16
|
|
172 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
173 ; GFX10-NEXT: ; return to shader part epilog
|
|
174 main_body:
|
|
175 %s = extractelement <2 x i16> %coords, i32 0
|
|
176 %mip = extractelement <2 x i16> %coords, i32 1
|
|
177 %v = call <4 x float> @llvm.amdgcn.image.load.mip.1d.v4f32.i16(i32 15, i16 %s, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
178 ret <4 x float> %v
|
|
179 }
|
|
180
|
|
181 define amdgpu_ps <4 x float> @load_mip_2d(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
182 ; GFX9-LABEL: load_mip_2d:
|
|
183 ; GFX9: ; %bb.0: ; %main_body
|
|
184 ; GFX9-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16
|
|
185 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
186 ; GFX9-NEXT: ; return to shader part epilog
|
|
187 ;
|
|
188 ; GFX10-LABEL: load_mip_2d:
|
|
189 ; GFX10: ; %bb.0: ; %main_body
|
|
190 ; GFX10-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D unorm a16
|
|
191 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
192 ; GFX10-NEXT: ; return to shader part epilog
|
|
193 main_body:
|
|
194 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
195 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
196 %mip = extractelement <2 x i16> %coords_hi, i32 0
|
|
197 %v = call <4 x float> @llvm.amdgcn.image.load.mip.2d.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
198 ret <4 x float> %v
|
|
199 }
|
|
200
|
|
201 define amdgpu_ps <4 x float> @load_mip_3d(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
202 ; GFX9-LABEL: load_mip_3d:
|
|
203 ; GFX9: ; %bb.0: ; %main_body
|
|
204 ; GFX9-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16
|
|
205 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
206 ; GFX9-NEXT: ; return to shader part epilog
|
|
207 ;
|
|
208 ; GFX10-LABEL: load_mip_3d:
|
|
209 ; GFX10: ; %bb.0: ; %main_body
|
|
210 ; GFX10-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_3D unorm a16
|
|
211 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
212 ; GFX10-NEXT: ; return to shader part epilog
|
|
213 main_body:
|
|
214 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
215 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
216 %r = extractelement <2 x i16> %coords_hi, i32 0
|
|
217 %mip = extractelement <2 x i16> %coords_hi, i32 1
|
|
218 %v = call <4 x float> @llvm.amdgcn.image.load.mip.3d.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %r, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
219 ret <4 x float> %v
|
|
220 }
|
|
221
|
|
222 define amdgpu_ps <4 x float> @load_mip_cube(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
223 ; GFX9-LABEL: load_mip_cube:
|
|
224 ; GFX9: ; %bb.0: ; %main_body
|
|
225 ; GFX9-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16 da
|
|
226 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
227 ; GFX9-NEXT: ; return to shader part epilog
|
|
228 ;
|
|
229 ; GFX10-LABEL: load_mip_cube:
|
|
230 ; GFX10: ; %bb.0: ; %main_body
|
|
231 ; GFX10-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_CUBE unorm a16
|
|
232 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
233 ; GFX10-NEXT: ; return to shader part epilog
|
|
234 main_body:
|
|
235 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
236 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
237 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
238 %mip = extractelement <2 x i16> %coords_hi, i32 1
|
|
239 %v = call <4 x float> @llvm.amdgcn.image.load.mip.cube.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %slice, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
240 ret <4 x float> %v
|
|
241 }
|
|
242
|
|
243 define amdgpu_ps <4 x float> @load_mip_1darray(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
244 ; GFX9-LABEL: load_mip_1darray:
|
|
245 ; GFX9: ; %bb.0: ; %main_body
|
|
246 ; GFX9-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16 da
|
|
247 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
248 ; GFX9-NEXT: ; return to shader part epilog
|
|
249 ;
|
|
250 ; GFX10-LABEL: load_mip_1darray:
|
|
251 ; GFX10: ; %bb.0: ; %main_body
|
|
252 ; GFX10-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D_ARRAY unorm a16
|
|
253 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
254 ; GFX10-NEXT: ; return to shader part epilog
|
|
255 main_body:
|
|
256 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
257 %slice = extractelement <2 x i16> %coords_lo, i32 1
|
|
258 %mip = extractelement <2 x i16> %coords_hi, i32 0
|
|
259 %v = call <4 x float> @llvm.amdgcn.image.load.mip.1darray.v4f32.i16(i32 15, i16 %s, i16 %slice, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
260 ret <4 x float> %v
|
|
261 }
|
|
262
|
|
263 define amdgpu_ps <4 x float> @load_mip_2darray(<8 x i32> inreg %rsrc, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
264 ; GFX9-LABEL: load_mip_2darray:
|
|
265 ; GFX9: ; %bb.0: ; %main_body
|
|
266 ; GFX9-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf unorm a16 da
|
|
267 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
268 ; GFX9-NEXT: ; return to shader part epilog
|
|
269 ;
|
|
270 ; GFX10-LABEL: load_mip_2darray:
|
|
271 ; GFX10: ; %bb.0: ; %main_body
|
|
272 ; GFX10-NEXT: image_load_mip v[0:3], v[0:1], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_ARRAY unorm a16
|
|
273 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
274 ; GFX10-NEXT: ; return to shader part epilog
|
|
275 main_body:
|
|
276 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
277 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
278 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
279 %mip = extractelement <2 x i16> %coords_hi, i32 1
|
|
280 %v = call <4 x float> @llvm.amdgcn.image.load.mip.2darray.v4f32.i16(i32 15, i16 %s, i16 %t, i16 %slice, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
281 ret <4 x float> %v
|
|
282 }
|
|
283
|
|
284 define amdgpu_ps void @store_1d(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords) {
|
|
285 ; GFX9-LABEL: store_1d:
|
|
286 ; GFX9: ; %bb.0: ; %main_body
|
|
287 ; GFX9-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf unorm a16
|
|
288 ; GFX9-NEXT: s_endpgm
|
|
289 ;
|
|
290 ; GFX10-LABEL: store_1d:
|
|
291 ; GFX10: ; %bb.0: ; %main_body
|
|
292 ; GFX10-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm a16
|
|
293 ; GFX10-NEXT: s_endpgm
|
|
294 main_body:
|
|
295 %s = extractelement <2 x i16> %coords, i32 0
|
|
296 call void @llvm.amdgcn.image.store.1d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, <8 x i32> %rsrc, i32 0, i32 0)
|
|
297 ret void
|
|
298 }
|
|
299
|
|
300 define amdgpu_ps void @store_2d(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords) {
|
|
301 ; GFX9-LABEL: store_2d:
|
|
302 ; GFX9: ; %bb.0: ; %main_body
|
|
303 ; GFX9-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf unorm a16
|
|
304 ; GFX9-NEXT: s_endpgm
|
|
305 ;
|
|
306 ; GFX10-LABEL: store_2d:
|
|
307 ; GFX10: ; %bb.0: ; %main_body
|
|
308 ; GFX10-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D unorm a16
|
|
309 ; GFX10-NEXT: s_endpgm
|
|
310 main_body:
|
|
311 %s = extractelement <2 x i16> %coords, i32 0
|
|
312 %t = extractelement <2 x i16> %coords, i32 1
|
|
313 call void @llvm.amdgcn.image.store.2d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, <8 x i32> %rsrc, i32 0, i32 0)
|
|
314 ret void
|
|
315 }
|
|
316
|
|
317 define amdgpu_ps void @store_3d(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
318 ; GFX9-LABEL: store_3d:
|
|
319 ; GFX9: ; %bb.0: ; %main_body
|
|
320 ; GFX9-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16
|
|
321 ; GFX9-NEXT: s_endpgm
|
|
322 ;
|
|
323 ; GFX10-LABEL: store_3d:
|
|
324 ; GFX10: ; %bb.0: ; %main_body
|
|
325 ; GFX10-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_3D unorm a16
|
|
326 ; GFX10-NEXT: s_endpgm
|
|
327 main_body:
|
|
328 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
329 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
330 %r = extractelement <2 x i16> %coords_hi, i32 0
|
|
331 call void @llvm.amdgcn.image.store.3d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %r, <8 x i32> %rsrc, i32 0, i32 0)
|
|
332 ret void
|
|
333 }
|
|
334
|
|
335 define amdgpu_ps void @store_cube(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
336 ; GFX9-LABEL: store_cube:
|
|
337 ; GFX9: ; %bb.0: ; %main_body
|
|
338 ; GFX9-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16 da
|
|
339 ; GFX9-NEXT: s_endpgm
|
|
340 ;
|
|
341 ; GFX10-LABEL: store_cube:
|
|
342 ; GFX10: ; %bb.0: ; %main_body
|
|
343 ; GFX10-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_CUBE unorm a16
|
|
344 ; GFX10-NEXT: s_endpgm
|
|
345 main_body:
|
|
346 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
347 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
348 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
349 call void @llvm.amdgcn.image.store.cube.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %slice, <8 x i32> %rsrc, i32 0, i32 0)
|
|
350 ret void
|
|
351 }
|
|
352
|
|
353 define amdgpu_ps void @store_1darray(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords) {
|
|
354 ; GFX9-LABEL: store_1darray:
|
|
355 ; GFX9: ; %bb.0: ; %main_body
|
|
356 ; GFX9-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf unorm a16 da
|
|
357 ; GFX9-NEXT: s_endpgm
|
|
358 ;
|
|
359 ; GFX10-LABEL: store_1darray:
|
|
360 ; GFX10: ; %bb.0: ; %main_body
|
|
361 ; GFX10-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D_ARRAY unorm a16
|
|
362 ; GFX10-NEXT: s_endpgm
|
|
363 main_body:
|
|
364 %s = extractelement <2 x i16> %coords, i32 0
|
|
365 %slice = extractelement <2 x i16> %coords, i32 1
|
|
366 call void @llvm.amdgcn.image.store.1darray.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %slice, <8 x i32> %rsrc, i32 0, i32 0)
|
|
367 ret void
|
|
368 }
|
|
369
|
|
370 define amdgpu_ps void @store_2darray(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
371 ; GFX9-LABEL: store_2darray:
|
|
372 ; GFX9: ; %bb.0: ; %main_body
|
|
373 ; GFX9-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16 da
|
|
374 ; GFX9-NEXT: s_endpgm
|
|
375 ;
|
|
376 ; GFX10-LABEL: store_2darray:
|
|
377 ; GFX10: ; %bb.0: ; %main_body
|
|
378 ; GFX10-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_ARRAY unorm a16
|
|
379 ; GFX10-NEXT: s_endpgm
|
|
380 main_body:
|
|
381 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
382 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
383 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
384 call void @llvm.amdgcn.image.store.2darray.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %slice, <8 x i32> %rsrc, i32 0, i32 0)
|
|
385 ret void
|
|
386 }
|
|
387
|
|
388 define amdgpu_ps void @store_2dmsaa(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
389 ; GFX9-LABEL: store_2dmsaa:
|
|
390 ; GFX9: ; %bb.0: ; %main_body
|
|
391 ; GFX9-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16
|
|
392 ; GFX9-NEXT: s_endpgm
|
|
393 ;
|
|
394 ; GFX10-LABEL: store_2dmsaa:
|
|
395 ; GFX10: ; %bb.0: ; %main_body
|
|
396 ; GFX10-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_MSAA unorm a16
|
|
397 ; GFX10-NEXT: s_endpgm
|
|
398 main_body:
|
|
399 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
400 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
401 %fragid = extractelement <2 x i16> %coords_hi, i32 0
|
|
402 call void @llvm.amdgcn.image.store.2dmsaa.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %fragid, <8 x i32> %rsrc, i32 0, i32 0)
|
|
403 ret void
|
|
404 }
|
|
405
|
|
406 define amdgpu_ps void @store_2darraymsaa(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
407 ; GFX9-LABEL: store_2darraymsaa:
|
|
408 ; GFX9: ; %bb.0: ; %main_body
|
|
409 ; GFX9-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16 da
|
|
410 ; GFX9-NEXT: s_endpgm
|
|
411 ;
|
|
412 ; GFX10-LABEL: store_2darraymsaa:
|
|
413 ; GFX10: ; %bb.0: ; %main_body
|
|
414 ; GFX10-NEXT: image_store v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm a16
|
|
415 ; GFX10-NEXT: s_endpgm
|
|
416 main_body:
|
|
417 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
418 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
419 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
420 %fragid = extractelement <2 x i16> %coords_hi, i32 1
|
|
421 call void @llvm.amdgcn.image.store.2darraymsaa.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %slice, i16 %fragid, <8 x i32> %rsrc, i32 0, i32 0)
|
|
422 ret void
|
|
423 }
|
|
424
|
|
425 define amdgpu_ps void @store_mip_1d(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords) {
|
|
426 ; GFX9-LABEL: store_mip_1d:
|
|
427 ; GFX9: ; %bb.0: ; %main_body
|
|
428 ; GFX9-NEXT: image_store_mip v[0:3], v4, s[0:7] dmask:0xf unorm a16
|
|
429 ; GFX9-NEXT: s_endpgm
|
|
430 ;
|
|
431 ; GFX10-LABEL: store_mip_1d:
|
|
432 ; GFX10: ; %bb.0: ; %main_body
|
|
433 ; GFX10-NEXT: image_store_mip v[0:3], v4, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm a16
|
|
434 ; GFX10-NEXT: s_endpgm
|
|
435 main_body:
|
|
436 %s = extractelement <2 x i16> %coords, i32 0
|
|
437 %mip = extractelement <2 x i16> %coords, i32 1
|
|
438 call void @llvm.amdgcn.image.store.mip.1d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
439 ret void
|
|
440 }
|
|
441
|
|
442 define amdgpu_ps void @store_mip_2d(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
443 ; GFX9-LABEL: store_mip_2d:
|
|
444 ; GFX9: ; %bb.0: ; %main_body
|
|
445 ; GFX9-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16
|
|
446 ; GFX9-NEXT: s_endpgm
|
|
447 ;
|
|
448 ; GFX10-LABEL: store_mip_2d:
|
|
449 ; GFX10: ; %bb.0: ; %main_body
|
|
450 ; GFX10-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D unorm a16
|
|
451 ; GFX10-NEXT: s_endpgm
|
|
452 main_body:
|
|
453 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
454 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
455 %mip = extractelement <2 x i16> %coords_hi, i32 0
|
|
456 call void @llvm.amdgcn.image.store.mip.2d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
457 ret void
|
|
458 }
|
|
459
|
|
460 define amdgpu_ps void @store_mip_3d(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
461 ; GFX9-LABEL: store_mip_3d:
|
|
462 ; GFX9: ; %bb.0: ; %main_body
|
|
463 ; GFX9-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16
|
|
464 ; GFX9-NEXT: s_endpgm
|
|
465 ;
|
|
466 ; GFX10-LABEL: store_mip_3d:
|
|
467 ; GFX10: ; %bb.0: ; %main_body
|
|
468 ; GFX10-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_3D unorm a16
|
|
469 ; GFX10-NEXT: s_endpgm
|
|
470 main_body:
|
|
471 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
472 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
473 %r = extractelement <2 x i16> %coords_hi, i32 0
|
|
474 %mip = extractelement <2 x i16> %coords_hi, i32 1
|
|
475 call void @llvm.amdgcn.image.store.mip.3d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %r, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
476 ret void
|
|
477 }
|
|
478
|
|
479 define amdgpu_ps void @store_mip_cube(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
480 ; GFX9-LABEL: store_mip_cube:
|
|
481 ; GFX9: ; %bb.0: ; %main_body
|
|
482 ; GFX9-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16 da
|
|
483 ; GFX9-NEXT: s_endpgm
|
|
484 ;
|
|
485 ; GFX10-LABEL: store_mip_cube:
|
|
486 ; GFX10: ; %bb.0: ; %main_body
|
|
487 ; GFX10-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_CUBE unorm a16
|
|
488 ; GFX10-NEXT: s_endpgm
|
|
489 main_body:
|
|
490 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
491 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
492 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
493 %mip = extractelement <2 x i16> %coords_hi, i32 1
|
|
494 call void @llvm.amdgcn.image.store.mip.cube.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %slice, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
495 ret void
|
|
496 }
|
|
497
|
|
498 define amdgpu_ps void @store_mip_1darray(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
499 ; GFX9-LABEL: store_mip_1darray:
|
|
500 ; GFX9: ; %bb.0: ; %main_body
|
|
501 ; GFX9-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16 da
|
|
502 ; GFX9-NEXT: s_endpgm
|
|
503 ;
|
|
504 ; GFX10-LABEL: store_mip_1darray:
|
|
505 ; GFX10: ; %bb.0: ; %main_body
|
|
506 ; GFX10-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D_ARRAY unorm a16
|
|
507 ; GFX10-NEXT: s_endpgm
|
|
508 main_body:
|
|
509 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
510 %slice = extractelement <2 x i16> %coords_lo, i32 1
|
|
511 %mip = extractelement <2 x i16> %coords_hi, i32 0
|
|
512 call void @llvm.amdgcn.image.store.mip.1darray.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %slice, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
513 ret void
|
|
514 }
|
|
515
|
|
516 define amdgpu_ps void @store_mip_2darray(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords_lo, <2 x i16> %coords_hi) {
|
|
517 ; GFX9-LABEL: store_mip_2darray:
|
|
518 ; GFX9: ; %bb.0: ; %main_body
|
|
519 ; GFX9-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf unorm a16 da
|
|
520 ; GFX9-NEXT: s_endpgm
|
|
521 ;
|
|
522 ; GFX10-LABEL: store_mip_2darray:
|
|
523 ; GFX10: ; %bb.0: ; %main_body
|
|
524 ; GFX10-NEXT: image_store_mip v[0:3], v[4:5], s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_ARRAY unorm a16
|
|
525 ; GFX10-NEXT: s_endpgm
|
|
526 main_body:
|
|
527 %s = extractelement <2 x i16> %coords_lo, i32 0
|
|
528 %t = extractelement <2 x i16> %coords_lo, i32 1
|
|
529 %slice = extractelement <2 x i16> %coords_hi, i32 0
|
|
530 %mip = extractelement <2 x i16> %coords_hi, i32 1
|
|
531 call void @llvm.amdgcn.image.store.mip.2darray.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, i16 %t, i16 %slice, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
532 ret void
|
|
533 }
|
|
534
|
|
535 define amdgpu_ps <4 x float> @getresinfo_1d(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
536 ; GFX9-LABEL: getresinfo_1d:
|
|
537 ; GFX9: ; %bb.0: ; %main_body
|
|
538 ; GFX9-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf unorm a16
|
|
539 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
540 ; GFX9-NEXT: ; return to shader part epilog
|
|
541 ;
|
|
542 ; GFX10-LABEL: getresinfo_1d:
|
|
543 ; GFX10: ; %bb.0: ; %main_body
|
|
544 ; GFX10-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm a16
|
|
545 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
546 ; GFX10-NEXT: ; return to shader part epilog
|
|
547 main_body:
|
|
548 %mip = extractelement <2 x i16> %coords, i32 0
|
|
549 %v = call <4 x float> @llvm.amdgcn.image.getresinfo.1d.v4f32.i16(i32 15, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
550 ret <4 x float> %v
|
|
551 }
|
|
552
|
|
553 define amdgpu_ps <4 x float> @getresinfo_2d(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
554 ; GFX9-LABEL: getresinfo_2d:
|
|
555 ; GFX9: ; %bb.0: ; %main_body
|
|
556 ; GFX9-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf unorm a16
|
|
557 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
558 ; GFX9-NEXT: ; return to shader part epilog
|
|
559 ;
|
|
560 ; GFX10-LABEL: getresinfo_2d:
|
|
561 ; GFX10: ; %bb.0: ; %main_body
|
|
562 ; GFX10-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D unorm a16
|
|
563 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
564 ; GFX10-NEXT: ; return to shader part epilog
|
|
565 main_body:
|
|
566 %mip = extractelement <2 x i16> %coords, i32 0
|
|
567 %v = call <4 x float> @llvm.amdgcn.image.getresinfo.2d.v4f32.i16(i32 15, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
568 ret <4 x float> %v
|
|
569 }
|
|
570
|
|
571 define amdgpu_ps <4 x float> @getresinfo_3d(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
572 ; GFX9-LABEL: getresinfo_3d:
|
|
573 ; GFX9: ; %bb.0: ; %main_body
|
|
574 ; GFX9-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf unorm a16
|
|
575 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
576 ; GFX9-NEXT: ; return to shader part epilog
|
|
577 ;
|
|
578 ; GFX10-LABEL: getresinfo_3d:
|
|
579 ; GFX10: ; %bb.0: ; %main_body
|
|
580 ; GFX10-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_3D unorm a16
|
|
581 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
582 ; GFX10-NEXT: ; return to shader part epilog
|
|
583 main_body:
|
|
584 %mip = extractelement <2 x i16> %coords, i32 0
|
|
585 %v = call <4 x float> @llvm.amdgcn.image.getresinfo.3d.v4f32.i16(i32 15, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
586 ret <4 x float> %v
|
|
587 }
|
|
588
|
|
589 define amdgpu_ps <4 x float> @getresinfo_cube(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
590 ; GFX9-LABEL: getresinfo_cube:
|
|
591 ; GFX9: ; %bb.0: ; %main_body
|
|
592 ; GFX9-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf unorm a16 da
|
|
593 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
594 ; GFX9-NEXT: ; return to shader part epilog
|
|
595 ;
|
|
596 ; GFX10-LABEL: getresinfo_cube:
|
|
597 ; GFX10: ; %bb.0: ; %main_body
|
|
598 ; GFX10-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_CUBE unorm a16
|
|
599 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
600 ; GFX10-NEXT: ; return to shader part epilog
|
|
601 main_body:
|
|
602 %mip = extractelement <2 x i16> %coords, i32 0
|
|
603 %v = call <4 x float> @llvm.amdgcn.image.getresinfo.cube.v4f32.i16(i32 15, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
604 ret <4 x float> %v
|
|
605 }
|
|
606
|
|
607 define amdgpu_ps <4 x float> @getresinfo_1darray(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
608 ; GFX9-LABEL: getresinfo_1darray:
|
|
609 ; GFX9: ; %bb.0: ; %main_body
|
|
610 ; GFX9-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf unorm a16 da
|
|
611 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
612 ; GFX9-NEXT: ; return to shader part epilog
|
|
613 ;
|
|
614 ; GFX10-LABEL: getresinfo_1darray:
|
|
615 ; GFX10: ; %bb.0: ; %main_body
|
|
616 ; GFX10-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D_ARRAY unorm a16
|
|
617 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
618 ; GFX10-NEXT: ; return to shader part epilog
|
|
619 main_body:
|
|
620 %mip = extractelement <2 x i16> %coords, i32 0
|
|
621 %v = call <4 x float> @llvm.amdgcn.image.getresinfo.1darray.v4f32.i16(i32 15, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
622 ret <4 x float> %v
|
|
623 }
|
|
624
|
|
625 define amdgpu_ps <4 x float> @getresinfo_2darray(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
626 ; GFX9-LABEL: getresinfo_2darray:
|
|
627 ; GFX9: ; %bb.0: ; %main_body
|
|
628 ; GFX9-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf unorm a16 da
|
|
629 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
630 ; GFX9-NEXT: ; return to shader part epilog
|
|
631 ;
|
|
632 ; GFX10-LABEL: getresinfo_2darray:
|
|
633 ; GFX10: ; %bb.0: ; %main_body
|
|
634 ; GFX10-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_ARRAY unorm a16
|
|
635 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
636 ; GFX10-NEXT: ; return to shader part epilog
|
|
637 main_body:
|
|
638 %mip = extractelement <2 x i16> %coords, i32 0
|
|
639 %v = call <4 x float> @llvm.amdgcn.image.getresinfo.2darray.v4f32.i16(i32 15, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
640 ret <4 x float> %v
|
|
641 }
|
|
642
|
|
643 define amdgpu_ps <4 x float> @getresinfo_2dmsaa(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
644 ; GFX9-LABEL: getresinfo_2dmsaa:
|
|
645 ; GFX9: ; %bb.0: ; %main_body
|
|
646 ; GFX9-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf unorm a16
|
|
647 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
648 ; GFX9-NEXT: ; return to shader part epilog
|
|
649 ;
|
|
650 ; GFX10-LABEL: getresinfo_2dmsaa:
|
|
651 ; GFX10: ; %bb.0: ; %main_body
|
|
652 ; GFX10-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_MSAA unorm a16
|
|
653 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
654 ; GFX10-NEXT: ; return to shader part epilog
|
|
655 main_body:
|
|
656 %mip = extractelement <2 x i16> %coords, i32 0
|
|
657 %v = call <4 x float> @llvm.amdgcn.image.getresinfo.2dmsaa.v4f32.i16(i32 15, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
658 ret <4 x float> %v
|
|
659 }
|
|
660
|
|
661 define amdgpu_ps <4 x float> @getresinfo_2darraymsaa(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
662 ; GFX9-LABEL: getresinfo_2darraymsaa:
|
|
663 ; GFX9: ; %bb.0: ; %main_body
|
|
664 ; GFX9-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf unorm a16 da
|
|
665 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
666 ; GFX9-NEXT: ; return to shader part epilog
|
|
667 ;
|
|
668 ; GFX10-LABEL: getresinfo_2darraymsaa:
|
|
669 ; GFX10: ; %bb.0: ; %main_body
|
|
670 ; GFX10-NEXT: image_get_resinfo v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm a16
|
|
671 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
672 ; GFX10-NEXT: ; return to shader part epilog
|
|
673 main_body:
|
|
674 %mip = extractelement <2 x i16> %coords, i32 0
|
|
675 %v = call <4 x float> @llvm.amdgcn.image.getresinfo.2darraymsaa.v4f32.i16(i32 15, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
676 ret <4 x float> %v
|
|
677 }
|
|
678
|
|
679 define amdgpu_ps float @load_1d_V1(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
680 ; GFX9-LABEL: load_1d_V1:
|
|
681 ; GFX9: ; %bb.0: ; %main_body
|
|
682 ; GFX9-NEXT: image_load v0, v0, s[0:7] dmask:0x8 unorm a16
|
|
683 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
684 ; GFX9-NEXT: ; return to shader part epilog
|
|
685 ;
|
|
686 ; GFX10-LABEL: load_1d_V1:
|
|
687 ; GFX10: ; %bb.0: ; %main_body
|
|
688 ; GFX10-NEXT: image_load v0, v0, s[0:7] dmask:0x8 dim:SQ_RSRC_IMG_1D unorm a16
|
|
689 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
690 ; GFX10-NEXT: ; return to shader part epilog
|
|
691 main_body:
|
|
692 %s = extractelement <2 x i16> %coords, i32 0
|
|
693 %v = call float @llvm.amdgcn.image.load.1d.f32.i16(i32 8, i16 %s, <8 x i32> %rsrc, i32 0, i32 0)
|
|
694 ret float %v
|
|
695 }
|
|
696
|
|
697 define amdgpu_ps <2 x float> @load_1d_V2(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
698 ; GFX9-LABEL: load_1d_V2:
|
|
699 ; GFX9: ; %bb.0: ; %main_body
|
|
700 ; GFX9-NEXT: image_load v[0:1], v0, s[0:7] dmask:0x9 unorm a16
|
|
701 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
702 ; GFX9-NEXT: ; return to shader part epilog
|
|
703 ;
|
|
704 ; GFX10-LABEL: load_1d_V2:
|
|
705 ; GFX10: ; %bb.0: ; %main_body
|
|
706 ; GFX10-NEXT: image_load v[0:1], v0, s[0:7] dmask:0x9 dim:SQ_RSRC_IMG_1D unorm a16
|
|
707 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
708 ; GFX10-NEXT: ; return to shader part epilog
|
|
709 main_body:
|
|
710 %s = extractelement <2 x i16> %coords, i32 0
|
|
711 %v = call <2 x float> @llvm.amdgcn.image.load.1d.v2f32.i16(i32 9, i16 %s, <8 x i32> %rsrc, i32 0, i32 0)
|
|
712 ret <2 x float> %v
|
|
713 }
|
|
714
|
|
715 define amdgpu_ps void @store_1d_V1(<8 x i32> inreg %rsrc, float %vdata, <2 x i16> %coords) {
|
|
716 ; GFX9-LABEL: store_1d_V1:
|
|
717 ; GFX9: ; %bb.0: ; %main_body
|
|
718 ; GFX9-NEXT: image_store v0, v1, s[0:7] dmask:0x2 unorm a16
|
|
719 ; GFX9-NEXT: s_endpgm
|
|
720 ;
|
|
721 ; GFX10-LABEL: store_1d_V1:
|
|
722 ; GFX10: ; %bb.0: ; %main_body
|
|
723 ; GFX10-NEXT: image_store v0, v1, s[0:7] dmask:0x2 dim:SQ_RSRC_IMG_1D unorm a16
|
|
724 ; GFX10-NEXT: s_endpgm
|
|
725 main_body:
|
|
726 %s = extractelement <2 x i16> %coords, i32 0
|
|
727 call void @llvm.amdgcn.image.store.1d.f32.i16(float %vdata, i32 2, i16 %s, <8 x i32> %rsrc, i32 0, i32 0)
|
|
728 ret void
|
|
729 }
|
|
730
|
|
731 define amdgpu_ps void @store_1d_V2(<8 x i32> inreg %rsrc, <2 x float> %vdata, <2 x i16> %coords) {
|
|
732 ; GFX9-LABEL: store_1d_V2:
|
|
733 ; GFX9: ; %bb.0: ; %main_body
|
|
734 ; GFX9-NEXT: image_store v[0:1], v2, s[0:7] dmask:0xc unorm a16
|
|
735 ; GFX9-NEXT: s_endpgm
|
|
736 ;
|
|
737 ; GFX10-LABEL: store_1d_V2:
|
|
738 ; GFX10: ; %bb.0: ; %main_body
|
|
739 ; GFX10-NEXT: image_store v[0:1], v2, s[0:7] dmask:0xc dim:SQ_RSRC_IMG_1D unorm a16
|
|
740 ; GFX10-NEXT: s_endpgm
|
|
741 main_body:
|
|
742 %s = extractelement <2 x i16> %coords, i32 0
|
|
743 call void @llvm.amdgcn.image.store.1d.v2f32.i16(<2 x float> %vdata, i32 12, i16 %s, <8 x i32> %rsrc, i32 0, i32 0)
|
|
744 ret void
|
|
745 }
|
|
746
|
|
747 define amdgpu_ps <4 x float> @load_1d_glc(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
748 ; GFX9-LABEL: load_1d_glc:
|
|
749 ; GFX9: ; %bb.0: ; %main_body
|
|
750 ; GFX9-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf unorm glc a16
|
|
751 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
752 ; GFX9-NEXT: ; return to shader part epilog
|
|
753 ;
|
|
754 ; GFX10-LABEL: load_1d_glc:
|
|
755 ; GFX10: ; %bb.0: ; %main_body
|
|
756 ; GFX10-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm glc a16
|
|
757 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
758 ; GFX10-NEXT: ; return to shader part epilog
|
|
759 main_body:
|
|
760 %s = extractelement <2 x i16> %coords, i32 0
|
|
761 %v = call <4 x float> @llvm.amdgcn.image.load.1d.v4f32.i16(i32 15, i16 %s, <8 x i32> %rsrc, i32 0, i32 1)
|
|
762 ret <4 x float> %v
|
|
763 }
|
|
764
|
|
765 define amdgpu_ps <4 x float> @load_1d_slc(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
766 ; GFX9-LABEL: load_1d_slc:
|
|
767 ; GFX9: ; %bb.0: ; %main_body
|
|
768 ; GFX9-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf unorm slc a16
|
|
769 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
770 ; GFX9-NEXT: ; return to shader part epilog
|
|
771 ;
|
|
772 ; GFX10-LABEL: load_1d_slc:
|
|
773 ; GFX10: ; %bb.0: ; %main_body
|
|
774 ; GFX10-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm slc a16
|
|
775 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
776 ; GFX10-NEXT: ; return to shader part epilog
|
|
777 main_body:
|
|
778 %s = extractelement <2 x i16> %coords, i32 0
|
|
779 %v = call <4 x float> @llvm.amdgcn.image.load.1d.v4f32.i16(i32 15, i16 %s, <8 x i32> %rsrc, i32 0, i32 2)
|
|
780 ret <4 x float> %v
|
|
781 }
|
|
782
|
|
783 define amdgpu_ps <4 x float> @load_1d_glc_slc(<8 x i32> inreg %rsrc, <2 x i16> %coords) {
|
|
784 ; GFX9-LABEL: load_1d_glc_slc:
|
|
785 ; GFX9: ; %bb.0: ; %main_body
|
|
786 ; GFX9-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf unorm glc slc a16
|
|
787 ; GFX9-NEXT: s_waitcnt vmcnt(0)
|
|
788 ; GFX9-NEXT: ; return to shader part epilog
|
|
789 ;
|
|
790 ; GFX10-LABEL: load_1d_glc_slc:
|
|
791 ; GFX10: ; %bb.0: ; %main_body
|
|
792 ; GFX10-NEXT: image_load v[0:3], v0, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm glc slc a16
|
|
793 ; GFX10-NEXT: s_waitcnt vmcnt(0)
|
|
794 ; GFX10-NEXT: ; return to shader part epilog
|
|
795 main_body:
|
|
796 %s = extractelement <2 x i16> %coords, i32 0
|
|
797 %v = call <4 x float> @llvm.amdgcn.image.load.1d.v4f32.i16(i32 15, i16 %s, <8 x i32> %rsrc, i32 0, i32 3)
|
|
798 ret <4 x float> %v
|
|
799 }
|
|
800
|
|
801 define amdgpu_ps void @store_1d_glc(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords) {
|
|
802 ; GFX9-LABEL: store_1d_glc:
|
|
803 ; GFX9: ; %bb.0: ; %main_body
|
|
804 ; GFX9-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf unorm glc a16
|
|
805 ; GFX9-NEXT: s_endpgm
|
|
806 ;
|
|
807 ; GFX10-LABEL: store_1d_glc:
|
|
808 ; GFX10: ; %bb.0: ; %main_body
|
|
809 ; GFX10-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm glc a16
|
|
810 ; GFX10-NEXT: s_endpgm
|
|
811 main_body:
|
|
812 %s = extractelement <2 x i16> %coords, i32 0
|
|
813 call void @llvm.amdgcn.image.store.1d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, <8 x i32> %rsrc, i32 0, i32 1)
|
|
814 ret void
|
|
815 }
|
|
816
|
|
817 define amdgpu_ps void @store_1d_slc(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords) {
|
|
818 ; GFX9-LABEL: store_1d_slc:
|
|
819 ; GFX9: ; %bb.0: ; %main_body
|
|
820 ; GFX9-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf unorm slc a16
|
|
821 ; GFX9-NEXT: s_endpgm
|
|
822 ;
|
|
823 ; GFX10-LABEL: store_1d_slc:
|
|
824 ; GFX10: ; %bb.0: ; %main_body
|
|
825 ; GFX10-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm slc a16
|
|
826 ; GFX10-NEXT: s_endpgm
|
|
827 main_body:
|
|
828 %s = extractelement <2 x i16> %coords, i32 0
|
|
829 call void @llvm.amdgcn.image.store.1d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, <8 x i32> %rsrc, i32 0, i32 2)
|
|
830 ret void
|
|
831 }
|
|
832
|
|
833 define amdgpu_ps void @store_1d_glc_slc(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords) {
|
|
834 ; GFX9-LABEL: store_1d_glc_slc:
|
|
835 ; GFX9: ; %bb.0: ; %main_body
|
|
836 ; GFX9-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf unorm glc slc a16
|
|
837 ; GFX9-NEXT: s_endpgm
|
|
838 ;
|
|
839 ; GFX10-LABEL: store_1d_glc_slc:
|
|
840 ; GFX10: ; %bb.0: ; %main_body
|
|
841 ; GFX10-NEXT: image_store v[0:3], v4, s[0:7] dmask:0xf dim:SQ_RSRC_IMG_1D unorm glc slc a16
|
|
842 ; GFX10-NEXT: s_endpgm
|
|
843 main_body:
|
|
844 %s = extractelement <2 x i16> %coords, i32 0
|
|
845 call void @llvm.amdgcn.image.store.1d.v4f32.i16(<4 x float> %vdata, i32 15, i16 %s, <8 x i32> %rsrc, i32 0, i32 3)
|
|
846 ret void
|
|
847 }
|
|
848
|
|
849 define amdgpu_ps <4 x float> @getresinfo_dmask0(<8 x i32> inreg %rsrc, <4 x float> %vdata, <2 x i16> %coords) #0 {
|
|
850 ; GFX9-LABEL: getresinfo_dmask0:
|
|
851 ; GFX9: ; %bb.0: ; %main_body
|
|
852 ; GFX9-NEXT: ; return to shader part epilog
|
|
853 ;
|
|
854 ; GFX10-LABEL: getresinfo_dmask0:
|
|
855 ; GFX10: ; %bb.0: ; %main_body
|
|
856 ; GFX10-NEXT: ; return to shader part epilog
|
|
857 main_body:
|
|
858 %mip = extractelement <2 x i16> %coords, i32 0
|
|
859 %r = call <4 x float> @llvm.amdgcn.image.getresinfo.1d.v4f32.i16(i32 0, i16 %mip, <8 x i32> %rsrc, i32 0, i32 0)
|
|
860 ret <4 x float> %r
|
|
861 }
|
|
862
|
|
863 declare <4 x float> @llvm.amdgcn.image.load.1d.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #1
|
|
864 declare <4 x float> @llvm.amdgcn.image.load.2d.v4f32.i16(i32, i16, i16, <8 x i32>, i32, i32) #1
|
|
865 declare <4 x float> @llvm.amdgcn.image.load.3d.v4f32.i16(i32, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
866 declare <4 x float> @llvm.amdgcn.image.load.cube.v4f32.i16(i32, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
867 declare <4 x float> @llvm.amdgcn.image.load.1darray.v4f32.i16(i32, i16, i16, <8 x i32>, i32, i32) #1
|
|
868 declare <4 x float> @llvm.amdgcn.image.load.2darray.v4f32.i16(i32, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
869 declare <4 x float> @llvm.amdgcn.image.load.2dmsaa.v4f32.i16(i32, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
870 declare <4 x float> @llvm.amdgcn.image.load.2darraymsaa.v4f32.i16(i32, i16, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
871
|
|
872 declare <4 x float> @llvm.amdgcn.image.load.mip.1d.v4f32.i16(i32, i16, i16, <8 x i32>, i32, i32) #1
|
|
873 declare <4 x float> @llvm.amdgcn.image.load.mip.2d.v4f32.i16(i32, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
874 declare <4 x float> @llvm.amdgcn.image.load.mip.3d.v4f32.i16(i32, i16, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
875 declare <4 x float> @llvm.amdgcn.image.load.mip.cube.v4f32.i16(i32, i16, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
876 declare <4 x float> @llvm.amdgcn.image.load.mip.1darray.v4f32.i16(i32, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
877 declare <4 x float> @llvm.amdgcn.image.load.mip.2darray.v4f32.i16(i32, i16, i16, i16, i16, <8 x i32>, i32, i32) #1
|
|
878
|
|
879 declare void @llvm.amdgcn.image.store.1d.v4f32.i16(<4 x float>, i32, i16, <8 x i32>, i32, i32) #0
|
|
880 declare void @llvm.amdgcn.image.store.2d.v4f32.i16(<4 x float>, i32, i16, i16, <8 x i32>, i32, i32) #0
|
|
881 declare void @llvm.amdgcn.image.store.3d.v4f32.i16(<4 x float>, i32, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
882 declare void @llvm.amdgcn.image.store.cube.v4f32.i16(<4 x float>, i32, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
883 declare void @llvm.amdgcn.image.store.1darray.v4f32.i16(<4 x float>, i32, i16, i16, <8 x i32>, i32, i32) #0
|
|
884 declare void @llvm.amdgcn.image.store.2darray.v4f32.i16(<4 x float>, i32, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
885 declare void @llvm.amdgcn.image.store.2dmsaa.v4f32.i16(<4 x float>, i32, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
886 declare void @llvm.amdgcn.image.store.2darraymsaa.v4f32.i16(<4 x float>, i32, i16, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
887
|
|
888 declare void @llvm.amdgcn.image.store.mip.1d.v4f32.i16(<4 x float>, i32, i16, i16, <8 x i32>, i32, i32) #0
|
|
889 declare void @llvm.amdgcn.image.store.mip.2d.v4f32.i16(<4 x float>, i32, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
890 declare void @llvm.amdgcn.image.store.mip.3d.v4f32.i16(<4 x float>, i32, i16, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
891 declare void @llvm.amdgcn.image.store.mip.cube.v4f32.i16(<4 x float>, i32, i16, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
892 declare void @llvm.amdgcn.image.store.mip.1darray.v4f32.i16(<4 x float>, i32, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
893 declare void @llvm.amdgcn.image.store.mip.2darray.v4f32.i16(<4 x float>, i32, i16, i16, i16, i16, <8 x i32>, i32, i32) #0
|
|
894
|
|
895 declare <4 x float> @llvm.amdgcn.image.getresinfo.1d.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #2
|
|
896 declare <4 x float> @llvm.amdgcn.image.getresinfo.2d.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #2
|
|
897 declare <4 x float> @llvm.amdgcn.image.getresinfo.3d.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #2
|
|
898 declare <4 x float> @llvm.amdgcn.image.getresinfo.cube.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #2
|
|
899 declare <4 x float> @llvm.amdgcn.image.getresinfo.1darray.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #2
|
|
900 declare <4 x float> @llvm.amdgcn.image.getresinfo.2darray.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #2
|
|
901 declare <4 x float> @llvm.amdgcn.image.getresinfo.2dmsaa.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #2
|
|
902 declare <4 x float> @llvm.amdgcn.image.getresinfo.2darraymsaa.v4f32.i16(i32, i16, <8 x i32>, i32, i32) #2
|
|
903
|
|
904 declare float @llvm.amdgcn.image.load.1d.f32.i16(i32, i16, <8 x i32>, i32, i32) #1
|
|
905 declare float @llvm.amdgcn.image.load.2d.f32.i16(i32, i16, i16, <8 x i32>, i32, i32) #1
|
|
906 declare <2 x float> @llvm.amdgcn.image.load.1d.v2f32.i16(i32, i16, <8 x i32>, i32, i32) #1
|
|
907 declare void @llvm.amdgcn.image.store.1d.f32.i16(float, i32, i16, <8 x i32>, i32, i32) #0
|
|
908 declare void @llvm.amdgcn.image.store.1d.v2f32.i16(<2 x float>, i32, i16, <8 x i32>, i32, i32) #0
|
|
909
|
|
910 attributes #0 = { nounwind }
|
|
911 attributes #1 = { nounwind readonly }
|
|
912 attributes #2 = { nounwind readnone }
|