221
|
1 ; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
|
|
2 ; RUN: llc -march=amdgcn -mcpu=tonga -global-isel -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
|
|
3
|
|
4 declare i32 @llvm.amdgcn.perm(i32, i32, i32) #0
|
|
5
|
|
6 ; GCN-LABEL: {{^}}v_perm_b32_v_v_v:
|
|
7 ; GCN: v_perm_b32 v{{[0-9]+}}, v0, v1, v2
|
252
|
8 define amdgpu_ps void @v_perm_b32_v_v_v(i32 %src1, i32 %src2, i32 %src3, ptr addrspace(1) %out) #1 {
|
221
|
9 %val = call i32 @llvm.amdgcn.perm(i32 %src1, i32 %src2, i32 %src3) #0
|
252
|
10 store i32 %val, ptr addrspace(1) %out
|
221
|
11 ret void
|
|
12 }
|
|
13
|
|
14 ; GCN-LABEL: {{^}}v_perm_b32_v_v_c:
|
|
15 ; GCN: v_perm_b32 v{{[0-9]+}}, v0, v1, {{[vs][0-9]+}}
|
252
|
16 define amdgpu_ps void @v_perm_b32_v_v_c(i32 %src1, i32 %src2, ptr addrspace(1) %out) #1 {
|
221
|
17 %val = call i32 @llvm.amdgcn.perm(i32 %src1, i32 %src2, i32 12345) #0
|
252
|
18 store i32 %val, ptr addrspace(1) %out
|
221
|
19 ret void
|
|
20 }
|
|
21
|
|
22 ; GCN-LABEL: {{^}}v_perm_b32_s_v_c:
|
|
23 ; GCN: v_perm_b32 v{{[0-9]+}}, s0, v0, v{{[0-9]+}}
|
252
|
24 define amdgpu_ps void @v_perm_b32_s_v_c(i32 inreg %src1, i32 %src2, ptr addrspace(1) %out) #1 {
|
221
|
25 %val = call i32 @llvm.amdgcn.perm(i32 %src1, i32 %src2, i32 12345) #0
|
252
|
26 store i32 %val, ptr addrspace(1) %out
|
221
|
27 ret void
|
|
28 }
|
|
29
|
|
30 ; GCN-LABEL: {{^}}v_perm_b32_s_s_c:
|
|
31 ; GCN: v_perm_b32 v{{[0-9]+}}, s0, v{{[0-9]+}}, v{{[0-9]+}}
|
252
|
32 define amdgpu_ps void @v_perm_b32_s_s_c(i32 inreg %src1, i32 inreg %src2, ptr addrspace(1) %out) #1 {
|
221
|
33 %val = call i32 @llvm.amdgcn.perm(i32 %src1, i32 %src2, i32 12345) #0
|
252
|
34 store i32 %val, ptr addrspace(1) %out
|
221
|
35 ret void
|
|
36 }
|
|
37
|
|
38 ; GCN-LABEL: {{^}}v_perm_b32_v_s_i:
|
|
39 ; GCN: v_perm_b32 v{{[0-9]+}}, v0, s0, 1
|
252
|
40 define amdgpu_ps void @v_perm_b32_v_s_i(i32 %src1, i32 inreg %src2, ptr addrspace(1) %out) #1 {
|
221
|
41 %val = call i32 @llvm.amdgcn.perm(i32 %src1, i32 %src2, i32 1) #0
|
252
|
42 store i32 %val, ptr addrspace(1) %out
|
221
|
43 ret void
|
|
44 }
|
|
45
|
|
46 attributes #0 = { nounwind readnone }
|
|
47 attributes #1 = { nounwind }
|