207
|
1 # RUN: llc -march=amdgcn -mcpu=gfx1010 -run-pass=si-peephole-sdwa -verify-machineinstrs -o - %s | FileCheck -check-prefix=GCN %s
|
|
2
|
|
3 # Do not fold stack objects into SDWA.
|
|
4
|
|
5 ---
|
|
6 # GCN-LABEL: name: sdwa_stack_object_src0
|
|
7 # GCN: V_ADD_U32_e64 %stack.0, killed %1
|
|
8 name: sdwa_stack_object_src0
|
|
9 stack:
|
|
10 - { id: 0, type: default, offset: 0, size: 32, alignment: 4, stack-id: default }
|
|
11 body: |
|
|
12 bb.0:
|
|
13 %0:vgpr_32 = IMPLICIT_DEF
|
|
14 %1:vgpr_32 = V_AND_B32_e32 255, %0, implicit $exec
|
|
15 %2:vgpr_32 = V_ADD_U32_e64 %stack.0, killed %1, 0, implicit $exec
|
|
16 S_ENDPGM 0, implicit %2
|
|
17
|
|
18 ...
|
|
19 ---
|
|
20 name: sdwa_stack_object_src1
|
|
21 # GCN-LABEL: name: sdwa_stack_object_src1
|
|
22 # GCN: V_ADD_U32_e64 killed %1, %stack.0
|
|
23 stack:
|
|
24 - { id: 0, type: default, offset: 0, size: 32, alignment: 4, stack-id: default }
|
|
25 body: |
|
|
26 bb.0:
|
|
27 %0:vgpr_32 = IMPLICIT_DEF
|
|
28 %1:vgpr_32 = V_AND_B32_e32 255, %0, implicit $exec
|
|
29 %2:vgpr_32 = V_ADD_U32_e64 killed %1, %stack.0, 0, implicit $exec
|
|
30 S_ENDPGM 0, implicit %2
|
|
31
|
|
32 ...
|