view llvm/test/CodeGen/AMDGPU/expand-si-indirect.mir @ 223:5f17cb93ff66 llvm-original

LLVM13 (2021/7/18)
author Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date Sun, 18 Jul 2021 22:43:00 +0900
parents 79ff65ed7e25
children
line wrap: on
line source

# RUN: llc -march=amdgcn -mcpu=gfx900 -start-before=twoaddressinstruction %s -o - | FileCheck %s -check-prefix=GCN

# Wait to sxpand SI_INDIRECT sequences that use VGPR indexing until after
# register allocation. We don’t want to reschedule the mode switching or to
# have any instructions inserted within the sequence. The Two-Address
# instruction pass could insert bad copies here if it is expanded too early.

---
# GCN-LABEL: expand_si_indirect
# GCN: s_set_gpr_idx_on
# GCN-NEXT: v_mov_b32_e32
# GCN-NEXT: s_set_gpr_idx_off

# GCN: s_set_gpr_idx_on
# GCN-NEXT: v_mov_b32_e32
# GCN-NOT: v_mov_b32_e32
# GCN-NEXT: s_set_gpr_idx_off

name: expand_si_indirect
tracksRegLiveness: true
body:             |
  bb.0.entry:
    liveins: $sgpr0_sgpr1

    %0:sgpr_64 = COPY killed $sgpr0_sgpr1
    %1:vgpr_32 = V_MOV_B32_e32 0, implicit $exec
    %2:sreg_64_xexec = S_LOAD_DWORDX2_IMM %0(p4), 36, 0
    %3:sreg_32_xm0_xexec = S_LOAD_DWORD_IMM killed %0(p4), 44, 0
    %4:sreg_32 = S_ADD_I32 %3, 1, implicit-def dead $scc
    %5:vgpr_32 = V_MOV_B32_e32 1065353216, implicit $exec
    %6:vgpr_32 = V_MOV_B32_e32 1073741824, implicit $exec
    %7:vgpr_32 = V_MOV_B32_e32 1077936128, implicit $exec
    %8:vgpr_32 = V_MOV_B32_e32 1082130432, implicit $exec
    %9:vgpr_32 = V_MOV_B32_e32 1084227584, implicit $exec
    %10:vgpr_32 = V_MOV_B32_e32 1086324736, implicit $exec
    %11:vgpr_32 = V_MOV_B32_e32 1088421888, implicit $exec
    %12:vgpr_32 = V_MOV_B32_e32 1090519040, implicit $exec
    %13:vgpr_32 = V_MOV_B32_e32 1091567616, implicit $exec
    %14:vgpr_32 = V_MOV_B32_e32 1092616192, implicit $exec
    %15:vgpr_32 = V_MOV_B32_e32 1093664768, implicit $exec
    %16:vgpr_32 = V_MOV_B32_e32 1094713344, implicit $exec
    %17:vgpr_32 = V_MOV_B32_e32 1095761920, implicit $exec
    %18:vgpr_32 = V_MOV_B32_e32 1096810496, implicit $exec
    %19:vgpr_32 = V_MOV_B32_e32 1097859072, implicit $exec
    %20:vgpr_32 = V_MOV_B32_e32 1098907648, implicit $exec
    %21:vreg_512 = REG_SEQUENCE killed %5, %subreg.sub0, killed %6, %subreg.sub1, killed %7, %subreg.sub2, killed %8, %subreg.sub3, killed %9, %subreg.sub4, killed %10, %subreg.sub5, killed %11, %subreg.sub6, killed %12, %subreg.sub7, killed %13, %subreg.sub8, killed %14, %subreg.sub9, killed %15, %subreg.sub10, killed %16, %subreg.sub11, killed %17, %subreg.sub12, killed %18, %subreg.sub13, killed %19, %subreg.sub14, killed %20, %subreg.sub15
    %22:vgpr_32 = V_MOV_B32_e32 1099431936, implicit $exec
    %23:vreg_512 = V_INDIRECT_REG_WRITE_GPR_IDX_B32_V16 killed %21, %22, killed %4, 3, implicit-def $m0, implicit $m0, implicit $exec
    %24:sreg_32 = S_ADD_I32 killed %3, 2, implicit-def dead $scc
    %25:vreg_512 = V_INDIRECT_REG_WRITE_GPR_IDX_B32_V16 %23, killed %22, killed %24, 3, implicit-def $m0, implicit $m0, implicit $exec
    %26:vgpr_32 = COPY %23.sub15
    %27:vgpr_32 = COPY %23.sub14
    %28:vgpr_32 = COPY %23.sub13
    %29:vgpr_32 = COPY %23.sub12
    %30:vreg_128 = REG_SEQUENCE killed %29, %subreg.sub0, killed %28, %subreg.sub1, killed %27, %subreg.sub2, killed %26, %subreg.sub3
    GLOBAL_STORE_DWORDX4_SADDR %1, killed %30, %2, 48, 0, implicit $exec
    %31:vgpr_32 = COPY %23.sub11
    %32:vgpr_32 = COPY %23.sub10
    %33:vgpr_32 = COPY %23.sub9
    %34:vgpr_32 = COPY %23.sub8
    %35:vreg_128 = REG_SEQUENCE killed %34, %subreg.sub0, killed %33, %subreg.sub1, killed %32, %subreg.sub2, killed %31, %subreg.sub3
    GLOBAL_STORE_DWORDX4_SADDR %1, killed %35, %2, 32, 0, implicit $exec
    %36:vgpr_32 = COPY %23.sub7
    %37:vgpr_32 = COPY %23.sub6
    %38:vgpr_32 = COPY %23.sub5
    %39:vgpr_32 = COPY %23.sub4
    %40:vreg_128 = REG_SEQUENCE killed %39, %subreg.sub0, killed %38, %subreg.sub1, killed %37, %subreg.sub2, killed %36, %subreg.sub3
    GLOBAL_STORE_DWORDX4_SADDR %1, killed %40, %2, 16, 0, implicit $exec
    %41:vgpr_32 = COPY %23.sub3
    %42:vgpr_32 = COPY %23.sub2
    %43:vgpr_32 = COPY %23.sub1
    %44:vgpr_32 = COPY killed %23.sub0
    %45:vreg_128 = REG_SEQUENCE killed %44, %subreg.sub0, killed %43, %subreg.sub1, killed %42, %subreg.sub2, killed %41, %subreg.sub3
    GLOBAL_STORE_DWORDX4_SADDR %1, killed %45, %2, 0, 0, implicit $exec
    %46:vgpr_32 = COPY %25.sub15
    %47:vgpr_32 = COPY %25.sub14
    %48:vgpr_32 = COPY %25.sub13
    %49:vgpr_32 = COPY %25.sub12
    %50:vreg_128 = REG_SEQUENCE killed %49, %subreg.sub0, killed %48, %subreg.sub1, killed %47, %subreg.sub2, killed %46, %subreg.sub3
    GLOBAL_STORE_DWORDX4_SADDR %1, killed %50, %2, 112, 0, implicit $exec
    %51:vgpr_32 = COPY %25.sub11
    %52:vgpr_32 = COPY %25.sub10
    %53:vgpr_32 = COPY %25.sub9
    %54:vgpr_32 = COPY %25.sub8
    %55:vreg_128 = REG_SEQUENCE killed %54, %subreg.sub0, killed %53, %subreg.sub1, killed %52, %subreg.sub2, killed %51, %subreg.sub3
    GLOBAL_STORE_DWORDX4_SADDR %1, killed %55, %2, 96, 0, implicit $exec
    %56:vgpr_32 = COPY %25.sub7
    %57:vgpr_32 = COPY %25.sub6
    %58:vgpr_32 = COPY %25.sub5
    %59:vgpr_32 = COPY %25.sub4
    %60:vreg_128 = REG_SEQUENCE killed %59, %subreg.sub0, killed %58, %subreg.sub1, killed %57, %subreg.sub2, killed %56, %subreg.sub3
    GLOBAL_STORE_DWORDX4_SADDR %1, killed %60, %2, 80, 0, implicit $exec
    %61:vgpr_32 = COPY %25.sub3
    %62:vgpr_32 = COPY %25.sub2
    %63:vgpr_32 = COPY %25.sub1
    %64:vgpr_32 = COPY killed %25.sub0
    %65:vreg_128 = REG_SEQUENCE killed %64, %subreg.sub0, killed %63, %subreg.sub1, killed %62, %subreg.sub2, killed %61, %subreg.sub3
    GLOBAL_STORE_DWORDX4_SADDR killed %1, killed %65, killed %2, 64, 0, implicit $exec
    S_ENDPGM 0

...