103 lines
5.5 KiB
YAML
103 lines
5.5 KiB
YAML
# RUN: llc -march=amdgcn -mcpu=gfx900 -start-before=twoaddressinstruction %s -o - | FileCheck %s -check-prefix=GCN
|
||
|
||
# Wait to sxpand SI_INDIRECT sequences that use VGPR indexing until after
|
||
# register allocation. We don’t want to reschedule the mode switching or to
|
||
# have any instructions inserted within the sequence. The Two-Address
|
||
# instruction pass could insert bad copies here if it is expanded too early.
|
||
|
||
---
|
||
# GCN-LABEL: expand_si_indirect
|
||
# GCN: s_set_gpr_idx_on
|
||
# GCN-NEXT: v_mov_b32_e32
|
||
# GCN-NEXT: s_set_gpr_idx_off
|
||
|
||
# GCN: s_set_gpr_idx_on
|
||
# GCN-NEXT: v_mov_b32_e32
|
||
# GCN-NOT: v_mov_b32_e32
|
||
# GCN-NEXT: s_set_gpr_idx_off
|
||
|
||
name: expand_si_indirect
|
||
tracksRegLiveness: true
|
||
body: |
|
||
bb.0.entry:
|
||
liveins: $sgpr0_sgpr1
|
||
|
||
%0:sgpr_64 = COPY killed $sgpr0_sgpr1
|
||
%1:vgpr_32 = V_MOV_B32_e32 0, implicit $exec
|
||
%2:sreg_64_xexec = S_LOAD_DWORDX2_IMM %0(p4), 36, 0, 0
|
||
%3:sreg_32_xm0_xexec = S_LOAD_DWORD_IMM killed %0(p4), 44, 0, 0
|
||
%4:sreg_32 = S_ADD_I32 %3, 1, implicit-def dead $scc
|
||
%5:vgpr_32 = V_MOV_B32_e32 1065353216, implicit $exec
|
||
%6:vgpr_32 = V_MOV_B32_e32 1073741824, implicit $exec
|
||
%7:vgpr_32 = V_MOV_B32_e32 1077936128, implicit $exec
|
||
%8:vgpr_32 = V_MOV_B32_e32 1082130432, implicit $exec
|
||
%9:vgpr_32 = V_MOV_B32_e32 1084227584, implicit $exec
|
||
%10:vgpr_32 = V_MOV_B32_e32 1086324736, implicit $exec
|
||
%11:vgpr_32 = V_MOV_B32_e32 1088421888, implicit $exec
|
||
%12:vgpr_32 = V_MOV_B32_e32 1090519040, implicit $exec
|
||
%13:vgpr_32 = V_MOV_B32_e32 1091567616, implicit $exec
|
||
%14:vgpr_32 = V_MOV_B32_e32 1092616192, implicit $exec
|
||
%15:vgpr_32 = V_MOV_B32_e32 1093664768, implicit $exec
|
||
%16:vgpr_32 = V_MOV_B32_e32 1094713344, implicit $exec
|
||
%17:vgpr_32 = V_MOV_B32_e32 1095761920, implicit $exec
|
||
%18:vgpr_32 = V_MOV_B32_e32 1096810496, implicit $exec
|
||
%19:vgpr_32 = V_MOV_B32_e32 1097859072, implicit $exec
|
||
%20:vgpr_32 = V_MOV_B32_e32 1098907648, implicit $exec
|
||
%21:vreg_512 = REG_SEQUENCE killed %5, %subreg.sub0, killed %6, %subreg.sub1, killed %7, %subreg.sub2, killed %8, %subreg.sub3, killed %9, %subreg.sub4, killed %10, %subreg.sub5, killed %11, %subreg.sub6, killed %12, %subreg.sub7, killed %13, %subreg.sub8, killed %14, %subreg.sub9, killed %15, %subreg.sub10, killed %16, %subreg.sub11, killed %17, %subreg.sub12, killed %18, %subreg.sub13, killed %19, %subreg.sub14, killed %20, %subreg.sub15
|
||
%22:vgpr_32 = V_MOV_B32_e32 1099431936, implicit $exec
|
||
%23:vreg_512 = V_INDIRECT_REG_WRITE_GPR_IDX_B32_V16 killed %21, %22, killed %4, 3, implicit-def $m0, implicit $m0, implicit $exec
|
||
%24:sreg_32 = S_ADD_I32 killed %3, 2, implicit-def dead $scc
|
||
%25:vreg_512 = V_INDIRECT_REG_WRITE_GPR_IDX_B32_V16 %23, killed %22, killed %24, 3, implicit-def $m0, implicit $m0, implicit $exec
|
||
%26:vgpr_32 = COPY %23.sub15
|
||
%27:vgpr_32 = COPY %23.sub14
|
||
%28:vgpr_32 = COPY %23.sub13
|
||
%29:vgpr_32 = COPY %23.sub12
|
||
%30:vreg_128 = REG_SEQUENCE killed %29, %subreg.sub0, killed %28, %subreg.sub1, killed %27, %subreg.sub2, killed %26, %subreg.sub3
|
||
GLOBAL_STORE_DWORDX4_SADDR %1, killed %30, %2, 48, 0, 0, 0, implicit $exec
|
||
%31:vgpr_32 = COPY %23.sub11
|
||
%32:vgpr_32 = COPY %23.sub10
|
||
%33:vgpr_32 = COPY %23.sub9
|
||
%34:vgpr_32 = COPY %23.sub8
|
||
%35:vreg_128 = REG_SEQUENCE killed %34, %subreg.sub0, killed %33, %subreg.sub1, killed %32, %subreg.sub2, killed %31, %subreg.sub3
|
||
GLOBAL_STORE_DWORDX4_SADDR %1, killed %35, %2, 32, 0, 0, 0, implicit $exec
|
||
%36:vgpr_32 = COPY %23.sub7
|
||
%37:vgpr_32 = COPY %23.sub6
|
||
%38:vgpr_32 = COPY %23.sub5
|
||
%39:vgpr_32 = COPY %23.sub4
|
||
%40:vreg_128 = REG_SEQUENCE killed %39, %subreg.sub0, killed %38, %subreg.sub1, killed %37, %subreg.sub2, killed %36, %subreg.sub3
|
||
GLOBAL_STORE_DWORDX4_SADDR %1, killed %40, %2, 16, 0, 0, 0, implicit $exec
|
||
%41:vgpr_32 = COPY %23.sub3
|
||
%42:vgpr_32 = COPY %23.sub2
|
||
%43:vgpr_32 = COPY %23.sub1
|
||
%44:vgpr_32 = COPY killed %23.sub0
|
||
%45:vreg_128 = REG_SEQUENCE killed %44, %subreg.sub0, killed %43, %subreg.sub1, killed %42, %subreg.sub2, killed %41, %subreg.sub3
|
||
GLOBAL_STORE_DWORDX4_SADDR %1, killed %45, %2, 0, 0, 0, 0, implicit $exec
|
||
%46:vgpr_32 = COPY %25.sub15
|
||
%47:vgpr_32 = COPY %25.sub14
|
||
%48:vgpr_32 = COPY %25.sub13
|
||
%49:vgpr_32 = COPY %25.sub12
|
||
%50:vreg_128 = REG_SEQUENCE killed %49, %subreg.sub0, killed %48, %subreg.sub1, killed %47, %subreg.sub2, killed %46, %subreg.sub3
|
||
GLOBAL_STORE_DWORDX4_SADDR %1, killed %50, %2, 112, 0, 0, 0, implicit $exec
|
||
%51:vgpr_32 = COPY %25.sub11
|
||
%52:vgpr_32 = COPY %25.sub10
|
||
%53:vgpr_32 = COPY %25.sub9
|
||
%54:vgpr_32 = COPY %25.sub8
|
||
%55:vreg_128 = REG_SEQUENCE killed %54, %subreg.sub0, killed %53, %subreg.sub1, killed %52, %subreg.sub2, killed %51, %subreg.sub3
|
||
GLOBAL_STORE_DWORDX4_SADDR %1, killed %55, %2, 96, 0, 0, 0, implicit $exec
|
||
%56:vgpr_32 = COPY %25.sub7
|
||
%57:vgpr_32 = COPY %25.sub6
|
||
%58:vgpr_32 = COPY %25.sub5
|
||
%59:vgpr_32 = COPY %25.sub4
|
||
%60:vreg_128 = REG_SEQUENCE killed %59, %subreg.sub0, killed %58, %subreg.sub1, killed %57, %subreg.sub2, killed %56, %subreg.sub3
|
||
GLOBAL_STORE_DWORDX4_SADDR %1, killed %60, %2, 80, 0, 0, 0, implicit $exec
|
||
%61:vgpr_32 = COPY %25.sub3
|
||
%62:vgpr_32 = COPY %25.sub2
|
||
%63:vgpr_32 = COPY %25.sub1
|
||
%64:vgpr_32 = COPY killed %25.sub0
|
||
%65:vreg_128 = REG_SEQUENCE killed %64, %subreg.sub0, killed %63, %subreg.sub1, killed %62, %subreg.sub2, killed %61, %subreg.sub3
|
||
GLOBAL_STORE_DWORDX4_SADDR killed %1, killed %65, killed %2, 64, 0, 0, 0, implicit $exec
|
||
S_ENDPGM 0
|
||
|
||
...
|
||
|