1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
| # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -march=amdgcn -verify-machineinstrs -run-pass=si-i1-copies %s -o - | FileCheck -check-prefix=GCN %s
---
name: kernel_i1_copy_phi_with_phi_incoming_value
tracksRegLiveness: true
body: |
; GCN-LABEL: name: kernel_i1_copy_phi_with_phi_incoming_value
; GCN: bb.0:
; GCN: successors: %bb.1(0x40000000), %bb.5(0x40000000)
; GCN: liveins: $vgpr0, $sgpr4_sgpr5
; GCN: [[COPY:%[0-9]+]]:sgpr_64(p4) = COPY $sgpr4_sgpr5
; GCN: [[COPY1:%[0-9]+]]:vgpr_32(s32) = COPY $vgpr0
; GCN: [[S_LOAD_DWORD_IMM:%[0-9]+]]:sreg_32_xm0_xexec = S_LOAD_DWORD_IMM [[COPY]](p4), 0, 0, 0 :: (dereferenceable invariant load 4, align 16, addrspace 4)
; GCN: [[COPY2:%[0-9]+]]:sreg_32 = COPY [[S_LOAD_DWORD_IMM]]
; GCN: [[COPY3:%[0-9]+]]:vgpr_32 = COPY [[COPY1]](s32)
; GCN: [[V_CMP_LT_I32_e64_:%[0-9]+]]:sreg_64 = V_CMP_LT_I32_e64 [[COPY1]](s32), [[S_LOAD_DWORD_IMM]], implicit $exec
; GCN: [[S_MOV_B64_:%[0-9]+]]:sreg_64 = S_MOV_B64 0
; GCN: [[SI_IF:%[0-9]+]]:sreg_64 = SI_IF killed [[V_CMP_LT_I32_e64_]], %bb.5, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
; GCN: S_BRANCH %bb.1
; GCN: bb.1:
; GCN: successors: %bb.6(0x80000000)
; GCN: [[S_MOV_B32_:%[0-9]+]]:sreg_32 = S_MOV_B32 16
; GCN: [[V_ADD_U32_e64_:%[0-9]+]]:vgpr_32 = V_ADD_U32_e64 [[COPY3]], killed [[S_MOV_B32_]], 0, implicit $exec
; GCN: [[V_CMP_GE_I32_e64_:%[0-9]+]]:sreg_64 = V_CMP_GE_I32_e64 [[V_ADD_U32_e64_]], [[COPY2]], implicit $exec
; GCN: [[S_MOV_B64_1:%[0-9]+]]:sreg_64 = S_MOV_B64 0
; GCN: [[COPY4:%[0-9]+]]:sreg_64 = COPY [[V_CMP_GE_I32_e64_]]
; GCN: S_BRANCH %bb.6
; GCN: bb.2:
; GCN: successors: %bb.5(0x80000000)
; GCN: [[PHI:%[0-9]+]]:sreg_64 = PHI %15, %bb.6
; GCN: SI_END_CF [[PHI]], implicit-def dead $exec, implicit-def dead $scc, implicit $exec
; GCN: [[S_MOV_B64_2:%[0-9]+]]:sreg_64 = S_MOV_B64 -1
; GCN: [[COPY5:%[0-9]+]]:sreg_64 = COPY $exec
; GCN: S_BRANCH %bb.5
; GCN: bb.3:
; GCN: successors: %bb.4(0x40000000), %bb.7(0x40000000)
; GCN: ATOMIC_FENCE 5, 2
; GCN: S_BARRIER
; GCN: ATOMIC_FENCE 4, 2
; GCN: [[COPY6:%[0-9]+]]:sreg_64 = COPY %18
; GCN: [[SI_IF1:%[0-9]+]]:sreg_64 = SI_IF [[COPY6]], %bb.7, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
; GCN: S_BRANCH %bb.4
; GCN: bb.4:
; GCN: successors: %bb.7(0x80000000)
; GCN: S_BRANCH %bb.7
; GCN: bb.5:
; GCN: successors: %bb.3(0x80000000)
; GCN: [[PHI1:%[0-9]+]]:sreg_64 = PHI [[S_MOV_B64_]], %bb.0, [[COPY5]], %bb.2
; GCN: SI_END_CF [[SI_IF]], implicit-def dead $exec, implicit-def dead $scc, implicit $exec
; GCN: S_BRANCH %bb.3
; GCN: bb.6:
; GCN: successors: %bb.2(0x40000000), %bb.6(0x40000000)
; GCN: [[PHI2:%[0-9]+]]:sreg_64 = PHI [[S_MOV_B64_1]], %bb.1, %15, %bb.6
; GCN: [[COPY7:%[0-9]+]]:sreg_64 = COPY [[COPY4]]
; GCN: [[SI_IF_BREAK:%[0-9]+]]:sreg_64 = SI_IF_BREAK [[COPY7]], [[PHI2]], implicit-def dead $scc
; GCN: SI_LOOP [[SI_IF_BREAK]], %bb.6, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
; GCN: S_BRANCH %bb.2
; GCN: bb.7:
; GCN: SI_END_CF [[SI_IF1]], implicit-def dead $exec, implicit-def dead $scc, implicit $exec
; GCN: S_ENDPGM 0
bb.0:
successors: %bb.1, %bb.5
liveins: $vgpr0, $sgpr4_sgpr5
%1:sgpr_64(p4) = COPY $sgpr4_sgpr5
%2:vgpr_32(s32) = COPY $vgpr0
%3:sreg_32_xm0_xexec = S_LOAD_DWORD_IMM %1:sgpr_64(p4), 0, 0, 0 :: (dereferenceable invariant load 4, align 16, addrspace 4)
%8:sreg_32 = COPY %3:sreg_32_xm0_xexec
%14:vgpr_32 = COPY %2:vgpr_32(s32)
%9:sreg_64 = V_CMP_LT_I32_e64 %2:vgpr_32(s32), %3:sreg_32_xm0_xexec, implicit $exec
%4:sreg_64 = S_MOV_B64 0
%17:vreg_1 = COPY %4:sreg_64, implicit $exec
%16:sreg_64 = SI_IF killed %9:sreg_64, %bb.5, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
S_BRANCH %bb.1
bb.1:
; predecessors: %bb.0
successors: %bb.6
%10:sreg_32 = S_MOV_B32 16
%18:vgpr_32 = V_ADD_U32_e64 %14:vgpr_32, killed %10:sreg_32, 0, implicit $exec
%11:sreg_64 = V_CMP_GE_I32_e64 %18:vgpr_32, %8:sreg_32, implicit $exec
%12:sreg_64 = S_MOV_B64 0
%19:vreg_1 = COPY %11:sreg_64
S_BRANCH %bb.6
bb.2:
; predecessors: %bb.6
successors: %bb.5
%20:sreg_64 = PHI %6:sreg_64, %bb.6
SI_END_CF %20:sreg_64, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
%15:sreg_64 = S_MOV_B64 -1
%21:vreg_1 = COPY %15:sreg_64, implicit $exec
S_BRANCH %bb.5
bb.3:
; predecessors: %bb.5
successors: %bb.4, %bb.7
%22:vreg_1 = PHI %7:vreg_1, %bb.5
ATOMIC_FENCE 5, 2
S_BARRIER
ATOMIC_FENCE 4, 2
%23:sreg_64 = COPY %22:vreg_1
%24:sreg_64 = SI_IF %23:sreg_64, %bb.7, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
S_BRANCH %bb.4
bb.4:
; predecessors: %bb.3
successors: %bb.7
S_BRANCH %bb.7
bb.5:
; predecessors: %bb.0, %bb.2
successors: %bb.3
%7:vreg_1 = PHI %17:vreg_1, %bb.0, %21:vreg_1, %bb.2
SI_END_CF %16:sreg_64, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
S_BRANCH %bb.3
bb.6:
; predecessors: %bb.1, %bb.6
successors: %bb.2, %bb.6
%5:sreg_64 = PHI %12:sreg_64, %bb.1, %6:sreg_64, %bb.6
%13:sreg_64 = COPY %19:vreg_1
%6:sreg_64 = SI_IF_BREAK %13:sreg_64, %5:sreg_64, implicit-def dead $scc
SI_LOOP %6:sreg_64, %bb.6, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
S_BRANCH %bb.2
bb.7:
; predecessors: %bb.3, %bb.4
SI_END_CF %24:sreg_64, implicit-def dead $exec, implicit-def dead $scc, implicit $exec
S_ENDPGM 0
...
|