1 ; RUN: llc -march=amdgcn -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=GCN -check-prefix=FUNC %s
2 ; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=VI -check-prefix=GCN -check-prefix=FUNC %s
3 ; RUN: llc -march=r600 -mcpu=cypress -verify-machineinstrs < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s
5 ; FUNC-LABEL: {{^}}sext_bool_icmp_eq_0:
7 ; GCN: v_cmp_ne_i32_e32 vcc,
8 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
9 ; GCN-NEXT:buffer_store_byte [[RESULT]]
12 ; EG: SETNE_INT * [[CMP:T[0-9]+]].[[CMPCHAN:[XYZW]]], KC0[2].Z, KC0[2].W
13 ; EG: AND_INT T{{[0-9]+.[XYZW]}}, PS, 1
14 define void @sext_bool_icmp_eq_0(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
15 %icmp0 = icmp eq i32 %a, %b
16 %ext = sext i1 %icmp0 to i32
17 %icmp1 = icmp eq i32 %ext, 0
18 store i1 %icmp1, i1 addrspace(1)* %out
22 ; FUNC-LABEL: {{^}}sext_bool_icmp_ne_0:
24 ; GCN: v_cmp_ne_i32_e32 vcc,
25 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
26 ; GCN-NEXT: buffer_store_byte [[RESULT]]
29 ; EG: SETNE_INT * [[CMP:T[0-9]+]].[[CMPCHAN:[XYZW]]], KC0[2].Z, KC0[2].W
30 ; EG: AND_INT T{{[0-9]+.[XYZW]}}, PS, 1
31 define void @sext_bool_icmp_ne_0(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
32 %icmp0 = icmp ne i32 %a, %b
33 %ext = sext i1 %icmp0 to i32
34 %icmp1 = icmp ne i32 %ext, 0
35 store i1 %icmp1, i1 addrspace(1)* %out
39 ; This really folds away to false
40 ; FUNC-LABEL: {{^}}sext_bool_icmp_eq_1:
41 ; GCN: v_cmp_eq_i32_e32 vcc,
42 ; GCN-NEXT: v_cndmask_b32_e64 [[TMP:v[0-9]+]], 0, -1, vcc
43 ; GCN-NEXT: v_cmp_eq_i32_e32 vcc, 1, [[TMP]]{{$}}
44 ; GCN-NEXT: v_cndmask_b32_e64 [[TMP:v[0-9]+]], 0, 1,
45 ; GCN-NEXT: buffer_store_byte [[TMP]]
47 define void @sext_bool_icmp_eq_1(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
48 %icmp0 = icmp eq i32 %a, %b
49 %ext = sext i1 %icmp0 to i32
50 %icmp1 = icmp eq i32 %ext, 1
51 store i1 %icmp1, i1 addrspace(1)* %out
55 ; This really folds away to true
56 ; FUNC-LABEL: {{^}}sext_bool_icmp_ne_1:
57 ; GCN: v_cmp_ne_i32_e32 vcc,
58 ; GCN-NEXT: v_cndmask_b32_e64 [[TMP:v[0-9]+]], 0, -1, vcc
59 ; GCN-NEXT: v_cmp_ne_i32_e32 vcc, 1, [[TMP]]{{$}}
60 ; GCN-NEXT: v_cndmask_b32_e64 [[TMP:v[0-9]+]], 0, 1,
61 ; GCN-NEXT: buffer_store_byte [[TMP]]
63 define void @sext_bool_icmp_ne_1(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
64 %icmp0 = icmp ne i32 %a, %b
65 %ext = sext i1 %icmp0 to i32
66 %icmp1 = icmp ne i32 %ext, 1
67 store i1 %icmp1, i1 addrspace(1)* %out
71 ; FUNC-LABEL: {{^}}zext_bool_icmp_eq_0:
73 ; GCN: v_cmp_ne_i32_e32 vcc,
74 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
75 ; GCN-NEXT: buffer_store_byte [[RESULT]]
77 define void @zext_bool_icmp_eq_0(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
78 %icmp0 = icmp eq i32 %a, %b
79 %ext = zext i1 %icmp0 to i32
80 %icmp1 = icmp eq i32 %ext, 0
81 store i1 %icmp1, i1 addrspace(1)* %out
85 ; FUNC-LABEL: {{^}}zext_bool_icmp_ne_0:
87 ; GCN: v_cmp_ne_i32_e32 vcc,
88 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
89 ; GCN-NEXT: buffer_store_byte [[RESULT]]
91 define void @zext_bool_icmp_ne_0(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
92 %icmp0 = icmp ne i32 %a, %b
93 %ext = zext i1 %icmp0 to i32
94 %icmp1 = icmp ne i32 %ext, 0
95 store i1 %icmp1, i1 addrspace(1)* %out
99 ; FUNC-LABEL: {{^}}zext_bool_icmp_eq_1:
101 ; GCN: v_cmp_eq_i32_e32 vcc,
102 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
103 ; GCN-NEXT: buffer_store_byte [[RESULT]]
105 define void @zext_bool_icmp_eq_1(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
106 %icmp0 = icmp eq i32 %a, %b
107 %ext = zext i1 %icmp0 to i32
108 %icmp1 = icmp eq i32 %ext, 1
109 store i1 %icmp1, i1 addrspace(1)* %out
113 ; FUNC-LABEL: {{^}}zext_bool_icmp_ne_1:
115 ; GCN: v_cmp_eq_i32_e32 vcc,
116 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
117 ; GCN-NEXT: buffer_store_byte [[RESULT]]
118 define void @zext_bool_icmp_ne_1(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
119 %icmp0 = icmp ne i32 %a, %b
120 %ext = zext i1 %icmp0 to i32
121 %icmp1 = icmp ne i32 %ext, 1
122 store i1 %icmp1, i1 addrspace(1)* %out
126 ; FUNC-LABEL: {{^}}sext_bool_icmp_ne_k:
127 ; SI-DAG: s_load_dword [[A:s[0-9]+]], s{{\[[0-9]+:[0-9]+\]}}, 0xb
128 ; SI-DAG: s_load_dword [[B:s[0-9]+]], s{{\[[0-9]+:[0-9]+\]}}, 0xc
129 ; VI-DAG: s_load_dword [[A:s[0-9]+]], s{{\[[0-9]+:[0-9]+\]}}, 0x2c
130 ; VI-DAG: s_load_dword [[B:s[0-9]+]], s{{\[[0-9]+:[0-9]+\]}}, 0x30
131 ; GCN: v_mov_b32_e32 [[VB:v[0-9]+]], [[B]]
132 ; GCN: v_cmp_ne_i32_e32 vcc, 2, [[VB]]{{$}}
133 ; GCN: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
134 ; GCN: buffer_store_byte
136 define void @sext_bool_icmp_ne_k(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
137 %icmp0 = icmp ne i32 %a, %b
138 %ext = sext i1 %icmp0 to i32
139 %icmp1 = icmp ne i32 %ext, 2
140 store i1 %icmp1, i1 addrspace(1)* %out
144 ; FUNC-LABEL: {{^}}cmp_zext_k_i8max:
145 ; SI: s_load_dword [[VALUE:s[0-9]+]], s{{\[[0-9]+:[0-9]+\]}}, 0xb
146 ; VI: s_load_dword [[VALUE:s[0-9]+]], s{{\[[0-9]+:[0-9]+\]}}, 0x2c
147 ; GCN: s_movk_i32 [[K255:s[0-9]+]], 0xff
148 ; GCN: s_and_b32 [[B:s[0-9]+]], [[VALUE]], [[K255]]
149 ; GCN: v_mov_b32_e32 [[VK255:v[0-9]+]], [[K255]]
150 ; GCN: v_cmp_ne_i32_e32 vcc, [[B]], [[VK255]]
151 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
152 ; GCN: buffer_store_byte [[RESULT]]
154 define void @cmp_zext_k_i8max(i1 addrspace(1)* %out, i8 %b) nounwind {
155 %b.ext = zext i8 %b to i32
156 %icmp0 = icmp ne i32 %b.ext, 255
157 store i1 %icmp0, i1 addrspace(1)* %out
161 ; FUNC-LABEL: {{^}}cmp_sext_k_neg1:
162 ; GCN: buffer_load_sbyte [[B:v[0-9]+]]
163 ; GCN: v_cmp_ne_i32_e32 vcc, -1, [[B]]{{$}}
164 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
165 ; GCN-NEXT: buffer_store_byte [[RESULT]]
167 define void @cmp_sext_k_neg1(i1 addrspace(1)* %out, i8 addrspace(1)* %b.ptr) nounwind {
168 %b = load i8, i8 addrspace(1)* %b.ptr
169 %b.ext = sext i8 %b to i32
170 %icmp0 = icmp ne i32 %b.ext, -1
171 store i1 %icmp0, i1 addrspace(1)* %out
175 ; FUNC-LABEL: {{^}}cmp_sext_k_neg1_i8_sext_arg:
176 ; GCN: s_load_dword [[B:s[0-9]+]]
177 ; GCN: v_cmp_ne_i32_e64 [[CMP:s\[[0-9]+:[0-9]+\]]], -1, [[B]]
178 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, [[CMP]]
179 ; GCN-NEXT: buffer_store_byte [[RESULT]]
181 define void @cmp_sext_k_neg1_i8_sext_arg(i1 addrspace(1)* %out, i8 signext %b) nounwind {
182 %b.ext = sext i8 %b to i32
183 %icmp0 = icmp ne i32 %b.ext, -1
184 store i1 %icmp0, i1 addrspace(1)* %out
188 ; FIXME: This ends up doing a buffer_load_ubyte, and and compare to
189 ; 255. Seems to be because of ordering problems when not allowing load widths to be reduced.
190 ; Should do a buffer_load_sbyte and compare with -1
192 ; FUNC-LABEL: {{^}}cmp_sext_k_neg1_i8_arg:
193 ; SI: s_load_dword [[VAL:s[0-9]+]], s[{{[0-9]+:[0-9]+}}], 0xb
194 ; VI: s_load_dword [[VAL:s[0-9]+]], s{{\[[0-9]+:[0-9]+\]}}, 0x2c
195 ; GCN: s_movk_i32 [[K:s[0-9]+]], 0xff
196 ; GCN: s_and_b32 [[B:s[0-9]+]], [[VAL]], [[K]]
197 ; GCN: v_mov_b32_e32 [[VK:v[0-9]+]], [[K]]
198 ; GCN: v_cmp_ne_i32_e32 vcc, [[B]], [[VK]]{{$}}
199 ; GCN-NEXT: v_cndmask_b32_e64 [[RESULT:v[0-9]+]], 0, 1, vcc
200 ; GCN: buffer_store_byte [[RESULT]]
202 define void @cmp_sext_k_neg1_i8_arg(i1 addrspace(1)* %out, i8 %b) nounwind {
203 %b.ext = sext i8 %b to i32
204 %icmp0 = icmp ne i32 %b.ext, -1
205 store i1 %icmp0, i1 addrspace(1)* %out
209 ; FUNC-LABEL: {{^}}cmp_zext_k_neg1:
210 ; GCN: v_mov_b32_e32 [[RESULT:v[0-9]+]], 1{{$}}
211 ; GCN: buffer_store_byte [[RESULT]]
213 define void @cmp_zext_k_neg1(i1 addrspace(1)* %out, i8 %b) nounwind {
214 %b.ext = zext i8 %b to i32
215 %icmp0 = icmp ne i32 %b.ext, -1
216 store i1 %icmp0, i1 addrspace(1)* %out
220 ; FUNC-LABEL: {{^}}zext_bool_icmp_ne_k:
221 ; GCN: v_mov_b32_e32 [[RESULT:v[0-9]+]], 1{{$}}
222 ; GCN: buffer_store_byte [[RESULT]]
224 define void @zext_bool_icmp_ne_k(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
225 %icmp0 = icmp ne i32 %a, %b
226 %ext = zext i1 %icmp0 to i32
227 %icmp1 = icmp ne i32 %ext, 2
228 store i1 %icmp1, i1 addrspace(1)* %out
232 ; FUNC-LABEL: {{^}}zext_bool_icmp_eq_k:
233 ; GCN: v_mov_b32_e32 [[RESULT:v[0-9]+]], 0{{$}}
234 ; GCN: buffer_store_byte [[RESULT]]
236 define void @zext_bool_icmp_eq_k(i1 addrspace(1)* %out, i32 %a, i32 %b) nounwind {
237 %icmp0 = icmp ne i32 %a, %b
238 %ext = zext i1 %icmp0 to i32
239 %icmp1 = icmp eq i32 %ext, 2
240 store i1 %icmp1, i1 addrspace(1)* %out