1 ; Test 32-bit floating-point comparison. The tests assume a z10 implementation
2 ; of select, using conditional branches rather than LOCGR.
4 ; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z10 | FileCheck %s
8 ; Check comparison with registers.
9 define i64 @f1(i64 %a, i64 %b, float %f1, float %f2) {
11 ; CHECK: cebr %f0, %f2
15 %cond = fcmp oeq float %f1, %f2
16 %res = select i1 %cond, i64 %a, i64 %b
20 ; Check the low end of the CEB range.
21 define i64 @f2(i64 %a, i64 %b, float %f1, float *%ptr) {
23 ; CHECK: ceb %f0, 0(%r4)
27 %f2 = load float *%ptr
28 %cond = fcmp oeq float %f1, %f2
29 %res = select i1 %cond, i64 %a, i64 %b
33 ; Check the high end of the aligned CEB range.
34 define i64 @f3(i64 %a, i64 %b, float %f1, float *%base) {
36 ; CHECK: ceb %f0, 4092(%r4)
40 %ptr = getelementptr float *%base, i64 1023
41 %f2 = load float *%ptr
42 %cond = fcmp oeq float %f1, %f2
43 %res = select i1 %cond, i64 %a, i64 %b
47 ; Check the next word up, which needs separate address logic.
48 ; Other sequences besides this one would be OK.
49 define i64 @f4(i64 %a, i64 %b, float %f1, float *%base) {
51 ; CHECK: aghi %r4, 4096
52 ; CHECK: ceb %f0, 0(%r4)
56 %ptr = getelementptr float *%base, i64 1024
57 %f2 = load float *%ptr
58 %cond = fcmp oeq float %f1, %f2
59 %res = select i1 %cond, i64 %a, i64 %b
63 ; Check negative displacements, which also need separate address logic.
64 define i64 @f5(i64 %a, i64 %b, float %f1, float *%base) {
67 ; CHECK: ceb %f0, 0(%r4)
71 %ptr = getelementptr float *%base, i64 -1
72 %f2 = load float *%ptr
73 %cond = fcmp oeq float %f1, %f2
74 %res = select i1 %cond, i64 %a, i64 %b
78 ; Check that CEB allows indices.
79 define i64 @f6(i64 %a, i64 %b, float %f1, float *%base, i64 %index) {
81 ; CHECK: sllg %r1, %r5, 2
82 ; CHECK: ceb %f0, 400(%r1,%r4)
86 %ptr1 = getelementptr float *%base, i64 %index
87 %ptr2 = getelementptr float *%ptr1, i64 100
88 %f2 = load float *%ptr2
89 %cond = fcmp oeq float %f1, %f2
90 %res = select i1 %cond, i64 %a, i64 %b
94 ; Check that comparisons of spilled values can use CEB rather than CEBR.
95 define float @f7(float *%ptr0) {
97 ; CHECK: brasl %r14, foo@PLT
98 ; CHECK: ceb {{%f[0-9]+}}, 16{{[04]}}(%r15)
100 %ptr1 = getelementptr float *%ptr0, i64 2
101 %ptr2 = getelementptr float *%ptr0, i64 4
102 %ptr3 = getelementptr float *%ptr0, i64 6
103 %ptr4 = getelementptr float *%ptr0, i64 8
104 %ptr5 = getelementptr float *%ptr0, i64 10
105 %ptr6 = getelementptr float *%ptr0, i64 12
106 %ptr7 = getelementptr float *%ptr0, i64 14
107 %ptr8 = getelementptr float *%ptr0, i64 16
108 %ptr9 = getelementptr float *%ptr0, i64 18
109 %ptr10 = getelementptr float *%ptr0, i64 20
111 %val0 = load float *%ptr0
112 %val1 = load float *%ptr1
113 %val2 = load float *%ptr2
114 %val3 = load float *%ptr3
115 %val4 = load float *%ptr4
116 %val5 = load float *%ptr5
117 %val6 = load float *%ptr6
118 %val7 = load float *%ptr7
119 %val8 = load float *%ptr8
120 %val9 = load float *%ptr9
121 %val10 = load float *%ptr10
123 %ret = call float @foo()
125 %cmp0 = fcmp olt float %ret, %val0
126 %cmp1 = fcmp olt float %ret, %val1
127 %cmp2 = fcmp olt float %ret, %val2
128 %cmp3 = fcmp olt float %ret, %val3
129 %cmp4 = fcmp olt float %ret, %val4
130 %cmp5 = fcmp olt float %ret, %val5
131 %cmp6 = fcmp olt float %ret, %val6
132 %cmp7 = fcmp olt float %ret, %val7
133 %cmp8 = fcmp olt float %ret, %val8
134 %cmp9 = fcmp olt float %ret, %val9
135 %cmp10 = fcmp olt float %ret, %val10
137 %sel0 = select i1 %cmp0, float %ret, float 0.0
138 %sel1 = select i1 %cmp1, float %sel0, float 1.0
139 %sel2 = select i1 %cmp2, float %sel1, float 2.0
140 %sel3 = select i1 %cmp3, float %sel2, float 3.0
141 %sel4 = select i1 %cmp4, float %sel3, float 4.0
142 %sel5 = select i1 %cmp5, float %sel4, float 5.0
143 %sel6 = select i1 %cmp6, float %sel5, float 6.0
144 %sel7 = select i1 %cmp7, float %sel6, float 7.0
145 %sel8 = select i1 %cmp8, float %sel7, float 8.0
146 %sel9 = select i1 %cmp9, float %sel8, float 9.0
147 %sel10 = select i1 %cmp10, float %sel9, float 10.0
152 ; Check comparison with zero.
153 define i64 @f8(i64 %a, i64 %b, float %f) {
155 ; CHECK: ltebr %f0, %f0
157 ; CHECK: lgr %r2, %r3
159 %cond = fcmp oeq float %f, 0.0
160 %res = select i1 %cond, i64 %a, i64 %b
164 ; Check the comparison can be reversed if that allows CEB to be used,
166 define i64 @f9(i64 %a, i64 %b, float %f2, float *%ptr) {
168 ; CHECK: ceb %f0, 0(%r4)
169 ; CHECK-NEXT: je {{\.L.*}}
170 ; CHECK: lgr %r2, %r3
172 %f1 = load float *%ptr
173 %cond = fcmp oeq float %f1, %f2
174 %res = select i1 %cond, i64 %a, i64 %b
179 define i64 @f10(i64 %a, i64 %b, float %f2, float *%ptr) {
181 ; CHECK: ceb %f0, 0(%r4)
182 ; CHECK-NEXT: jlh {{\.L.*}}
183 ; CHECK: lgr %r2, %r3
185 %f1 = load float *%ptr
186 %cond = fcmp one float %f1, %f2
187 %res = select i1 %cond, i64 %a, i64 %b
192 define i64 @f11(i64 %a, i64 %b, float %f2, float *%ptr) {
194 ; CHECK: ceb %f0, 0(%r4)
195 ; CHECK-NEXT: jh {{\.L.*}}
196 ; CHECK: lgr %r2, %r3
198 %f1 = load float *%ptr
199 %cond = fcmp olt float %f1, %f2
200 %res = select i1 %cond, i64 %a, i64 %b
205 define i64 @f12(i64 %a, i64 %b, float %f2, float *%ptr) {
207 ; CHECK: ceb %f0, 0(%r4)
208 ; CHECK-NEXT: jhe {{\.L.*}}
209 ; CHECK: lgr %r2, %r3
211 %f1 = load float *%ptr
212 %cond = fcmp ole float %f1, %f2
213 %res = select i1 %cond, i64 %a, i64 %b
218 define i64 @f13(i64 %a, i64 %b, float %f2, float *%ptr) {
220 ; CHECK: ceb %f0, 0(%r4)
221 ; CHECK-NEXT: jle {{\.L.*}}
222 ; CHECK: lgr %r2, %r3
224 %f1 = load float *%ptr
225 %cond = fcmp oge float %f1, %f2
226 %res = select i1 %cond, i64 %a, i64 %b
231 define i64 @f14(i64 %a, i64 %b, float %f2, float *%ptr) {
233 ; CHECK: ceb %f0, 0(%r4)
234 ; CHECK-NEXT: jl {{\.L.*}}
235 ; CHECK: lgr %r2, %r3
237 %f1 = load float *%ptr
238 %cond = fcmp ogt float %f1, %f2
239 %res = select i1 %cond, i64 %a, i64 %b
244 define i64 @f15(i64 %a, i64 %b, float %f2, float *%ptr) {
246 ; CHECK: ceb %f0, 0(%r4)
247 ; CHECK-NEXT: jnlh {{\.L.*}}
248 ; CHECK: lgr %r2, %r3
250 %f1 = load float *%ptr
251 %cond = fcmp ueq float %f1, %f2
252 %res = select i1 %cond, i64 %a, i64 %b
257 define i64 @f16(i64 %a, i64 %b, float %f2, float *%ptr) {
259 ; CHECK: ceb %f0, 0(%r4)
260 ; CHECK-NEXT: jne {{\.L.*}}
261 ; CHECK: lgr %r2, %r3
263 %f1 = load float *%ptr
264 %cond = fcmp une float %f1, %f2
265 %res = select i1 %cond, i64 %a, i64 %b
270 define i64 @f17(i64 %a, i64 %b, float %f2, float *%ptr) {
272 ; CHECK: ceb %f0, 0(%r4)
273 ; CHECK-NEXT: jnle {{\.L.*}}
274 ; CHECK: lgr %r2, %r3
276 %f1 = load float *%ptr
277 %cond = fcmp ult float %f1, %f2
278 %res = select i1 %cond, i64 %a, i64 %b
283 define i64 @f18(i64 %a, i64 %b, float %f2, float *%ptr) {
285 ; CHECK: ceb %f0, 0(%r4)
286 ; CHECK-NEXT: jnl {{\.L.*}}
287 ; CHECK: lgr %r2, %r3
289 %f1 = load float *%ptr
290 %cond = fcmp ule float %f1, %f2
291 %res = select i1 %cond, i64 %a, i64 %b
296 define i64 @f19(i64 %a, i64 %b, float %f2, float *%ptr) {
298 ; CHECK: ceb %f0, 0(%r4)
299 ; CHECK-NEXT: jnh {{\.L.*}}
300 ; CHECK: lgr %r2, %r3
302 %f1 = load float *%ptr
303 %cond = fcmp uge float %f1, %f2
304 %res = select i1 %cond, i64 %a, i64 %b
309 define i64 @f20(i64 %a, i64 %b, float %f2, float *%ptr) {
311 ; CHECK: ceb %f0, 0(%r4)
312 ; CHECK-NEXT: jnhe {{\.L.*}}
313 ; CHECK: lgr %r2, %r3
315 %f1 = load float *%ptr
316 %cond = fcmp ugt float %f1, %f2
317 %res = select i1 %cond, i64 %a, i64 %b