1 ; RUN: llc -march=amdgcn -mcpu=SI < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
2 ; RUN: llc -march=r600 -mcpu=redwood < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s
4 ; FUNC-LABEL: {{^}}sdiv24_i8:
14 define void @sdiv24_i8(i8 addrspace(1)* %out, i8 addrspace(1)* %in) {
15 %den_ptr = getelementptr i8 addrspace(1)* %in, i8 1
16 %num = load i8 addrspace(1) * %in
17 %den = load i8 addrspace(1) * %den_ptr
18 %result = sdiv i8 %num, %den
19 store i8 %result, i8 addrspace(1)* %out
23 ; FUNC-LABEL: {{^}}sdiv24_i16:
33 define void @sdiv24_i16(i16 addrspace(1)* %out, i16 addrspace(1)* %in) {
34 %den_ptr = getelementptr i16 addrspace(1)* %in, i16 1
35 %num = load i16 addrspace(1) * %in, align 2
36 %den = load i16 addrspace(1) * %den_ptr, align 2
37 %result = sdiv i16 %num, %den
38 store i16 %result, i16 addrspace(1)* %out, align 2
42 ; FUNC-LABEL: {{^}}sdiv24_i32:
52 define void @sdiv24_i32(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
53 %den_ptr = getelementptr i32 addrspace(1)* %in, i32 1
54 %num = load i32 addrspace(1) * %in, align 4
55 %den = load i32 addrspace(1) * %den_ptr, align 4
56 %num.i24.0 = shl i32 %num, 8
57 %den.i24.0 = shl i32 %den, 8
58 %num.i24 = ashr i32 %num.i24.0, 8
59 %den.i24 = ashr i32 %den.i24.0, 8
60 %result = sdiv i32 %num.i24, %den.i24
61 store i32 %result, i32 addrspace(1)* %out, align 4
65 ; FUNC-LABEL: {{^}}sdiv25_i32:
66 ; SI-NOT: v_cvt_f32_i32
71 define void @sdiv25_i32(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
72 %den_ptr = getelementptr i32 addrspace(1)* %in, i32 1
73 %num = load i32 addrspace(1) * %in, align 4
74 %den = load i32 addrspace(1) * %den_ptr, align 4
75 %num.i24.0 = shl i32 %num, 7
76 %den.i24.0 = shl i32 %den, 7
77 %num.i24 = ashr i32 %num.i24.0, 7
78 %den.i24 = ashr i32 %den.i24.0, 7
79 %result = sdiv i32 %num.i24, %den.i24
80 store i32 %result, i32 addrspace(1)* %out, align 4
84 ; FUNC-LABEL: {{^}}test_no_sdiv24_i32_1:
85 ; SI-NOT: v_cvt_f32_i32
90 define void @test_no_sdiv24_i32_1(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
91 %den_ptr = getelementptr i32 addrspace(1)* %in, i32 1
92 %num = load i32 addrspace(1) * %in, align 4
93 %den = load i32 addrspace(1) * %den_ptr, align 4
94 %num.i24.0 = shl i32 %num, 8
95 %den.i24.0 = shl i32 %den, 7
96 %num.i24 = ashr i32 %num.i24.0, 8
97 %den.i24 = ashr i32 %den.i24.0, 7
98 %result = sdiv i32 %num.i24, %den.i24
99 store i32 %result, i32 addrspace(1)* %out, align 4
103 ; FUNC-LABEL: {{^}}test_no_sdiv24_i32_2:
104 ; SI-NOT: v_cvt_f32_i32
109 define void @test_no_sdiv24_i32_2(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
110 %den_ptr = getelementptr i32 addrspace(1)* %in, i32 1
111 %num = load i32 addrspace(1) * %in, align 4
112 %den = load i32 addrspace(1) * %den_ptr, align 4
113 %num.i24.0 = shl i32 %num, 7
114 %den.i24.0 = shl i32 %den, 8
115 %num.i24 = ashr i32 %num.i24.0, 7
116 %den.i24 = ashr i32 %den.i24.0, 8
117 %result = sdiv i32 %num.i24, %den.i24
118 store i32 %result, i32 addrspace(1)* %out, align 4
122 ; FUNC-LABEL: {{^}}srem24_i8:
132 define void @srem24_i8(i8 addrspace(1)* %out, i8 addrspace(1)* %in) {
133 %den_ptr = getelementptr i8 addrspace(1)* %in, i8 1
134 %num = load i8 addrspace(1) * %in
135 %den = load i8 addrspace(1) * %den_ptr
136 %result = srem i8 %num, %den
137 store i8 %result, i8 addrspace(1)* %out
141 ; FUNC-LABEL: {{^}}srem24_i16:
151 define void @srem24_i16(i16 addrspace(1)* %out, i16 addrspace(1)* %in) {
152 %den_ptr = getelementptr i16 addrspace(1)* %in, i16 1
153 %num = load i16 addrspace(1) * %in, align 2
154 %den = load i16 addrspace(1) * %den_ptr, align 2
155 %result = srem i16 %num, %den
156 store i16 %result, i16 addrspace(1)* %out, align 2
160 ; FUNC-LABEL: {{^}}srem24_i32:
170 define void @srem24_i32(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
171 %den_ptr = getelementptr i32 addrspace(1)* %in, i32 1
172 %num = load i32 addrspace(1) * %in, align 4
173 %den = load i32 addrspace(1) * %den_ptr, align 4
174 %num.i24.0 = shl i32 %num, 8
175 %den.i24.0 = shl i32 %den, 8
176 %num.i24 = ashr i32 %num.i24.0, 8
177 %den.i24 = ashr i32 %den.i24.0, 8
178 %result = srem i32 %num.i24, %den.i24
179 store i32 %result, i32 addrspace(1)* %out, align 4
183 ; FUNC-LABEL: {{^}}srem25_i32:
184 ; SI-NOT: v_cvt_f32_i32
189 define void @srem25_i32(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
190 %den_ptr = getelementptr i32 addrspace(1)* %in, i32 1
191 %num = load i32 addrspace(1) * %in, align 4
192 %den = load i32 addrspace(1) * %den_ptr, align 4
193 %num.i24.0 = shl i32 %num, 7
194 %den.i24.0 = shl i32 %den, 7
195 %num.i24 = ashr i32 %num.i24.0, 7
196 %den.i24 = ashr i32 %den.i24.0, 7
197 %result = srem i32 %num.i24, %den.i24
198 store i32 %result, i32 addrspace(1)* %out, align 4
202 ; FUNC-LABEL: {{^}}test_no_srem24_i32_1:
203 ; SI-NOT: v_cvt_f32_i32
208 define void @test_no_srem24_i32_1(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
209 %den_ptr = getelementptr i32 addrspace(1)* %in, i32 1
210 %num = load i32 addrspace(1) * %in, align 4
211 %den = load i32 addrspace(1) * %den_ptr, align 4
212 %num.i24.0 = shl i32 %num, 8
213 %den.i24.0 = shl i32 %den, 7
214 %num.i24 = ashr i32 %num.i24.0, 8
215 %den.i24 = ashr i32 %den.i24.0, 7
216 %result = srem i32 %num.i24, %den.i24
217 store i32 %result, i32 addrspace(1)* %out, align 4
221 ; FUNC-LABEL: {{^}}test_no_srem24_i32_2:
222 ; SI-NOT: v_cvt_f32_i32
227 define void @test_no_srem24_i32_2(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
228 %den_ptr = getelementptr i32 addrspace(1)* %in, i32 1
229 %num = load i32 addrspace(1) * %in, align 4
230 %den = load i32 addrspace(1) * %den_ptr, align 4
231 %num.i24.0 = shl i32 %num, 7
232 %den.i24.0 = shl i32 %den, 8
233 %num.i24 = ashr i32 %num.i24.0, 7
234 %den.i24 = ashr i32 %den.i24.0, 8
235 %result = srem i32 %num.i24, %den.i24
236 store i32 %result, i32 addrspace(1)* %out, align 4