1 ; RUN: llc -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 < %s | FileCheck %s
2 ; RUN: llc -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -disable-fp-elim < %s | FileCheck -check-prefix=CHECK-FP %s
3 ; RUN: llc -mtriple=powerpc-unknown-linux-gnu -disable-fp-elim < %s | FileCheck -check-prefix=CHECK-32 %s
4 ; RUN: llc -mtriple=powerpc-unknown-linux-gnu -disable-fp-elim -relocation-model=pic < %s | FileCheck -check-prefix=CHECK-32-PIC %s
5 target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"
6 target triple = "powerpc64-unknown-linux-gnu"
8 %struct.s = type { i32, i32 }
10 declare void @bar(i32*)
12 @barbaz = external global i32
14 define void @goo(%struct.s* byval nocapture readonly %a) {
16 %x = alloca [2 x i32], align 32
17 %a1 = getelementptr inbounds %struct.s* %a, i64 0, i32 0
18 %0 = load i32* %a1, align 4
19 %arrayidx = getelementptr inbounds [2 x i32]* %x, i64 0, i64 0
20 store i32 %0, i32* %arrayidx, align 32
21 %b = getelementptr inbounds %struct.s* %a, i64 0, i32 1
22 %1 = load i32* %b, align 4
23 %2 = load i32* @barbaz, align 4
24 %arrayidx2 = getelementptr inbounds [2 x i32]* %x, i64 0, i64 1
25 store i32 %2, i32* %arrayidx2, align 4
26 call void @bar(i32* %arrayidx)
33 ; CHECK-DAG: rldicl [[REG:[0-9]+]], 1, 0, 59
34 ; CHECK-DAG: std 30, -16(1)
36 ; CHECK-DAG: std 0, 16(1)
37 ; CHECK-DAG: subfic 0, [[REG]], -160
38 ; CHECK: stdux 1, 1, 0
40 ; CHECK: .cfi_offset r30, -16
41 ; CHECK: .cfi_offset lr, 16
43 ; CHECK: std 3, 48(30)
46 ; CHECK-DAG: ld 0, 16(1)
47 ; CHECK-DAG: ld 30, -16(1)
51 ; CHECK-FP-LABEL: @goo
53 ; CHECK-FP-DAG: mflr 0
54 ; CHECK-FP-DAG: rldicl [[REG:[0-9]+]], 1, 0, 59
55 ; CHECK-FP-DAG: std 31, -8(1)
56 ; CHECK-FP-DAG: std 30, -16(1)
57 ; CHECK-FP-DAG: mr 30, 1
58 ; CHECK-FP-DAG: std 0, 16(1)
59 ; CHECK-FP-DAG: subfic 0, [[REG]], -160
60 ; CHECK-FP: stdux 1, 1, 0
62 ; CHECK-FP: .cfi_offset r31, -8
63 ; CHECK-FP: .cfi_offset r30, -16
64 ; CHECK-FP: .cfi_offset lr, 16
68 ; CHECK-FP: std 3, 48(30)
70 ; CHECK-FP: ld 1, 0(1)
71 ; CHECK-FP-DAG: ld 0, 16(1)
72 ; CHECK-FP-DAG: ld 31, -8(1)
73 ; CHECK-FP-DAG: ld 30, -16(1)
74 ; CHECK-FP-DAG: mtlr 0
77 ; CHECK-32-LABEL: @goo
78 ; CHECK-32-DAG: mflr 0
79 ; CHECK-32-DAG: rlwinm [[REG:[0-9]+]], 1, 0, 27, 31
80 ; CHECK-32-DAG: stw 30, -8(1)
81 ; CHECK-32-DAG: mr 30, 1
82 ; CHECK-32-DAG: stw 0, 4(1)
83 ; CHECK-32-DAG: subfic 0, [[REG]], -64
84 ; CHECK-32: stwux 1, 1, 0
86 ; CHECK-32-PIC-LABEL: @goo
87 ; CHECK-32-PIC-DAG: mflr 0
88 ; CHECK-32-PIC-DAG: rlwinm [[REG:[0-9]+]], 1, 0, 27, 31
89 ; CHECK-32-PIC-DAG: stw 29, -12(1)
90 ; CHECK-32-PIC-DAG: mr 29, 1
91 ; CHECK-32-PIC-DAG: stw 0, 4(1)
92 ; CHECK-32-PIC-DAG: subfic 0, [[REG]], -64
93 ; CHECK-32-PIC: stwux 1, 1, 0
95 ; The large-frame-size case.
96 define void @hoo(%struct.s* byval nocapture readonly %a) {
98 %x = alloca [200000 x i32], align 32
99 %a1 = getelementptr inbounds %struct.s* %a, i64 0, i32 0
100 %0 = load i32* %a1, align 4
101 %arrayidx = getelementptr inbounds [200000 x i32]* %x, i64 0, i64 0
102 store i32 %0, i32* %arrayidx, align 32
103 %b = getelementptr inbounds %struct.s* %a, i64 0, i32 1
104 %1 = load i32* %b, align 4
105 %arrayidx2 = getelementptr inbounds [200000 x i32]* %x, i64 0, i64 1
106 store i32 %1, i32* %arrayidx2, align 4
107 call void @bar(i32* %arrayidx)
113 ; CHECK-DAG: lis [[REG1:[0-9]+]], -13
114 ; CHECK-DAG: rldicl [[REG3:[0-9]+]], 1, 0, 59
116 ; CHECK-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51808
117 ; CHECK-DAG: std 30, -16(1)
118 ; CHECK-DAG: mr 30, 1
119 ; CHECK-DAG: std 0, 16(1)
120 ; CHECK-DAG: subfc 0, [[REG3]], [[REG2]]
121 ; CHECK: stdux 1, 1, 0
125 ; CHECK-32-LABEL: @hoo
127 ; CHECK-32-DAG: lis [[REG1:[0-9]+]], -13
128 ; CHECK-32-DAG: rlwinm [[REG3:[0-9]+]], 1, 0, 27, 31
129 ; CHECK-32-DAG: mflr 0
130 ; CHECK-32-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51904
131 ; CHECK-32-DAG: stw 30, -8(1)
132 ; CHECK-32-DAG: mr 30, 1
133 ; CHECK-32-DAG: stw 0, 4(1)
134 ; CHECK-32-DAG: subfc 0, [[REG3]], [[REG2]]
135 ; CHECK-32: stwux 1, 1, 0
139 ; CHECK-32-PIC-LABEL: @hoo
141 ; CHECK-32-PIC-DAG: lis [[REG1:[0-9]+]], -13
142 ; CHECK-32-PIC-DAG: rlwinm [[REG3:[0-9]+]], 1, 0, 27, 31
143 ; CHECK-32-PIC-DAG: mflr 0
144 ; CHECK-32-PIC-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51904
145 ; CHECK-32-PIC-DAG: stw 29, -12(1)
146 ; CHECK-32-PIC-DAG: mr 29, 1
147 ; CHECK-32-PIC-DAG: stw 0, 4(1)
148 ; CHECK-32-PIC-DAG: subfc 0, [[REG3]], [[REG2]]
149 ; CHECK-32: stwux 1, 1, 0
153 ; Make sure that the FP save area is still allocated correctly relative to
154 ; where r30 is saved.
155 define void @loo(%struct.s* byval nocapture readonly %a) {
157 %x = alloca [2 x i32], align 32
158 %a1 = getelementptr inbounds %struct.s* %a, i64 0, i32 0
159 %0 = load i32* %a1, align 4
160 %arrayidx = getelementptr inbounds [2 x i32]* %x, i64 0, i64 0
161 store i32 %0, i32* %arrayidx, align 32
162 %b = getelementptr inbounds %struct.s* %a, i64 0, i32 1
163 %1 = load i32* %b, align 4
164 %arrayidx2 = getelementptr inbounds [2 x i32]* %x, i64 0, i64 1
165 store i32 %1, i32* %arrayidx2, align 4
166 call void @bar(i32* %arrayidx)
167 call void asm sideeffect "", "~{f30}"() nounwind
174 ; CHECK-DAG: rldicl [[REG:[0-9]+]], 1, 0, 59
175 ; CHECK-DAG: std 30, -32(1)
176 ; CHECK-DAG: mr 30, 1
177 ; CHECK-DAG: std 0, 16(1)
178 ; CHECK-DAG: subfic 0, [[REG]], -192
179 ; CHECK: stdux 1, 1, 0
181 ; CHECK: stfd 30, -16(30)
185 ; CHECK-FP-LABEL: @loo
187 ; CHECK-FP-DAG: mflr 0
188 ; CHECK-FP-DAG: rldicl [[REG:[0-9]+]], 1, 0, 59
189 ; CHECK-FP-DAG: std 31, -24(1)
190 ; CHECK-FP-DAG: std 30, -32(1)
191 ; CHECK-FP-DAG: mr 30, 1
192 ; CHECK-FP-DAG: std 0, 16(1)
193 ; CHECK-FP-DAG: subfic 0, [[REG]], -192
194 ; CHECK-FP: stdux 1, 1, 0
196 ; CHECK-FP: stfd 30, -16(30)