1 ; RUN: llc -verify-machineinstrs < %s -mtriple=aarch64-none-linux-gnu -tailcallopt | FileCheck %s
3 declare fastcc void @callee_stack0()
4 declare fastcc void @callee_stack8([8 x i32], i64)
5 declare fastcc void @callee_stack16([8 x i32], i64, i64)
6 declare extern_weak fastcc void @callee_weak()
8 define fastcc void @caller_to0_from0() nounwind {
9 ; CHECK-LABEL: caller_to0_from0:
12 tail call fastcc void @callee_stack0()
15 ; CHECK-NEXT: b callee_stack0
18 define fastcc void @caller_to0_from8([8 x i32], i64) {
19 ; CHECK-LABEL: caller_to0_from8:
21 tail call fastcc void @callee_stack0()
24 ; CHECK: add sp, sp, #16
25 ; CHECK-NEXT: b callee_stack0
28 define fastcc void @caller_to8_from0() {
29 ; CHECK-LABEL: caller_to8_from0:
30 ; CHECK: sub sp, sp, #32
32 ; Key point is that the "42" should go #16 below incoming stack
33 ; pointer (we didn't have arg space to reuse).
34 tail call fastcc void @callee_stack8([8 x i32] undef, i64 42)
37 ; CHECK: str {{x[0-9]+}}, [sp, #16]!
38 ; CHECK-NEXT: b callee_stack8
41 define fastcc void @caller_to8_from8([8 x i32], i64 %a) {
42 ; CHECK-LABEL: caller_to8_from8:
43 ; CHECK: sub sp, sp, #16
45 ; Key point is that the "%a" should go where at SP on entry.
46 tail call fastcc void @callee_stack8([8 x i32] undef, i64 42)
49 ; CHECK: str {{x[0-9]+}}, [sp, #16]!
50 ; CHECK-NEXT: b callee_stack8
53 define fastcc void @caller_to16_from8([8 x i32], i64 %a) {
54 ; CHECK-LABEL: caller_to16_from8:
55 ; CHECK: sub sp, sp, #16
57 ; Important point is that the call reuses the "dead" argument space
58 ; above %a on the stack. If it tries to go below incoming-SP then the
59 ; callee will not deallocate the space, even in fastcc.
60 tail call fastcc void @callee_stack16([8 x i32] undef, i64 42, i64 2)
62 ; CHECK: stp {{x[0-9]+}}, {{x[0-9]+}}, [sp, #16]
63 ; CHECK-NEXT: add sp, sp, #16
64 ; CHECK-NEXT: b callee_stack16
69 define fastcc void @caller_to8_from24([8 x i32], i64 %a, i64 %b, i64 %c) {
70 ; CHECK-LABEL: caller_to8_from24:
71 ; CHECK: sub sp, sp, #16
73 ; Key point is that the "%a" should go where at #16 above SP on entry.
74 tail call fastcc void @callee_stack8([8 x i32] undef, i64 42)
77 ; CHECK: str {{x[0-9]+}}, [sp, #32]!
78 ; CHECK-NEXT: b callee_stack8
82 define fastcc void @caller_to16_from16([8 x i32], i64 %a, i64 %b) {
83 ; CHECK-LABEL: caller_to16_from16:
84 ; CHECK: sub sp, sp, #16
86 ; Here we want to make sure that both loads happen before the stores:
87 ; otherwise either %a or %b will be wrongly clobbered.
88 tail call fastcc void @callee_stack16([8 x i32] undef, i64 %b, i64 %a)
91 ; CHECK: ldp {{x[0-9]+}}, {{x[0-9]+}}, [sp, #16]
92 ; CHECK: stp {{x[0-9]+}}, {{x[0-9]+}}, [sp, #16]
93 ; CHECK-NEXT: add sp, sp, #16
94 ; CHECK-NEXT: b callee_stack16
98 ; Weakly-referenced extern functions cannot be tail-called, as AAELF does
99 ; not define the behaviour of branch instructions to undefined weak symbols.
100 define fastcc void @caller_weak() {
101 ; CHECK-LABEL: caller_weak:
102 ; CHECK: bl callee_weak
103 tail call void @callee_weak()
107 declare { [2 x float] } @get_vec2()
109 define { [3 x float] } @test_add_elem() {
110 ; CHECK-LABEL: test_add_elem:
112 ; CHECK: fmov s2, #1.0
115 %call = tail call { [2 x float] } @get_vec2()
116 %arr = extractvalue { [2 x float] } %call, 0
117 %arr.0 = extractvalue [2 x float] %arr, 0
118 %arr.1 = extractvalue [2 x float] %arr, 1
120 %res.0 = insertvalue { [3 x float] } undef, float %arr.0, 0, 0
121 %res.01 = insertvalue { [3 x float] } %res.0, float %arr.1, 0, 1
122 %res.012 = insertvalue { [3 x float] } %res.01, float 1.000000e+00, 0, 2
123 ret { [3 x float] } %res.012
126 declare double @get_double()
127 define { double, [2 x double] } @test_mismatched_insert() {
128 ; CHECK-LABEL: test_mismatched_insert:
129 ; CHECK: bl get_double
130 ; CHECK: bl get_double
131 ; CHECK: bl get_double
134 %val0 = call double @get_double()
135 %val1 = call double @get_double()
136 %val2 = tail call double @get_double()
138 %res.0 = insertvalue { double, [2 x double] } undef, double %val0, 0
139 %res.01 = insertvalue { double, [2 x double] } %res.0, double %val1, 1, 0
140 %res.012 = insertvalue { double, [2 x double] } %res.01, double %val2, 1, 1
142 ret { double, [2 x double] } %res.012