0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
1 ; RUN: llc -verify-machineinstrs < %s -mtriple=aarch64-none-linux-gnu -tailcallopt | FileCheck %s
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
2
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
3 declare fastcc void @callee_stack0()
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
4 declare fastcc void @callee_stack8([8 x i32], i64)
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
5 declare fastcc void @callee_stack16([8 x i32], i64, i64)
|
77
|
6 declare extern_weak fastcc void @callee_weak()
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
7
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
8 define fastcc void @caller_to0_from0() nounwind {
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
9 ; CHECK-LABEL: caller_to0_from0:
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
10 ; CHECK-NEXT: // BB
|
77
|
11
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
12 tail call fastcc void @callee_stack0()
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
13 ret void
|
77
|
14
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
15 ; CHECK-NEXT: b callee_stack0
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
16 }
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
17
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
18 define fastcc void @caller_to0_from8([8 x i32], i64) {
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
19 ; CHECK-LABEL: caller_to0_from8:
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
20
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
21 tail call fastcc void @callee_stack0()
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
22 ret void
|
77
|
23
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
24 ; CHECK: add sp, sp, #16
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
25 ; CHECK-NEXT: b callee_stack0
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
26 }
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
27
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
28 define fastcc void @caller_to8_from0() {
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
29 ; CHECK-LABEL: caller_to8_from0:
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
30 ; CHECK: sub sp, sp, #32
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
31
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
32 ; Key point is that the "42" should go #16 below incoming stack
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
33 ; pointer (we didn't have arg space to reuse).
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
34 tail call fastcc void @callee_stack8([8 x i32] undef, i64 42)
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
35 ret void
|
77
|
36
|
|
37 ; CHECK: str {{x[0-9]+}}, [sp, #16]!
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
38 ; CHECK-NEXT: b callee_stack8
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
39 }
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
40
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
41 define fastcc void @caller_to8_from8([8 x i32], i64 %a) {
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
42 ; CHECK-LABEL: caller_to8_from8:
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
43 ; CHECK: sub sp, sp, #16
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
44
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
45 ; Key point is that the "%a" should go where at SP on entry.
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
46 tail call fastcc void @callee_stack8([8 x i32] undef, i64 42)
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
47 ret void
|
77
|
48
|
|
49 ; CHECK: str {{x[0-9]+}}, [sp, #16]!
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
50 ; CHECK-NEXT: b callee_stack8
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
51 }
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
52
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
53 define fastcc void @caller_to16_from8([8 x i32], i64 %a) {
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
54 ; CHECK-LABEL: caller_to16_from8:
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
55 ; CHECK: sub sp, sp, #16
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
56
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
57 ; Important point is that the call reuses the "dead" argument space
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
58 ; above %a on the stack. If it tries to go below incoming-SP then the
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
59 ; callee will not deallocate the space, even in fastcc.
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
60 tail call fastcc void @callee_stack16([8 x i32] undef, i64 42, i64 2)
|
77
|
61
|
95
|
62 ; CHECK: stp {{x[0-9]+}}, {{x[0-9]+}}, [sp, #16]!
|
77
|
63 ; CHECK-NEXT: b callee_stack16
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
64 ret void
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
65 }
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
66
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
67
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
68 define fastcc void @caller_to8_from24([8 x i32], i64 %a, i64 %b, i64 %c) {
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
69 ; CHECK-LABEL: caller_to8_from24:
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
70 ; CHECK: sub sp, sp, #16
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
71
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
72 ; Key point is that the "%a" should go where at #16 above SP on entry.
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
73 tail call fastcc void @callee_stack8([8 x i32] undef, i64 42)
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
74 ret void
|
77
|
75
|
|
76 ; CHECK: str {{x[0-9]+}}, [sp, #32]!
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
77 ; CHECK-NEXT: b callee_stack8
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
78 }
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
79
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
80
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
81 define fastcc void @caller_to16_from16([8 x i32], i64 %a, i64 %b) {
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
82 ; CHECK-LABEL: caller_to16_from16:
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
83 ; CHECK: sub sp, sp, #16
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
84
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
85 ; Here we want to make sure that both loads happen before the stores:
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
86 ; otherwise either %a or %b will be wrongly clobbered.
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
87 tail call fastcc void @callee_stack16([8 x i32] undef, i64 %b, i64 %a)
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
88 ret void
|
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
89
|
77
|
90 ; CHECK: ldp {{x[0-9]+}}, {{x[0-9]+}}, [sp, #16]
|
95
|
91 ; CHECK: stp {{x[0-9]+}}, {{x[0-9]+}}, [sp, #16]!
|
77
|
92 ; CHECK-NEXT: b callee_stack16
|
|
93 }
|
|
94
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
95
|
77
|
96 ; Weakly-referenced extern functions cannot be tail-called, as AAELF does
|
|
97 ; not define the behaviour of branch instructions to undefined weak symbols.
|
|
98 define fastcc void @caller_weak() {
|
|
99 ; CHECK-LABEL: caller_weak:
|
|
100 ; CHECK: bl callee_weak
|
|
101 tail call void @callee_weak()
|
|
102 ret void
|
0
Kaito Tokumori <e105711@ie.u-ryukyu.ac.jp>
parents:
diff
changeset
|
103 }
|
95
|
104
|
|
105 declare { [2 x float] } @get_vec2()
|
|
106
|
|
107 define { [3 x float] } @test_add_elem() {
|
|
108 ; CHECK-LABEL: test_add_elem:
|
|
109 ; CHECK: bl get_vec2
|
|
110 ; CHECK: fmov s2, #1.0
|
|
111 ; CHECK: ret
|
|
112
|
|
113 %call = tail call { [2 x float] } @get_vec2()
|
|
114 %arr = extractvalue { [2 x float] } %call, 0
|
|
115 %arr.0 = extractvalue [2 x float] %arr, 0
|
|
116 %arr.1 = extractvalue [2 x float] %arr, 1
|
|
117
|
|
118 %res.0 = insertvalue { [3 x float] } undef, float %arr.0, 0, 0
|
|
119 %res.01 = insertvalue { [3 x float] } %res.0, float %arr.1, 0, 1
|
|
120 %res.012 = insertvalue { [3 x float] } %res.01, float 1.000000e+00, 0, 2
|
|
121 ret { [3 x float] } %res.012
|
|
122 }
|
|
123
|
|
124 declare double @get_double()
|
|
125 define { double, [2 x double] } @test_mismatched_insert() {
|
|
126 ; CHECK-LABEL: test_mismatched_insert:
|
|
127 ; CHECK: bl get_double
|
|
128 ; CHECK: bl get_double
|
|
129 ; CHECK: bl get_double
|
|
130 ; CHECK: ret
|
|
131
|
|
132 %val0 = call double @get_double()
|
|
133 %val1 = call double @get_double()
|
|
134 %val2 = tail call double @get_double()
|
|
135
|
|
136 %res.0 = insertvalue { double, [2 x double] } undef, double %val0, 0
|
|
137 %res.01 = insertvalue { double, [2 x double] } %res.0, double %val1, 1, 0
|
|
138 %res.012 = insertvalue { double, [2 x double] } %res.01, double %val2, 1, 1
|
|
139
|
|
140 ret { double, [2 x double] } %res.012
|
|
141 }
|