1; RUN: llc < %s -asm-verbose=false -disable-wasm-fallthrough-return-opt | FileCheck %s
2
3target datalayout = "e-m:e-p:32:32-i64:64-n32:64-S128"
4target triple = "wasm32-unknown-unknown"
5
6declare void @ext_func(i64* %ptr)
7declare void @ext_func_i32(i32* %ptr)
8
9; CHECK-LABEL: alloca32:
10; Check that there is an extra local for the stack pointer.
11; CHECK: .local i32{{$}}
12define void @alloca32() noredzone {
13 ; CHECK: i32.const $push[[L4:.+]]=, 0{{$}}
14 ; CHECK: i32.const $push[[L1:.+]]=, 0{{$}}
15 ; CHECK-NEXT: i32.load $push[[L2:.+]]=, __stack_pointer($pop[[L1]])
16 ; CHECK-NEXT: i32.const $push[[L3:.+]]=, 16
17 ; CHECK-NEXT: i32.sub $push[[L9:.+]]=, $pop[[L2]], $pop[[L3]]
18 ; CHECK-NEXT: tee_local $push[[L8:.+]]=, $[[SP:.+]]=, $pop[[L9]]{{$}}
19 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L4]]), $pop[[L8]]{{$}}
20 %retval = alloca i32
21 ; CHECK: i32.const $push[[L0:.+]]=, 0
22 ; CHECK: i32.store 12($[[SP]]), $pop[[L0]]
23 store i32 0, i32* %retval
24 ; CHECK: i32.const $push[[L6:.+]]=, 0
25 ; CHECK-NEXT: i32.const $push[[L5:.+]]=, 16
26 ; CHECK-NEXT: i32.add $push[[L7:.+]]=, $[[SP]], $pop[[L5]]
27 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L6]]), $pop[[L7]]
28 ret void
29}
30
31; CHECK-LABEL: alloca3264:
32; CHECK: .local i32{{$}}
33define void @alloca3264() {
34 ; CHECK: i32.const $push[[L2:.+]]=, 0{{$}}
35 ; CHECK-NEXT: i32.load $push[[L3:.+]]=, __stack_pointer($pop[[L2]])
36 ; CHECK-NEXT: i32.const $push[[L4:.+]]=, 16
37 ; CHECK-NEXT: i32.sub $push[[L6:.+]]=, $pop[[L3]], $pop[[L4]]
38 ; CHECK-NEXT: tee_local $push[[L5:.+]]=, $[[SP:.+]]=, $pop[[L6]]
39 %r1 = alloca i32
40 %r2 = alloca double
41 ; CHECK-NEXT: i32.const $push[[L0:.+]]=, 0
42 ; CHECK-NEXT: i32.store 12($pop[[L5]]), $pop[[L0]]
43 store i32 0, i32* %r1
44 ; CHECK-NEXT: i64.const $push[[L1:.+]]=, 0
45 ; CHECK-NEXT: i64.store 0($[[SP]]), $pop[[L1]]
46 store double 0.0, double* %r2
47 ; CHECK-NEXT: return
48 ret void
49}
50
51; CHECK-LABEL: allocarray:
52; CHECK: .local i32{{$}}
53define void @allocarray() {
54 ; CHECK: i32.const $push[[L6:.+]]=, 0{{$}}
55 ; CHECK: i32.const $push[[L3:.+]]=, 0{{$}}
56 ; CHECK-NEXT: i32.load $push[[L4:.+]]=, __stack_pointer($pop[[L3]])
57 ; CHECK-NEXT: i32.const $push[[L5:.+]]=, 144{{$}}
58 ; CHECK-NEXT: i32.sub $push[[L12:.+]]=, $pop[[L4]], $pop[[L5]]
59 ; CHECK-NEXT: tee_local $push[[L11:.+]]=, $0=, $pop[[L12]]
60 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L6]]), $pop[[L11]]
61 %r = alloca [33 x i32]
62
63 ; CHECK:      i32.const $push{{.+}}=, 24
64 ; CHECK-NEXT: i32.add $push[[L3:.+]]=, $[[SP]], $pop{{.+}}
65 ; CHECK-NEXT: i32.const $push[[L1:.+]]=, 1{{$}}
66 ; CHECK-NEXT: i32.store 0($pop[[L3]]), $pop[[L1]]{{$}}
67 ; CHECK-NEXT: i32.const $push[[L10:.+]]=, 1{{$}}
68 ; CHECK-NEXT: i32.store 12(${{.+}}), $pop[[L10]]{{$}}
69 %p = getelementptr [33 x i32], [33 x i32]* %r, i32 0, i32 0
70 store i32 1, i32* %p
71 %p2 = getelementptr [33 x i32], [33 x i32]* %r, i32 0, i32 3
72 store i32 1, i32* %p2
73
74 ; CHECK: i32.const $push[[L9:.+]]=, 0{{$}}
75 ; CHECK-NEXT: i32.const $push[[L7:.+]]=, 144
76 ; CHECK-NEXT: i32.add $push[[L8:.+]]=, $[[SP]], $pop[[L7]]
77 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L9]]), $pop[[L8]]
78 ret void
79}
80
81; CHECK-LABEL: non_mem_use
82define void @non_mem_use(i8** %addr) {
83 ; CHECK: i32.const $push[[L2:.+]]=, 48
84 ; CHECK-NEXT: i32.sub $push[[L12:.+]]=, {{.+}}, $pop[[L2]]
85 ; CHECK-NEXT: tee_local $push[[L11:.+]]=, $[[SP:.+]]=, $pop[[L12]]
86 ; CHECK-NEXT: i32.store {{.+}}, $pop[[L11]]
87 %buf = alloca [27 x i8], align 16
88 %r = alloca i64
89 %r2 = alloca i64
90 ; %r is at SP+8
91 ; CHECK: i32.const $push[[OFF:.+]]=, 8
92 ; CHECK-NEXT: i32.add $push[[ARG1:.+]]=, $[[SP]], $pop[[OFF]]
93 ; CHECK-NEXT: call ext_func@FUNCTION, $pop[[ARG1]]
94 call void @ext_func(i64* %r)
95 ; %r2 is at SP+0, no add needed
96 ; CHECK-NEXT: call ext_func@FUNCTION, $[[SP]]
97 call void @ext_func(i64* %r2)
98 ; Use as a value, but in a store
99 ; %buf is at SP+16
100 ; CHECK: i32.const $push[[OFF:.+]]=, 16
101 ; CHECK-NEXT: i32.add $push[[VAL:.+]]=, $[[SP]], $pop[[OFF]]
102 ; CHECK-NEXT: i32.store 0($0), $pop[[VAL]]
103 %gep = getelementptr inbounds [27 x i8], [27 x i8]* %buf, i32 0, i32 0
104 store i8* %gep, i8** %addr
105 ret void
106}
107
108; CHECK-LABEL: allocarray_inbounds:
109; CHECK: .local i32{{$}}
110define void @allocarray_inbounds() {
111 ; CHECK: i32.const $push[[L5:.+]]=, 0{{$}}
112 ; CHECK: i32.const $push[[L2:.+]]=, 0{{$}}
113 ; CHECK-NEXT: i32.load $push[[L3:.+]]=, __stack_pointer($pop[[L2]])
114 ; CHECK-NEXT: i32.const $push[[L4:.+]]=, 32{{$}}
115 ; CHECK-NEXT: i32.sub $push[[L11:.+]]=, $pop[[L3]], $pop[[L4]]
116 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, $[[SP:.+]]=, $pop[[L11]]
117 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L5]]), $pop[[L10]]{{$}}
118 %r = alloca [5 x i32]
119 ; CHECK: i32.const $push[[L3:.+]]=, 1
120 ; CHECK-DAG: i32.store 24(${{.+}}), $pop[[L3]]
121 %p = getelementptr inbounds [5 x i32], [5 x i32]* %r, i32 0, i32 0
122 store i32 1, i32* %p
123 ; This store should have both the GEP and the FI folded into it.
124 ; CHECK-DAG: i32.store 12(${{.+}}), $pop
125 %p2 = getelementptr inbounds [5 x i32], [5 x i32]* %r, i32 0, i32 3
126 store i32 1, i32* %p2
127 call void @ext_func(i64* null);
128 ; CHECK: call ext_func
129 ; CHECK: i32.const $push[[L6:.+]]=, 0{{$}}
130 ; CHECK-NEXT: i32.const $push[[L5:.+]]=, 32{{$}}
131 ; CHECK-NEXT: i32.add $push[[L7:.+]]=, ${{.+}}, $pop[[L5]]
132 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L6]]), $pop[[L7]]
133 ret void
134}
135
136; CHECK-LABEL: dynamic_alloca:
137define void @dynamic_alloca(i32 %alloc) {
138 ; CHECK: i32.const $push[[L7:.+]]=, 0{{$}}
139 ; CHECK: i32.const $push[[L1:.+]]=, 0{{$}}
140 ; CHECK-NEXT: i32.load $push[[L13:.+]]=, __stack_pointer($pop[[L1]])
141 ; CHECK-NEXT: tee_local $push[[L12:.+]]=, [[SP:.+]], $pop[[L13]]{{$}}
142 ; Target independent codegen bumps the stack pointer.
143 ; CHECK: i32.sub
144 ; Check that SP is written back to memory after decrement
145 ; CHECK: i32.store __stack_pointer($pop{{.+}}),
146 %r = alloca i32, i32 %alloc
147 ; Target-independent codegen also calculates the store addr
148 ; CHECK: call ext_func_i32@FUNCTION
149 call void @ext_func_i32(i32* %r)
150 ; CHECK: i32.const $push[[L3:.+]]=, 0{{$}}
151 ; CHECK: i32.store __stack_pointer($pop[[L3]]), $pop{{.+}}
152 ret void
153}
154
155; CHECK-LABEL: dynamic_alloca_redzone:
156define void @dynamic_alloca_redzone(i32 %alloc) {
157 ; CHECK: i32.const $push[[L8:.+]]=, 0{{$}}
158 ; CHECK-NEXT: i32.load $push[[L13:.+]]=, __stack_pointer($pop[[L1]])
159 ; CHECK-NEXT: tee_local $push[[L12:.+]]=, [[SP:.+]], $pop[[L13]]{{$}}
160 ; CHECK-NEXT: copy_local [[FP:.+]]=, $pop[[L12]]{{$}}
161 ; Target independent codegen bumps the stack pointer
162 ; CHECK: i32.sub
163 %r = alloca i32, i32 %alloc
164 ; CHECK-NEXT: tee_local       $push[[L8:.+]]=, $0=, $pop
165 ; CHECK-NEXT: copy_local      $drop=, $pop[[L8]]{{$}}
166 ; CHECK-NEXT: i32.const       $push[[L6:.+]]=, 0{{$}}
167 ; CHECK-NEXT: i32.store       0($0), $pop[[L6]]{{$}}
168 store i32 0, i32* %r
169 ; CHECK-NEXT: return
170 ret void
171}
172
173; CHECK-LABEL: dynamic_static_alloca:
174define void @dynamic_static_alloca(i32 %alloc) noredzone {
175 ; Decrement SP in the prolog by the static amount and writeback to memory.
176 ; CHECK: i32.const $push[[L13:.+]]=, 0{{$}}
177 ; CHECK: i32.const $push[[L10:.+]]=, 0{{$}}
178 ; CHECK-NEXT: i32.load $push[[L11:.+]]=, __stack_pointer($pop[[L10]])
179 ; CHECK-NEXT: i32.const $push[[L12:.+]]=, 16
180 ; CHECK-NEXT: i32.sub $push[[L23:.+]]=, $pop[[L11]], $pop[[L12]]
181 ; CHECK-NEXT: tee_local $push[[L22:.+]]=, $[[SP:.+]]=, $pop[[L23]]
182 ; CHECK-NEXT: i32.store __stack_pointer($pop{{.+}}), $pop[[L22]]
183
184 ; Alloc and write to a static alloca
185 ; CHECK: copy_local $push[[L21:.+]]=, $[[SP]]
186 ; CHECK-NEXT: tee_local $push[[pushedFP:.+]]=, $[[FP:.+]]=, $pop[[L21]]
187 ; CHECK-NEXT: i32.const $push[[L0:.+]]=, 101
188 ; CHECK-NEXT: i32.store [[static_offset:.+]]($pop[[pushedFP]]), $pop[[L0]]
189 %static = alloca i32
190 store volatile i32 101, i32* %static
191
192 ; Decrement SP in the body by the dynamic amount.
193 ; CHECK: i32.sub
194 ; CHECK: tee_local $push{{.+}}=, $[[dynamic_local:.+]]=, $pop{{.+}}
195 ; CHECK: i32.store __stack_pointer
196 %dynamic = alloca i32, i32 %alloc
197
198 ; Ensure we don't modify the frame pointer after assigning it.
199 ; CHECK-NOT: $[[FP]]=
200
201 ; Ensure the static address doesn't change after modifying the stack pointer.
202 ; CHECK: i32.const $push[[L7:.+]]=, 102
203 ; CHECK-NEXT: i32.store [[static_offset]]($[[FP]]), $pop[[L7]]
204 ; CHECK-NEXT: i32.const $push[[L8:.+]]=, 103
205 ; CHECK-NEXT: i32.store 0($[[dynamic_local]]), $pop[[L8]]
206 store volatile i32 102, i32* %static
207 store volatile i32 103, i32* %dynamic
208
209 ; Decrement SP in the body by the dynamic amount.
210 ; CHECK: i32.sub
211 ; CHECK: tee_local $push{{.+}}=, $[[dynamic2_local:.+]]=, $pop{{.+}}
212 %dynamic.2 = alloca i32, i32 %alloc
213
214 ; CHECK-NOT: $[[FP]]=
215
216 ; Ensure neither the static nor dynamic address changes after the second
217 ; modification of the stack pointer.
218 ; CHECK: i32.const $push[[L9:.+]]=, 104
219 ; CHECK-NEXT: i32.store [[static_offset]]($[[FP]]), $pop[[L9]]
220 ; CHECK-NEXT: i32.const $push[[L10:.+]]=, 105
221 ; CHECK-NEXT: i32.store 0($[[dynamic_local]]), $pop[[L10]]
222 ; CHECK-NEXT: i32.const $push[[L11:.+]]=, 106
223 ; CHECK-NEXT: i32.store 0($[[dynamic2_local]]), $pop[[L11]]
224 store volatile i32 104, i32* %static
225 store volatile i32 105, i32* %dynamic
226 store volatile i32 106, i32* %dynamic.2
227
228 ; Writeback to memory.
229 ; CHECK: i32.const $push[[L17:.+]]=, 16
230 ; CHECK-NEXT: i32.add $push[[L18:.+]]=, $[[FP]], $pop[[L17]]
231 ; CHECK-NEXT: i32.store __stack_pointer($pop{{.+}}), $pop[[L18]]
232 ret void
233}
234
235declare i8* @llvm.stacksave()
236declare void @llvm.stackrestore(i8*)
237
238; CHECK-LABEL: llvm_stack_builtins:
239define void @llvm_stack_builtins(i32 %alloc) noredzone {
240 ; CHECK: i32.load $push[[L11:.+]]=, __stack_pointer($pop{{.+}})
241 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, ${{.+}}=, $pop[[L11]]
242 ; CHECK-NEXT: copy_local $[[STACK:.+]]=, $pop[[L10]]
243 %stack = call i8* @llvm.stacksave()
244
245 ; Ensure we don't reassign the stacksave local
246 ; CHECK-NOT: $[[STACK]]=
247 %dynamic = alloca i32, i32 %alloc
248
249 ; CHECK: i32.store __stack_pointer($pop{{.+}}), $[[STACK]]
250 call void @llvm.stackrestore(i8* %stack)
251
252 ret void
253}
254
255; Not actually using the alloca'd variables exposed an issue with register
256; stackification, where copying the stack pointer into the frame pointer was
257; moved after the stack pointer was updated for the dynamic alloca.
258; CHECK-LABEL: dynamic_alloca_nouse:
259define void @dynamic_alloca_nouse(i32 %alloc) noredzone {
260 ; CHECK: i32.load $push[[L11:.+]]=, __stack_pointer($pop{{.+}})
261 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, ${{.+}}=, $pop[[L11]]
262 ; CHECK-NEXT: copy_local $[[FP:.+]]=, $pop[[L10]]
263 %dynamic = alloca i32, i32 %alloc
264
265 ; CHECK-NOT: $[[FP]]=,
266
267 ; CHECK: i32.store __stack_pointer($pop{{.+}}), $[[FP]]
268 ret void
269}
270
271; The use of the alloca in a phi causes a CopyToReg DAG node to be generated,
272; which has to have special handling because CopyToReg can't have a FI operand
273; CHECK-LABEL: copytoreg_fi:
274define void @copytoreg_fi(i1 %cond, i32* %b) {
275entry:
276 ; CHECK: i32.const $push[[L1:.+]]=, 16
277 ; CHECK-NEXT: i32.sub $push[[L3:.+]]=, {{.+}}, $pop[[L1]]
278 %addr = alloca i32
279 ; CHECK: i32.const $push[[OFF:.+]]=, 12
280 ; CHECK-NEXT: i32.add $push[[ADDR:.+]]=, $pop[[L3]], $pop[[OFF]]
281 ; CHECK-NEXT: copy_local [[COPY:.+]]=, $pop[[ADDR]]
282 br label %body
283body:
284 %a = phi i32* [%addr, %entry], [%b, %body]
285 store i32 1, i32* %a
286 ; CHECK: i32.store 0([[COPY]]),
287 br i1 %cond, label %body, label %exit
288exit:
289 ret void
290}
291
292declare void @use_i8_star(i8*)
293declare i8* @llvm.frameaddress(i32)
294
295; Test __builtin_frame_address(0).
296; CHECK-LABEL: frameaddress_0:
297; CHECK: i32.const $push[[L0:.+]]=, 0{{$}}
298; CHECK-NEXT: i32.load $push[[L3:.+]]=, __stack_pointer($pop[[L0]])
299; CHECK-NEXT: copy_local $push[[L4:.+]]=, $pop[[L3]]{{$}}
300; CHECK-NEXT: tee_local $push[[L2:.+]]=, $[[FP:.+]]=, $pop[[L4]]{{$}}
301; CHECK-NEXT: call use_i8_star@FUNCTION, $pop[[L2]]
302; CHECK-NEXT: i32.const $push[[L1:.+]]=, 0{{$}}
303; CHECK-NEXT: i32.store __stack_pointer($pop[[L1]]), $[[FP]]
304define void @frameaddress_0() {
305  %t = call i8* @llvm.frameaddress(i32 0)
306  call void @use_i8_star(i8* %t)
307  ret void
308}
309
310; Test __builtin_frame_address(1).
311
312; CHECK-LABEL: frameaddress_1:
313; CHECK-NEXT: i32.const $push0=, 0{{$}}
314; CHECK-NEXT: call use_i8_star@FUNCTION, $pop0{{$}}
315; CHECK-NEXT: return{{$}}
316define void @frameaddress_1() {
317  %t = call i8* @llvm.frameaddress(i32 1)
318  call void @use_i8_star(i8* %t)
319  ret void
320}
321
322; Test a stack address passed to an inline asm.
323; CHECK-LABEL: inline_asm:
324; CHECK:       __stack_pointer
325; CHECK:       #APP
326; CHECK-NEXT:  # %{{[0-9]+}}{{$}}
327; CHECK-NEXT:  #NO_APP
328define void @inline_asm() {
329  %tmp = alloca i8
330  call void asm sideeffect "# %0", "r"(i8* %tmp)
331  ret void
332}
333
334; TODO: test over-aligned alloca
335