1; RUN: llc < %s -asm-verbose=false -disable-wasm-fallthrough-return-opt | FileCheck %s 2 3target datalayout = "e-m:e-p:32:32-i64:64-n32:64-S128" 4target triple = "wasm32-unknown-unknown" 5 6declare void @ext_func(i64* %ptr) 7declare void @ext_func_i32(i32* %ptr) 8 9; CHECK-LABEL: alloca32: 10; Check that there is an extra local for the stack pointer. 11; CHECK: .local i32{{$}} 12define void @alloca32() noredzone { 13 ; CHECK: i32.const $push[[L4:.+]]=, 0{{$}} 14 ; CHECK: i32.const $push[[L1:.+]]=, 0{{$}} 15 ; CHECK-NEXT: i32.load $push[[L2:.+]]=, __stack_pointer($pop[[L1]]) 16 ; CHECK-NEXT: i32.const $push[[L3:.+]]=, 16 17 ; CHECK-NEXT: i32.sub $push[[L9:.+]]=, $pop[[L2]], $pop[[L3]] 18 ; CHECK-NEXT: tee_local $push[[L8:.+]]=, $[[SP:.+]]=, $pop[[L9]]{{$}} 19 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L4]]), $pop[[L8]]{{$}} 20 %retval = alloca i32 21 ; CHECK: i32.const $push[[L0:.+]]=, 0 22 ; CHECK: i32.store 12($[[SP]]), $pop[[L0]] 23 store i32 0, i32* %retval 24 ; CHECK: i32.const $push[[L6:.+]]=, 0 25 ; CHECK-NEXT: i32.const $push[[L5:.+]]=, 16 26 ; CHECK-NEXT: i32.add $push[[L7:.+]]=, $[[SP]], $pop[[L5]] 27 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L6]]), $pop[[L7]] 28 ret void 29} 30 31; CHECK-LABEL: alloca3264: 32; CHECK: .local i32{{$}} 33define void @alloca3264() { 34 ; CHECK: i32.const $push[[L2:.+]]=, 0{{$}} 35 ; CHECK-NEXT: i32.load $push[[L3:.+]]=, __stack_pointer($pop[[L2]]) 36 ; CHECK-NEXT: i32.const $push[[L4:.+]]=, 16 37 ; CHECK-NEXT: i32.sub $push[[L6:.+]]=, $pop[[L3]], $pop[[L4]] 38 ; CHECK-NEXT: tee_local $push[[L5:.+]]=, $[[SP:.+]]=, $pop[[L6]] 39 %r1 = alloca i32 40 %r2 = alloca double 41 ; CHECK-NEXT: i32.const $push[[L0:.+]]=, 0 42 ; CHECK-NEXT: i32.store 12($pop[[L5]]), $pop[[L0]] 43 store i32 0, i32* %r1 44 ; CHECK-NEXT: i64.const $push[[L1:.+]]=, 0 45 ; CHECK-NEXT: i64.store 0($[[SP]]), $pop[[L1]] 46 store double 0.0, double* %r2 47 ; CHECK-NEXT: return 48 ret void 49} 50 51; CHECK-LABEL: allocarray: 52; CHECK: .local i32{{$}} 53define void @allocarray() { 54 ; CHECK: i32.const $push[[L6:.+]]=, 0{{$}} 55 ; CHECK: i32.const $push[[L3:.+]]=, 0{{$}} 56 ; CHECK-NEXT: i32.load $push[[L4:.+]]=, __stack_pointer($pop[[L3]]) 57 ; CHECK-NEXT: i32.const $push[[L5:.+]]=, 144{{$}} 58 ; CHECK-NEXT: i32.sub $push[[L12:.+]]=, $pop[[L4]], $pop[[L5]] 59 ; CHECK-NEXT: tee_local $push[[L11:.+]]=, $0=, $pop[[L12]] 60 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L6]]), $pop[[L11]] 61 %r = alloca [33 x i32] 62 63 ; CHECK: i32.const $push{{.+}}=, 24 64 ; CHECK-NEXT: i32.add $push[[L3:.+]]=, $[[SP]], $pop{{.+}} 65 ; CHECK-NEXT: i32.const $push[[L1:.+]]=, 1{{$}} 66 ; CHECK-NEXT: i32.store 0($pop[[L3]]), $pop[[L1]]{{$}} 67 ; CHECK-NEXT: i32.const $push[[L10:.+]]=, 1{{$}} 68 ; CHECK-NEXT: i32.store 12(${{.+}}), $pop[[L10]]{{$}} 69 %p = getelementptr [33 x i32], [33 x i32]* %r, i32 0, i32 0 70 store i32 1, i32* %p 71 %p2 = getelementptr [33 x i32], [33 x i32]* %r, i32 0, i32 3 72 store i32 1, i32* %p2 73 74 ; CHECK: i32.const $push[[L9:.+]]=, 0{{$}} 75 ; CHECK-NEXT: i32.const $push[[L7:.+]]=, 144 76 ; CHECK-NEXT: i32.add $push[[L8:.+]]=, $[[SP]], $pop[[L7]] 77 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L9]]), $pop[[L8]] 78 ret void 79} 80 81; CHECK-LABEL: non_mem_use 82define void @non_mem_use(i8** %addr) { 83 ; CHECK: i32.const $push[[L2:.+]]=, 48 84 ; CHECK-NEXT: i32.sub $push[[L12:.+]]=, {{.+}}, $pop[[L2]] 85 ; CHECK-NEXT: tee_local $push[[L11:.+]]=, $[[SP:.+]]=, $pop[[L12]] 86 ; CHECK-NEXT: i32.store {{.+}}, $pop[[L11]] 87 %buf = alloca [27 x i8], align 16 88 %r = alloca i64 89 %r2 = alloca i64 90 ; %r is at SP+8 91 ; CHECK: i32.const $push[[OFF:.+]]=, 8 92 ; CHECK-NEXT: i32.add $push[[ARG1:.+]]=, $[[SP]], $pop[[OFF]] 93 ; CHECK-NEXT: call ext_func@FUNCTION, $pop[[ARG1]] 94 call void @ext_func(i64* %r) 95 ; %r2 is at SP+0, no add needed 96 ; CHECK-NEXT: call ext_func@FUNCTION, $[[SP]] 97 call void @ext_func(i64* %r2) 98 ; Use as a value, but in a store 99 ; %buf is at SP+16 100 ; CHECK: i32.const $push[[OFF:.+]]=, 16 101 ; CHECK-NEXT: i32.add $push[[VAL:.+]]=, $[[SP]], $pop[[OFF]] 102 ; CHECK-NEXT: i32.store 0($0), $pop[[VAL]] 103 %gep = getelementptr inbounds [27 x i8], [27 x i8]* %buf, i32 0, i32 0 104 store i8* %gep, i8** %addr 105 ret void 106} 107 108; CHECK-LABEL: allocarray_inbounds: 109; CHECK: .local i32{{$}} 110define void @allocarray_inbounds() { 111 ; CHECK: i32.const $push[[L5:.+]]=, 0{{$}} 112 ; CHECK: i32.const $push[[L2:.+]]=, 0{{$}} 113 ; CHECK-NEXT: i32.load $push[[L3:.+]]=, __stack_pointer($pop[[L2]]) 114 ; CHECK-NEXT: i32.const $push[[L4:.+]]=, 32{{$}} 115 ; CHECK-NEXT: i32.sub $push[[L11:.+]]=, $pop[[L3]], $pop[[L4]] 116 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, $[[SP:.+]]=, $pop[[L11]] 117 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L5]]), $pop[[L10]]{{$}} 118 %r = alloca [5 x i32] 119 ; CHECK: i32.const $push[[L3:.+]]=, 1 120 ; CHECK-DAG: i32.store 24(${{.+}}), $pop[[L3]] 121 %p = getelementptr inbounds [5 x i32], [5 x i32]* %r, i32 0, i32 0 122 store i32 1, i32* %p 123 ; This store should have both the GEP and the FI folded into it. 124 ; CHECK-DAG: i32.store 12(${{.+}}), $pop 125 %p2 = getelementptr inbounds [5 x i32], [5 x i32]* %r, i32 0, i32 3 126 store i32 1, i32* %p2 127 call void @ext_func(i64* null); 128 ; CHECK: call ext_func 129 ; CHECK: i32.const $push[[L6:.+]]=, 0{{$}} 130 ; CHECK-NEXT: i32.const $push[[L5:.+]]=, 32{{$}} 131 ; CHECK-NEXT: i32.add $push[[L7:.+]]=, ${{.+}}, $pop[[L5]] 132 ; CHECK-NEXT: i32.store __stack_pointer($pop[[L6]]), $pop[[L7]] 133 ret void 134} 135 136; CHECK-LABEL: dynamic_alloca: 137define void @dynamic_alloca(i32 %alloc) { 138 ; CHECK: i32.const $push[[L7:.+]]=, 0{{$}} 139 ; CHECK: i32.const $push[[L1:.+]]=, 0{{$}} 140 ; CHECK-NEXT: i32.load $push[[L13:.+]]=, __stack_pointer($pop[[L1]]) 141 ; CHECK-NEXT: tee_local $push[[L12:.+]]=, [[SP:.+]], $pop[[L13]]{{$}} 142 ; Target independent codegen bumps the stack pointer. 143 ; CHECK: i32.sub 144 ; Check that SP is written back to memory after decrement 145 ; CHECK: i32.store __stack_pointer($pop{{.+}}), 146 %r = alloca i32, i32 %alloc 147 ; Target-independent codegen also calculates the store addr 148 ; CHECK: call ext_func_i32@FUNCTION 149 call void @ext_func_i32(i32* %r) 150 ; CHECK: i32.const $push[[L3:.+]]=, 0{{$}} 151 ; CHECK: i32.store __stack_pointer($pop[[L3]]), $pop{{.+}} 152 ret void 153} 154 155; CHECK-LABEL: dynamic_alloca_redzone: 156define void @dynamic_alloca_redzone(i32 %alloc) { 157 ; CHECK: i32.const $push[[L8:.+]]=, 0{{$}} 158 ; CHECK-NEXT: i32.load $push[[L13:.+]]=, __stack_pointer($pop[[L1]]) 159 ; CHECK-NEXT: tee_local $push[[L12:.+]]=, [[SP:.+]], $pop[[L13]]{{$}} 160 ; CHECK-NEXT: copy_local [[FP:.+]]=, $pop[[L12]]{{$}} 161 ; Target independent codegen bumps the stack pointer 162 ; CHECK: i32.sub 163 %r = alloca i32, i32 %alloc 164 ; CHECK-NEXT: tee_local $push[[L8:.+]]=, $0=, $pop 165 ; CHECK-NEXT: copy_local $drop=, $pop[[L8]]{{$}} 166 ; CHECK-NEXT: i32.const $push[[L6:.+]]=, 0{{$}} 167 ; CHECK-NEXT: i32.store 0($0), $pop[[L6]]{{$}} 168 store i32 0, i32* %r 169 ; CHECK-NEXT: return 170 ret void 171} 172 173; CHECK-LABEL: dynamic_static_alloca: 174define void @dynamic_static_alloca(i32 %alloc) noredzone { 175 ; Decrement SP in the prolog by the static amount and writeback to memory. 176 ; CHECK: i32.const $push[[L13:.+]]=, 0{{$}} 177 ; CHECK: i32.const $push[[L10:.+]]=, 0{{$}} 178 ; CHECK-NEXT: i32.load $push[[L11:.+]]=, __stack_pointer($pop[[L10]]) 179 ; CHECK-NEXT: i32.const $push[[L12:.+]]=, 16 180 ; CHECK-NEXT: i32.sub $push[[L23:.+]]=, $pop[[L11]], $pop[[L12]] 181 ; CHECK-NEXT: tee_local $push[[L22:.+]]=, $[[SP:.+]]=, $pop[[L23]] 182 ; CHECK-NEXT: i32.store __stack_pointer($pop{{.+}}), $pop[[L22]] 183 184 ; Alloc and write to a static alloca 185 ; CHECK: copy_local $push[[L21:.+]]=, $[[SP]] 186 ; CHECK-NEXT: tee_local $push[[pushedFP:.+]]=, $[[FP:.+]]=, $pop[[L21]] 187 ; CHECK-NEXT: i32.const $push[[L0:.+]]=, 101 188 ; CHECK-NEXT: i32.store [[static_offset:.+]]($pop[[pushedFP]]), $pop[[L0]] 189 %static = alloca i32 190 store volatile i32 101, i32* %static 191 192 ; Decrement SP in the body by the dynamic amount. 193 ; CHECK: i32.sub 194 ; CHECK: tee_local $push{{.+}}=, $[[dynamic_local:.+]]=, $pop{{.+}} 195 ; CHECK: i32.store __stack_pointer 196 %dynamic = alloca i32, i32 %alloc 197 198 ; Ensure we don't modify the frame pointer after assigning it. 199 ; CHECK-NOT: $[[FP]]= 200 201 ; Ensure the static address doesn't change after modifying the stack pointer. 202 ; CHECK: i32.const $push[[L7:.+]]=, 102 203 ; CHECK-NEXT: i32.store [[static_offset]]($[[FP]]), $pop[[L7]] 204 ; CHECK-NEXT: i32.const $push[[L8:.+]]=, 103 205 ; CHECK-NEXT: i32.store 0($[[dynamic_local]]), $pop[[L8]] 206 store volatile i32 102, i32* %static 207 store volatile i32 103, i32* %dynamic 208 209 ; Decrement SP in the body by the dynamic amount. 210 ; CHECK: i32.sub 211 ; CHECK: tee_local $push{{.+}}=, $[[dynamic2_local:.+]]=, $pop{{.+}} 212 %dynamic.2 = alloca i32, i32 %alloc 213 214 ; CHECK-NOT: $[[FP]]= 215 216 ; Ensure neither the static nor dynamic address changes after the second 217 ; modification of the stack pointer. 218 ; CHECK: i32.const $push[[L9:.+]]=, 104 219 ; CHECK-NEXT: i32.store [[static_offset]]($[[FP]]), $pop[[L9]] 220 ; CHECK-NEXT: i32.const $push[[L10:.+]]=, 105 221 ; CHECK-NEXT: i32.store 0($[[dynamic_local]]), $pop[[L10]] 222 ; CHECK-NEXT: i32.const $push[[L11:.+]]=, 106 223 ; CHECK-NEXT: i32.store 0($[[dynamic2_local]]), $pop[[L11]] 224 store volatile i32 104, i32* %static 225 store volatile i32 105, i32* %dynamic 226 store volatile i32 106, i32* %dynamic.2 227 228 ; Writeback to memory. 229 ; CHECK: i32.const $push[[L17:.+]]=, 16 230 ; CHECK-NEXT: i32.add $push[[L18:.+]]=, $[[FP]], $pop[[L17]] 231 ; CHECK-NEXT: i32.store __stack_pointer($pop{{.+}}), $pop[[L18]] 232 ret void 233} 234 235declare i8* @llvm.stacksave() 236declare void @llvm.stackrestore(i8*) 237 238; CHECK-LABEL: llvm_stack_builtins: 239define void @llvm_stack_builtins(i32 %alloc) noredzone { 240 ; CHECK: i32.load $push[[L11:.+]]=, __stack_pointer($pop{{.+}}) 241 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, ${{.+}}=, $pop[[L11]] 242 ; CHECK-NEXT: copy_local $[[STACK:.+]]=, $pop[[L10]] 243 %stack = call i8* @llvm.stacksave() 244 245 ; Ensure we don't reassign the stacksave local 246 ; CHECK-NOT: $[[STACK]]= 247 %dynamic = alloca i32, i32 %alloc 248 249 ; CHECK: i32.store __stack_pointer($pop{{.+}}), $[[STACK]] 250 call void @llvm.stackrestore(i8* %stack) 251 252 ret void 253} 254 255; Not actually using the alloca'd variables exposed an issue with register 256; stackification, where copying the stack pointer into the frame pointer was 257; moved after the stack pointer was updated for the dynamic alloca. 258; CHECK-LABEL: dynamic_alloca_nouse: 259define void @dynamic_alloca_nouse(i32 %alloc) noredzone { 260 ; CHECK: i32.load $push[[L11:.+]]=, __stack_pointer($pop{{.+}}) 261 ; CHECK-NEXT: tee_local $push[[L10:.+]]=, ${{.+}}=, $pop[[L11]] 262 ; CHECK-NEXT: copy_local $[[FP:.+]]=, $pop[[L10]] 263 %dynamic = alloca i32, i32 %alloc 264 265 ; CHECK-NOT: $[[FP]]=, 266 267 ; CHECK: i32.store __stack_pointer($pop{{.+}}), $[[FP]] 268 ret void 269} 270 271; The use of the alloca in a phi causes a CopyToReg DAG node to be generated, 272; which has to have special handling because CopyToReg can't have a FI operand 273; CHECK-LABEL: copytoreg_fi: 274define void @copytoreg_fi(i1 %cond, i32* %b) { 275entry: 276 ; CHECK: i32.const $push[[L1:.+]]=, 16 277 ; CHECK-NEXT: i32.sub $push[[L3:.+]]=, {{.+}}, $pop[[L1]] 278 %addr = alloca i32 279 ; CHECK: i32.const $push[[OFF:.+]]=, 12 280 ; CHECK-NEXT: i32.add $push[[ADDR:.+]]=, $pop[[L3]], $pop[[OFF]] 281 ; CHECK-NEXT: copy_local [[COPY:.+]]=, $pop[[ADDR]] 282 br label %body 283body: 284 %a = phi i32* [%addr, %entry], [%b, %body] 285 store i32 1, i32* %a 286 ; CHECK: i32.store 0([[COPY]]), 287 br i1 %cond, label %body, label %exit 288exit: 289 ret void 290} 291 292declare void @use_i8_star(i8*) 293declare i8* @llvm.frameaddress(i32) 294 295; Test __builtin_frame_address(0). 296; CHECK-LABEL: frameaddress_0: 297; CHECK: i32.const $push[[L0:.+]]=, 0{{$}} 298; CHECK-NEXT: i32.load $push[[L3:.+]]=, __stack_pointer($pop[[L0]]) 299; CHECK-NEXT: copy_local $push[[L4:.+]]=, $pop[[L3]]{{$}} 300; CHECK-NEXT: tee_local $push[[L2:.+]]=, $[[FP:.+]]=, $pop[[L4]]{{$}} 301; CHECK-NEXT: call use_i8_star@FUNCTION, $pop[[L2]] 302; CHECK-NEXT: i32.const $push[[L1:.+]]=, 0{{$}} 303; CHECK-NEXT: i32.store __stack_pointer($pop[[L1]]), $[[FP]] 304define void @frameaddress_0() { 305 %t = call i8* @llvm.frameaddress(i32 0) 306 call void @use_i8_star(i8* %t) 307 ret void 308} 309 310; Test __builtin_frame_address(1). 311 312; CHECK-LABEL: frameaddress_1: 313; CHECK-NEXT: i32.const $push0=, 0{{$}} 314; CHECK-NEXT: call use_i8_star@FUNCTION, $pop0{{$}} 315; CHECK-NEXT: return{{$}} 316define void @frameaddress_1() { 317 %t = call i8* @llvm.frameaddress(i32 1) 318 call void @use_i8_star(i8* %t) 319 ret void 320} 321 322; Test a stack address passed to an inline asm. 323; CHECK-LABEL: inline_asm: 324; CHECK: __stack_pointer 325; CHECK: #APP 326; CHECK-NEXT: # %{{[0-9]+}}{{$}} 327; CHECK-NEXT: #NO_APP 328define void @inline_asm() { 329 %tmp = alloca i8 330 call void asm sideeffect "# %0", "r"(i8* %tmp) 331 ret void 332} 333 334; TODO: test over-aligned alloca 335