1; RUN: llc -mtriple=thumbv7-apple-none-macho < %s | FileCheck %s 2; RUN: llc -mtriple=thumbv6m-apple-none-macho -disable-fp-elim < %s | FileCheck %s --check-prefix=CHECK-T1 3; RUN: llc -mtriple=thumbv7-apple-darwin-ios -disable-fp-elim < %s | FileCheck %s --check-prefix=CHECK-IOS 4; RUN: llc -mtriple=thumbv7--linux-gnueabi -disable-fp-elim < %s | FileCheck %s --check-prefix=CHECK-LINUX 5 6 7declare void @bar(i8*) 8 9%bigVec = type [2 x double] 10 11@var = global %bigVec zeroinitializer 12 13define void @check_simple() minsize { 14; CHECK-LABEL: check_simple: 15; CHECK: push {r3, r4, r5, r6, r7, lr} 16; CHECK-NOT: sub sp, sp, 17; ... 18; CHECK-NOT: add sp, sp, 19; CHECK: pop {r0, r1, r2, r3, r7, pc} 20 21; CHECK-T1-LABEL: check_simple: 22; CHECK-T1: push {r3, r4, r5, r6, r7, lr} 23; CHECK-T1: add r7, sp, #16 24; CHECK-T1-NOT: sub sp, sp, 25; ... 26; CHECK-T1-NOT: add sp, sp, 27; CHECK-T1: pop {r0, r1, r2, r3, r7, pc} 28 29 ; iOS always has a frame pointer and messing with the push affects 30 ; how it's set in the prologue. Make sure we get that right. 31; CHECK-IOS-LABEL: check_simple: 32; CHECK-IOS: push {r3, r4, r5, r6, r7, lr} 33; CHECK-NOT: sub sp, 34; CHECK-IOS: add r7, sp, #16 35; CHECK-NOT: sub sp, 36; ... 37; CHECK-NOT: add sp, 38; CHEC: pop {r3, r4, r5, r6, r7, pc} 39 40 %var = alloca i8, i32 16 41 call void @bar(i8* %var) 42 ret void 43} 44 45define void @check_simple_too_big() minsize { 46; CHECK-LABEL: check_simple_too_big: 47; CHECK: push {r7, lr} 48; CHECK: sub sp, 49; ... 50; CHECK: add sp, 51; CHECK: pop {r7, pc} 52 %var = alloca i8, i32 64 53 call void @bar(i8* %var) 54 ret void 55} 56 57define void @check_vfp_fold() minsize { 58; CHECK-LABEL: check_vfp_fold: 59; CHECK: push {r[[GLOBREG:[0-9]+]], lr} 60; CHECK: vpush {d6, d7, d8, d9} 61; CHECK-NOT: sub sp, 62; ... 63; CHECK-NOT: add sp, 64; CHECK: vpop {d6, d7, d8, d9} 65; CHECK: pop {r[[GLOBREG]], pc} 66 67 ; iOS uses aligned NEON stores here, which is convenient since we 68 ; want to make sure that works too. 69; CHECK-IOS-LABEL: check_vfp_fold: 70; CHECK-IOS: push {r4, r7, lr} 71; CHECK-IOS: sub.w r4, sp, #16 72; CHECK-IOS: bfc r4, #0, #4 73; CHECK-IOS: mov sp, r4 74; CHECK-IOS: vst1.64 {d8, d9}, [r4:128] 75; CHECK-IOS: sub sp, #16 76; ... 77; CHECK-IOS: add r4, sp, #16 78; CHECK-IOS: vld1.64 {d8, d9}, [r4:128] 79; CHECK-IOS: mov sp, r4 80; CHECK-IOS: pop {r4, r7, pc} 81 82 %var = alloca i8, i32 16 83 84 call void asm "", "r,~{d8},~{d9}"(i8* %var) 85 call void @bar(i8* %var) 86 87 ret void 88} 89 90; This function should use just enough space that the "add sp, sp, ..." could be 91; folded in except that doing so would clobber the value being returned. 92define i64 @check_no_return_clobber() minsize { 93; CHECK-LABEL: check_no_return_clobber: 94; CHECK: push {r1, r2, r3, r4, r5, r6, r7, lr} 95; CHECK-NOT: sub sp, 96; ... 97; CHECK: add sp, #24 98; CHECK: pop {r7, pc} 99 100 ; Just to keep iOS FileCheck within previous function: 101; CHECK-IOS-LABEL: check_no_return_clobber: 102 103 %var = alloca i8, i32 20 104 call void @bar(i8* %var) 105 ret i64 0 106} 107 108define arm_aapcs_vfpcc double @check_vfp_no_return_clobber() minsize { 109; CHECK-LABEL: check_vfp_no_return_clobber: 110; CHECK: push {r[[GLOBREG:[0-9]+]], lr} 111; CHECK: vpush {d0, d1, d2, d3, d4, d5, d6, d7, d8, d9} 112; CHECK-NOT: sub sp, 113; ... 114; CHECK: add sp, #64 115; CHECK: vpop {d8, d9} 116; CHECK: pop {r[[GLOBREG]], pc} 117 118 %var = alloca i8, i32 64 119 120 %tmp = load %bigVec, %bigVec* @var 121 call void @bar(i8* %var) 122 store %bigVec %tmp, %bigVec* @var 123 124 ret double 1.0 125} 126 127@dbl = global double 0.0 128 129; PR18136: there was a bug determining where the first eligible pop in a 130; basic-block was when the entire block was epilogue code. 131define void @test_fold_point(i1 %tst) minsize { 132; CHECK-LABEL: test_fold_point: 133 134 ; Important to check for beginning of basic block, because if it gets 135 ; if-converted the test is probably no longer checking what it should. 136; CHECK: {{LBB[0-9]+_2}}: 137; CHECK-NEXT: vpop {d7, d8} 138; CHECK-NEXT: pop {r4, pc} 139 140 ; With a guaranteed frame-pointer, we want to make sure that its offset in the 141 ; push block is correct, even if a few registers have been tacked onto a later 142 ; vpush (PR18160). 143; CHECK-IOS-LABEL: test_fold_point: 144; CHECK-IOS: push {r4, r7, lr} 145; CHECK-IOS-NEXT: add r7, sp, #4 146; CHECK-IOS-NEXT: vpush {d7, d8} 147 148 ; We want some memory so there's a stack adjustment to fold... 149 %var = alloca i8, i32 8 150 151 ; We want a long-lived floating register so that a callee-saved dN is used and 152 ; there's both a vpop and a pop. 153 %live_val = load double, double* @dbl 154 br i1 %tst, label %true, label %end 155true: 156 call void @bar(i8* %var) 157 store double %live_val, double* @dbl 158 br label %end 159end: 160 ; We want the epilogue to be the only thing in a basic block so that we hit 161 ; the correct edge-case (first inst in block is correct one to adjust). 162 ret void 163} 164 165define void @test_varsize(...) minsize { 166; CHECK-T1-LABEL: test_varsize: 167; CHECK-T1: sub sp, #16 168; CHECK-T1: push {r5, r6, r7, lr} 169; ... 170; CHECK-T1: pop {r2, r3, r7} 171; CHECK-T1: pop {[[POP_REG:r[0-3]]]} 172; CHECK-T1: add sp, #16 173; CHECK-T1: bx [[POP_REG]] 174 175; CHECK-LABEL: test_varsize: 176; CHECK: sub sp, #16 177; CHECK: push {r5, r6, r7, lr} 178; ... 179; CHECK: pop.w {r2, r3, r7, lr} 180; CHECK: add sp, #16 181; CHECK: bx lr 182 183 %var = alloca i8, i32 8 184 call void @llvm.va_start(i8* %var) 185 call void @bar(i8* %var) 186 ret void 187} 188 189%"MyClass" = type { i8*, i32, i32, float, float, float, [2 x i8], i32, i32* } 190 191declare float @foo() 192 193declare void @bar3() 194 195declare %"MyClass"* @bar2(%"MyClass"* returned, i16*, i32, float, float, i32, i32, i1 zeroext, i1 zeroext, i32) 196 197define fastcc float @check_vfp_no_return_clobber2(i16* %r, i16* %chars, i32 %length, i1 zeroext %flag) minsize { 198entry: 199; CHECK-LINUX-LABEL: check_vfp_no_return_clobber2 200; CHECK-LINUX: vpush {d0, d1, d2, d3, d4, d5, d6, d7, d8} 201; CHECK-NOT: sub sp, 202; ... 203; CHECK-LINUX: add sp 204; CHECK-LINUX: vpop {d8} 205 %run = alloca %"MyClass", align 4 206 %call = call %"MyClass"* @bar2(%"MyClass"* %run, i16* %chars, i32 %length, float 0.000000e+00, float 0.000000e+00, i32 1, i32 1, i1 zeroext false, i1 zeroext true, i32 3) 207 %call1 = call float @foo() 208 %cmp = icmp eq %"MyClass"* %run, null 209 br i1 %cmp, label %exit, label %if.then 210 211if.then: ; preds = %entry 212 call void @bar3() 213 br label %exit 214 215exit: ; preds = %if.then, %entry 216 ret float %call1 217} 218 219declare void @llvm.va_start(i8*) nounwind 220