1; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2; RUN: opt -S -memcpyopt < %s -enable-memcpyopt-memoryssa=0 | FileCheck %s --check-prefixes=CHECK,NO_MSSA
3; RUN: opt -S -memcpyopt < %s -enable-memcpyopt-memoryssa=1 -verify-memoryssa | FileCheck %s --check-prefixes=CHECK,MSSA
4
5; PR40118: BasicAA didn't realize that stackrestore ends the lifetime of
6; unescaped dynamic allocas, such as those that might come from inalloca.
7
8source_filename = "t.cpp"
9target datalayout = "e-m:x-p:32:32-i64:64-f80:32-n8:16:32-a:0:32-S32"
10target triple = "i686-unknown-windows-msvc19.14.26433"
11
12@str = internal constant [9 x i8] c"abcdxxxxx"
13
14
15; Test that we can propagate memcpy through an unescaped dynamic alloca across
16; a call to @external.
17
18define i32 @test_norestore(i32 %n) {
19; CHECK-LABEL: @test_norestore(
20; CHECK-NEXT:    [[TMPMEM:%.*]] = alloca [10 x i8], align 4
21; CHECK-NEXT:    [[TMP:%.*]] = getelementptr inbounds [10 x i8], [10 x i8]* [[TMPMEM]], i32 0, i32 0
22; CHECK-NEXT:    [[P:%.*]] = alloca i8, i32 [[N:%.*]], align 4
23; CHECK-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[P]], i8* align 1 getelementptr inbounds ([9 x i8], [9 x i8]* @str, i32 0, i32 0), i32 9, i1 false)
24; CHECK-NEXT:    [[P10:%.*]] = getelementptr inbounds i8, i8* [[P]], i32 9
25; CHECK-NEXT:    store i8 0, i8* [[P10]], align 1
26; CHECK-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[TMP]], i8* [[P]], i32 10, i1 false)
27; CHECK-NEXT:    call void @external()
28; CHECK-NEXT:    [[HEAP:%.*]] = call i8* @malloc(i32 9)
29; CHECK-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[HEAP]], i8* [[P]], i32 9, i1 false)
30; CHECK-NEXT:    call void @useit(i8* [[HEAP]])
31; CHECK-NEXT:    ret i32 0
32;
33  %tmpmem = alloca [10 x i8], align 4
34  %tmp = getelementptr inbounds [10 x i8], [10 x i8]* %tmpmem, i32 0, i32 0
35
36  ; Make a dynamic alloca, initialize it.
37  %p = alloca i8, i32 %n, align 4
38  call void @llvm.memcpy.p0i8.p0i8.i32(i8* %p, i8* align 1 getelementptr inbounds ([9 x i8], [9 x i8]* @str, i32 0, i32 0), i32 9, i1 false)
39
40  ; This extra byte exists to prevent memcpyopt from propagating @str.
41  %p10 = getelementptr inbounds i8, i8* %p, i32 9
42  store i8 0, i8* %p10
43
44  call void @llvm.memcpy.p0i8.p0i8.i32(i8* %tmp, i8* %p, i32 10, i1 false)
45  call void @external()
46  %heap = call i8* @malloc(i32 9)
47  call void @llvm.memcpy.p0i8.p0i8.i32(i8* %heap, i8* %tmp, i32 9, i1 false)
48  call void @useit(i8* %heap)
49  ret i32 0
50}
51
52; Do not propagate memcpy from %p across the stackrestore.
53
54define i32 @test_stackrestore() {
55; CHECK-LABEL: @test_stackrestore(
56; CHECK-NEXT:    [[TMPMEM:%.*]] = alloca [10 x i8], align 4
57; CHECK-NEXT:    [[TMP:%.*]] = getelementptr inbounds [10 x i8], [10 x i8]* [[TMPMEM]], i32 0, i32 0
58; CHECK-NEXT:    [[INALLOCA_SAVE:%.*]] = tail call i8* @llvm.stacksave()
59; CHECK-NEXT:    [[ARGMEM:%.*]] = alloca inalloca [10 x i8], align 4
60; CHECK-NEXT:    [[P:%.*]] = getelementptr inbounds [10 x i8], [10 x i8]* [[ARGMEM]], i32 0, i32 0
61; CHECK-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[P]], i8* align 1 getelementptr inbounds ([9 x i8], [9 x i8]* @str, i32 0, i32 0), i32 9, i1 false)
62; CHECK-NEXT:    [[P10:%.*]] = getelementptr inbounds [10 x i8], [10 x i8]* [[ARGMEM]], i32 0, i32 9
63; CHECK-NEXT:    store i8 0, i8* [[P10]], align 1
64; CHECK-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[TMP]], i8* [[P]], i32 10, i1 false)
65; CHECK-NEXT:    call void @llvm.stackrestore(i8* [[INALLOCA_SAVE]])
66; CHECK-NEXT:    [[HEAP:%.*]] = call i8* @malloc(i32 9)
67; CHECK-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[HEAP]], i8* [[TMP]], i32 9, i1 false)
68; CHECK-NEXT:    call void @useit(i8* [[HEAP]])
69; CHECK-NEXT:    ret i32 0
70;
71  %tmpmem = alloca [10 x i8], align 4
72  %tmp = getelementptr inbounds [10 x i8], [10 x i8]* %tmpmem, i32 0, i32 0
73  %inalloca.save = tail call i8* @llvm.stacksave()
74  %argmem = alloca inalloca [10 x i8], align 4
75  %p = getelementptr inbounds [10 x i8], [10 x i8]* %argmem, i32 0, i32 0
76  call void @llvm.memcpy.p0i8.p0i8.i32(i8* %p, i8* align 1 getelementptr inbounds ([9 x i8], [9 x i8]* @str, i32 0, i32 0), i32 9, i1 false)
77
78  ; This extra byte exists to prevent memcpyopt from propagating @str.
79  %p10 = getelementptr inbounds [10 x i8], [10 x i8]* %argmem, i32 0, i32 9
80  store i8 0, i8* %p10
81
82  call void @llvm.memcpy.p0i8.p0i8.i32(i8* %tmp, i8* %p, i32 10, i1 false)
83  call void @llvm.stackrestore(i8* %inalloca.save)
84  %heap = call i8* @malloc(i32 9)
85  call void @llvm.memcpy.p0i8.p0i8.i32(i8* %heap, i8* %tmp, i32 9, i1 false)
86  call void @useit(i8* %heap)
87  ret i32 0
88}
89
90declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture writeonly, i8* nocapture readonly, i32, i1)
91declare i8* @llvm.stacksave()
92declare void @llvm.stackrestore(i8*)
93declare i8* @malloc(i32)
94declare void @useit(i8*)
95declare void @external()
96