1target datalayout = "e-i64:64-f80:128-n8:16:32:64-S128"
2; RUN: opt < %s -alignment-from-assumptions -S | FileCheck %s
3; RUN: opt < %s -passes=alignment-from-assumptions -S | FileCheck %s
4
5define i32 @foo(i32* nocapture %a) nounwind uwtable readonly {
6entry:
7  %ptrint = ptrtoint i32* %a to i64
8  %maskedptr = and i64 %ptrint, 31
9  %maskcond = icmp eq i64 %maskedptr, 0
10  tail call void @llvm.assume(i1 %maskcond)
11  %0 = load i32, i32* %a, align 4
12  ret i32 %0
13
14; CHECK-LABEL: @foo
15; CHECK: load i32, i32* {{[^,]+}}, align 32
16; CHECK: ret i32
17}
18
19define i32 @foo2(i32* nocapture %a) nounwind uwtable readonly {
20entry:
21  %ptrint = ptrtoint i32* %a to i64
22  %offsetptr = add i64 %ptrint, 24
23  %maskedptr = and i64 %offsetptr, 31
24  %maskcond = icmp eq i64 %maskedptr, 0
25  tail call void @llvm.assume(i1 %maskcond)
26  %arrayidx = getelementptr inbounds i32, i32* %a, i64 2
27  %0 = load i32, i32* %arrayidx, align 4
28  ret i32 %0
29
30; CHECK-LABEL: @foo2
31; CHECK: load i32, i32* {{[^,]+}}, align 16
32; CHECK: ret i32
33}
34
35define i32 @foo2a(i32* nocapture %a) nounwind uwtable readonly {
36entry:
37  %ptrint = ptrtoint i32* %a to i64
38  %offsetptr = add i64 %ptrint, 28
39  %maskedptr = and i64 %offsetptr, 31
40  %maskcond = icmp eq i64 %maskedptr, 0
41  tail call void @llvm.assume(i1 %maskcond)
42  %arrayidx = getelementptr inbounds i32, i32* %a, i64 -1
43  %0 = load i32, i32* %arrayidx, align 4
44  ret i32 %0
45
46; CHECK-LABEL: @foo2a
47; CHECK: load i32, i32* {{[^,]+}}, align 32
48; CHECK: ret i32
49}
50
51define i32 @goo(i32* nocapture %a) nounwind uwtable readonly {
52entry:
53  %ptrint = ptrtoint i32* %a to i64
54  %maskedptr = and i64 %ptrint, 31
55  %maskcond = icmp eq i64 %maskedptr, 0
56  tail call void @llvm.assume(i1 %maskcond)
57  %0 = load i32, i32* %a, align 4
58  ret i32 %0
59
60; CHECK-LABEL: @goo
61; CHECK: load i32, i32* {{[^,]+}}, align 32
62; CHECK: ret i32
63}
64
65define i32 @hoo(i32* nocapture %a) nounwind uwtable readonly {
66entry:
67  %ptrint = ptrtoint i32* %a to i64
68  %maskedptr = and i64 %ptrint, 31
69  %maskcond = icmp eq i64 %maskedptr, 0
70  tail call void @llvm.assume(i1 %maskcond)
71  br label %for.body
72
73for.body:                                         ; preds = %entry, %for.body
74  %indvars.iv = phi i64 [ 0, %entry ], [ %indvars.iv.next, %for.body ]
75  %r.06 = phi i32 [ 0, %entry ], [ %add, %for.body ]
76  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
77  %0 = load i32, i32* %arrayidx, align 4
78  %add = add nsw i32 %0, %r.06
79  %indvars.iv.next = add i64 %indvars.iv, 8
80  %1 = trunc i64 %indvars.iv.next to i32
81  %cmp = icmp slt i32 %1, 2048
82  br i1 %cmp, label %for.body, label %for.end
83
84for.end:                                          ; preds = %for.body
85  %add.lcssa = phi i32 [ %add, %for.body ]
86  ret i32 %add.lcssa
87
88; CHECK-LABEL: @hoo
89; CHECK: load i32, i32* %arrayidx, align 32
90; CHECK: ret i32 %add.lcssa
91}
92
93; test D66575
94; def hoo2(a, id, num):
95;   for i0 in range(id*64, 4096, num*64):
96;     for i1 in range(0, 4096, 32):
97;       for i2 in range(0, 4096, 32):
98;         load(a, i0+i1+i2+32)
99define void @hoo2(i32* nocapture %a, i64 %id, i64 %num) nounwind uwtable readonly {
100entry:
101  %ptrint = ptrtoint i32* %a to i64
102  %maskedptr = and i64 %ptrint, 31
103  %maskcond = icmp eq i64 %maskedptr, 0
104  tail call void @llvm.assume(i1 %maskcond)
105  %id.mul = shl nsw i64 %id, 6
106  %num.mul = shl nsw i64 %num, 6
107  br label %for0.body
108
109for0.body:
110  %i0 = phi i64 [ %id.mul, %entry ], [ %i0.next, %for0.end ]
111  br label %for1.body
112
113for1.body:
114  %i1 = phi i64 [ 0, %for0.body ], [ %i1.next, %for1.end ]
115  br label %for2.body
116
117for2.body:
118  %i2 = phi i64 [ 0, %for1.body ], [ %i2.next, %for2.body ]
119
120  %t1 = add nuw nsw i64 %i0, %i1
121  %t2 = add nuw nsw i64 %t1, %i2
122  %t3 = add nuw nsw i64 %t2, 32
123  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %t3
124  %x = load i32, i32* %arrayidx, align 4
125
126  %i2.next = add nuw nsw i64 %i2, 32
127  %cmp2 = icmp ult i64 %i2.next, 4096
128  br i1 %cmp2, label %for2.body, label %for1.end
129
130for1.end:
131  %i1.next = add nuw nsw i64 %i1, 32
132  %cmp1 = icmp ult i64 %i1.next, 4096
133  br i1 %cmp1, label %for1.body, label %for0.end
134
135for0.end:
136  %i0.next = add nuw nsw i64 %i0, %num.mul
137  %cmp0 = icmp ult i64 %i0.next, 4096
138  br i1 %cmp0, label %for0.body, label %return
139
140return:
141  ret void
142
143; CHECK-LABEL: @hoo2
144; CHECK: load i32, i32* %arrayidx, align 32
145; CHECK: ret void
146}
147
148define i32 @joo(i32* nocapture %a) nounwind uwtable readonly {
149entry:
150  %ptrint = ptrtoint i32* %a to i64
151  %maskedptr = and i64 %ptrint, 31
152  %maskcond = icmp eq i64 %maskedptr, 0
153  tail call void @llvm.assume(i1 %maskcond)
154  br label %for.body
155
156for.body:                                         ; preds = %entry, %for.body
157  %indvars.iv = phi i64 [ 4, %entry ], [ %indvars.iv.next, %for.body ]
158  %r.06 = phi i32 [ 0, %entry ], [ %add, %for.body ]
159  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
160  %0 = load i32, i32* %arrayidx, align 4
161  %add = add nsw i32 %0, %r.06
162  %indvars.iv.next = add i64 %indvars.iv, 8
163  %1 = trunc i64 %indvars.iv.next to i32
164  %cmp = icmp slt i32 %1, 2048
165  br i1 %cmp, label %for.body, label %for.end
166
167for.end:                                          ; preds = %for.body
168  %add.lcssa = phi i32 [ %add, %for.body ]
169  ret i32 %add.lcssa
170
171; CHECK-LABEL: @joo
172; CHECK: load i32, i32* %arrayidx, align 16
173; CHECK: ret i32 %add.lcssa
174}
175
176define i32 @koo(i32* nocapture %a) nounwind uwtable readonly {
177entry:
178  %ptrint = ptrtoint i32* %a to i64
179  %maskedptr = and i64 %ptrint, 31
180  %maskcond = icmp eq i64 %maskedptr, 0
181  tail call void @llvm.assume(i1 %maskcond)
182  br label %for.body
183
184for.body:                                         ; preds = %entry, %for.body
185  %indvars.iv = phi i64 [ 0, %entry ], [ %indvars.iv.next, %for.body ]
186  %r.06 = phi i32 [ 0, %entry ], [ %add, %for.body ]
187  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
188  %0 = load i32, i32* %arrayidx, align 4
189  %add = add nsw i32 %0, %r.06
190  %indvars.iv.next = add i64 %indvars.iv, 4
191  %1 = trunc i64 %indvars.iv.next to i32
192  %cmp = icmp slt i32 %1, 2048
193  br i1 %cmp, label %for.body, label %for.end
194
195for.end:                                          ; preds = %for.body
196  %add.lcssa = phi i32 [ %add, %for.body ]
197  ret i32 %add.lcssa
198
199; CHECK-LABEL: @koo
200; CHECK: load i32, i32* %arrayidx, align 16
201; CHECK: ret i32 %add.lcssa
202}
203
204define i32 @koo2(i32* nocapture %a) nounwind uwtable readonly {
205entry:
206  %ptrint = ptrtoint i32* %a to i64
207  %maskedptr = and i64 %ptrint, 31
208  %maskcond = icmp eq i64 %maskedptr, 0
209  tail call void @llvm.assume(i1 %maskcond)
210  br label %for.body
211
212for.body:                                         ; preds = %entry, %for.body
213  %indvars.iv = phi i64 [ -4, %entry ], [ %indvars.iv.next, %for.body ]
214  %r.06 = phi i32 [ 0, %entry ], [ %add, %for.body ]
215  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
216  %0 = load i32, i32* %arrayidx, align 4
217  %add = add nsw i32 %0, %r.06
218  %indvars.iv.next = add i64 %indvars.iv, 4
219  %1 = trunc i64 %indvars.iv.next to i32
220  %cmp = icmp slt i32 %1, 2048
221  br i1 %cmp, label %for.body, label %for.end
222
223for.end:                                          ; preds = %for.body
224  %add.lcssa = phi i32 [ %add, %for.body ]
225  ret i32 %add.lcssa
226
227; CHECK-LABEL: @koo2
228; CHECK: load i32, i32* %arrayidx, align 16
229; CHECK: ret i32 %add.lcssa
230}
231
232define i32 @moo(i32* nocapture %a) nounwind uwtable {
233entry:
234  %ptrint = ptrtoint i32* %a to i64
235  %maskedptr = and i64 %ptrint, 31
236  %maskcond = icmp eq i64 %maskedptr, 0
237  tail call void @llvm.assume(i1 %maskcond)
238  %0 = bitcast i32* %a to i8*
239  tail call void @llvm.memset.p0i8.i64(i8* align 4 %0, i8 0, i64 64, i1 false)
240  ret i32 undef
241
242; CHECK-LABEL: @moo
243; CHECK: @llvm.memset.p0i8.i64(i8* align 32 %0, i8 0, i64 64, i1 false)
244; CHECK: ret i32 undef
245}
246
247define i32 @moo2(i32* nocapture %a, i32* nocapture %b) nounwind uwtable {
248entry:
249  %ptrint = ptrtoint i32* %a to i64
250  %maskedptr = and i64 %ptrint, 31
251  %maskcond = icmp eq i64 %maskedptr, 0
252  tail call void @llvm.assume(i1 %maskcond)
253  %ptrint1 = ptrtoint i32* %b to i64
254  %maskedptr3 = and i64 %ptrint1, 127
255  %maskcond4 = icmp eq i64 %maskedptr3, 0
256  tail call void @llvm.assume(i1 %maskcond4)
257  %0 = bitcast i32* %a to i8*
258  %1 = bitcast i32* %b to i8*
259  tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 4 %0, i8* align 4 %1, i64 64, i1 false)
260  ret i32 undef
261
262; CHECK-LABEL: @moo2
263; CHECK: @llvm.memcpy.p0i8.p0i8.i64(i8* align 32 %0, i8* align 128 %1, i64 64, i1 false)
264; CHECK: ret i32 undef
265}
266
267declare void @llvm.assume(i1) nounwind
268
269declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i1) nounwind
270declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture, i8* nocapture, i64, i1) nounwind
271
272