1 // NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --function-signature --include-generated-funcs
2 // RUN: %clang_cc1 -no-opaque-pointers -fopenmp-enable-irbuilder -verify -fopenmp -fopenmp-version=45 -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s
3 // expected-no-diagnostics
4 
5 #ifndef HEADER
6 #define HEADER
7 
8 // CHECK-LABEL: define {{.*}}@workshareloop_unsigned_static_chunked(
9 // CHECK-NEXT:  [[ENTRY:.*]]:
10 // CHECK-NEXT:    %[[A_ADDR:.+]] = alloca float*, align 8
11 // CHECK-NEXT:    %[[B_ADDR:.+]] = alloca float*, align 8
12 // CHECK-NEXT:    %[[C_ADDR:.+]] = alloca float*, align 8
13 // CHECK-NEXT:    %[[D_ADDR:.+]] = alloca float*, align 8
14 // CHECK-NEXT:    %[[I:.+]] = alloca i32, align 4
15 // CHECK-NEXT:    %[[AGG_CAPTURED:.+]] = alloca %struct.anon, align 8
16 // CHECK-NEXT:    %[[AGG_CAPTURED1:.+]] = alloca %struct.anon.0, align 4
17 // CHECK-NEXT:    %[[DOTCOUNT_ADDR:.+]] = alloca i32, align 4
18 // CHECK-NEXT:    %[[P_LASTITER:.+]] = alloca i32, align 4
19 // CHECK-NEXT:    %[[P_LOWERBOUND:.+]] = alloca i32, align 4
20 // CHECK-NEXT:    %[[P_UPPERBOUND:.+]] = alloca i32, align 4
21 // CHECK-NEXT:    %[[P_STRIDE:.+]] = alloca i32, align 4
22 // CHECK-NEXT:    store float* %[[A:.+]], float** %[[A_ADDR]], align 8
23 // CHECK-NEXT:    store float* %[[B:.+]], float** %[[B_ADDR]], align 8
24 // CHECK-NEXT:    store float* %[[C:.+]], float** %[[C_ADDR]], align 8
25 // CHECK-NEXT:    store float* %[[D:.+]], float** %[[D_ADDR]], align 8
26 // CHECK-NEXT:    store i32 33, i32* %[[I]], align 4
27 // CHECK-NEXT:    %[[TMP0:.+]] = getelementptr inbounds %struct.anon, %struct.anon* %[[AGG_CAPTURED]], i32 0, i32 0
28 // CHECK-NEXT:    store i32* %[[I]], i32** %[[TMP0]], align 8
29 // CHECK-NEXT:    %[[TMP1:.+]] = getelementptr inbounds %struct.anon.0, %struct.anon.0* %[[AGG_CAPTURED1]], i32 0, i32 0
30 // CHECK-NEXT:    %[[TMP2:.+]] = load i32, i32* %[[I]], align 4
31 // CHECK-NEXT:    store i32 %[[TMP2]], i32* %[[TMP1]], align 4
32 // CHECK-NEXT:    call void @__captured_stmt(i32* %[[DOTCOUNT_ADDR]], %struct.anon* %[[AGG_CAPTURED]])
33 // CHECK-NEXT:    %[[DOTCOUNT:.+]] = load i32, i32* %[[DOTCOUNT_ADDR]], align 4
34 // CHECK-NEXT:    br label %[[OMP_LOOP_PREHEADER:.+]]
35 // CHECK-EMPTY:
36 // CHECK-NEXT:  [[OMP_LOOP_PREHEADER]]:
37 // CHECK-NEXT:    store i32 0, i32* %[[P_LOWERBOUND]], align 4
38 // CHECK-NEXT:    %[[TMP3:.+]] = sub i32 %[[DOTCOUNT]], 1
39 // CHECK-NEXT:    store i32 %[[TMP3]], i32* %[[P_UPPERBOUND]], align 4
40 // CHECK-NEXT:    store i32 1, i32* %[[P_STRIDE]], align 4
41 // CHECK-NEXT:    %[[OMP_GLOBAL_THREAD_NUM:.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @1)
42 // CHECK-NEXT:    call void @__kmpc_for_static_init_4u(%struct.ident_t* @1, i32 %[[OMP_GLOBAL_THREAD_NUM]], i32 33, i32* %[[P_LASTITER]], i32* %[[P_LOWERBOUND]], i32* %[[P_UPPERBOUND]], i32* %[[P_STRIDE]], i32 1, i32 5)
43 // CHECK-NEXT:    %[[OMP_FIRSTCHUNK_LB:.+]] = load i32, i32* %[[P_LOWERBOUND]], align 4
44 // CHECK-NEXT:    %[[OMP_FIRSTCHUNK_UB:.+]] = load i32, i32* %[[P_UPPERBOUND]], align 4
45 // CHECK-NEXT:    %[[TMP4:.+]] = add i32 %[[OMP_FIRSTCHUNK_UB]], 1
46 // CHECK-NEXT:    %[[OMP_CHUNK_RANGE:.+]] = sub i32 %[[TMP4]], %[[OMP_FIRSTCHUNK_LB]]
47 // CHECK-NEXT:    %[[OMP_DISPATCH_STRIDE:.+]] = load i32, i32* %[[P_STRIDE]], align 4
48 // CHECK-NEXT:    %[[TMP5:.+]] = sub nuw i32 %[[DOTCOUNT]], %[[OMP_FIRSTCHUNK_LB]]
49 // CHECK-NEXT:    %[[TMP6:.+]] = icmp ule i32 %[[DOTCOUNT]], %[[OMP_FIRSTCHUNK_LB]]
50 // CHECK-NEXT:    %[[TMP7:.+]] = sub i32 %[[TMP5]], 1
51 // CHECK-NEXT:    %[[TMP8:.+]] = udiv i32 %[[TMP7]], %[[OMP_DISPATCH_STRIDE]]
52 // CHECK-NEXT:    %[[TMP9:.+]] = add i32 %[[TMP8]], 1
53 // CHECK-NEXT:    %[[TMP10:.+]] = icmp ule i32 %[[TMP5]], %[[OMP_DISPATCH_STRIDE]]
54 // CHECK-NEXT:    %[[TMP11:.+]] = select i1 %[[TMP10]], i32 1, i32 %[[TMP9]]
55 // CHECK-NEXT:    %[[OMP_DISPATCH_TRIPCOUNT:.+]] = select i1 %[[TMP6]], i32 0, i32 %[[TMP11]]
56 // CHECK-NEXT:    br label %[[OMP_DISPATCH_PREHEADER:.+]]
57 // CHECK-EMPTY:
58 // CHECK-NEXT:  [[OMP_DISPATCH_PREHEADER]]:
59 // CHECK-NEXT:    br label %[[OMP_DISPATCH_HEADER:.+]]
60 // CHECK-EMPTY:
61 // CHECK-NEXT:  [[OMP_DISPATCH_HEADER]]:
62 // CHECK-NEXT:    %[[OMP_DISPATCH_IV:.+]] = phi i32 [ 0, %[[OMP_DISPATCH_PREHEADER]] ], [ %[[OMP_DISPATCH_NEXT:.+]], %[[OMP_DISPATCH_INC:.+]] ]
63 // CHECK-NEXT:    br label %[[OMP_DISPATCH_COND:.+]]
64 // CHECK-EMPTY:
65 // CHECK-NEXT:  [[OMP_DISPATCH_COND]]:
66 // CHECK-NEXT:    %[[OMP_DISPATCH_CMP:.+]] = icmp ult i32 %[[OMP_DISPATCH_IV]], %[[OMP_DISPATCH_TRIPCOUNT]]
67 // CHECK-NEXT:    br i1 %[[OMP_DISPATCH_CMP]], label %[[OMP_DISPATCH_BODY:.+]], label %[[OMP_DISPATCH_EXIT:.+]]
68 // CHECK-EMPTY:
69 // CHECK-NEXT:  [[OMP_DISPATCH_BODY]]:
70 // CHECK-NEXT:    %[[TMP12:.+]] = mul i32 %[[OMP_DISPATCH_IV]], %[[OMP_DISPATCH_STRIDE]]
71 // CHECK-NEXT:    %[[TMP13:.+]] = add i32 %[[TMP12]], %[[OMP_FIRSTCHUNK_LB]]
72 // CHECK-NEXT:    br label %[[OMP_LOOP_PREHEADER9:.+]]
73 // CHECK-EMPTY:
74 // CHECK-NEXT:  [[OMP_DISPATCH_INC]]:
75 // CHECK-NEXT:    %[[OMP_DISPATCH_NEXT]] = add nuw i32 %[[OMP_DISPATCH_IV]], 1
76 // CHECK-NEXT:    br label %[[OMP_DISPATCH_HEADER]]
77 // CHECK-EMPTY:
78 // CHECK-NEXT:  [[OMP_DISPATCH_EXIT]]:
79 // CHECK-NEXT:    call void @__kmpc_for_static_fini(%struct.ident_t* @1, i32 %[[OMP_GLOBAL_THREAD_NUM]])
80 // CHECK-NEXT:    %[[OMP_GLOBAL_THREAD_NUM10:.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @1)
81 // CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @2, i32 %[[OMP_GLOBAL_THREAD_NUM10]])
82 // CHECK-NEXT:    br label %[[OMP_DISPATCH_AFTER:.+]]
83 // CHECK-EMPTY:
84 // CHECK-NEXT:  [[OMP_DISPATCH_AFTER]]:
85 // CHECK-NEXT:    br label %[[OMP_LOOP_AFTER:.+]]
86 // CHECK-EMPTY:
87 // CHECK-NEXT:  [[OMP_LOOP_PREHEADER9]]:
88 // CHECK-NEXT:    %[[TMP14:.+]] = add i32 %[[TMP13]], %[[OMP_CHUNK_RANGE]]
89 // CHECK-NEXT:    %[[OMP_CHUNK_IS_LAST:.+]] = icmp uge i32 %[[TMP14]], %[[DOTCOUNT]]
90 // CHECK-NEXT:    %[[TMP15:.+]] = sub i32 %[[DOTCOUNT]], %[[TMP13]]
91 // CHECK-NEXT:    %[[OMP_CHUNK_TRIPCOUNT:.+]] = select i1 %[[OMP_CHUNK_IS_LAST]], i32 %[[TMP15]], i32 %[[OMP_CHUNK_RANGE]]
92 // CHECK-NEXT:    br label %[[OMP_LOOP_HEADER:.+]]
93 // CHECK-EMPTY:
94 // CHECK-NEXT:  [[OMP_LOOP_HEADER]]:
95 // CHECK-NEXT:    %[[OMP_LOOP_IV:.+]] = phi i32 [ 0, %[[OMP_LOOP_PREHEADER9]] ], [ %[[OMP_LOOP_NEXT:.+]], %[[OMP_LOOP_INC:.+]] ]
96 // CHECK-NEXT:    br label %[[OMP_LOOP_COND:.+]]
97 // CHECK-EMPTY:
98 // CHECK-NEXT:  [[OMP_LOOP_COND]]:
99 // CHECK-NEXT:    %[[OMP_LOOP_CMP:.+]] = icmp ult i32 %[[OMP_LOOP_IV]], %[[OMP_CHUNK_TRIPCOUNT]]
100 // CHECK-NEXT:    br i1 %[[OMP_LOOP_CMP]], label %[[OMP_LOOP_BODY:.+]], label %[[OMP_LOOP_EXIT:.+]]
101 // CHECK-EMPTY:
102 // CHECK-NEXT:  [[OMP_LOOP_BODY]]:
103 // CHECK-NEXT:    %[[TMP16:.+]] = add i32 %[[OMP_LOOP_IV]], %[[TMP13]]
104 // CHECK-NEXT:    call void @__captured_stmt.1(i32* %[[I]], i32 %[[TMP16]], %struct.anon.0* %[[AGG_CAPTURED1]])
105 // CHECK-NEXT:    %[[TMP17:.+]] = load float*, float** %[[B_ADDR]], align 8
106 // CHECK-NEXT:    %[[TMP18:.+]] = load i32, i32* %[[I]], align 4
107 // CHECK-NEXT:    %[[IDXPROM:.+]] = zext i32 %[[TMP18]] to i64
108 // CHECK-NEXT:    %[[ARRAYIDX:.+]] = getelementptr inbounds float, float* %[[TMP17]], i64 %[[IDXPROM]]
109 // CHECK-NEXT:    %[[TMP19:.+]] = load float, float* %[[ARRAYIDX]], align 4
110 // CHECK-NEXT:    %[[TMP20:.+]] = load float*, float** %[[C_ADDR]], align 8
111 // CHECK-NEXT:    %[[TMP21:.+]] = load i32, i32* %[[I]], align 4
112 // CHECK-NEXT:    %[[IDXPROM2:.+]] = zext i32 %[[TMP21]] to i64
113 // CHECK-NEXT:    %[[ARRAYIDX3:.+]] = getelementptr inbounds float, float* %[[TMP20]], i64 %[[IDXPROM2]]
114 // CHECK-NEXT:    %[[TMP22:.+]] = load float, float* %[[ARRAYIDX3]], align 4
115 // CHECK-NEXT:    %[[MUL:.+]] = fmul float %[[TMP19]], %[[TMP22]]
116 // CHECK-NEXT:    %[[TMP23:.+]] = load float*, float** %[[D_ADDR]], align 8
117 // CHECK-NEXT:    %[[TMP24:.+]] = load i32, i32* %[[I]], align 4
118 // CHECK-NEXT:    %[[IDXPROM4:.+]] = zext i32 %[[TMP24]] to i64
119 // CHECK-NEXT:    %[[ARRAYIDX5:.+]] = getelementptr inbounds float, float* %[[TMP23]], i64 %[[IDXPROM4]]
120 // CHECK-NEXT:    %[[TMP25:.+]] = load float, float* %[[ARRAYIDX5]], align 4
121 // CHECK-NEXT:    %[[MUL6:.+]] = fmul float %[[MUL]], %[[TMP25]]
122 // CHECK-NEXT:    %[[TMP26:.+]] = load float*, float** %[[A_ADDR]], align 8
123 // CHECK-NEXT:    %[[TMP27:.+]] = load i32, i32* %[[I]], align 4
124 // CHECK-NEXT:    %[[IDXPROM7:.+]] = zext i32 %[[TMP27]] to i64
125 // CHECK-NEXT:    %[[ARRAYIDX8:.+]] = getelementptr inbounds float, float* %[[TMP26]], i64 %[[IDXPROM7]]
126 // CHECK-NEXT:    store float %[[MUL6]], float* %[[ARRAYIDX8]], align 4
127 // CHECK-NEXT:    br label %[[OMP_LOOP_INC]]
128 // CHECK-EMPTY:
129 // CHECK-NEXT:  [[OMP_LOOP_INC]]:
130 // CHECK-NEXT:    %[[OMP_LOOP_NEXT]] = add nuw i32 %[[OMP_LOOP_IV]], 1
131 // CHECK-NEXT:    br label %[[OMP_LOOP_HEADER]]
132 // CHECK-EMPTY:
133 // CHECK-NEXT:  [[OMP_LOOP_EXIT]]:
134 // CHECK-NEXT:    br label %[[OMP_DISPATCH_INC]]
135 // CHECK-EMPTY:
136 // CHECK-NEXT:  [[OMP_LOOP_AFTER]]:
137 // CHECK-NEXT:    ret void
138 // CHECK-NEXT:  }
139 
workshareloop_unsigned_static_chunked(float * a,float * b,float * c,float * d)140 extern "C" void workshareloop_unsigned_static_chunked(float *a, float *b, float *c, float *d) {
141 #pragma omp for schedule(static, 5)
142   for (unsigned i = 33; i < 32000000; i += 7) {
143     a[i] = b[i] * c[i] * d[i];
144   }
145 }
146 
147 #endif // HEADER
148 
149 // CHECK-LABEL: define {{.*}}@__captured_stmt(
150 // CHECK-NEXT:  [[ENTRY:.*]]:
151 // CHECK-NEXT:    %[[DISTANCE_ADDR:.+]] = alloca i32*, align 8
152 // CHECK-NEXT:    %[[__CONTEXT_ADDR:.+]] = alloca %struct.anon*, align 8
153 // CHECK-NEXT:    %[[DOTSTART:.+]] = alloca i32, align 4
154 // CHECK-NEXT:    %[[DOTSTOP:.+]] = alloca i32, align 4
155 // CHECK-NEXT:    %[[DOTSTEP:.+]] = alloca i32, align 4
156 // CHECK-NEXT:    store i32* %[[DISTANCE:.+]], i32** %[[DISTANCE_ADDR]], align 8
157 // CHECK-NEXT:    store %struct.anon* %[[__CONTEXT:.+]], %struct.anon** %[[__CONTEXT_ADDR]], align 8
158 // CHECK-NEXT:    %[[TMP0:.+]] = load %struct.anon*, %struct.anon** %[[__CONTEXT_ADDR]], align 8
159 // CHECK-NEXT:    %[[TMP1:.+]] = getelementptr inbounds %struct.anon, %struct.anon* %[[TMP0]], i32 0, i32 0
160 // CHECK-NEXT:    %[[TMP2:.+]] = load i32*, i32** %[[TMP1]], align 8
161 // CHECK-NEXT:    %[[TMP3:.+]] = load i32, i32* %[[TMP2]], align 4
162 // CHECK-NEXT:    store i32 %[[TMP3]], i32* %[[DOTSTART]], align 4
163 // CHECK-NEXT:    store i32 32000000, i32* %[[DOTSTOP]], align 4
164 // CHECK-NEXT:    store i32 7, i32* %[[DOTSTEP]], align 4
165 // CHECK-NEXT:    %[[TMP4:.+]] = load i32, i32* %[[DOTSTART]], align 4
166 // CHECK-NEXT:    %[[TMP5:.+]] = load i32, i32* %[[DOTSTOP]], align 4
167 // CHECK-NEXT:    %[[CMP:.+]] = icmp ult i32 %[[TMP4]], %[[TMP5]]
168 // CHECK-NEXT:    br i1 %[[CMP]], label %[[COND_TRUE:.+]], label %[[COND_FALSE:.+]]
169 // CHECK-EMPTY:
170 // CHECK-NEXT:  [[COND_TRUE]]:
171 // CHECK-NEXT:    %[[TMP6:.+]] = load i32, i32* %[[DOTSTOP]], align 4
172 // CHECK-NEXT:    %[[TMP7:.+]] = load i32, i32* %[[DOTSTART]], align 4
173 // CHECK-NEXT:    %[[SUB:.+]] = sub i32 %[[TMP6]], %[[TMP7]]
174 // CHECK-NEXT:    %[[TMP8:.+]] = load i32, i32* %[[DOTSTEP]], align 4
175 // CHECK-NEXT:    %[[SUB1:.+]] = sub i32 %[[TMP8]], 1
176 // CHECK-NEXT:    %[[ADD:.+]] = add i32 %[[SUB]], %[[SUB1]]
177 // CHECK-NEXT:    %[[TMP9:.+]] = load i32, i32* %[[DOTSTEP]], align 4
178 // CHECK-NEXT:    %[[DIV:.+]] = udiv i32 %[[ADD]], %[[TMP9]]
179 // CHECK-NEXT:    br label %[[COND_END:.+]]
180 // CHECK-EMPTY:
181 // CHECK-NEXT:  [[COND_FALSE]]:
182 // CHECK-NEXT:    br label %[[COND_END]]
183 // CHECK-EMPTY:
184 // CHECK-NEXT:  [[COND_END]]:
185 // CHECK-NEXT:    %[[COND:.+]] = phi i32 [ %[[DIV]], %[[COND_TRUE]] ], [ 0, %[[COND_FALSE]] ]
186 // CHECK-NEXT:    %[[TMP10:.+]] = load i32*, i32** %[[DISTANCE_ADDR]], align 8
187 // CHECK-NEXT:    store i32 %[[COND]], i32* %[[TMP10]], align 4
188 // CHECK-NEXT:    ret void
189 // CHECK-NEXT:  }
190 
191 
192 // CHECK-LABEL: define {{.*}}@__captured_stmt.1(
193 // CHECK-NEXT:  [[ENTRY:.*]]:
194 // CHECK-NEXT:    %[[LOOPVAR_ADDR:.+]] = alloca i32*, align 8
195 // CHECK-NEXT:    %[[LOGICAL_ADDR:.+]] = alloca i32, align 4
196 // CHECK-NEXT:    %[[__CONTEXT_ADDR:.+]] = alloca %struct.anon.0*, align 8
197 // CHECK-NEXT:    store i32* %[[LOOPVAR:.+]], i32** %[[LOOPVAR_ADDR]], align 8
198 // CHECK-NEXT:    store i32 %[[LOGICAL:.+]], i32* %[[LOGICAL_ADDR]], align 4
199 // CHECK-NEXT:    store %struct.anon.0* %[[__CONTEXT:.+]], %struct.anon.0** %[[__CONTEXT_ADDR]], align 8
200 // CHECK-NEXT:    %[[TMP0:.+]] = load %struct.anon.0*, %struct.anon.0** %[[__CONTEXT_ADDR]], align 8
201 // CHECK-NEXT:    %[[TMP1:.+]] = getelementptr inbounds %struct.anon.0, %struct.anon.0* %[[TMP0]], i32 0, i32 0
202 // CHECK-NEXT:    %[[TMP2:.+]] = load i32, i32* %[[TMP1]], align 4
203 // CHECK-NEXT:    %[[TMP3:.+]] = load i32, i32* %[[LOGICAL_ADDR]], align 4
204 // CHECK-NEXT:    %[[MUL:.+]] = mul i32 7, %[[TMP3]]
205 // CHECK-NEXT:    %[[ADD:.+]] = add i32 %[[TMP2]], %[[MUL]]
206 // CHECK-NEXT:    %[[TMP4:.+]] = load i32*, i32** %[[LOOPVAR_ADDR]], align 8
207 // CHECK-NEXT:    store i32 %[[ADD]], i32* %[[TMP4]], align 4
208 // CHECK-NEXT:    ret void
209 // CHECK-NEXT:  }
210 
211 
212 // CHECK: ![[META0:[0-9]+]] = !{i32 1, !"wchar_size", i32 4}
213 // CHECK: ![[META1:[0-9]+]] = !{i32 7, !"openmp", i32 45}
214 // CHECK: ![[META2:[0-9]+]] =
215