1*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s
2*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
3*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
4*1ec469cfSAlexey Bataev 
5*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s
6*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
7*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
8*1ec469cfSAlexey Bataev // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
9*1ec469cfSAlexey Bataev // expected-no-diagnostics
10*1ec469cfSAlexey Bataev #ifndef HEADER
11*1ec469cfSAlexey Bataev #define HEADER
12*1ec469cfSAlexey Bataev 
13*1ec469cfSAlexey Bataev void foo();
14*1ec469cfSAlexey Bataev void bar();
15*1ec469cfSAlexey Bataev 
16*1ec469cfSAlexey Bataev // CHECK: define void @{{.*}}baz{{.*}}(i32 %n)
17*1ec469cfSAlexey Bataev void baz(int n) {
18*1ec469cfSAlexey Bataev   static float a[10];
19*1ec469cfSAlexey Bataev   static double b;
20*1ec469cfSAlexey Bataev 
21*1ec469cfSAlexey Bataev   // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(
22*1ec469cfSAlexey Bataev   // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(
23*1ec469cfSAlexey Bataev 
24*1ec469cfSAlexey Bataev   // CHECK: call i8* @llvm.stacksave()
25*1ec469cfSAlexey Bataev   // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]]
26*1ec469cfSAlexey Bataev 
27*1ec469cfSAlexey Bataev   // float a_buffer[10][n];
28*1ec469cfSAlexey Bataev   // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]],
29*1ec469cfSAlexey Bataev 
30*1ec469cfSAlexey Bataev   // double b_buffer[10];
31*1ec469cfSAlexey Bataev   // CHECK: [[B_BUF:%.+]] = alloca double, i64 10,
32*1ec469cfSAlexey Bataev #pragma omp parallel for reduction(inscan, +:a[:n], b)
33*1ec469cfSAlexey Bataev   for (int i = 0; i < 10; ++i) {
34*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
35*1ec469cfSAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
36*1ec469cfSAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
37*1ec469cfSAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
38*1ec469cfSAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
39*1ec469cfSAlexey Bataev     // CHECK: [[INPUT_PHASE:.+]]:
40*1ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
41*1ec469cfSAlexey Bataev 
42*1ec469cfSAlexey Bataev     // a_buffer[i][0..n] = a_priv[[0..n];
43*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
44*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
45*1ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
46*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
47*1ec469cfSAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
48*1ec469cfSAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
49*1ec469cfSAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
50*1ec469cfSAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8*
51*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
52*1ec469cfSAlexey Bataev 
53*1ec469cfSAlexey Bataev     // b_buffer[i] = b_priv;
54*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
55*1ec469cfSAlexey Bataev     // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]],
56*1ec469cfSAlexey Bataev     // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]],
57*1ec469cfSAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:.+]]
58*1ec469cfSAlexey Bataev 
59*1ec469cfSAlexey Bataev     // CHECK: [[DISPATCH]]:
60*1ec469cfSAlexey Bataev     // CHECK: br label %[[INPUT_PHASE]]
61*1ec469cfSAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
62*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
63*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
64*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_barrier(
65*1ec469cfSAlexey Bataev     foo();
66*1ec469cfSAlexey Bataev #pragma omp scan inclusive(a[:n], b)
67*1ec469cfSAlexey Bataev     // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01)
68*1ec469cfSAlexey Bataev     // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]])
69*1ec469cfSAlexey Bataev     // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32
70*1ec469cfSAlexey Bataev     // CHECK: br label %[[OUTER_BODY:[^,]+]]
71*1ec469cfSAlexey Bataev     // CHECK: [[OUTER_BODY]]:
72*1ec469cfSAlexey Bataev     // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ]
73*1ec469cfSAlexey Bataev     // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ]
74*1ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]]
75*1ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]]
76*1ec469cfSAlexey Bataev     // CHECK: [[INNER_BODY]]:
77*1ec469cfSAlexey Bataev     // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ]
78*1ec469cfSAlexey Bataev 
79*1ec469cfSAlexey Bataev     // a_buffer[i] += a_buffer[i-pow(2, k)];
80*1ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]]
81*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
82*1ec469cfSAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
83*1ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]]
84*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
85*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]]
86*1ec469cfSAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
87*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]]
88*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]]
89*1ec469cfSAlexey Bataev     // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]]
90*1ec469cfSAlexey Bataev     // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]]
91*1ec469cfSAlexey Bataev     // CHECK: [[RED_BODY]]:
92*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ]
93*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ]
94*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]],
95*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]],
96*1ec469cfSAlexey Bataev     // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]]
97*1ec469cfSAlexey Bataev     // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]],
98*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1
99*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1
100*1ec469cfSAlexey Bataev     // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]]
101*1ec469cfSAlexey Bataev     // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]]
102*1ec469cfSAlexey Bataev     // CHECK: [[RED_DONE]]:
103*1ec469cfSAlexey Bataev 
104*1ec469cfSAlexey Bataev     // b_buffer[i] += b_buffer[i-pow(2, k)];
105*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
106*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]],
107*1ec469cfSAlexey Bataev     // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]]
108*1ec469cfSAlexey Bataev     // CHECK: store double [[RED]], double* [[B_BUF_IDX]],
109*1ec469cfSAlexey Bataev 
110*1ec469cfSAlexey Bataev     // --i;
111*1ec469cfSAlexey Bataev     // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1
112*1ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]]
113*1ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]]
114*1ec469cfSAlexey Bataev     // CHECK: [[INNER_EXIT]]:
115*1ec469cfSAlexey Bataev 
116*1ec469cfSAlexey Bataev     // ++k;
117*1ec469cfSAlexey Bataev     // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1
118*1ec469cfSAlexey Bataev     // k2pow <<= 1;
119*1ec469cfSAlexey Bataev     // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1
120*1ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]]
121*1ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]]
122*1ec469cfSAlexey Bataev     // CHECK: [[OUTER_EXIT]]:
123*1ec469cfSAlexey Bataev     bar();
124*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
125*1ec469cfSAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
126*1ec469cfSAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
127*1ec469cfSAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
128*1ec469cfSAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
129*1ec469cfSAlexey Bataev 
130*1ec469cfSAlexey Bataev     // Skip the before scan body.
131*1ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
132*1ec469cfSAlexey Bataev 
133*1ec469cfSAlexey Bataev     // CHECK: [[EXIT_INSCAN:[^,]+]]:
134*1ec469cfSAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:[^,]+]]
135*1ec469cfSAlexey Bataev 
136*1ec469cfSAlexey Bataev     // CHECK: [[DISPATCH]]:
137*1ec469cfSAlexey Bataev     // a_priv[[0..n] = a_buffer[i][0..n];
138*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
139*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
140*1ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
141*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
142*1ec469cfSAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
143*1ec469cfSAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
144*1ec469cfSAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8*
145*1ec469cfSAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
146*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
147*1ec469cfSAlexey Bataev 
148*1ec469cfSAlexey Bataev     // b_priv = b_buffer[i];
149*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
150*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
151*1ec469cfSAlexey Bataev     // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]],
152*1ec469cfSAlexey Bataev     // CHECK: br label %[[SCAN_PHASE:[^,]+]]
153*1ec469cfSAlexey Bataev 
154*1ec469cfSAlexey Bataev     // CHECK: [[SCAN_PHASE]]:
155*1ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}bar{{.+}}()
156*1ec469cfSAlexey Bataev     // CHECK: br label %[[EXIT_INSCAN]]
157*1ec469cfSAlexey Bataev 
158*1ec469cfSAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
159*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
160*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
161*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8*
162*1ec469cfSAlexey Bataev   }
163*1ec469cfSAlexey Bataev 
164*1ec469cfSAlexey Bataev   // CHECK: call i8* @llvm.stacksave()
165*1ec469cfSAlexey Bataev   // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]]
166*1ec469cfSAlexey Bataev 
167*1ec469cfSAlexey Bataev   // float a_buffer[10][n];
168*1ec469cfSAlexey Bataev   // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]],
169*1ec469cfSAlexey Bataev 
170*1ec469cfSAlexey Bataev   // double b_buffer[10];
171*1ec469cfSAlexey Bataev   // CHECK: [[B_BUF:%.+]] = alloca double, i64 10,
172*1ec469cfSAlexey Bataev #pragma omp parallel for reduction(inscan, +:a[:n], b)
173*1ec469cfSAlexey Bataev   for (int i = 0; i < 10; ++i) {
174*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
175*1ec469cfSAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
176*1ec469cfSAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
177*1ec469cfSAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
178*1ec469cfSAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
179*1ec469cfSAlexey Bataev 
180*1ec469cfSAlexey Bataev     // Skip the before scan body.
181*1ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
182*1ec469cfSAlexey Bataev 
183*1ec469cfSAlexey Bataev     // CHECK: [[EXIT_INSCAN:[^,]+]]:
184*1ec469cfSAlexey Bataev 
185*1ec469cfSAlexey Bataev     // a_buffer[i][0..n] = a_priv[[0..n];
186*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
187*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
188*1ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
189*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
190*1ec469cfSAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
191*1ec469cfSAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
192*1ec469cfSAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
193*1ec469cfSAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8*
194*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
195*1ec469cfSAlexey Bataev 
196*1ec469cfSAlexey Bataev     // b_buffer[i] = b_priv;
197*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
198*1ec469cfSAlexey Bataev     // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]],
199*1ec469cfSAlexey Bataev     // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]],
200*1ec469cfSAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:[^,]+]]
201*1ec469cfSAlexey Bataev 
202*1ec469cfSAlexey Bataev     // CHECK: [[DISPATCH]]:
203*1ec469cfSAlexey Bataev     // CHECK: br label %[[INPUT_PHASE:[^,]+]]
204*1ec469cfSAlexey Bataev 
205*1ec469cfSAlexey Bataev     // CHECK: [[INPUT_PHASE]]:
206*1ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}bar{{.+}}()
207*1ec469cfSAlexey Bataev     // CHECK: br label %[[EXIT_INSCAN]]
208*1ec469cfSAlexey Bataev 
209*1ec469cfSAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
210*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
211*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
212*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_barrier(
213*1ec469cfSAlexey Bataev     foo();
214*1ec469cfSAlexey Bataev #pragma omp scan exclusive(a[:n], b)
215*1ec469cfSAlexey Bataev     // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01)
216*1ec469cfSAlexey Bataev     // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]])
217*1ec469cfSAlexey Bataev     // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32
218*1ec469cfSAlexey Bataev     // CHECK: br label %[[OUTER_BODY:[^,]+]]
219*1ec469cfSAlexey Bataev     // CHECK: [[OUTER_BODY]]:
220*1ec469cfSAlexey Bataev     // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ]
221*1ec469cfSAlexey Bataev     // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ]
222*1ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]]
223*1ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]]
224*1ec469cfSAlexey Bataev     // CHECK: [[INNER_BODY]]:
225*1ec469cfSAlexey Bataev     // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ]
226*1ec469cfSAlexey Bataev 
227*1ec469cfSAlexey Bataev     // a_buffer[i] += a_buffer[i-pow(2, k)];
228*1ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]]
229*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
230*1ec469cfSAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
231*1ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]]
232*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
233*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]]
234*1ec469cfSAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
235*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]]
236*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]]
237*1ec469cfSAlexey Bataev     // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]]
238*1ec469cfSAlexey Bataev     // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]]
239*1ec469cfSAlexey Bataev     // CHECK: [[RED_BODY]]:
240*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ]
241*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ]
242*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]],
243*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]],
244*1ec469cfSAlexey Bataev     // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]]
245*1ec469cfSAlexey Bataev     // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]],
246*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1
247*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1
248*1ec469cfSAlexey Bataev     // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]]
249*1ec469cfSAlexey Bataev     // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]]
250*1ec469cfSAlexey Bataev     // CHECK: [[RED_DONE]]:
251*1ec469cfSAlexey Bataev 
252*1ec469cfSAlexey Bataev     // b_buffer[i] += b_buffer[i-pow(2, k)];
253*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
254*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]],
255*1ec469cfSAlexey Bataev     // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]]
256*1ec469cfSAlexey Bataev     // CHECK: store double [[RED]], double* [[B_BUF_IDX]],
257*1ec469cfSAlexey Bataev 
258*1ec469cfSAlexey Bataev     // --i;
259*1ec469cfSAlexey Bataev     // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1
260*1ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]]
261*1ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]]
262*1ec469cfSAlexey Bataev     // CHECK: [[INNER_EXIT]]:
263*1ec469cfSAlexey Bataev 
264*1ec469cfSAlexey Bataev     // ++k;
265*1ec469cfSAlexey Bataev     // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1
266*1ec469cfSAlexey Bataev     // k2pow <<= 1;
267*1ec469cfSAlexey Bataev     // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1
268*1ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]]
269*1ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]]
270*1ec469cfSAlexey Bataev     // CHECK: [[OUTER_EXIT]]:
271*1ec469cfSAlexey Bataev     bar();
272*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
273*1ec469cfSAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
274*1ec469cfSAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
275*1ec469cfSAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
276*1ec469cfSAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
277*1ec469cfSAlexey Bataev 
278*1ec469cfSAlexey Bataev     // CHECK: [[SCAN_PHASE:.+]]:
279*1ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
280*1ec469cfSAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:.+]]
281*1ec469cfSAlexey Bataev 
282*1ec469cfSAlexey Bataev     // CHECK: [[DISPATCH]]:
283*1ec469cfSAlexey Bataev     // if (i >0)
284*1ec469cfSAlexey Bataev     //   a_priv[[0..n] = a_buffer[i-1][0..n];
285*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
286*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
287*1ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp eq i64 [[BASE_IDX]], 0
288*1ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[IF_DONE:[^,]+]], label %[[IF_THEN:[^,]+]]
289*1ec469cfSAlexey Bataev     // CHECK: [[IF_THEN]]:
290*1ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_SUB_1:%.+]] = sub nuw i64 [[BASE_IDX]], 1
291*1ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX_SUB_1]], [[NUM_ELEMS]]
292*1ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
293*1ec469cfSAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
294*1ec469cfSAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
295*1ec469cfSAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8*
296*1ec469cfSAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
297*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
298*1ec469cfSAlexey Bataev 
299*1ec469cfSAlexey Bataev     // b_priv = b_buffer[i];
300*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX_SUB_1]]
301*1ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
302*1ec469cfSAlexey Bataev     // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]],
303*1ec469cfSAlexey Bataev     // CHECK: br label %[[SCAN_PHASE]]
304*1ec469cfSAlexey Bataev 
305*1ec469cfSAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
306*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
307*1ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
308*1ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8*
309*1ec469cfSAlexey Bataev   }
310*1ec469cfSAlexey Bataev }
311*1ec469cfSAlexey Bataev 
312*1ec469cfSAlexey Bataev #endif
313*1ec469cfSAlexey Bataev 
314