1*532dc62bSNikita Popov // RUN: %clang_cc1 -no-opaque-pointers -verify -fopenmp -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s
2*532dc62bSNikita Popov // RUN: %clang_cc1 -no-opaque-pointers -fopenmp -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
3*532dc62bSNikita Popov // RUN: %clang_cc1 -no-opaque-pointers -fopenmp -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
4bd1c03d7SAlexey Bataev 
5*532dc62bSNikita Popov // RUN: %clang_cc1 -no-opaque-pointers -verify -fopenmp-simd -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s
6*532dc62bSNikita Popov // RUN: %clang_cc1 -no-opaque-pointers -fopenmp-simd -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
7*532dc62bSNikita Popov // RUN: %clang_cc1 -no-opaque-pointers -fopenmp-simd -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
8bd1c03d7SAlexey Bataev // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
9bd1c03d7SAlexey Bataev // expected-no-diagnostics
10bd1c03d7SAlexey Bataev #ifndef HEADER
11bd1c03d7SAlexey Bataev #define HEADER
12bd1c03d7SAlexey Bataev 
13bd1c03d7SAlexey Bataev void foo();
14bd1c03d7SAlexey Bataev void bar();
15bd1c03d7SAlexey Bataev 
161b1c8d83Shyeongyu kim // CHECK: define{{.*}} void @{{.*}}baz{{.*}}(i32 noundef %n)
baz(int n)17bd1c03d7SAlexey Bataev void baz(int n) {
18bd1c03d7SAlexey Bataev   static float a[10];
19bd1c03d7SAlexey Bataev   static double b;
20bd1c03d7SAlexey Bataev   // CHECK: call i8* @llvm.stacksave()
21bd1c03d7SAlexey Bataev   // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]]
22bd1c03d7SAlexey Bataev 
23bd1c03d7SAlexey Bataev   // float a_buffer[10][n];
24bd1c03d7SAlexey Bataev   // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]],
25bd1c03d7SAlexey Bataev 
26bd1c03d7SAlexey Bataev   // double b_buffer[10];
27bd1c03d7SAlexey Bataev   // CHECK: [[B_BUF:%.+]] = alloca double, i64 10,
28bd1c03d7SAlexey Bataev #pragma omp for reduction(inscan, +:a[:n], b)
29bd1c03d7SAlexey Bataev   for (int i = 0; i < 10; ++i) {
30bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
31bd1c03d7SAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
32bd1c03d7SAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
33bd1c03d7SAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
34bd1c03d7SAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
35bd1c03d7SAlexey Bataev     // CHECK: [[INPUT_PHASE:.+]]:
36bd1c03d7SAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
37bd1c03d7SAlexey Bataev 
38bd1c03d7SAlexey Bataev     // a_buffer[i][0..n] = a_priv[[0..n];
39bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
40bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
41bd1c03d7SAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
42bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
43bd1c03d7SAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
44bd1c03d7SAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
45bd1c03d7SAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
46bd1c03d7SAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8*
47bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
48bd1c03d7SAlexey Bataev 
49bd1c03d7SAlexey Bataev     // b_buffer[i] = b_priv;
50bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
51bd1c03d7SAlexey Bataev     // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]],
52bd1c03d7SAlexey Bataev     // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]],
53bd1c03d7SAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:.+]]
54bd1c03d7SAlexey Bataev 
55bd1c03d7SAlexey Bataev     // CHECK: [[DISPATCH]]:
56bd1c03d7SAlexey Bataev     // CHECK: br label %[[INPUT_PHASE]]
57bd1c03d7SAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
58bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
59bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
60bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_barrier(
61bd1c03d7SAlexey Bataev     foo();
62bd1c03d7SAlexey Bataev #pragma omp scan inclusive(a[:n], b)
63bd1c03d7SAlexey Bataev     // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01)
64bd1c03d7SAlexey Bataev     // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]])
65bd1c03d7SAlexey Bataev     // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32
66bd1c03d7SAlexey Bataev     // CHECK: br label %[[OUTER_BODY:[^,]+]]
67bd1c03d7SAlexey Bataev     // CHECK: [[OUTER_BODY]]:
68bd1c03d7SAlexey Bataev     // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ]
69bd1c03d7SAlexey Bataev     // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ]
70bd1c03d7SAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]]
71bd1c03d7SAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]]
72bd1c03d7SAlexey Bataev     // CHECK: [[INNER_BODY]]:
73bd1c03d7SAlexey Bataev     // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ]
74bd1c03d7SAlexey Bataev 
75bd1c03d7SAlexey Bataev     // a_buffer[i] += a_buffer[i-pow(2, k)];
76bd1c03d7SAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]]
77bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
78bd1c03d7SAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
79bd1c03d7SAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]]
80bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
81bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]]
82bd1c03d7SAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
83bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]]
84bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]]
85bd1c03d7SAlexey Bataev     // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]]
86bd1c03d7SAlexey Bataev     // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]]
87bd1c03d7SAlexey Bataev     // CHECK: [[RED_BODY]]:
88bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ]
89bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ]
90bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]],
91bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]],
92bd1c03d7SAlexey Bataev     // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]]
93bd1c03d7SAlexey Bataev     // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]],
94bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1
95bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1
96bd1c03d7SAlexey Bataev     // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]]
97bd1c03d7SAlexey Bataev     // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]]
98bd1c03d7SAlexey Bataev     // CHECK: [[RED_DONE]]:
99bd1c03d7SAlexey Bataev 
100bd1c03d7SAlexey Bataev     // b_buffer[i] += b_buffer[i-pow(2, k)];
101bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
102bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]],
103bd1c03d7SAlexey Bataev     // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]]
104bd1c03d7SAlexey Bataev     // CHECK: store double [[RED]], double* [[B_BUF_IDX]],
105bd1c03d7SAlexey Bataev 
106bd1c03d7SAlexey Bataev     // --i;
107bd1c03d7SAlexey Bataev     // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1
108bd1c03d7SAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]]
109bd1c03d7SAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]]
110bd1c03d7SAlexey Bataev     // CHECK: [[INNER_EXIT]]:
111bd1c03d7SAlexey Bataev 
112bd1c03d7SAlexey Bataev     // ++k;
113bd1c03d7SAlexey Bataev     // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1
114bd1c03d7SAlexey Bataev     // k2pow <<= 1;
115bd1c03d7SAlexey Bataev     // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1
116bd1c03d7SAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]]
117bd1c03d7SAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]]
118bd1c03d7SAlexey Bataev     // CHECK: [[OUTER_EXIT]]:
119bd1c03d7SAlexey Bataev     bar();
120bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
121bd1c03d7SAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
122bd1c03d7SAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
123bd1c03d7SAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
124bd1c03d7SAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
125bd1c03d7SAlexey Bataev 
126bd1c03d7SAlexey Bataev     // Skip the before scan body.
127bd1c03d7SAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
128bd1c03d7SAlexey Bataev 
129bd1c03d7SAlexey Bataev     // CHECK: [[EXIT_INSCAN:[^,]+]]:
130bd1c03d7SAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:[^,]+]]
131bd1c03d7SAlexey Bataev 
132bd1c03d7SAlexey Bataev     // CHECK: [[DISPATCH]]:
133bd1c03d7SAlexey Bataev     // a_priv[[0..n] = a_buffer[i][0..n];
134bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
135bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
136bd1c03d7SAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
137bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
138bd1c03d7SAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
139bd1c03d7SAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
140bd1c03d7SAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8*
141bd1c03d7SAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
142bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
143bd1c03d7SAlexey Bataev 
144bd1c03d7SAlexey Bataev     // b_priv = b_buffer[i];
145bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
146bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
147bd1c03d7SAlexey Bataev     // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]],
148bd1c03d7SAlexey Bataev     // CHECK: br label %[[SCAN_PHASE:[^,]+]]
149bd1c03d7SAlexey Bataev 
150bd1c03d7SAlexey Bataev     // CHECK: [[SCAN_PHASE]]:
151bd1c03d7SAlexey Bataev     // CHECK: call void @{{.+}}bar{{.+}}()
152bd1c03d7SAlexey Bataev     // CHECK: br label %[[EXIT_INSCAN]]
153bd1c03d7SAlexey Bataev 
154bd1c03d7SAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
155bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
156bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
157bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8*
158bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_barrier(
159bd1c03d7SAlexey Bataev   }
160bd1c03d7SAlexey Bataev 
161bd1c03d7SAlexey Bataev   // CHECK: call i8* @llvm.stacksave()
162bd1c03d7SAlexey Bataev   // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]]
163bd1c03d7SAlexey Bataev 
164bd1c03d7SAlexey Bataev   // float a_buffer[10][n];
165bd1c03d7SAlexey Bataev   // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]],
166bd1c03d7SAlexey Bataev 
167bd1c03d7SAlexey Bataev   // double b_buffer[10];
168bd1c03d7SAlexey Bataev   // CHECK: [[B_BUF:%.+]] = alloca double, i64 10,
169bd1c03d7SAlexey Bataev #pragma omp for reduction(inscan, +:a[:n], b)
170bd1c03d7SAlexey Bataev   for (int i = 0; i < 10; ++i) {
171bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
172bd1c03d7SAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
173bd1c03d7SAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
174bd1c03d7SAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
175bd1c03d7SAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
176bd1c03d7SAlexey Bataev 
177bd1c03d7SAlexey Bataev     // Skip the before scan body.
178bd1c03d7SAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
179bd1c03d7SAlexey Bataev 
180bd1c03d7SAlexey Bataev     // CHECK: [[EXIT_INSCAN:[^,]+]]:
181bd1c03d7SAlexey Bataev 
182bd1c03d7SAlexey Bataev     // a_buffer[i][0..n] = a_priv[[0..n];
183bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
184bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
185bd1c03d7SAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
186bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
187bd1c03d7SAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
188bd1c03d7SAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
189bd1c03d7SAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
190bd1c03d7SAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8*
191bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
192bd1c03d7SAlexey Bataev 
193bd1c03d7SAlexey Bataev     // b_buffer[i] = b_priv;
194bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
195bd1c03d7SAlexey Bataev     // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]],
196bd1c03d7SAlexey Bataev     // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]],
197bd1c03d7SAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:[^,]+]]
198bd1c03d7SAlexey Bataev 
199bd1c03d7SAlexey Bataev     // CHECK: [[DISPATCH]]:
200bd1c03d7SAlexey Bataev     // CHECK: br label %[[INPUT_PHASE:[^,]+]]
201bd1c03d7SAlexey Bataev 
202bd1c03d7SAlexey Bataev     // CHECK: [[INPUT_PHASE]]:
203bd1c03d7SAlexey Bataev     // CHECK: call void @{{.+}}bar{{.+}}()
204bd1c03d7SAlexey Bataev     // CHECK: br label %[[EXIT_INSCAN]]
205bd1c03d7SAlexey Bataev 
206bd1c03d7SAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
207bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
208bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
209bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_barrier(
210bd1c03d7SAlexey Bataev     foo();
211bd1c03d7SAlexey Bataev #pragma omp scan exclusive(a[:n], b)
212bd1c03d7SAlexey Bataev     // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01)
213bd1c03d7SAlexey Bataev     // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]])
214bd1c03d7SAlexey Bataev     // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32
215bd1c03d7SAlexey Bataev     // CHECK: br label %[[OUTER_BODY:[^,]+]]
216bd1c03d7SAlexey Bataev     // CHECK: [[OUTER_BODY]]:
217bd1c03d7SAlexey Bataev     // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ]
218bd1c03d7SAlexey Bataev     // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ]
219bd1c03d7SAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]]
220bd1c03d7SAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]]
221bd1c03d7SAlexey Bataev     // CHECK: [[INNER_BODY]]:
222bd1c03d7SAlexey Bataev     // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ]
223bd1c03d7SAlexey Bataev 
224bd1c03d7SAlexey Bataev     // a_buffer[i] += a_buffer[i-pow(2, k)];
225bd1c03d7SAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]]
226bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
227bd1c03d7SAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
228bd1c03d7SAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]]
229bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
230bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]]
231bd1c03d7SAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
232bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]]
233bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]]
234bd1c03d7SAlexey Bataev     // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]]
235bd1c03d7SAlexey Bataev     // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]]
236bd1c03d7SAlexey Bataev     // CHECK: [[RED_BODY]]:
237bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ]
238bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ]
239bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]],
240bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]],
241bd1c03d7SAlexey Bataev     // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]]
242bd1c03d7SAlexey Bataev     // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]],
243bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1
244bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1
245bd1c03d7SAlexey Bataev     // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]]
246bd1c03d7SAlexey Bataev     // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]]
247bd1c03d7SAlexey Bataev     // CHECK: [[RED_DONE]]:
248bd1c03d7SAlexey Bataev 
249bd1c03d7SAlexey Bataev     // b_buffer[i] += b_buffer[i-pow(2, k)];
250bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
251bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]],
252bd1c03d7SAlexey Bataev     // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]]
253bd1c03d7SAlexey Bataev     // CHECK: store double [[RED]], double* [[B_BUF_IDX]],
254bd1c03d7SAlexey Bataev 
255bd1c03d7SAlexey Bataev     // --i;
256bd1c03d7SAlexey Bataev     // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1
257bd1c03d7SAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]]
258bd1c03d7SAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]]
259bd1c03d7SAlexey Bataev     // CHECK: [[INNER_EXIT]]:
260bd1c03d7SAlexey Bataev 
261bd1c03d7SAlexey Bataev     // ++k;
262bd1c03d7SAlexey Bataev     // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1
263bd1c03d7SAlexey Bataev     // k2pow <<= 1;
264bd1c03d7SAlexey Bataev     // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1
265bd1c03d7SAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]]
266bd1c03d7SAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]]
267bd1c03d7SAlexey Bataev     // CHECK: [[OUTER_EXIT]]:
268bd1c03d7SAlexey Bataev     bar();
269bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
270bd1c03d7SAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
271bd1c03d7SAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
272bd1c03d7SAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
273bd1c03d7SAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
274bd1c03d7SAlexey Bataev 
275bd1c03d7SAlexey Bataev     // CHECK: [[SCAN_PHASE:.+]]:
276bd1c03d7SAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
277bd1c03d7SAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:.+]]
278bd1c03d7SAlexey Bataev 
279bd1c03d7SAlexey Bataev     // CHECK: [[DISPATCH]]:
280bd1c03d7SAlexey Bataev     // if (i >0)
281bd1c03d7SAlexey Bataev     //   a_priv[[0..n] = a_buffer[i-1][0..n];
282bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
283bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
284bd1c03d7SAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp eq i64 [[BASE_IDX]], 0
285bd1c03d7SAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[IF_DONE:[^,]+]], label %[[IF_THEN:[^,]+]]
286bd1c03d7SAlexey Bataev     // CHECK: [[IF_THEN]]:
287bd1c03d7SAlexey Bataev     // CHECK: [[BASE_IDX_SUB_1:%.+]] = sub nuw i64 [[BASE_IDX]], 1
288bd1c03d7SAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX_SUB_1]], [[NUM_ELEMS]]
289bd1c03d7SAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
290bd1c03d7SAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
291bd1c03d7SAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
292bd1c03d7SAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8*
293bd1c03d7SAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
294bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
295bd1c03d7SAlexey Bataev 
296bd1c03d7SAlexey Bataev     // b_priv = b_buffer[i];
297bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX_SUB_1]]
298bd1c03d7SAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
299bd1c03d7SAlexey Bataev     // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]],
300bd1c03d7SAlexey Bataev     // CHECK: br label %[[SCAN_PHASE]]
301bd1c03d7SAlexey Bataev 
302bd1c03d7SAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
303bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
304bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
305bd1c03d7SAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8*
306bd1c03d7SAlexey Bataev     // CHECK: call void @__kmpc_barrier(
307bd1c03d7SAlexey Bataev   }
308bd1c03d7SAlexey Bataev }
309bd1c03d7SAlexey Bataev 
310bd1c03d7SAlexey Bataev #endif
311bd1c03d7SAlexey Bataev 
312