1*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -verify -fopenmp -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s
2*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
3*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
41ec469cfSAlexey Bataev 
5*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -verify -fopenmp-simd -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s
6*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -fopenmp-simd -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s
7*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
81ec469cfSAlexey Bataev // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
91ec469cfSAlexey Bataev // expected-no-diagnostics
101ec469cfSAlexey Bataev #ifndef HEADER
111ec469cfSAlexey Bataev #define HEADER
121ec469cfSAlexey Bataev 
131ec469cfSAlexey Bataev void foo();
141ec469cfSAlexey Bataev void bar();
151ec469cfSAlexey Bataev 
161ec469cfSAlexey Bataev // CHECK: define void @{{.*}}baz{{.*}}(i32 %n)
171ec469cfSAlexey Bataev void baz(int n) {
181ec469cfSAlexey Bataev   static float a[10];
191ec469cfSAlexey Bataev   static double b;
201ec469cfSAlexey Bataev 
211ec469cfSAlexey Bataev   // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(
221ec469cfSAlexey Bataev   // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(
231ec469cfSAlexey Bataev 
241ec469cfSAlexey Bataev   // CHECK: call i8* @llvm.stacksave()
251ec469cfSAlexey Bataev   // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]]
261ec469cfSAlexey Bataev 
271ec469cfSAlexey Bataev   // float a_buffer[10][n];
281ec469cfSAlexey Bataev   // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]],
291ec469cfSAlexey Bataev 
301ec469cfSAlexey Bataev   // double b_buffer[10];
311ec469cfSAlexey Bataev   // CHECK: [[B_BUF:%.+]] = alloca double, i64 10,
321ec469cfSAlexey Bataev #pragma omp parallel for reduction(inscan, +:a[:n], b)
331ec469cfSAlexey Bataev   for (int i = 0; i < 10; ++i) {
341ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
351ec469cfSAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
361ec469cfSAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
371ec469cfSAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
381ec469cfSAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
391ec469cfSAlexey Bataev     // CHECK: [[INPUT_PHASE:.+]]:
401ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
411ec469cfSAlexey Bataev 
421ec469cfSAlexey Bataev     // a_buffer[i][0..n] = a_priv[[0..n];
431ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
441ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
451ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
461ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
471ec469cfSAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
481ec469cfSAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
491ec469cfSAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
501ec469cfSAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8*
511ec469cfSAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
521ec469cfSAlexey Bataev 
531ec469cfSAlexey Bataev     // b_buffer[i] = b_priv;
541ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
551ec469cfSAlexey Bataev     // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]],
561ec469cfSAlexey Bataev     // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]],
571ec469cfSAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:.+]]
581ec469cfSAlexey Bataev 
591ec469cfSAlexey Bataev     // CHECK: [[DISPATCH]]:
601ec469cfSAlexey Bataev     // CHECK: br label %[[INPUT_PHASE]]
611ec469cfSAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
621ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
631ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
641ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_barrier(
651ec469cfSAlexey Bataev     foo();
661ec469cfSAlexey Bataev #pragma omp scan inclusive(a[:n], b)
671ec469cfSAlexey Bataev     // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01)
681ec469cfSAlexey Bataev     // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]])
691ec469cfSAlexey Bataev     // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32
701ec469cfSAlexey Bataev     // CHECK: br label %[[OUTER_BODY:[^,]+]]
711ec469cfSAlexey Bataev     // CHECK: [[OUTER_BODY]]:
721ec469cfSAlexey Bataev     // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ]
731ec469cfSAlexey Bataev     // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ]
741ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]]
751ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]]
761ec469cfSAlexey Bataev     // CHECK: [[INNER_BODY]]:
771ec469cfSAlexey Bataev     // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ]
781ec469cfSAlexey Bataev 
791ec469cfSAlexey Bataev     // a_buffer[i] += a_buffer[i-pow(2, k)];
801ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]]
811ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
821ec469cfSAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
831ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]]
841ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
851ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]]
861ec469cfSAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
871ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]]
881ec469cfSAlexey Bataev     // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]]
891ec469cfSAlexey Bataev     // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]]
901ec469cfSAlexey Bataev     // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]]
911ec469cfSAlexey Bataev     // CHECK: [[RED_BODY]]:
921ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ]
931ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ]
941ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]],
951ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]],
961ec469cfSAlexey Bataev     // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]]
971ec469cfSAlexey Bataev     // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]],
981ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1
991ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1
1001ec469cfSAlexey Bataev     // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]]
1011ec469cfSAlexey Bataev     // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]]
1021ec469cfSAlexey Bataev     // CHECK: [[RED_DONE]]:
1031ec469cfSAlexey Bataev 
1041ec469cfSAlexey Bataev     // b_buffer[i] += b_buffer[i-pow(2, k)];
1051ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
1061ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]],
1071ec469cfSAlexey Bataev     // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]]
1081ec469cfSAlexey Bataev     // CHECK: store double [[RED]], double* [[B_BUF_IDX]],
1091ec469cfSAlexey Bataev 
1101ec469cfSAlexey Bataev     // --i;
1111ec469cfSAlexey Bataev     // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1
1121ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]]
1131ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]]
1141ec469cfSAlexey Bataev     // CHECK: [[INNER_EXIT]]:
1151ec469cfSAlexey Bataev 
1161ec469cfSAlexey Bataev     // ++k;
1171ec469cfSAlexey Bataev     // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1
1181ec469cfSAlexey Bataev     // k2pow <<= 1;
1191ec469cfSAlexey Bataev     // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1
1201ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]]
1211ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]]
1221ec469cfSAlexey Bataev     // CHECK: [[OUTER_EXIT]]:
1231ec469cfSAlexey Bataev     bar();
1241ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
1251ec469cfSAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
1261ec469cfSAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
1271ec469cfSAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
1281ec469cfSAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
1291ec469cfSAlexey Bataev 
1301ec469cfSAlexey Bataev     // Skip the before scan body.
1311ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
1321ec469cfSAlexey Bataev 
1331ec469cfSAlexey Bataev     // CHECK: [[EXIT_INSCAN:[^,]+]]:
1341ec469cfSAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:[^,]+]]
1351ec469cfSAlexey Bataev 
1361ec469cfSAlexey Bataev     // CHECK: [[DISPATCH]]:
1371ec469cfSAlexey Bataev     // a_priv[[0..n] = a_buffer[i][0..n];
1381ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
1391ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
1401ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
1411ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
1421ec469cfSAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
1431ec469cfSAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
1441ec469cfSAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8*
1451ec469cfSAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
1461ec469cfSAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
1471ec469cfSAlexey Bataev 
1481ec469cfSAlexey Bataev     // b_priv = b_buffer[i];
1491ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
1501ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
1511ec469cfSAlexey Bataev     // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]],
1521ec469cfSAlexey Bataev     // CHECK: br label %[[SCAN_PHASE:[^,]+]]
1531ec469cfSAlexey Bataev 
1541ec469cfSAlexey Bataev     // CHECK: [[SCAN_PHASE]]:
1551ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}bar{{.+}}()
1561ec469cfSAlexey Bataev     // CHECK: br label %[[EXIT_INSCAN]]
1571ec469cfSAlexey Bataev 
1581ec469cfSAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
1591ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
1601ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
1611ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8*
1621ec469cfSAlexey Bataev   }
1631ec469cfSAlexey Bataev 
1641ec469cfSAlexey Bataev   // CHECK: call i8* @llvm.stacksave()
1651ec469cfSAlexey Bataev   // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]]
1661ec469cfSAlexey Bataev 
1671ec469cfSAlexey Bataev   // float a_buffer[10][n];
1681ec469cfSAlexey Bataev   // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]],
1691ec469cfSAlexey Bataev 
1701ec469cfSAlexey Bataev   // double b_buffer[10];
1711ec469cfSAlexey Bataev   // CHECK: [[B_BUF:%.+]] = alloca double, i64 10,
1721ec469cfSAlexey Bataev #pragma omp parallel for reduction(inscan, +:a[:n], b)
1731ec469cfSAlexey Bataev   for (int i = 0; i < 10; ++i) {
1741ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
1751ec469cfSAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
1761ec469cfSAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
1771ec469cfSAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
1781ec469cfSAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
1791ec469cfSAlexey Bataev 
1801ec469cfSAlexey Bataev     // Skip the before scan body.
1811ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
1821ec469cfSAlexey Bataev 
1831ec469cfSAlexey Bataev     // CHECK: [[EXIT_INSCAN:[^,]+]]:
1841ec469cfSAlexey Bataev 
1851ec469cfSAlexey Bataev     // a_buffer[i][0..n] = a_priv[[0..n];
1861ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
1871ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
1881ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]]
1891ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
1901ec469cfSAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
1911ec469cfSAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
1921ec469cfSAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
1931ec469cfSAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8*
1941ec469cfSAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
1951ec469cfSAlexey Bataev 
1961ec469cfSAlexey Bataev     // b_buffer[i] = b_priv;
1971ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]]
1981ec469cfSAlexey Bataev     // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]],
1991ec469cfSAlexey Bataev     // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]],
2001ec469cfSAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:[^,]+]]
2011ec469cfSAlexey Bataev 
2021ec469cfSAlexey Bataev     // CHECK: [[DISPATCH]]:
2031ec469cfSAlexey Bataev     // CHECK: br label %[[INPUT_PHASE:[^,]+]]
2041ec469cfSAlexey Bataev 
2051ec469cfSAlexey Bataev     // CHECK: [[INPUT_PHASE]]:
2061ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}bar{{.+}}()
2071ec469cfSAlexey Bataev     // CHECK: br label %[[EXIT_INSCAN]]
2081ec469cfSAlexey Bataev 
2091ec469cfSAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
2101ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
2111ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
2121ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_barrier(
2131ec469cfSAlexey Bataev     foo();
2141ec469cfSAlexey Bataev #pragma omp scan exclusive(a[:n], b)
2151ec469cfSAlexey Bataev     // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01)
2161ec469cfSAlexey Bataev     // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]])
2171ec469cfSAlexey Bataev     // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32
2181ec469cfSAlexey Bataev     // CHECK: br label %[[OUTER_BODY:[^,]+]]
2191ec469cfSAlexey Bataev     // CHECK: [[OUTER_BODY]]:
2201ec469cfSAlexey Bataev     // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ]
2211ec469cfSAlexey Bataev     // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ]
2221ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]]
2231ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]]
2241ec469cfSAlexey Bataev     // CHECK: [[INNER_BODY]]:
2251ec469cfSAlexey Bataev     // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ]
2261ec469cfSAlexey Bataev 
2271ec469cfSAlexey Bataev     // a_buffer[i] += a_buffer[i-pow(2, k)];
2281ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]]
2291ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
2301ec469cfSAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
2311ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]]
2321ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
2331ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]]
2341ec469cfSAlexey Bataev     // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]]
2351ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]]
2361ec469cfSAlexey Bataev     // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]]
2371ec469cfSAlexey Bataev     // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]]
2381ec469cfSAlexey Bataev     // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]]
2391ec469cfSAlexey Bataev     // CHECK: [[RED_BODY]]:
2401ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ]
2411ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ]
2421ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]],
2431ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]],
2441ec469cfSAlexey Bataev     // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]]
2451ec469cfSAlexey Bataev     // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]],
2461ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1
2471ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1
2481ec469cfSAlexey Bataev     // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]]
2491ec469cfSAlexey Bataev     // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]]
2501ec469cfSAlexey Bataev     // CHECK: [[RED_DONE]]:
2511ec469cfSAlexey Bataev 
2521ec469cfSAlexey Bataev     // b_buffer[i] += b_buffer[i-pow(2, k)];
2531ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
2541ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]],
2551ec469cfSAlexey Bataev     // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]]
2561ec469cfSAlexey Bataev     // CHECK: store double [[RED]], double* [[B_BUF_IDX]],
2571ec469cfSAlexey Bataev 
2581ec469cfSAlexey Bataev     // --i;
2591ec469cfSAlexey Bataev     // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1
2601ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]]
2611ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]]
2621ec469cfSAlexey Bataev     // CHECK: [[INNER_EXIT]]:
2631ec469cfSAlexey Bataev 
2641ec469cfSAlexey Bataev     // ++k;
2651ec469cfSAlexey Bataev     // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1
2661ec469cfSAlexey Bataev     // k2pow <<= 1;
2671ec469cfSAlexey Bataev     // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1
2681ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]]
2691ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]]
2701ec469cfSAlexey Bataev     // CHECK: [[OUTER_EXIT]]:
2711ec469cfSAlexey Bataev     bar();
2721ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_init_4(
2731ec469cfSAlexey Bataev     // CHECK: call i8* @llvm.stacksave()
2741ec469cfSAlexey Bataev     // CHECK: store float 0.000000e+00, float* %
2751ec469cfSAlexey Bataev     // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]],
2761ec469cfSAlexey Bataev     // CHECK: br label %[[DISPATCH:[^,]+]]
2771ec469cfSAlexey Bataev 
2781ec469cfSAlexey Bataev     // CHECK: [[SCAN_PHASE:.+]]:
2791ec469cfSAlexey Bataev     // CHECK: call void @{{.+}}foo{{.+}}()
2801ec469cfSAlexey Bataev     // CHECK: br label %[[LOOP_CONTINUE:.+]]
2811ec469cfSAlexey Bataev 
2821ec469cfSAlexey Bataev     // CHECK: [[DISPATCH]]:
2831ec469cfSAlexey Bataev     // if (i >0)
2841ec469cfSAlexey Bataev     //   a_priv[[0..n] = a_buffer[i-1][0..n];
2851ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]],
2861ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64
2871ec469cfSAlexey Bataev     // CHECK: [[CMP:%.+]] = icmp eq i64 [[BASE_IDX]], 0
2881ec469cfSAlexey Bataev     // CHECK: br i1 [[CMP]], label %[[IF_DONE:[^,]+]], label %[[IF_THEN:[^,]+]]
2891ec469cfSAlexey Bataev     // CHECK: [[IF_THEN]]:
2901ec469cfSAlexey Bataev     // CHECK: [[BASE_IDX_SUB_1:%.+]] = sub nuw i64 [[BASE_IDX]], 1
2911ec469cfSAlexey Bataev     // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX_SUB_1]], [[NUM_ELEMS]]
2921ec469cfSAlexey Bataev     // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]]
2931ec469cfSAlexey Bataev     // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0
2941ec469cfSAlexey Bataev     // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4
2951ec469cfSAlexey Bataev     // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8*
2961ec469cfSAlexey Bataev     // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8*
2971ec469cfSAlexey Bataev     // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false)
2981ec469cfSAlexey Bataev 
2991ec469cfSAlexey Bataev     // b_priv = b_buffer[i];
3001ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX_SUB_1]]
3011ec469cfSAlexey Bataev     // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]],
3021ec469cfSAlexey Bataev     // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]],
3031ec469cfSAlexey Bataev     // CHECK: br label %[[SCAN_PHASE]]
3041ec469cfSAlexey Bataev 
3051ec469cfSAlexey Bataev     // CHECK: [[LOOP_CONTINUE]]:
3061ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8* %
3071ec469cfSAlexey Bataev     // CHECK: call void @__kmpc_for_static_fini(
3081ec469cfSAlexey Bataev     // CHECK: call void @llvm.stackrestore(i8*
3091ec469cfSAlexey Bataev   }
3101ec469cfSAlexey Bataev }
3111ec469cfSAlexey Bataev 
3121ec469cfSAlexey Bataev #endif
3131ec469cfSAlexey Bataev 
314