1*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -verify -fopenmp -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s 2*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s 3*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s 41ec469cfSAlexey Bataev 5*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -verify -fopenmp-simd -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s 6*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -fopenmp-simd -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s 7*ff260ad0SSaiyedul Islam // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s 81ec469cfSAlexey Bataev // SIMD-ONLY0-NOT: {{__kmpc|__tgt}} 91ec469cfSAlexey Bataev // expected-no-diagnostics 101ec469cfSAlexey Bataev #ifndef HEADER 111ec469cfSAlexey Bataev #define HEADER 121ec469cfSAlexey Bataev 131ec469cfSAlexey Bataev void foo(); 141ec469cfSAlexey Bataev void bar(); 151ec469cfSAlexey Bataev 161ec469cfSAlexey Bataev // CHECK: define void @{{.*}}baz{{.*}}(i32 %n) 171ec469cfSAlexey Bataev void baz(int n) { 181ec469cfSAlexey Bataev static float a[10]; 191ec469cfSAlexey Bataev static double b; 201ec469cfSAlexey Bataev 211ec469cfSAlexey Bataev // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call( 221ec469cfSAlexey Bataev // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call( 231ec469cfSAlexey Bataev 241ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 251ec469cfSAlexey Bataev // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]] 261ec469cfSAlexey Bataev 271ec469cfSAlexey Bataev // float a_buffer[10][n]; 281ec469cfSAlexey Bataev // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]], 291ec469cfSAlexey Bataev 301ec469cfSAlexey Bataev // double b_buffer[10]; 311ec469cfSAlexey Bataev // CHECK: [[B_BUF:%.+]] = alloca double, i64 10, 321ec469cfSAlexey Bataev #pragma omp parallel for reduction(inscan, +:a[:n], b) 331ec469cfSAlexey Bataev for (int i = 0; i < 10; ++i) { 341ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_init_4( 351ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 361ec469cfSAlexey Bataev // CHECK: store float 0.000000e+00, float* % 371ec469cfSAlexey Bataev // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]], 381ec469cfSAlexey Bataev // CHECK: br label %[[DISPATCH:[^,]+]] 391ec469cfSAlexey Bataev // CHECK: [[INPUT_PHASE:.+]]: 401ec469cfSAlexey Bataev // CHECK: call void @{{.+}}foo{{.+}}() 411ec469cfSAlexey Bataev 421ec469cfSAlexey Bataev // a_buffer[i][0..n] = a_priv[[0..n]; 431ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]], 441ec469cfSAlexey Bataev // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64 451ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]] 461ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 471ec469cfSAlexey Bataev // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0 481ec469cfSAlexey Bataev // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4 491ec469cfSAlexey Bataev // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8* 501ec469cfSAlexey Bataev // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8* 511ec469cfSAlexey Bataev // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false) 521ec469cfSAlexey Bataev 531ec469cfSAlexey Bataev // b_buffer[i] = b_priv; 541ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]] 551ec469cfSAlexey Bataev // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]], 561ec469cfSAlexey Bataev // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]], 571ec469cfSAlexey Bataev // CHECK: br label %[[LOOP_CONTINUE:.+]] 581ec469cfSAlexey Bataev 591ec469cfSAlexey Bataev // CHECK: [[DISPATCH]]: 601ec469cfSAlexey Bataev // CHECK: br label %[[INPUT_PHASE]] 611ec469cfSAlexey Bataev // CHECK: [[LOOP_CONTINUE]]: 621ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* % 631ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_fini( 641ec469cfSAlexey Bataev // CHECK: call void @__kmpc_barrier( 651ec469cfSAlexey Bataev foo(); 661ec469cfSAlexey Bataev #pragma omp scan inclusive(a[:n], b) 671ec469cfSAlexey Bataev // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01) 681ec469cfSAlexey Bataev // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]]) 691ec469cfSAlexey Bataev // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32 701ec469cfSAlexey Bataev // CHECK: br label %[[OUTER_BODY:[^,]+]] 711ec469cfSAlexey Bataev // CHECK: [[OUTER_BODY]]: 721ec469cfSAlexey Bataev // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ] 731ec469cfSAlexey Bataev // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ] 741ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]] 751ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]] 761ec469cfSAlexey Bataev // CHECK: [[INNER_BODY]]: 771ec469cfSAlexey Bataev // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ] 781ec469cfSAlexey Bataev 791ec469cfSAlexey Bataev // a_buffer[i] += a_buffer[i-pow(2, k)]; 801ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]] 811ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 821ec469cfSAlexey Bataev // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]] 831ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]] 841ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 851ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]] 861ec469cfSAlexey Bataev // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]] 871ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]] 881ec469cfSAlexey Bataev // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]] 891ec469cfSAlexey Bataev // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]] 901ec469cfSAlexey Bataev // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]] 911ec469cfSAlexey Bataev // CHECK: [[RED_BODY]]: 921ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ] 931ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ] 941ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]], 951ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], 961ec469cfSAlexey Bataev // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]] 971ec469cfSAlexey Bataev // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]], 981ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1 991ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1 1001ec469cfSAlexey Bataev // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]] 1011ec469cfSAlexey Bataev // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]] 1021ec469cfSAlexey Bataev // CHECK: [[RED_DONE]]: 1031ec469cfSAlexey Bataev 1041ec469cfSAlexey Bataev // b_buffer[i] += b_buffer[i-pow(2, k)]; 1051ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]], 1061ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]], 1071ec469cfSAlexey Bataev // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]] 1081ec469cfSAlexey Bataev // CHECK: store double [[RED]], double* [[B_BUF_IDX]], 1091ec469cfSAlexey Bataev 1101ec469cfSAlexey Bataev // --i; 1111ec469cfSAlexey Bataev // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1 1121ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]] 1131ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]] 1141ec469cfSAlexey Bataev // CHECK: [[INNER_EXIT]]: 1151ec469cfSAlexey Bataev 1161ec469cfSAlexey Bataev // ++k; 1171ec469cfSAlexey Bataev // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1 1181ec469cfSAlexey Bataev // k2pow <<= 1; 1191ec469cfSAlexey Bataev // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1 1201ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]] 1211ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]] 1221ec469cfSAlexey Bataev // CHECK: [[OUTER_EXIT]]: 1231ec469cfSAlexey Bataev bar(); 1241ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_init_4( 1251ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 1261ec469cfSAlexey Bataev // CHECK: store float 0.000000e+00, float* % 1271ec469cfSAlexey Bataev // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]], 1281ec469cfSAlexey Bataev // CHECK: br label %[[DISPATCH:[^,]+]] 1291ec469cfSAlexey Bataev 1301ec469cfSAlexey Bataev // Skip the before scan body. 1311ec469cfSAlexey Bataev // CHECK: call void @{{.+}}foo{{.+}}() 1321ec469cfSAlexey Bataev 1331ec469cfSAlexey Bataev // CHECK: [[EXIT_INSCAN:[^,]+]]: 1341ec469cfSAlexey Bataev // CHECK: br label %[[LOOP_CONTINUE:[^,]+]] 1351ec469cfSAlexey Bataev 1361ec469cfSAlexey Bataev // CHECK: [[DISPATCH]]: 1371ec469cfSAlexey Bataev // a_priv[[0..n] = a_buffer[i][0..n]; 1381ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]], 1391ec469cfSAlexey Bataev // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64 1401ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]] 1411ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 1421ec469cfSAlexey Bataev // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0 1431ec469cfSAlexey Bataev // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4 1441ec469cfSAlexey Bataev // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8* 1451ec469cfSAlexey Bataev // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8* 1461ec469cfSAlexey Bataev // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false) 1471ec469cfSAlexey Bataev 1481ec469cfSAlexey Bataev // b_priv = b_buffer[i]; 1491ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]] 1501ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]], 1511ec469cfSAlexey Bataev // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]], 1521ec469cfSAlexey Bataev // CHECK: br label %[[SCAN_PHASE:[^,]+]] 1531ec469cfSAlexey Bataev 1541ec469cfSAlexey Bataev // CHECK: [[SCAN_PHASE]]: 1551ec469cfSAlexey Bataev // CHECK: call void @{{.+}}bar{{.+}}() 1561ec469cfSAlexey Bataev // CHECK: br label %[[EXIT_INSCAN]] 1571ec469cfSAlexey Bataev 1581ec469cfSAlexey Bataev // CHECK: [[LOOP_CONTINUE]]: 1591ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* % 1601ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_fini( 1611ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* 1621ec469cfSAlexey Bataev } 1631ec469cfSAlexey Bataev 1641ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 1651ec469cfSAlexey Bataev // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]] 1661ec469cfSAlexey Bataev 1671ec469cfSAlexey Bataev // float a_buffer[10][n]; 1681ec469cfSAlexey Bataev // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]], 1691ec469cfSAlexey Bataev 1701ec469cfSAlexey Bataev // double b_buffer[10]; 1711ec469cfSAlexey Bataev // CHECK: [[B_BUF:%.+]] = alloca double, i64 10, 1721ec469cfSAlexey Bataev #pragma omp parallel for reduction(inscan, +:a[:n], b) 1731ec469cfSAlexey Bataev for (int i = 0; i < 10; ++i) { 1741ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_init_4( 1751ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 1761ec469cfSAlexey Bataev // CHECK: store float 0.000000e+00, float* % 1771ec469cfSAlexey Bataev // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]], 1781ec469cfSAlexey Bataev // CHECK: br label %[[DISPATCH:[^,]+]] 1791ec469cfSAlexey Bataev 1801ec469cfSAlexey Bataev // Skip the before scan body. 1811ec469cfSAlexey Bataev // CHECK: call void @{{.+}}foo{{.+}}() 1821ec469cfSAlexey Bataev 1831ec469cfSAlexey Bataev // CHECK: [[EXIT_INSCAN:[^,]+]]: 1841ec469cfSAlexey Bataev 1851ec469cfSAlexey Bataev // a_buffer[i][0..n] = a_priv[[0..n]; 1861ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]], 1871ec469cfSAlexey Bataev // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64 1881ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]] 1891ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 1901ec469cfSAlexey Bataev // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0 1911ec469cfSAlexey Bataev // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4 1921ec469cfSAlexey Bataev // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8* 1931ec469cfSAlexey Bataev // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8* 1941ec469cfSAlexey Bataev // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false) 1951ec469cfSAlexey Bataev 1961ec469cfSAlexey Bataev // b_buffer[i] = b_priv; 1971ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]] 1981ec469cfSAlexey Bataev // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]], 1991ec469cfSAlexey Bataev // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]], 2001ec469cfSAlexey Bataev // CHECK: br label %[[LOOP_CONTINUE:[^,]+]] 2011ec469cfSAlexey Bataev 2021ec469cfSAlexey Bataev // CHECK: [[DISPATCH]]: 2031ec469cfSAlexey Bataev // CHECK: br label %[[INPUT_PHASE:[^,]+]] 2041ec469cfSAlexey Bataev 2051ec469cfSAlexey Bataev // CHECK: [[INPUT_PHASE]]: 2061ec469cfSAlexey Bataev // CHECK: call void @{{.+}}bar{{.+}}() 2071ec469cfSAlexey Bataev // CHECK: br label %[[EXIT_INSCAN]] 2081ec469cfSAlexey Bataev 2091ec469cfSAlexey Bataev // CHECK: [[LOOP_CONTINUE]]: 2101ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* % 2111ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_fini( 2121ec469cfSAlexey Bataev // CHECK: call void @__kmpc_barrier( 2131ec469cfSAlexey Bataev foo(); 2141ec469cfSAlexey Bataev #pragma omp scan exclusive(a[:n], b) 2151ec469cfSAlexey Bataev // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01) 2161ec469cfSAlexey Bataev // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]]) 2171ec469cfSAlexey Bataev // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32 2181ec469cfSAlexey Bataev // CHECK: br label %[[OUTER_BODY:[^,]+]] 2191ec469cfSAlexey Bataev // CHECK: [[OUTER_BODY]]: 2201ec469cfSAlexey Bataev // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ] 2211ec469cfSAlexey Bataev // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ] 2221ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]] 2231ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]] 2241ec469cfSAlexey Bataev // CHECK: [[INNER_BODY]]: 2251ec469cfSAlexey Bataev // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ] 2261ec469cfSAlexey Bataev 2271ec469cfSAlexey Bataev // a_buffer[i] += a_buffer[i-pow(2, k)]; 2281ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]] 2291ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 2301ec469cfSAlexey Bataev // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]] 2311ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]] 2321ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 2331ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]] 2341ec469cfSAlexey Bataev // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]] 2351ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]] 2361ec469cfSAlexey Bataev // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]] 2371ec469cfSAlexey Bataev // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]] 2381ec469cfSAlexey Bataev // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]] 2391ec469cfSAlexey Bataev // CHECK: [[RED_BODY]]: 2401ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ] 2411ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ] 2421ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]], 2431ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], 2441ec469cfSAlexey Bataev // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]] 2451ec469cfSAlexey Bataev // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]], 2461ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1 2471ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1 2481ec469cfSAlexey Bataev // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]] 2491ec469cfSAlexey Bataev // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]] 2501ec469cfSAlexey Bataev // CHECK: [[RED_DONE]]: 2511ec469cfSAlexey Bataev 2521ec469cfSAlexey Bataev // b_buffer[i] += b_buffer[i-pow(2, k)]; 2531ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]], 2541ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]], 2551ec469cfSAlexey Bataev // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]] 2561ec469cfSAlexey Bataev // CHECK: store double [[RED]], double* [[B_BUF_IDX]], 2571ec469cfSAlexey Bataev 2581ec469cfSAlexey Bataev // --i; 2591ec469cfSAlexey Bataev // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1 2601ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]] 2611ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]] 2621ec469cfSAlexey Bataev // CHECK: [[INNER_EXIT]]: 2631ec469cfSAlexey Bataev 2641ec469cfSAlexey Bataev // ++k; 2651ec469cfSAlexey Bataev // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1 2661ec469cfSAlexey Bataev // k2pow <<= 1; 2671ec469cfSAlexey Bataev // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1 2681ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]] 2691ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]] 2701ec469cfSAlexey Bataev // CHECK: [[OUTER_EXIT]]: 2711ec469cfSAlexey Bataev bar(); 2721ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_init_4( 2731ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 2741ec469cfSAlexey Bataev // CHECK: store float 0.000000e+00, float* % 2751ec469cfSAlexey Bataev // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]], 2761ec469cfSAlexey Bataev // CHECK: br label %[[DISPATCH:[^,]+]] 2771ec469cfSAlexey Bataev 2781ec469cfSAlexey Bataev // CHECK: [[SCAN_PHASE:.+]]: 2791ec469cfSAlexey Bataev // CHECK: call void @{{.+}}foo{{.+}}() 2801ec469cfSAlexey Bataev // CHECK: br label %[[LOOP_CONTINUE:.+]] 2811ec469cfSAlexey Bataev 2821ec469cfSAlexey Bataev // CHECK: [[DISPATCH]]: 2831ec469cfSAlexey Bataev // if (i >0) 2841ec469cfSAlexey Bataev // a_priv[[0..n] = a_buffer[i-1][0..n]; 2851ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]], 2861ec469cfSAlexey Bataev // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64 2871ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp eq i64 [[BASE_IDX]], 0 2881ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[IF_DONE:[^,]+]], label %[[IF_THEN:[^,]+]] 2891ec469cfSAlexey Bataev // CHECK: [[IF_THEN]]: 2901ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_SUB_1:%.+]] = sub nuw i64 [[BASE_IDX]], 1 2911ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX_SUB_1]], [[NUM_ELEMS]] 2921ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 2931ec469cfSAlexey Bataev // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0 2941ec469cfSAlexey Bataev // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4 2951ec469cfSAlexey Bataev // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8* 2961ec469cfSAlexey Bataev // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8* 2971ec469cfSAlexey Bataev // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false) 2981ec469cfSAlexey Bataev 2991ec469cfSAlexey Bataev // b_priv = b_buffer[i]; 3001ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX_SUB_1]] 3011ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]], 3021ec469cfSAlexey Bataev // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]], 3031ec469cfSAlexey Bataev // CHECK: br label %[[SCAN_PHASE]] 3041ec469cfSAlexey Bataev 3051ec469cfSAlexey Bataev // CHECK: [[LOOP_CONTINUE]]: 3061ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* % 3071ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_fini( 3081ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* 3091ec469cfSAlexey Bataev } 3101ec469cfSAlexey Bataev } 3111ec469cfSAlexey Bataev 3121ec469cfSAlexey Bataev #endif 3131ec469cfSAlexey Bataev 314