1*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s 2*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s 3*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s 4*1ec469cfSAlexey Bataev 5*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s 6*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -std=c++11 -triple x86_64-unknown-unknown -emit-pch -o %t %s 7*1ec469cfSAlexey Bataev // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s 8*1ec469cfSAlexey Bataev // SIMD-ONLY0-NOT: {{__kmpc|__tgt}} 9*1ec469cfSAlexey Bataev // expected-no-diagnostics 10*1ec469cfSAlexey Bataev #ifndef HEADER 11*1ec469cfSAlexey Bataev #define HEADER 12*1ec469cfSAlexey Bataev 13*1ec469cfSAlexey Bataev void foo(); 14*1ec469cfSAlexey Bataev void bar(); 15*1ec469cfSAlexey Bataev 16*1ec469cfSAlexey Bataev // CHECK: define void @{{.*}}baz{{.*}}(i32 %n) 17*1ec469cfSAlexey Bataev void baz(int n) { 18*1ec469cfSAlexey Bataev static float a[10]; 19*1ec469cfSAlexey Bataev static double b; 20*1ec469cfSAlexey Bataev 21*1ec469cfSAlexey Bataev // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call( 22*1ec469cfSAlexey Bataev // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call( 23*1ec469cfSAlexey Bataev 24*1ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 25*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]] 26*1ec469cfSAlexey Bataev 27*1ec469cfSAlexey Bataev // float a_buffer[10][n]; 28*1ec469cfSAlexey Bataev // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]], 29*1ec469cfSAlexey Bataev 30*1ec469cfSAlexey Bataev // double b_buffer[10]; 31*1ec469cfSAlexey Bataev // CHECK: [[B_BUF:%.+]] = alloca double, i64 10, 32*1ec469cfSAlexey Bataev #pragma omp parallel for reduction(inscan, +:a[:n], b) 33*1ec469cfSAlexey Bataev for (int i = 0; i < 10; ++i) { 34*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_init_4( 35*1ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 36*1ec469cfSAlexey Bataev // CHECK: store float 0.000000e+00, float* % 37*1ec469cfSAlexey Bataev // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]], 38*1ec469cfSAlexey Bataev // CHECK: br label %[[DISPATCH:[^,]+]] 39*1ec469cfSAlexey Bataev // CHECK: [[INPUT_PHASE:.+]]: 40*1ec469cfSAlexey Bataev // CHECK: call void @{{.+}}foo{{.+}}() 41*1ec469cfSAlexey Bataev 42*1ec469cfSAlexey Bataev // a_buffer[i][0..n] = a_priv[[0..n]; 43*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]], 44*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64 45*1ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]] 46*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 47*1ec469cfSAlexey Bataev // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0 48*1ec469cfSAlexey Bataev // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4 49*1ec469cfSAlexey Bataev // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8* 50*1ec469cfSAlexey Bataev // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8* 51*1ec469cfSAlexey Bataev // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false) 52*1ec469cfSAlexey Bataev 53*1ec469cfSAlexey Bataev // b_buffer[i] = b_priv; 54*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]] 55*1ec469cfSAlexey Bataev // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]], 56*1ec469cfSAlexey Bataev // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]], 57*1ec469cfSAlexey Bataev // CHECK: br label %[[LOOP_CONTINUE:.+]] 58*1ec469cfSAlexey Bataev 59*1ec469cfSAlexey Bataev // CHECK: [[DISPATCH]]: 60*1ec469cfSAlexey Bataev // CHECK: br label %[[INPUT_PHASE]] 61*1ec469cfSAlexey Bataev // CHECK: [[LOOP_CONTINUE]]: 62*1ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* % 63*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_fini( 64*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_barrier( 65*1ec469cfSAlexey Bataev foo(); 66*1ec469cfSAlexey Bataev #pragma omp scan inclusive(a[:n], b) 67*1ec469cfSAlexey Bataev // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01) 68*1ec469cfSAlexey Bataev // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]]) 69*1ec469cfSAlexey Bataev // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32 70*1ec469cfSAlexey Bataev // CHECK: br label %[[OUTER_BODY:[^,]+]] 71*1ec469cfSAlexey Bataev // CHECK: [[OUTER_BODY]]: 72*1ec469cfSAlexey Bataev // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ] 73*1ec469cfSAlexey Bataev // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ] 74*1ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]] 75*1ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]] 76*1ec469cfSAlexey Bataev // CHECK: [[INNER_BODY]]: 77*1ec469cfSAlexey Bataev // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ] 78*1ec469cfSAlexey Bataev 79*1ec469cfSAlexey Bataev // a_buffer[i] += a_buffer[i-pow(2, k)]; 80*1ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]] 81*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 82*1ec469cfSAlexey Bataev // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]] 83*1ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]] 84*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 85*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]] 86*1ec469cfSAlexey Bataev // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]] 87*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]] 88*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]] 89*1ec469cfSAlexey Bataev // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]] 90*1ec469cfSAlexey Bataev // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]] 91*1ec469cfSAlexey Bataev // CHECK: [[RED_BODY]]: 92*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ] 93*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ] 94*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]], 95*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], 96*1ec469cfSAlexey Bataev // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]] 97*1ec469cfSAlexey Bataev // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]], 98*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1 99*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1 100*1ec469cfSAlexey Bataev // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]] 101*1ec469cfSAlexey Bataev // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]] 102*1ec469cfSAlexey Bataev // CHECK: [[RED_DONE]]: 103*1ec469cfSAlexey Bataev 104*1ec469cfSAlexey Bataev // b_buffer[i] += b_buffer[i-pow(2, k)]; 105*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]], 106*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]], 107*1ec469cfSAlexey Bataev // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]] 108*1ec469cfSAlexey Bataev // CHECK: store double [[RED]], double* [[B_BUF_IDX]], 109*1ec469cfSAlexey Bataev 110*1ec469cfSAlexey Bataev // --i; 111*1ec469cfSAlexey Bataev // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1 112*1ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]] 113*1ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]] 114*1ec469cfSAlexey Bataev // CHECK: [[INNER_EXIT]]: 115*1ec469cfSAlexey Bataev 116*1ec469cfSAlexey Bataev // ++k; 117*1ec469cfSAlexey Bataev // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1 118*1ec469cfSAlexey Bataev // k2pow <<= 1; 119*1ec469cfSAlexey Bataev // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1 120*1ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]] 121*1ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]] 122*1ec469cfSAlexey Bataev // CHECK: [[OUTER_EXIT]]: 123*1ec469cfSAlexey Bataev bar(); 124*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_init_4( 125*1ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 126*1ec469cfSAlexey Bataev // CHECK: store float 0.000000e+00, float* % 127*1ec469cfSAlexey Bataev // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]], 128*1ec469cfSAlexey Bataev // CHECK: br label %[[DISPATCH:[^,]+]] 129*1ec469cfSAlexey Bataev 130*1ec469cfSAlexey Bataev // Skip the before scan body. 131*1ec469cfSAlexey Bataev // CHECK: call void @{{.+}}foo{{.+}}() 132*1ec469cfSAlexey Bataev 133*1ec469cfSAlexey Bataev // CHECK: [[EXIT_INSCAN:[^,]+]]: 134*1ec469cfSAlexey Bataev // CHECK: br label %[[LOOP_CONTINUE:[^,]+]] 135*1ec469cfSAlexey Bataev 136*1ec469cfSAlexey Bataev // CHECK: [[DISPATCH]]: 137*1ec469cfSAlexey Bataev // a_priv[[0..n] = a_buffer[i][0..n]; 138*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]], 139*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64 140*1ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]] 141*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 142*1ec469cfSAlexey Bataev // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0 143*1ec469cfSAlexey Bataev // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4 144*1ec469cfSAlexey Bataev // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8* 145*1ec469cfSAlexey Bataev // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8* 146*1ec469cfSAlexey Bataev // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false) 147*1ec469cfSAlexey Bataev 148*1ec469cfSAlexey Bataev // b_priv = b_buffer[i]; 149*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]] 150*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]], 151*1ec469cfSAlexey Bataev // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]], 152*1ec469cfSAlexey Bataev // CHECK: br label %[[SCAN_PHASE:[^,]+]] 153*1ec469cfSAlexey Bataev 154*1ec469cfSAlexey Bataev // CHECK: [[SCAN_PHASE]]: 155*1ec469cfSAlexey Bataev // CHECK: call void @{{.+}}bar{{.+}}() 156*1ec469cfSAlexey Bataev // CHECK: br label %[[EXIT_INSCAN]] 157*1ec469cfSAlexey Bataev 158*1ec469cfSAlexey Bataev // CHECK: [[LOOP_CONTINUE]]: 159*1ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* % 160*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_fini( 161*1ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* 162*1ec469cfSAlexey Bataev } 163*1ec469cfSAlexey Bataev 164*1ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 165*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_SIZE:%.+]] = mul nuw i64 10, [[NUM_ELEMS:%[^,]+]] 166*1ec469cfSAlexey Bataev 167*1ec469cfSAlexey Bataev // float a_buffer[10][n]; 168*1ec469cfSAlexey Bataev // CHECK: [[A_BUF:%.+]] = alloca float, i64 [[A_BUF_SIZE]], 169*1ec469cfSAlexey Bataev 170*1ec469cfSAlexey Bataev // double b_buffer[10]; 171*1ec469cfSAlexey Bataev // CHECK: [[B_BUF:%.+]] = alloca double, i64 10, 172*1ec469cfSAlexey Bataev #pragma omp parallel for reduction(inscan, +:a[:n], b) 173*1ec469cfSAlexey Bataev for (int i = 0; i < 10; ++i) { 174*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_init_4( 175*1ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 176*1ec469cfSAlexey Bataev // CHECK: store float 0.000000e+00, float* % 177*1ec469cfSAlexey Bataev // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]], 178*1ec469cfSAlexey Bataev // CHECK: br label %[[DISPATCH:[^,]+]] 179*1ec469cfSAlexey Bataev 180*1ec469cfSAlexey Bataev // Skip the before scan body. 181*1ec469cfSAlexey Bataev // CHECK: call void @{{.+}}foo{{.+}}() 182*1ec469cfSAlexey Bataev 183*1ec469cfSAlexey Bataev // CHECK: [[EXIT_INSCAN:[^,]+]]: 184*1ec469cfSAlexey Bataev 185*1ec469cfSAlexey Bataev // a_buffer[i][0..n] = a_priv[[0..n]; 186*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]], 187*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64 188*1ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX]], [[NUM_ELEMS]] 189*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 190*1ec469cfSAlexey Bataev // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0 191*1ec469cfSAlexey Bataev // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4 192*1ec469cfSAlexey Bataev // CHECK: [[DEST:%.+]] = bitcast float* [[A_BUF_IDX]] to i8* 193*1ec469cfSAlexey Bataev // CHECK: [[SRC:%.+]] = bitcast float* [[A_PRIV]] to i8* 194*1ec469cfSAlexey Bataev // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false) 195*1ec469cfSAlexey Bataev 196*1ec469cfSAlexey Bataev // b_buffer[i] = b_priv; 197*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX]] 198*1ec469cfSAlexey Bataev // CHECK: [[B_PRIV:%.+]] = load double, double* [[B_PRIV_ADDR]], 199*1ec469cfSAlexey Bataev // CHECK: store double [[B_PRIV]], double* [[B_BUF_IDX]], 200*1ec469cfSAlexey Bataev // CHECK: br label %[[LOOP_CONTINUE:[^,]+]] 201*1ec469cfSAlexey Bataev 202*1ec469cfSAlexey Bataev // CHECK: [[DISPATCH]]: 203*1ec469cfSAlexey Bataev // CHECK: br label %[[INPUT_PHASE:[^,]+]] 204*1ec469cfSAlexey Bataev 205*1ec469cfSAlexey Bataev // CHECK: [[INPUT_PHASE]]: 206*1ec469cfSAlexey Bataev // CHECK: call void @{{.+}}bar{{.+}}() 207*1ec469cfSAlexey Bataev // CHECK: br label %[[EXIT_INSCAN]] 208*1ec469cfSAlexey Bataev 209*1ec469cfSAlexey Bataev // CHECK: [[LOOP_CONTINUE]]: 210*1ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* % 211*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_fini( 212*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_barrier( 213*1ec469cfSAlexey Bataev foo(); 214*1ec469cfSAlexey Bataev #pragma omp scan exclusive(a[:n], b) 215*1ec469cfSAlexey Bataev // CHECK: [[LOG2_10:%.+]] = call double @llvm.log2.f64(double 1.000000e+01) 216*1ec469cfSAlexey Bataev // CHECK: [[CEIL_LOG2_10:%.+]] = call double @llvm.ceil.f64(double [[LOG2_10]]) 217*1ec469cfSAlexey Bataev // CHECK: [[CEIL_LOG2_10_INT:%.+]] = fptoui double [[CEIL_LOG2_10]] to i32 218*1ec469cfSAlexey Bataev // CHECK: br label %[[OUTER_BODY:[^,]+]] 219*1ec469cfSAlexey Bataev // CHECK: [[OUTER_BODY]]: 220*1ec469cfSAlexey Bataev // CHECK: [[K:%.+]] = phi i32 [ 0, %{{.+}} ], [ [[K_NEXT:%.+]], %{{.+}} ] 221*1ec469cfSAlexey Bataev // CHECK: [[K2POW:%.+]] = phi i64 [ 1, %{{.+}} ], [ [[K2POW_NEXT:%.+]], %{{.+}} ] 222*1ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp uge i64 9, [[K2POW]] 223*1ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[INNER_BODY:[^,]+]], label %[[INNER_EXIT:[^,]+]] 224*1ec469cfSAlexey Bataev // CHECK: [[INNER_BODY]]: 225*1ec469cfSAlexey Bataev // CHECK: [[I:%.+]] = phi i64 [ 9, %[[OUTER_BODY]] ], [ [[I_PREV:%.+]], %{{.+}} ] 226*1ec469cfSAlexey Bataev 227*1ec469cfSAlexey Bataev // a_buffer[i] += a_buffer[i-pow(2, k)]; 228*1ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[I]], [[NUM_ELEMS]] 229*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 230*1ec469cfSAlexey Bataev // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]] 231*1ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[IDX_SUB_K2POW]], [[NUM_ELEMS]] 232*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 233*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[I]] 234*1ec469cfSAlexey Bataev // CHECK: [[IDX_SUB_K2POW:%.+]] = sub nuw i64 [[I]], [[K2POW]] 235*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_SUB_K2POW:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[IDX_SUB_K2POW]] 236*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_END:%.+]] = getelementptr float, float* [[A_BUF_IDX]], i64 [[NUM_ELEMS]] 237*1ec469cfSAlexey Bataev // CHECK: [[ISEMPTY:%.+]] = icmp eq float* [[A_BUF_IDX]], [[A_BUF_END]] 238*1ec469cfSAlexey Bataev // CHECK: br i1 [[ISEMPTY]], label %[[RED_DONE:[^,]+]], label %[[RED_BODY:[^,]+]] 239*1ec469cfSAlexey Bataev // CHECK: [[RED_BODY]]: 240*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_ELEM:%.+]] = phi float* [ [[A_BUF_IDX_SUB_K2POW]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_SUB_K2POW_NEXT:%.+]], %[[RED_BODY]] ] 241*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_ELEM:%.+]] = phi float* [ [[A_BUF_IDX]], %[[INNER_BODY]] ], [ [[A_BUF_IDX_NEXT:%.+]], %[[RED_BODY]] ] 242*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_VAL:%.+]] = load float, float* [[A_BUF_IDX_ELEM]], 243*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_VAL:%.+]] = load float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], 244*1ec469cfSAlexey Bataev // CHECK: [[RED:%.+]] = fadd float [[A_BUF_IDX_VAL]], [[A_BUF_IDX_SUB_K2POW_VAL]] 245*1ec469cfSAlexey Bataev // CHECK: store float [[RED]], float* [[A_BUF_IDX_ELEM]], 246*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_NEXT]] = getelementptr float, float* [[A_BUF_IDX_ELEM]], i32 1 247*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX_SUB_K2POW_NEXT]] = getelementptr float, float* [[A_BUF_IDX_SUB_K2POW_ELEM]], i32 1 248*1ec469cfSAlexey Bataev // CHECK: [[DONE:%.+]] = icmp eq float* [[A_BUF_IDX_NEXT]], [[A_BUF_END]] 249*1ec469cfSAlexey Bataev // CHECK: br i1 [[DONE]], label %[[RED_DONE]], label %[[RED_BODY]] 250*1ec469cfSAlexey Bataev // CHECK: [[RED_DONE]]: 251*1ec469cfSAlexey Bataev 252*1ec469cfSAlexey Bataev // b_buffer[i] += b_buffer[i-pow(2, k)]; 253*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]], 254*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_SUB_K2POW_VAL:%.+]] = load double, double* [[B_BUF_IDX_SUB_K2POW]], 255*1ec469cfSAlexey Bataev // CHECK: [[RED:%.+]] = fadd double [[B_BUF_IDX_VAL]], [[B_BUF_IDX_SUB_K2POW_VAL]] 256*1ec469cfSAlexey Bataev // CHECK: store double [[RED]], double* [[B_BUF_IDX]], 257*1ec469cfSAlexey Bataev 258*1ec469cfSAlexey Bataev // --i; 259*1ec469cfSAlexey Bataev // CHECK: [[I_PREV:%.+]] = sub nuw i64 [[I]], 1 260*1ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp uge i64 [[I_PREV]], [[K2POW]] 261*1ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[INNER_BODY]], label %[[INNER_EXIT]] 262*1ec469cfSAlexey Bataev // CHECK: [[INNER_EXIT]]: 263*1ec469cfSAlexey Bataev 264*1ec469cfSAlexey Bataev // ++k; 265*1ec469cfSAlexey Bataev // CHECK: [[K_NEXT]] = add nuw i32 [[K]], 1 266*1ec469cfSAlexey Bataev // k2pow <<= 1; 267*1ec469cfSAlexey Bataev // CHECK: [[K2POW_NEXT]] = shl nuw i64 [[K2POW]], 1 268*1ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp ne i32 [[K_NEXT]], [[CEIL_LOG2_10_INT]] 269*1ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[OUTER_BODY]], label %[[OUTER_EXIT:[^,]+]] 270*1ec469cfSAlexey Bataev // CHECK: [[OUTER_EXIT]]: 271*1ec469cfSAlexey Bataev bar(); 272*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_init_4( 273*1ec469cfSAlexey Bataev // CHECK: call i8* @llvm.stacksave() 274*1ec469cfSAlexey Bataev // CHECK: store float 0.000000e+00, float* % 275*1ec469cfSAlexey Bataev // CHECK: store double 0.000000e+00, double* [[B_PRIV_ADDR:%.+]], 276*1ec469cfSAlexey Bataev // CHECK: br label %[[DISPATCH:[^,]+]] 277*1ec469cfSAlexey Bataev 278*1ec469cfSAlexey Bataev // CHECK: [[SCAN_PHASE:.+]]: 279*1ec469cfSAlexey Bataev // CHECK: call void @{{.+}}foo{{.+}}() 280*1ec469cfSAlexey Bataev // CHECK: br label %[[LOOP_CONTINUE:.+]] 281*1ec469cfSAlexey Bataev 282*1ec469cfSAlexey Bataev // CHECK: [[DISPATCH]]: 283*1ec469cfSAlexey Bataev // if (i >0) 284*1ec469cfSAlexey Bataev // a_priv[[0..n] = a_buffer[i-1][0..n]; 285*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_I:%.+]] = load i32, i32* [[IV_ADDR:%.+]], 286*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX:%.+]] = zext i32 [[BASE_IDX_I]] to i64 287*1ec469cfSAlexey Bataev // CHECK: [[CMP:%.+]] = icmp eq i64 [[BASE_IDX]], 0 288*1ec469cfSAlexey Bataev // CHECK: br i1 [[CMP]], label %[[IF_DONE:[^,]+]], label %[[IF_THEN:[^,]+]] 289*1ec469cfSAlexey Bataev // CHECK: [[IF_THEN]]: 290*1ec469cfSAlexey Bataev // CHECK: [[BASE_IDX_SUB_1:%.+]] = sub nuw i64 [[BASE_IDX]], 1 291*1ec469cfSAlexey Bataev // CHECK: [[IDX:%.+]] = mul nsw i64 [[BASE_IDX_SUB_1]], [[NUM_ELEMS]] 292*1ec469cfSAlexey Bataev // CHECK: [[A_BUF_IDX:%.+]] = getelementptr inbounds float, float* [[A_BUF]], i64 [[IDX]] 293*1ec469cfSAlexey Bataev // CHECK: [[A_PRIV:%.+]] = getelementptr inbounds [10 x float], [10 x float]* [[A_PRIV_ADDR:%.+]], i64 0, i64 0 294*1ec469cfSAlexey Bataev // CHECK: [[BYTES:%.+]] = mul nuw i64 [[NUM_ELEMS:%.+]], 4 295*1ec469cfSAlexey Bataev // CHECK: [[DEST:%.+]] = bitcast float* [[A_PRIV]] to i8* 296*1ec469cfSAlexey Bataev // CHECK: [[SRC:%.+]] = bitcast float* [[A_BUF_IDX]] to i8* 297*1ec469cfSAlexey Bataev // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* {{.*}}[[DEST]], i8* {{.*}}[[SRC]], i64 [[BYTES]], i1 false) 298*1ec469cfSAlexey Bataev 299*1ec469cfSAlexey Bataev // b_priv = b_buffer[i]; 300*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX:%.+]] = getelementptr inbounds double, double* [[B_BUF]], i64 [[BASE_IDX_SUB_1]] 301*1ec469cfSAlexey Bataev // CHECK: [[B_BUF_IDX_VAL:%.+]] = load double, double* [[B_BUF_IDX]], 302*1ec469cfSAlexey Bataev // CHECK: store double [[B_BUF_IDX_VAL]], double* [[B_PRIV_ADDR]], 303*1ec469cfSAlexey Bataev // CHECK: br label %[[SCAN_PHASE]] 304*1ec469cfSAlexey Bataev 305*1ec469cfSAlexey Bataev // CHECK: [[LOOP_CONTINUE]]: 306*1ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* % 307*1ec469cfSAlexey Bataev // CHECK: call void @__kmpc_for_static_fini( 308*1ec469cfSAlexey Bataev // CHECK: call void @llvm.stackrestore(i8* 309*1ec469cfSAlexey Bataev } 310*1ec469cfSAlexey Bataev } 311*1ec469cfSAlexey Bataev 312*1ec469cfSAlexey Bataev #endif 313*1ec469cfSAlexey Bataev 314