1 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c++ -emit-llvm %s -o - | FileCheck %s 2 // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 3 // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s 4 5 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -x c++ -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s 6 // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 7 // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s 8 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}} 9 // expected-no-diagnostics 10 #ifndef HEADER 11 #define HEADER 12 13 typedef void **omp_allocator_handle_t; 14 extern const omp_allocator_handle_t omp_null_allocator; 15 extern const omp_allocator_handle_t omp_default_mem_alloc; 16 extern const omp_allocator_handle_t omp_large_cap_mem_alloc; 17 extern const omp_allocator_handle_t omp_const_mem_alloc; 18 extern const omp_allocator_handle_t omp_high_bw_mem_alloc; 19 extern const omp_allocator_handle_t omp_low_lat_mem_alloc; 20 extern const omp_allocator_handle_t omp_cgroup_mem_alloc; 21 extern const omp_allocator_handle_t omp_pteam_mem_alloc; 22 extern const omp_allocator_handle_t omp_thread_mem_alloc; 23 24 // CHECK: [[PRIVATES:%.+]] = type { i8*, i8* } 25 26 struct S { 27 int a; 28 S() : a(0) {} 29 S(const S&) {} 30 S& operator=(const S&) {return *this;} 31 ~S() {} 32 friend S operator+(const S&a, const S&b) {return a;} 33 }; 34 35 36 int main(int argc, char **argv) { 37 int a; 38 float b; 39 S c[5]; 40 short d[argc]; 41 #pragma omp taskgroup task_reduction(+: a, b, argc) 42 { 43 #pragma omp taskgroup task_reduction(-:c, d) 44 #pragma omp parallel 45 #pragma omp task in_reduction(+:a) in_reduction(-:d) allocate(omp_high_bw_mem_alloc: d) 46 a += d[a]; 47 } 48 #pragma omp task in_reduction(+:a) 49 ++a; 50 return 0; 51 } 52 53 // CHECK-LABEL: @main 54 // CHECK: void @__kmpc_taskgroup(%struct.ident_t* @1, i32 [[GTID:%.+]]) 55 // CHECK: [[TD1:%.+]] = call i8* @__kmpc_taskred_init(i32 [[GTID]], i32 3, i8* % 56 // CHECK-NEXT: store i8* [[TD1]], i8** [[TD1_ADDR:%[^,]+]], 57 // CHECK-NEXT: call void @__kmpc_taskgroup(%struct.ident_t* @1, i32 [[GTID]]) 58 // CHECK: [[TD2:%.+]] = call i8* @__kmpc_taskred_init(i32 [[GTID]], i32 2, i8* % 59 // CHECK-NEXT: store i8* [[TD2]], i8** [[TD2_ADDR:%[^,]+]], 60 // CHECK-NEXT: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @1, i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i64, i16*, i8**, i8**)* [[OMP_PARALLEL:@.+]] to void (i32*, i32*, ...)*), i32* %{{.+}}, i64 %{{.+}}, i16* %{{.+}}, i8** [[TD1_ADDR]], i8** [[TD2_ADDR]]) 61 // CHECK-NEXT: call void @__kmpc_end_taskgroup(%struct.ident_t* @1, i32 [[GTID]]) 62 // CHECK-NEXT: call void @__kmpc_end_taskgroup(%struct.ident_t* @1, i32 [[GTID]]) 63 64 // CHECK: define internal void [[OMP_PARALLEL]]( 65 // CHECK: [[TASK_T:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* @1, i32 [[GTID:%.+]], i32 1, i64 56, i64 40, i32 (i32, i8*)* bitcast (i32 (i32, [[T:%.+]]*)* [[OMP_TASK:@.+]] to i32 (i32, i8*)*)) 66 // CHECK-NEXT: [[TASK_T_WITH_PRIVS:%.+]] = bitcast i8* [[TASK_T]] to [[T]]* 67 // CHECK: [[PRIVS:%.+]] = getelementptr inbounds [[T]], [[T]]* [[TASK_T_WITH_PRIVS]], i32 0, i32 1 68 // CHECK: [[TD1_REF:%.+]] = getelementptr inbounds [[PRIVATES]], [[PRIVATES]]* [[PRIVS]], i32 0, i32 0 69 // CHECK-NEXT: [[TD1:%.+]] = load i8*, i8** %{{.+}}, 70 // CHECK-NEXT: store i8* [[TD1]], i8** [[TD1_REF]], 71 // CHECK-NEXT: [[TD2_REF:%.+]] = getelementptr inbounds [[PRIVATES]], [[PRIVATES]]* [[PRIVS]], i32 0, i32 1 72 // CHECK-NEXT: [[TD2:%.+]] = load i8*, i8** %{{.+}}, 73 // CHECK-NEXT: store i8* [[TD2]], i8** [[TD2_REF]], 74 // CHECK-NEXT: call i32 @__kmpc_omp_task(%struct.ident_t* @1, i32 [[GTID]], i8* [[TASK_T]]) 75 // CHECK-NEXT: ret void 76 // CHECK-NEXT: } 77 78 // CHECK: define internal {{.*}} [[OMP_TASK]]( 79 // CHECK: call void (i8*, ...) %{{[^(]+}}(i8* %{{.+}}, i8*** [[TD1_REF:%[^,]+]], i8*** [[TD2_REF:%[^,]+]]) 80 // CHECK-NEXT: [[TD1_ADDR:%.+]] = load i8**, i8*** [[TD1_REF]], 81 // CHECK-NEXT: [[TD2_ADDR:%.+]] = load i8**, i8*** [[TD2_REF]], 82 // CHECK-NEXT: [[A_REF:%.+]] = getelementptr inbounds % 83 // CHECK-NEXT: [[A_ADDR:%.+]] = load i32*, i32** [[A_REF]], 84 // CHECK-NEXT: [[TD1:%.+]] = load i8*, i8** [[TD1_ADDR]], 85 // CHECK-NEXT: [[GTID:%.+]] = load i32, i32* % 86 // CHECK-NEXT: [[A_PTR:%.+]] = bitcast i32* [[A_ADDR]] to i8* 87 // CHECK-NEXT: call i8* @__kmpc_task_reduction_get_th_data(i32 [[GTID]], i8* [[TD1]], i8* [[A_PTR]]) 88 // CHECK: [[D_REF:%.+]] = getelementptr inbounds % 89 // CHECK-NEXT: [[D_ADDR:%.+]] = load i16*, i16** [[D_REF]], 90 // CHECK: call i8* @__kmpc_threadprivate_cached( 91 // CHECK: [[TD2:%.+]] = load i8*, i8** [[TD2_ADDR]], 92 // CHECK-NEXT: [[D_PTR:%.+]] = bitcast i16* [[D_ADDR]] to i8* 93 // CHECK-NEXT: call i8* @__kmpc_task_reduction_get_th_data(i32 [[GTID]], i8* [[TD2]], i8* [[D_PTR]]) 94 // CHECK: add nsw i32 95 // CHECK: store i32 % 96 // CHECK-NOT: call i8* @__kmpc_threadprivate_cached( 97 98 // CHECK: [[A_PTR:%.+]] = call i8* @__kmpc_task_reduction_get_th_data(i32 %{{.+}}, i8* null, i8* %{{.+}}) 99 // CHECK-NEXT: [[A_ADDR:%.+]] = bitcast i8* [[A_PTR]] to i32* 100 // CHECK-NEXT: [[A:%.+]] = load i32, i32* [[A_ADDR]], 101 // CHECK-NEXT: [[NEW:%.+]] = add nsw i32 [[A]], 1 102 // CHECK-NEXT: store i32 [[NEW]], i32* [[A_ADDR]], 103 #endif 104