1 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck %s 2 // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 3 // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck %s 4 5 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s 6 // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 7 // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s 8 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}} 9 // expected-no-diagnostics 10 #ifndef HEADER 11 #define HEADER 12 13 // CHECK-LABEL: @main 14 int main(int argc, char **argv) { 15 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]]) 16 // CHECK: call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], 17 // CHECK: call i32 @__kmpc_omp_task(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], 18 #pragma omp task 19 ; 20 // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 21 // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0 22 // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]] 23 // CHECK: [[THEN]] 24 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 25 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*)) 26 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 27 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 28 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 29 // CHECK: store i64 0, i64* [[DOWN]], 30 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 31 // CHECK: store i64 9, i64* [[UP]], 32 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 33 // CHECK: store i64 1, i64* [[ST]], 34 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 35 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 0, i64 0, i8* null) 36 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 37 // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 38 // CHECK-NEXT: br label {{%?}}[[EXIT]] 39 // CHECK: [[EXIT]] 40 #pragma omp master taskloop priority(argc) 41 for (int i = 0; i < 10; ++i) 42 ; 43 // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 44 // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0 45 // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]] 46 // CHECK: [[THEN]] 47 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*)) 48 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 49 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 50 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 51 // CHECK: store i64 0, i64* [[DOWN]], 52 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 53 // CHECK: store i64 9, i64* [[UP]], 54 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 55 // CHECK: store i64 1, i64* [[ST]], 56 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 57 // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64 58 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null) 59 // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 60 // CHECK-NEXT: br label {{%?}}[[EXIT]] 61 // CHECK: [[EXIT]] 62 #pragma omp master taskloop nogroup grainsize(argc) 63 for (int i = 0; i < 10; ++i) 64 ; 65 // CHECK: [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 66 // CHECK-NEXT: [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0 67 // CHECK-NEXT: br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]] 68 // CHECK: [[THEN]] 69 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 70 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*)) 71 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 72 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 73 // CHECK: [[IF:%.+]] = icmp ne i32 %{{.+}}, 0 74 // CHECK: [[IF_INT:%.+]] = sext i1 [[IF]] to i32 75 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 76 // CHECK: store i64 0, i64* [[DOWN]], 77 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 78 // CHECK: store i64 %{{.+}}, i64* [[UP]], 79 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 80 // CHECK: store i64 1, i64* [[ST]], 81 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 82 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 4, i8* null) 83 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 84 // CHECK-NEXT: call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 85 // CHECK-NEXT: br label {{%?}}[[EXIT]] 86 // CHECK: [[EXIT]] 87 int i; 88 #pragma omp master taskloop if(argc) shared(argc, argv) collapse(2) num_tasks(4) 89 for (i = 0; i < argc; ++i) 90 for (int j = argc; j < argv[argc][argc]; ++j) 91 ; 92 } 93 94 // CHECK: define internal i32 [[TASK1]]( 95 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 96 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 97 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 98 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 99 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 100 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 101 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 102 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 103 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 104 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 105 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 106 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 107 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 108 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 109 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 110 // CHECK: br label 111 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]], 112 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 113 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]], 114 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 115 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 116 // CHECK: load i32, i32* % 117 // CHECK: store i32 % 118 // CHECK: load i32, i32* % 119 // CHECK: add nsw i32 %{{.+}}, 1 120 // CHECK: store i32 %{{.+}}, i32* % 121 // CHECK: br label % 122 // CHECK: ret i32 0 123 124 // CHECK: define internal i32 [[TASK2]]( 125 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 126 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 127 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 128 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 129 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 130 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 131 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 132 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 133 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 134 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 135 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 136 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 137 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 138 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 139 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 140 // CHECK: br label 141 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]], 142 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 143 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]], 144 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 145 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 146 // CHECK: load i32, i32* % 147 // CHECK: store i32 % 148 // CHECK: load i32, i32* % 149 // CHECK: add nsw i32 %{{.+}}, 1 150 // CHECK: store i32 %{{.+}}, i32* % 151 // CHECK: br label % 152 // CHECK: ret i32 0 153 154 // CHECK: define internal i32 [[TASK3]]( 155 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 156 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 157 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 158 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 159 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 160 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 161 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 162 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 163 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 164 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 165 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 166 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 167 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 168 // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]], 169 // CHECK: br label 170 // CHECK: ret i32 0 171 172 // CHECK-LABEL: @_ZN1SC2Ei 173 struct S { 174 int a; 175 S(int c) { 176 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]]) 177 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*)) 178 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 179 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 180 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 181 // CHECK: store i64 0, i64* [[DOWN]], 182 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 183 // CHECK: store i64 %{{.+}}, i64* [[UP]], 184 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 185 // CHECK: store i64 1, i64* [[ST]], 186 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 187 // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64 188 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 [[NUM_TASKS]], i8* null) 189 #pragma omp master taskloop shared(c) num_tasks(a) 190 for (a = 0; a < c; ++a) 191 ; 192 } 193 } s(1); 194 195 // CHECK: define internal i32 [[TASK4]]( 196 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 197 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 198 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 199 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 200 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 201 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 202 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 203 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 204 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 205 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 206 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 207 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 208 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 209 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 210 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 211 // CHECK: br label 212 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]], 213 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 214 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]], 215 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 216 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 217 // CHECK: load i32, i32* % 218 // CHECK: store i32 % 219 // CHECK: load i32, i32* % 220 // CHECK: add nsw i32 %{{.+}}, 1 221 // CHECK: store i32 %{{.+}}, i32* % 222 // CHECK: br label % 223 // CHECK: ret i32 0 224 225 #endif 226