1 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck %s
2 // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
3 // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck %s
4 
5 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
6 // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
7 // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
8 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
9 // expected-no-diagnostics
10 #ifndef HEADER
11 #define HEADER
12 
13 // CHECK-LABEL: @main
14 int main(int argc, char **argv) {
15 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]])
16 // CHECK: call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]],
17 // CHECK: call i32 @__kmpc_omp_task(%struct.ident_t* [[DEFLOC]], i32 [[GTID]],
18 #pragma omp task
19   ;
20 // CHECK:       [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
21 // CHECK-NEXT:  [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
22 // CHECK-NEXT:  br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
23 // CHECK:       [[THEN]]
24 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
25 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*))
26 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
27 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
28 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
29 // CHECK: store i64 0, i64* [[DOWN]],
30 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
31 // CHECK: store i64 9, i64* [[UP]],
32 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
33 // CHECK: store i64 1, i64* [[ST]],
34 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
35 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 0, i64 0, i8* null)
36 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
37 // CHECK-NEXT:  call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
38 // CHECK-NEXT:  br label {{%?}}[[EXIT]]
39 // CHECK:       [[EXIT]]
40 #pragma omp master taskloop priority(argc)
41   for (int i = 0; i < 10; ++i)
42     ;
43 // CHECK:       [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
44 // CHECK-NEXT:  [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
45 // CHECK-NEXT:  br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
46 // CHECK:       [[THEN]]
47 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*))
48 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
49 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
50 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
51 // CHECK: store i64 0, i64* [[DOWN]],
52 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
53 // CHECK: store i64 9, i64* [[UP]],
54 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
55 // CHECK: store i64 1, i64* [[ST]],
56 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
57 // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64
58 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null)
59 // CHECK-NEXT:  call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
60 // CHECK-NEXT:  br label {{%?}}[[EXIT]]
61 // CHECK:       [[EXIT]]
62 #pragma omp master taskloop nogroup grainsize(argc)
63   for (int i = 0; i < 10; ++i)
64     ;
65 // CHECK:       [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
66 // CHECK-NEXT:  [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
67 // CHECK-NEXT:  br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
68 // CHECK:       [[THEN]]
69 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
70 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*))
71 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
72 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
73 // CHECK: [[IF:%.+]] = icmp ne i32 %{{.+}}, 0
74 // CHECK: [[IF_INT:%.+]] = sext i1 [[IF]] to i32
75 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
76 // CHECK: store i64 0, i64* [[DOWN]],
77 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
78 // CHECK: store i64 %{{.+}}, i64* [[UP]],
79 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
80 // CHECK: store i64 1, i64* [[ST]],
81 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
82 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 4, i8* null)
83 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
84 // CHECK-NEXT:  call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
85 // CHECK-NEXT:  br label {{%?}}[[EXIT]]
86 // CHECK:       [[EXIT]]
87   int i;
88 #pragma omp master taskloop if(argc) shared(argc, argv) collapse(2) num_tasks(4)
89   for (i = 0; i < argc; ++i)
90   for (int j = argc; j < argv[argc][argc]; ++j)
91     ;
92 }
93 
94 // CHECK: define internal i32 [[TASK1]](
95 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
96 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
97 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
98 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
99 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
100 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
101 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
102 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
103 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
104 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
105 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
106 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
107 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
108 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
109 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
110 // CHECK: br label
111 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
112 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
113 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
114 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
115 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
116 // CHECK: load i32, i32* %
117 // CHECK: store i32 %
118 // CHECK: load i32, i32* %
119 // CHECK: add nsw i32 %{{.+}}, 1
120 // CHECK: store i32 %{{.+}}, i32* %
121 // CHECK: br label %
122 // CHECK: ret i32 0
123 
124 // CHECK: define internal i32 [[TASK2]](
125 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
126 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
127 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
128 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
129 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
130 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
131 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
132 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
133 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
134 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
135 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
136 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
137 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
138 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
139 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
140 // CHECK: br label
141 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
142 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
143 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
144 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
145 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
146 // CHECK: load i32, i32* %
147 // CHECK: store i32 %
148 // CHECK: load i32, i32* %
149 // CHECK: add nsw i32 %{{.+}}, 1
150 // CHECK: store i32 %{{.+}}, i32* %
151 // CHECK: br label %
152 // CHECK: ret i32 0
153 
154 // CHECK: define internal i32 [[TASK3]](
155 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
156 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
157 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
158 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
159 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
160 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
161 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
162 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
163 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
164 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
165 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
166 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
167 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
168 // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]],
169 // CHECK: br label
170 // CHECK: ret i32 0
171 
172 // CHECK-LABEL: @_ZN1SC2Ei
173 struct S {
174   int a;
175   S(int c) {
176 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]])
177 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*))
178 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
179 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
180 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
181 // CHECK: store i64 0, i64* [[DOWN]],
182 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
183 // CHECK: store i64 %{{.+}}, i64* [[UP]],
184 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
185 // CHECK: store i64 1, i64* [[ST]],
186 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
187 // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64
188 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 [[NUM_TASKS]], i8* null)
189 #pragma omp master taskloop shared(c) num_tasks(a)
190     for (a = 0; a < c; ++a)
191       ;
192   }
193 } s(1);
194 
195 // CHECK: define internal i32 [[TASK4]](
196 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
197 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
198 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
199 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
200 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
201 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
202 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
203 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
204 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
205 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
206 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
207 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
208 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
209 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
210 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
211 // CHECK: br label
212 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
213 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
214 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
215 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
216 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
217 // CHECK: load i32, i32* %
218 // CHECK: store i32 %
219 // CHECK: load i32, i32* %
220 // CHECK: add nsw i32 %{{.+}}, 1
221 // CHECK: store i32 %{{.+}}, i32* %
222 // CHECK: br label %
223 // CHECK: ret i32 0
224 
225 #endif
226