1 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -fopenmp-version=45 -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck %s --check-prefix CHECK --check-prefix OMP45
2 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
3 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck %s --check-prefix CHECK --check-prefix OMP45
4 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -fopenmp-version=50 -x c++ -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
5 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
6 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50
7 
8 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -fopenmp-version=45 -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
9 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
10 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
11 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -fopenmp-version=50 -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
12 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
13 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s
14 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
15 // expected-no-diagnostics
16 #ifndef HEADER
17 #define HEADER
18 
19 // CHECK-LABEL: @main
20 int main(int argc, char **argv) {
21 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]])
22 // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEFLOC]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64)* [[OMP_OUTLINED1:@.+]] to void (i32*, i32*, ...)*), i64 [[PRIORITY:%.+]])
23 // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEFLOC]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64)* [[OMP_OUTLINED2:@.+]] to void (i32*, i32*, ...)*), i64 [[GRAINSIZE:%.+]])
24 // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEFLOC]], i32 5, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i8***, i64, i64)* [[OMP_OUTLINED3:@.+]] to void (i32*, i32*, ...)*), i32* [[I:%.+]], i32* [[ARGC:%.+]], i8*** [[ARGV:%.+]], i64 [[COND:%.+]], i64 [[NUM_TASKS:%.+]])
25 // CHECK: call void @__kmpc_serialized_parallel(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
26 // CHECK: call void [[OMP_OUTLINED3]](i32* %{{.+}}, i32* %{{.+}}, i32* [[I]], i32* [[ARGC]], i8*** [[ARGV]], i64 [[COND]], i64 [[NUM_TASKS]])
27 // CHECK: call void @__kmpc_end_serialized_parallel(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
28 
29 
30 // CHECK: define internal void [[OMP_OUTLINED1]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, i64 %{{.+}})
31 // CHECK: [[PRIO_ADDR:%.+]] = bitcast i64* %{{.+}} to i32*
32 // CHECK:       [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID:%.+]])
33 // CHECK-NEXT:  [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
34 // CHECK-NEXT:  br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
35 // CHECK:       [[THEN]]
36 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
37 // CHECK: [[PRIO:%.+]] = load i32, i32* [[PRIO_ADDR]],
38 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*))
39 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
40 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
41 // CHECK: [[PRIO_ADDR:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 4
42 // CHECK: [[PRIO_ADDR_CAST:%.+]] = bitcast %{{.+}}* [[PRIO_ADDR]] to i32*
43 // CHECK: store i32 [[PRIO]], i32* [[PRIO_ADDR_CAST]],
44 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
45 // CHECK: store i64 0, i64* [[DOWN]],
46 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
47 // CHECK: store i64 9, i64* [[UP]],
48 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
49 // CHECK: store i64 1, i64* [[ST]],
50 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
51 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 0, i64 0, i8* null)
52 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
53 // CHECK-NEXT:  call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
54 // CHECK-NEXT:  br label {{%?}}[[EXIT]]
55 // CHECK:       [[EXIT]]
56 
57 
58 // CHECK: define internal i32 [[TASK1]](
59 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
60 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
61 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
62 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
63 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
64 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
65 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
66 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
67 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
68 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
69 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
70 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
71 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
72 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
73 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
74 // CHECK: br label
75 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
76 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
77 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
78 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
79 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
80 // CHECK: load i32, i32* %
81 // CHECK: store i32 %
82 // CHECK: load i32, i32* %
83 // CHECK: add nsw i32 %{{.+}}, 1
84 // CHECK: store i32 %{{.+}}, i32* %
85 // CHECK: br label %
86 // CHECK: ret i32 0
87 
88 #pragma omp parallel master taskloop simd priority(argc) safelen(8)
89   for (int i = 0; i < 10; ++i)
90     ;
91 // CHECK: define internal void [[OMP_OUTLINED2]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, i64 %{{.+}})
92 // CHECK:       [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID:%.+]])
93 // CHECK-NEXT:  [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
94 // CHECK-NEXT:  br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
95 // CHECK:       [[THEN]]
96 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*))
97 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
98 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
99 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
100 // CHECK: store i64 0, i64* [[DOWN]],
101 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
102 // CHECK: store i64 9, i64* [[UP]],
103 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
104 // CHECK: store i64 1, i64* [[ST]],
105 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
106 // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64
107 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null)
108 // CHECK-NEXT:  call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
109 // CHECK-NEXT:  br label {{%?}}[[EXIT]]
110 // CHECK:       [[EXIT]]
111 
112 
113 // CHECK: define internal i32 [[TASK2]](
114 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
115 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
116 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
117 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
118 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
119 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
120 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
121 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
122 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
123 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
124 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
125 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
126 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
127 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
128 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
129 // CHECK: br label
130 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],{{.*}}!llvm.access.group
131 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
132 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],{{.*}}!llvm.access.group
133 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
134 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
135 // CHECK: load i32, i32* %{{.*}}!llvm.access.group
136 // CHECK: store i32 %{{.*}}!llvm.access.group
137 // CHECK: load i32, i32* %
138 // CHECK: add nsw i32 %{{.+}}, 1
139 // CHECK: store i32 %{{.+}}, i32* %
140 // CHECK: br label %
141 // CHECK: ret i32 0
142 
143 #pragma omp parallel master taskloop simd nogroup grainsize(argc) simdlen(16)
144   for (int i = 0; i < 10; ++i)
145     ;
146 // CHECK: define internal void [[OMP_OUTLINED3]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, i32* nonnull align 4 dereferenceable(4) %{{.+}}, i8*** nonnull align 8 dereferenceable(8) %{{.+}}, i64 %{{.+}}, i64 %{{.+}})
147 // CHECK:       [[RES:%.+]] = call {{.*}}i32 @__kmpc_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID:%.+]])
148 // CHECK-NEXT:  [[IS_MASTER:%.+]] = icmp ne i32 [[RES]], 0
149 // CHECK-NEXT:  br i1 [[IS_MASTER]], label {{%?}}[[THEN:.+]], label {{%?}}[[EXIT:.+]]
150 // CHECK:       [[THEN]]
151 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
152 // OMP45: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 88, i64 24, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*))
153 // OMP50: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 88, i64 32, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*))
154 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
155 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
156 // CHECK: [[COND_VAL:%.+]] = load i8, i8* %{{.+}},
157 // CHECK: [[COND_BOOL:%.+]] = trunc i8 [[COND_VAL]] to i1
158 // CHECK: [[IF_INT:%.+]] = sext i1 [[COND_BOOL]] to i32
159 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
160 // CHECK: store i64 0, i64* [[DOWN]],
161 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
162 // CHECK: store i64 %{{.+}}, i64* [[UP]],
163 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
164 // CHECK: store i64 1, i64* [[ST]],
165 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
166 // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64
167 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 [[NUM_TASKS]], i8* bitcast (void ([[TDP_TY]]*, [[TDP_TY]]*, i32)* [[TASK_DUP:@.+]] to i8*))
168 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
169 // CHECK-NEXT:  call {{.*}}void @__kmpc_end_master(%struct.ident_t* [[DEFLOC]], i32 [[GTID]])
170 // CHECK-NEXT:  br label {{%?}}[[EXIT]]
171 // CHECK:       [[EXIT]]
172 
173 // CHECK: define internal i32 [[TASK3]](
174 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
175 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
176 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
177 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
178 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
179 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
180 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
181 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
182 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
183 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
184 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
185 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
186 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
187 // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]],
188 // CHECK: br label
189 // CHECK: ret i32 0
190 
191   int i;
192 #pragma omp parallel master taskloop simd if(argc) shared(argc, argv) collapse(2) num_tasks(argc) lastprivate(i) aligned(argv:8)
193   for (i = 0; i < argc; ++i)
194   for (int j = argc; j < argv[argc][argc]; ++j)
195     ;
196 }
197 
198 // CHECK-LABEL: @_ZN1SC2Ei
199 struct S {
200   int a;
201   S(int c) {
202 // CHECK: call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEFLOC]], i32 3, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, %struct.S*, i32*, i64)* [[OMP_OUTLINED4:@.+]] to void (i32*, i32*, ...)*), %struct.S* %{{.+}}, i32* %{{.+}}, i64 %{{.+}})
203 
204 // CHECK: define internal void [[OMP_OUTLINED4]](i32* noalias %{{.+}}, i32* noalias %{{.+}}, %struct.S* %{{.+}}, i32* nonnull align 4 dereferenceable(4) %{{.+}}, i64 %{{.+}})
205 // CHECK: [[CONV:%.+]] = bitcast i64* %{{.+}} to i8*
206 // CHECK: [[CONDI8:%.+]] = load i8, i8* [[CONV]],
207 // CHECK: [[COND:%.+]] = trunc i8 [[CONDI8]] to i1
208 // CHECK: [[IS_FINAL:%.+]] = select i1 [[COND:%.+]], i32 2, i32 0
209 // CHECK: [[FLAGS:%.+]] = or i32 [[IS_FINAL]], 1
210 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID:%.+]], i32 [[FLAGS]], i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*))
211 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
212 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
213 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
214 // CHECK: store i64 0, i64* [[DOWN]],
215 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
216 // CHECK: store i64 %{{.+}}, i64* [[UP]],
217 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
218 // CHECK: store i64 1, i64* [[ST]],
219 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
220 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 4, i8* null)
221 #pragma omp parallel master taskloop simd shared(c) num_tasks(4) final(c)
222     for (a = 0; a < c; ++a)
223       ;
224   }
225 } s(1);
226 
227 // CHECK: define internal i32 [[TASK4]](
228 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
229 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
230 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
231 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
232 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
233 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
234 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
235 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
236 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
237 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
238 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
239 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
240 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
241 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
242 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
243 // CHECK: br label
244 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
245 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
246 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
247 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
248 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
249 // CHECK: load i32, i32* %{{.*}}!llvm.access.group
250 // CHECK: store i32 %{{.*}}!llvm.access.group
251 // CHECK: load i32, i32* %
252 // CHECK: add nsw i32 %{{.+}}, 1
253 // CHECK: store i32 %{{.+}}, i32* %
254 // CHECK: br label %
255 // CHECK: ret i32 0
256 
257 // OMP45-NOT: !{!"llvm.loop.vectorize.enable", i1 false}
258 // CHECK-DAG: !{!"llvm.loop.vectorize.enable", i1 true}
259 // OMP50-DAG: !{!"llvm.loop.vectorize.enable", i1 false}
260 // OMP45-NOT: !{!"llvm.loop.vectorize.enable", i1 false}
261 
262 #endif
263