1 // Test host codegen.
2 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-64
3 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s
4 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-64
5 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-32
6 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s
7 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-32
8 
9 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s
10 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -o %t %s
11 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
12 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s
13 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -o %t %s
14 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s
15 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}}
16 
17 // Test target codegen - host bc file has to be created first.
18 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm-bc %s -o %t-ppc-host.bc
19 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck %s --check-prefix TCHECK --check-prefix TCHECK-64
20 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o %t %s
21 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix TCHECK --check-prefix TCHECK-64
22 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm-bc %s -o %t-x86-host.bc
23 // RUN: %clang_cc1 -verify -fopenmp -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - | FileCheck %s --check-prefix TCHECK --check-prefix TCHECK-32
24 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o %t %s
25 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix TCHECK --check-prefix TCHECK-32
26 
27 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm-bc %s -o %t-ppc-host.bc
28 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck --check-prefix SIMD-ONLY1 %s
29 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -emit-pch -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o %t %s
30 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=powerpc64le-ibm-linux-gnu -std=c++11 -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY1 %s
31 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm-bc %s -o %t-x86-host.bc
32 // RUN: %clang_cc1 -verify -fopenmp-simd -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - | FileCheck --check-prefix SIMD-ONLY1 %s
33 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -std=c++11 -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -emit-pch -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o %t %s
34 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple i386-unknown-unknown -fopenmp-targets=i386-pc-linux-gnu -std=c++11 -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY1 %s
35 // SIMD-ONLY1-NOT: {{__kmpc|__tgt}}
36 
37 // expected-no-diagnostics
38 #ifndef HEADER
39 #define HEADER
40 
41 // CHECK-DAG: %struct.ident_t = type { i32, i32, i32, i32, i8* }
42 // CHECK-DAG: [[STR:@.+]] = private unnamed_addr constant [23 x i8] c";unknown;unknown;0;0;;\00"
43 // CHECK-DAG: [[DEF_LOC:@.+]] = private unnamed_addr global %struct.ident_t { i32 0, i32 2, i32 0, i32 0, i8* getelementptr inbounds ([23 x i8], [23 x i8]* [[STR]], i32 0, i32 0) }
44 
45 // CHECK-DAG: [[S1:%.+]] = type { double }
46 // CHECK-DAG: [[ENTTY:%.+]] = type { i8*, i8*, i[[SZ:32|64]], i32, i32 }
47 
48 // TCHECK: [[ENTTY:%.+]] = type { i8*, i8*, i{{32|64}}, i32, i32 }
49 
50 // We have 6 target regions
51 
52 // CHECK-DAG: @{{.*}} = weak constant i8 0
53 // CHECK-DAG: @{{.*}} = weak constant i8 0
54 // CHECK-DAG: @{{.*}} = weak constant i8 0
55 // CHECK-DAG: @{{.*}} = weak constant i8 0
56 // CHECK-DAG: @{{.*}} = weak constant i8 0
57 // CHECK-DAG: @{{.*}} = weak constant i8 0
58 
59 // TCHECK: @{{.+}} = weak constant [[ENTTY]]
60 // TCHECK: @{{.+}} = weak constant [[ENTTY]]
61 // TCHECK: @{{.+}} = weak constant [[ENTTY]]
62 // TCHECK: @{{.+}} = weak constant [[ENTTY]]
63 // TCHECK: @{{.+}} = weak constant [[ENTTY]]
64 // TCHECK: @{{.+}} = weak constant [[ENTTY]]
65 
66 // Check target registration is registered as a Ctor.
67 // CHECK: appending global [1 x { i32, void ()*, i8* }] [{ i32, void ()*, i8* } { i32 0, void ()* @.omp_offloading.requires_reg, i8* null }]
68 
69 
70 template<typename tx>
71 tx ftemplate(int n) {
72   tx a = 0;
73 
74   #pragma omp target parallel num_threads(tx(20))
75   {
76   }
77 
78   short b = 1;
79   #pragma omp target parallel num_threads(b)
80   {
81     a += b;
82   }
83 
84   return a;
85 }
86 
87 static
88 int fstatic(int n) {
89 
90   #pragma omp target parallel num_threads(n)
91   {
92   }
93 
94   #pragma omp target parallel num_threads(32+n)
95   {
96   }
97 
98   return n+1;
99 }
100 
101 struct S1 {
102   double a;
103 
104   int r1(int n){
105     int b = 1;
106 
107     #pragma omp target parallel num_threads(n-b)
108     {
109       this->a = (double)b + 1.5;
110     }
111 
112     #pragma omp target parallel num_threads(1024)
113     {
114       this->a = 2.5;
115     }
116 
117     return (int)a;
118   }
119 };
120 
121 // CHECK: define {{.*}}@{{.*}}bar{{.*}}
122 int bar(int n){
123   int a = 0;
124 
125   S1 S;
126   // CHECK: call {{.*}}i32 [[FS1:@.+]]([[S1]]* {{.*}}, i32 {{.*}})
127   a += S.r1(n);
128 
129   // CHECK: call {{.*}}i32 [[FSTATIC:@.+]](i32 {{.*}})
130   a += fstatic(n);
131 
132   // CHECK: call {{.*}}i32 [[FTEMPLATE:@.+]](i32 {{.*}})
133   a += ftemplate<int>(n);
134 
135   return a;
136 }
137 
138 
139 
140 //
141 // CHECK: define {{.*}}[[FS1]]([[S1]]* {{%.+}}, i32 {{[^%]*}}[[PARM:%.+]])
142 //
143 // CHECK-DAG:   store i32 [[PARM]], i32* [[N_ADDR:%.+]], align
144 // CHECK:       store i32 1, i32* [[B:%.+]], align
145 // CHECK:       [[NV:%.+]] = load i32, i32* [[N_ADDR]], align
146 // CHECK:       [[BV:%.+]] = load i32, i32* [[B]], align
147 // CHECK:       [[SUB:%.+]] = sub nsw i32 [[NV]], [[BV]]
148 // CHECK:       store i32 [[SUB]], i32* [[CAPE_ADDR:%.+]], align
149 // CHECK:       [[CEV:%.+]] = load i32, i32* [[CAPE_ADDR]], align
150 // CHECK-64:    [[CONV:%.+]] = bitcast i[[SZ]]* [[CAPEC_ADDR:%.+]] to i32*
151 // CHECK-64:    store i32 [[CEV]], i32* [[CONV]], align
152 // CHECK-32:    store i32 [[CEV]], i32* [[CAPEC_ADDR:%.+]], align
153 // CHECK:       [[ARG:%.+]] = load i[[SZ]], i[[SZ]]* [[CAPEC_ADDR]], align
154 // CHECK:       [[THREADS:%.+]] = load i32, i32* [[CAPE_ADDR]], align
155 //
156 // CHECK-DAG:   [[RET:%.+]] = call i32 @__tgt_target_teams(i64 -1, i8* @{{[^,]+}}, i32 4, {{.*}}, i32 1, i32 [[THREADS]])
157 // CHECK:       [[ERROR:%.+]] = icmp ne i32 [[RET]], 0
158 // CHECK:       br i1 [[ERROR]], label %[[FAIL:.+]], label %[[END:[^,]+]]
159 //
160 // CHECK:       [[FAIL]]
161 // CHECK:       call void [[HVT1:@.+]]([[S1]]* {{%.+}}, i[[SZ]] {{%.+}}, i[[SZ]] [[ARG]])
162 // CHECK:       br label {{%?}}[[END]]
163 // CHECK:       [[END]]
164 //
165 //
166 //
167 // CHECK-DAG:   [[RET:%.+]] = call i32 @__tgt_target_teams(i64 -1, i8* @{{[^,]+}}, i32 2, {{.+}}, i32 1, i32 1024)
168 // CHECK:       [[ERROR:%.+]] = icmp ne i32 [[RET]], 0
169 // CHECK:       br i1 [[ERROR]], label %[[FAIL:.+]], label %[[END:[^,]+]]
170 //
171 // CHECK:       [[FAIL]]
172 // CHECK:       call void [[HVT2:@.+]]([[S1]]* {{[^,]+}})
173 // CHECK:       br label {{%?}}[[END]]
174 // CHECK:       [[END]]
175 //
176 
177 
178 
179 
180 
181 
182 //
183 // CHECK: define {{.*}}[[FSTATIC]](i32 {{[^%]*}}[[PARM:%.+]])
184 //
185 // CHECK-DAG:   store i32 [[PARM]], i32* [[N_ADDR:%.+]], align
186 // CHECK:       [[NV:%.+]] = load i32, i32* [[N_ADDR]], align
187 // CHECK:       store i32 [[NV]], i32* [[CAPE_ADDR:%.+]], align
188 // CHECK:       [[CEV:%.+]] = load i32, i32* [[CAPE_ADDR]], align
189 // CHECK-64:    [[CONV:%.+]] = bitcast i[[SZ]]* [[CAPEC_ADDR:%.+]] to i32*
190 // CHECK-64:    store i32 [[CEV]], i32* [[CONV]], align
191 // CHECK-32:    store i32 [[CEV]], i32* [[CAPEC_ADDR:%.+]], align
192 // CHECK:       [[ARG:%.+]] = load i[[SZ]], i[[SZ]]* [[CAPEC_ADDR]], align
193 // CHECK:       [[THREADS:%.+]] = load i32, i32* [[CAPE_ADDR]], align
194 //
195 // CHECK-DAG:   [[RET:%.+]] = call i32 @__tgt_target_teams(i64 -1, i8* @{{[^,]+}}, i32 1, {{.*}}, i32 1, i32 [[THREADS]])
196 // CHECK:       [[ERROR:%.+]] = icmp ne i32 [[RET]], 0
197 // CHECK:       br i1 [[ERROR]], label %[[FAIL:.+]], label %[[END:[^,]+]]
198 //
199 // CHECK:       [[FAIL]]
200 // CHECK:       call void [[HVT3:@.+]](i[[SZ]] [[ARG]])
201 // CHECK:       br label {{%?}}[[END]]
202 // CHECK:       [[END]]
203 //
204 //
205 //
206 // CHECK:       [[NV:%.+]] = load i32, i32* [[N_ADDR]], align
207 // CHECK:       [[ADD:%.+]] = add nsw i32 32, [[NV]]
208 // CHECK:       store i32 [[ADD]], i32* [[CAPE_ADDR:%.+]], align
209 // CHECK:       [[CEV:%.+]] = load i32, i32* [[CAPE_ADDR]], align
210 // CHECK-64:    [[CONV:%.+]] = bitcast i[[SZ]]* [[CAPEC_ADDR:%.+]] to i32*
211 // CHECK-64:    store i32 [[CEV]], i32* [[CONV]], align
212 // CHECK-32:    store i32 [[CEV]], i32* [[CAPEC_ADDR:%.+]], align
213 // CHECK:       [[ARG:%.+]] = load i[[SZ]], i[[SZ]]* [[CAPEC_ADDR]], align
214 // CHECK:       [[THREADS:%.+]] = load i32, i32* [[CAPE_ADDR]], align
215 //
216 // CHECK-DAG:   [[RET:%.+]] = call i32 @__tgt_target_teams(i64 -1, i8* @{{[^,]+}}, i32 1, {{.*}}, i32 1, i32 [[THREADS]])
217 // CHECK:       [[ERROR:%.+]] = icmp ne i32 [[RET]], 0
218 // CHECK:       br i1 [[ERROR]], label %[[FAIL:.+]], label %[[END:[^,]+]]
219 //
220 // CHECK:       [[FAIL]]
221 // CHECK:       call void [[HVT4:@.+]](i[[SZ]] [[ARG]])
222 // CHECK:       br label {{%?}}[[END]]
223 // CHECK:       [[END]]
224 //
225 
226 
227 
228 
229 
230 
231 //
232 // CHECK: define {{.*}}[[FTEMPLATE]]
233 //
234 // CHECK-DAG:   [[RET:%.+]] = call i32 @__tgt_target_teams(i64 -1, i8* @{{[^,]+}}, i32 0, {{.*}}, i32 1, i32 20)
235 // CHECK-NEXT:  [[ERROR:%.+]] = icmp ne i32 [[RET]], 0
236 // CHECK-NEXT:  br i1 [[ERROR]], label %[[FAIL:.+]], label %[[END:[^,]+]]
237 //
238 // CHECK:       [[FAIL]]
239 // CHECK:       call void [[HVT5:@.+]]()
240 // CHECK:       br label {{%?}}[[END]]
241 //
242 // CHECK:       [[END]]
243 //
244 //
245 //
246 // CHECK:       store i16 1, i16* [[B:%.+]], align
247 // CHECK:       [[BV:%.+]] = load i16, i16* [[B]], align
248 // CHECK:       store i16 [[BV]], i16* [[CAPE_ADDR:%.+]], align
249 // CHECK:       [[CEV:%.+]] = load i16, i16* [[CAPE_ADDR]], align
250 // CHECK:       [[CONV:%.+]] = bitcast i[[SZ]]* [[CAPEC_ADDR:%.+]] to i16*
251 // CHECK:       store i16 [[CEV]], i16* [[CONV]], align
252 // CHECK:       [[ARG:%.+]] = load i[[SZ]], i[[SZ]]* [[CAPEC_ADDR]], align
253 // CHECK:       [[T:%.+]] = load i16, i16* [[CAPE_ADDR]], align
254 // CHECK:       [[THREADS:%.+]] = zext i16 [[T]] to i32
255 //
256 // CHECK-DAG:   [[RET:%.+]] = call i32 @__tgt_target_teams(i64 -1, i8* @{{[^,]+}}, i32 3, {{.*}}, i32 1, i32 [[THREADS]])
257 // CHECK:       [[ERROR:%.+]] = icmp ne i32 [[RET]], 0
258 // CHECK:       br i1 [[ERROR]], label %[[FAIL:.+]], label %[[END:[^,]+]]
259 //
260 // CHECK:       [[FAIL]]
261 // CHECK:       call void [[HVT6:@.+]](i[[SZ]] {{%.+}}, i[[SZ]] {{%.+}}, i[[SZ]] [[ARG]])
262 // CHECK:       br label {{%?}}[[END]]
263 // CHECK:       [[END]]
264 //
265 
266 
267 
268 
269 
270 
271 // Check that the offloading functions are emitted and that the parallel function
272 // is appropriately guarded.
273 
274 // CHECK:       define internal void [[HVT1]]([[S1]]* {{%.+}}, i[[SZ]] [[PARM1:%.+]], i[[SZ]] [[PARM2:%.+]])
275 // CHECK-DAG:   store i[[SZ]] [[PARM2]], i[[SZ]]* [[CAPE_ADDR:%.+]], align
276 // CHECK-64:    [[CONV:%.+]] = bitcast i[[SZ]]* [[CAPE_ADDR]] to i32*
277 // CHECK-64:    [[NT:%.+]] = load i32, i32* [[CONV]], align
278 // CHECK-32:    [[NT:%.+]] = load i32, i32* [[CAPE_ADDR]], align
279 // CHECK:       call void @__kmpc_push_num_threads(%struct.ident_t* {{[^,]+}}, i32 {{[^,]+}}, i32 [[NT]])
280 // CHECK:       call {{.*}}void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEF_LOC]], i32 2,
281 //
282 //
283 
284 
285 // CHECK:       define internal void [[HVT2]]([[S1]]* {{%.+}})
286 // CHECK:       call void @__kmpc_push_num_threads(%struct.ident_t* {{[^,]+}}, i32 {{[^,]+}}, i32 1024)
287 // CHECK:       call {{.*}}void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEF_LOC]], i32 1,
288 //
289 //
290 
291 
292 
293 
294 
295 
296 
297 
298 // CHECK:       define internal void [[HVT3]](i[[SZ]] [[PARM:%.+]])
299 // CHECK-DAG:   store i[[SZ]] [[PARM]], i[[SZ]]* [[CAPE_ADDR:%.+]], align
300 // CHECK-64:    [[CONV:%.+]] = bitcast i[[SZ]]* [[CAPE_ADDR]] to i32*
301 // CHECK-64:    [[NT:%.+]] = load i32, i32* [[CONV]], align
302 // CHECK-32:    [[NT:%.+]] = load i32, i32* [[CAPE_ADDR]], align
303 // CHECK:       call void @__kmpc_push_num_threads(%struct.ident_t* {{[^,]+}}, i32 {{[^,]+}}, i32 [[NT]])
304 // CHECK:       call {{.*}}void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEF_LOC]], i32 0,
305 //
306 //
307 // CHECK:       define internal void [[HVT4]](i[[SZ]] [[PARM:%.+]])
308 // CHECK-DAG:   store i[[SZ]] [[PARM]], i[[SZ]]* [[CAPE_ADDR:%.+]], align
309 // CHECK-64:    [[CONV:%.+]] = bitcast i[[SZ]]* [[CAPE_ADDR]] to i32*
310 // CHECK-64:    [[NT:%.+]] = load i32, i32* [[CONV]], align
311 // CHECK-32:    [[NT:%.+]] = load i32, i32* [[CAPE_ADDR]], align
312 // CHECK:       call void @__kmpc_push_num_threads(%struct.ident_t* {{[^,]+}}, i32 {{[^,]+}}, i32 [[NT]])
313 // CHECK:       call {{.*}}void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEF_LOC]], i32 0,
314 //
315 //
316 
317 
318 
319 
320 
321 // CHECK:       define internal void [[HVT5]](
322 // CHECK:       call void @__kmpc_push_num_threads(%struct.ident_t* {{[^,]+}}, i32 {{[^,]+}}, i32 20)
323 // CHECK:       call {{.*}}void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEF_LOC]], i32 0,
324 //
325 //
326 
327 
328 // CHECK:       define internal void [[HVT6]](i[[SZ]] [[PARM1:%.+]], i[[SZ]] [[PARM2:%.+]], i[[SZ]] [[PARM3:%.+]])
329 // CHECK-DAG:   store i[[SZ]] [[PARM3]], i[[SZ]]* [[CAPE_ADDR:%.+]], align
330 // CHECK:       [[CONV:%.+]] = bitcast i[[SZ]]* [[CAPE_ADDR]] to i16*
331 // CHECK:       [[T:%.+]] = load i16, i16* [[CONV]], align
332 // CHECK:       [[NT:%.+]] = sext i16 [[T]] to i32
333 // CHECK:       call void @__kmpc_push_num_threads(%struct.ident_t* {{[^,]+}}, i32 {{[^,]+}}, i32 [[NT]])
334 // CHECK:       call {{.*}}void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* [[DEF_LOC]], i32 2,
335 //
336 //
337 
338 
339 
340 #endif
341