1 // NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --function-signature --include-generated-funcs
2 // RUN: %clang_cc1 -no-opaque-pointers -fopenmp-enable-irbuilder -verify -fopenmp -fopenmp-version=45 -x c++ -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s
3 // expected-no-diagnostics
4
5 #ifndef HEADER
6 #define HEADER
7
8 // CHECK-LABEL: define {{.*}}@workshareloop_unsigned_down(
9 // CHECK-NEXT: [[ENTRY:.*]]:
10 // CHECK-NEXT: %[[A_ADDR:.+]] = alloca float*, align 8
11 // CHECK-NEXT: %[[I:.+]] = alloca i32, align 4
12 // CHECK-NEXT: %[[AGG_CAPTURED:.+]] = alloca %struct.anon, align 8
13 // CHECK-NEXT: %[[AGG_CAPTURED1:.+]] = alloca %struct.anon.0, align 4
14 // CHECK-NEXT: %[[DOTCOUNT_ADDR:.+]] = alloca i32, align 4
15 // CHECK-NEXT: %[[P_LASTITER:.+]] = alloca i32, align 4
16 // CHECK-NEXT: %[[P_LOWERBOUND:.+]] = alloca i32, align 4
17 // CHECK-NEXT: %[[P_UPPERBOUND:.+]] = alloca i32, align 4
18 // CHECK-NEXT: %[[P_STRIDE:.+]] = alloca i32, align 4
19 // CHECK-NEXT: store float* %[[A:.+]], float** %[[A_ADDR]], align 8
20 // CHECK-NEXT: store i32 32000000, i32* %[[I]], align 4
21 // CHECK-NEXT: %[[TMP0:.+]] = getelementptr inbounds %struct.anon, %struct.anon* %[[AGG_CAPTURED]], i32 0, i32 0
22 // CHECK-NEXT: store i32* %[[I]], i32** %[[TMP0]], align 8
23 // CHECK-NEXT: %[[TMP1:.+]] = getelementptr inbounds %struct.anon.0, %struct.anon.0* %[[AGG_CAPTURED1]], i32 0, i32 0
24 // CHECK-NEXT: %[[TMP2:.+]] = load i32, i32* %[[I]], align 4
25 // CHECK-NEXT: store i32 %[[TMP2]], i32* %[[TMP1]], align 4
26 // CHECK-NEXT: call void @__captured_stmt(i32* %[[DOTCOUNT_ADDR]], %struct.anon* %[[AGG_CAPTURED]])
27 // CHECK-NEXT: %[[DOTCOUNT:.+]] = load i32, i32* %[[DOTCOUNT_ADDR]], align 4
28 // CHECK-NEXT: br label %[[OMP_LOOP_PREHEADER:.+]]
29 // CHECK-EMPTY:
30 // CHECK-NEXT: [[OMP_LOOP_PREHEADER]]:
31 // CHECK-NEXT: store i32 0, i32* %[[P_LOWERBOUND]], align 4
32 // CHECK-NEXT: %[[TMP3:.+]] = sub i32 %[[DOTCOUNT]], 1
33 // CHECK-NEXT: store i32 %[[TMP3]], i32* %[[P_UPPERBOUND]], align 4
34 // CHECK-NEXT: store i32 1, i32* %[[P_STRIDE]], align 4
35 // CHECK-NEXT: %[[OMP_GLOBAL_THREAD_NUM:.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @1)
36 // CHECK-NEXT: call void @__kmpc_for_static_init_4u(%struct.ident_t* @1, i32 %[[OMP_GLOBAL_THREAD_NUM]], i32 34, i32* %[[P_LASTITER]], i32* %[[P_LOWERBOUND]], i32* %[[P_UPPERBOUND]], i32* %[[P_STRIDE]], i32 1, i32 0)
37 // CHECK-NEXT: %[[TMP4:.+]] = load i32, i32* %[[P_LOWERBOUND]], align 4
38 // CHECK-NEXT: %[[TMP5:.+]] = load i32, i32* %[[P_UPPERBOUND]], align 4
39 // CHECK-NEXT: %[[TMP6:.+]] = sub i32 %[[TMP5]], %[[TMP4]]
40 // CHECK-NEXT: %[[TMP7:.+]] = add i32 %[[TMP6]], 1
41 // CHECK-NEXT: br label %[[OMP_LOOP_HEADER:.+]]
42 // CHECK-EMPTY:
43 // CHECK-NEXT: [[OMP_LOOP_HEADER]]:
44 // CHECK-NEXT: %[[OMP_LOOP_IV:.+]] = phi i32 [ 0, %[[OMP_LOOP_PREHEADER]] ], [ %[[OMP_LOOP_NEXT:.+]], %[[OMP_LOOP_INC:.+]] ]
45 // CHECK-NEXT: br label %[[OMP_LOOP_COND:.+]]
46 // CHECK-EMPTY:
47 // CHECK-NEXT: [[OMP_LOOP_COND]]:
48 // CHECK-NEXT: %[[OMP_LOOP_CMP:.+]] = icmp ult i32 %[[OMP_LOOP_IV]], %[[TMP7]]
49 // CHECK-NEXT: br i1 %[[OMP_LOOP_CMP]], label %[[OMP_LOOP_BODY:.+]], label %[[OMP_LOOP_EXIT:.+]]
50 // CHECK-EMPTY:
51 // CHECK-NEXT: [[OMP_LOOP_BODY]]:
52 // CHECK-NEXT: %[[TMP8:.+]] = add i32 %[[OMP_LOOP_IV]], %[[TMP4]]
53 // CHECK-NEXT: call void @__captured_stmt.1(i32* %[[I]], i32 %[[TMP8]], %struct.anon.0* %[[AGG_CAPTURED1]])
54 // CHECK-NEXT: %[[TMP9:.+]] = load i32, i32* %[[I]], align 4
55 // CHECK-NEXT: %[[CONV:.+]] = uitofp i32 %[[TMP9]] to float
56 // CHECK-NEXT: %[[TMP10:.+]] = load float*, float** %[[A_ADDR]], align 8
57 // CHECK-NEXT: %[[TMP11:.+]] = load i32, i32* %[[I]], align 4
58 // CHECK-NEXT: %[[IDXPROM:.+]] = zext i32 %[[TMP11]] to i64
59 // CHECK-NEXT: %[[ARRAYIDX:.+]] = getelementptr inbounds float, float* %[[TMP10]], i64 %[[IDXPROM]]
60 // CHECK-NEXT: store float %[[CONV]], float* %[[ARRAYIDX]], align 4
61 // CHECK-NEXT: br label %[[OMP_LOOP_INC]]
62 // CHECK-EMPTY:
63 // CHECK-NEXT: [[OMP_LOOP_INC]]:
64 // CHECK-NEXT: %[[OMP_LOOP_NEXT]] = add nuw i32 %[[OMP_LOOP_IV]], 1
65 // CHECK-NEXT: br label %[[OMP_LOOP_HEADER]]
66 // CHECK-EMPTY:
67 // CHECK-NEXT: [[OMP_LOOP_EXIT]]:
68 // CHECK-NEXT: call void @__kmpc_for_static_fini(%struct.ident_t* @1, i32 %[[OMP_GLOBAL_THREAD_NUM]])
69 // CHECK-NEXT: %[[OMP_GLOBAL_THREAD_NUM2:.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @1)
70 // CHECK-NEXT: call void @__kmpc_barrier(%struct.ident_t* @2, i32 %[[OMP_GLOBAL_THREAD_NUM2]])
71 // CHECK-NEXT: br label %[[OMP_LOOP_AFTER:.+]]
72 // CHECK-EMPTY:
73 // CHECK-NEXT: [[OMP_LOOP_AFTER]]:
74 // CHECK-NEXT: ret void
75 // CHECK-NEXT: }
76
workshareloop_unsigned_down(float * a)77 extern "C" void workshareloop_unsigned_down(float *a) {
78 #pragma omp for
79 for (unsigned i = 32000000; i > 33; i -= 7) {
80 a[i] = i;
81 }
82 }
83
84 #endif // HEADER
85 //
86 //
87 //
88 //
89 //
90
91 // CHECK-LABEL: define {{.*}}@__captured_stmt(
92 // CHECK-NEXT: [[ENTRY:.*]]:
93 // CHECK-NEXT: %[[DISTANCE_ADDR:.+]] = alloca i32*, align 8
94 // CHECK-NEXT: %[[__CONTEXT_ADDR:.+]] = alloca %struct.anon*, align 8
95 // CHECK-NEXT: %[[DOTSTART:.+]] = alloca i32, align 4
96 // CHECK-NEXT: %[[DOTSTOP:.+]] = alloca i32, align 4
97 // CHECK-NEXT: %[[DOTSTEP:.+]] = alloca i32, align 4
98 // CHECK-NEXT: store i32* %[[DISTANCE:.+]], i32** %[[DISTANCE_ADDR]], align 8
99 // CHECK-NEXT: store %struct.anon* %[[__CONTEXT:.+]], %struct.anon** %[[__CONTEXT_ADDR]], align 8
100 // CHECK-NEXT: %[[TMP0:.+]] = load %struct.anon*, %struct.anon** %[[__CONTEXT_ADDR]], align 8
101 // CHECK-NEXT: %[[TMP1:.+]] = getelementptr inbounds %struct.anon, %struct.anon* %[[TMP0]], i32 0, i32 0
102 // CHECK-NEXT: %[[TMP2:.+]] = load i32*, i32** %[[TMP1]], align 8
103 // CHECK-NEXT: %[[TMP3:.+]] = load i32, i32* %[[TMP2]], align 4
104 // CHECK-NEXT: store i32 %[[TMP3]], i32* %[[DOTSTART]], align 4
105 // CHECK-NEXT: store i32 33, i32* %[[DOTSTOP]], align 4
106 // CHECK-NEXT: store i32 -7, i32* %[[DOTSTEP]], align 4
107 // CHECK-NEXT: %[[TMP4:.+]] = load i32, i32* %[[DOTSTART]], align 4
108 // CHECK-NEXT: %[[TMP5:.+]] = load i32, i32* %[[DOTSTOP]], align 4
109 // CHECK-NEXT: %[[CMP:.+]] = icmp ugt i32 %[[TMP4]], %[[TMP5]]
110 // CHECK-NEXT: br i1 %[[CMP]], label %[[COND_TRUE:.+]], label %[[COND_FALSE:.+]]
111 // CHECK-EMPTY:
112 // CHECK-NEXT: [[COND_TRUE]]:
113 // CHECK-NEXT: %[[TMP6:.+]] = load i32, i32* %[[DOTSTART]], align 4
114 // CHECK-NEXT: %[[TMP7:.+]] = load i32, i32* %[[DOTSTOP]], align 4
115 // CHECK-NEXT: %[[SUB:.+]] = sub i32 %[[TMP6]], %[[TMP7]]
116 // CHECK-NEXT: %[[TMP8:.+]] = load i32, i32* %[[DOTSTEP]], align 4
117 // CHECK-NEXT: %[[SUB1:.+]] = sub nsw i32 0, %[[TMP8]]
118 // CHECK-NEXT: %[[SUB2:.+]] = sub i32 %[[SUB1]], 1
119 // CHECK-NEXT: %[[ADD:.+]] = add i32 %[[SUB]], %[[SUB2]]
120 // CHECK-NEXT: %[[TMP9:.+]] = load i32, i32* %[[DOTSTEP]], align 4
121 // CHECK-NEXT: %[[SUB3:.+]] = sub nsw i32 0, %[[TMP9]]
122 // CHECK-NEXT: %[[DIV:.+]] = udiv i32 %[[ADD]], %[[SUB3]]
123 // CHECK-NEXT: br label %[[COND_END:.+]]
124 // CHECK-EMPTY:
125 // CHECK-NEXT: [[COND_FALSE]]:
126 // CHECK-NEXT: br label %[[COND_END]]
127 // CHECK-EMPTY:
128 // CHECK-NEXT: [[COND_END]]:
129 // CHECK-NEXT: %[[COND:.+]] = phi i32 [ %[[DIV]], %[[COND_TRUE]] ], [ 0, %[[COND_FALSE]] ]
130 // CHECK-NEXT: %[[TMP10:.+]] = load i32*, i32** %[[DISTANCE_ADDR]], align 8
131 // CHECK-NEXT: store i32 %[[COND]], i32* %[[TMP10]], align 4
132 // CHECK-NEXT: ret void
133 // CHECK-NEXT: }
134
135
136 // CHECK-LABEL: define {{.*}}@__captured_stmt.1(
137 // CHECK-NEXT: [[ENTRY:.*]]:
138 // CHECK-NEXT: %[[LOOPVAR_ADDR:.+]] = alloca i32*, align 8
139 // CHECK-NEXT: %[[LOGICAL_ADDR:.+]] = alloca i32, align 4
140 // CHECK-NEXT: %[[__CONTEXT_ADDR:.+]] = alloca %struct.anon.0*, align 8
141 // CHECK-NEXT: store i32* %[[LOOPVAR:.+]], i32** %[[LOOPVAR_ADDR]], align 8
142 // CHECK-NEXT: store i32 %[[LOGICAL:.+]], i32* %[[LOGICAL_ADDR]], align 4
143 // CHECK-NEXT: store %struct.anon.0* %[[__CONTEXT:.+]], %struct.anon.0** %[[__CONTEXT_ADDR]], align 8
144 // CHECK-NEXT: %[[TMP0:.+]] = load %struct.anon.0*, %struct.anon.0** %[[__CONTEXT_ADDR]], align 8
145 // CHECK-NEXT: %[[TMP1:.+]] = getelementptr inbounds %struct.anon.0, %struct.anon.0* %[[TMP0]], i32 0, i32 0
146 // CHECK-NEXT: %[[TMP2:.+]] = load i32, i32* %[[TMP1]], align 4
147 // CHECK-NEXT: %[[TMP3:.+]] = load i32, i32* %[[LOGICAL_ADDR]], align 4
148 // CHECK-NEXT: %[[MUL:.+]] = mul i32 -7, %[[TMP3]]
149 // CHECK-NEXT: %[[ADD:.+]] = add i32 %[[TMP2]], %[[MUL]]
150 // CHECK-NEXT: %[[TMP4:.+]] = load i32*, i32** %[[LOOPVAR_ADDR]], align 8
151 // CHECK-NEXT: store i32 %[[ADD]], i32* %[[TMP4]], align 4
152 // CHECK-NEXT: ret void
153 // CHECK-NEXT: }
154
155
156 // CHECK: ![[META0:[0-9]+]] = !{i32 1, !"wchar_size", i32 4}
157 // CHECK: ![[META1:[0-9]+]] = !{i32 7, !"openmp", i32 45}
158 // CHECK: ![[META2:[0-9]+]] =
159