1 | // RUN: %clang_cc1 -verify -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-llvm %s -o - | FileCheck %s |
2 | // RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple x86_64-apple-darwin10 -emit-pch -o %t %s |
3 | // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s |
4 | // RUN: %clang_cc1 -verify -fopenmp -x c++ -std=c++11 -DLAMBDA -triple x86_64-apple-darwin10 -emit-llvm %s -o - | FileCheck -check-prefix=LAMBDA %s |
5 | // RUN: %clang_cc1 -verify -fopenmp -x c++ -fblocks -DBLOCKS -triple x86_64-apple-darwin10 -emit-llvm %s -o - | FileCheck -check-prefix=BLOCKS %s |
6 | // RUN: %clang_cc1 -verify -fopenmp -x c++ -std=c++11 -DARRAY -triple x86_64-apple-darwin10 -emit-llvm %s -o - | FileCheck -check-prefix=ARRAY %s |
7 | |
8 | // RUN: %clang_cc1 -verify -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s |
9 | // RUN: %clang_cc1 -fopenmp-simd -x c++ -std=c++11 -triple x86_64-apple-darwin10 -emit-pch -o %t %s |
10 | // RUN: %clang_cc1 -fopenmp-simd -x c++ -triple x86_64-apple-darwin10 -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s |
11 | // RUN: %clang_cc1 -verify -fopenmp-simd -x c++ -std=c++11 -DLAMBDA -triple x86_64-apple-darwin10 -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s |
12 | // RUN: %clang_cc1 -verify -fopenmp-simd -x c++ -fblocks -DBLOCKS -triple x86_64-apple-darwin10 -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s |
13 | // RUN: %clang_cc1 -verify -fopenmp-simd -x c++ -std=c++11 -DARRAY -triple x86_64-apple-darwin10 -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s |
14 | // SIMD-ONLY0-NOT: {{__kmpc|__tgt}} |
15 | // expected-no-diagnostics |
16 | // It doesn't pass on win32. Investigating. |
17 | // REQUIRES: shell |
18 | |
19 | #ifndef ARRAY |
20 | #ifndef HEADER |
21 | #define HEADER |
22 | |
23 | template <class T> |
24 | struct S { |
25 | T f; |
26 | S(T a) : f(a) {} |
27 | S() : f() {} |
28 | operator T() { return T(); } |
29 | ~S() {} |
30 | }; |
31 | |
32 | volatile double g; |
33 | |
34 | // CHECK-DAG: [[KMP_TASK_T_TY:%.+]] = type { i8*, i32 (i32, i8*)*, i32, %union{{.+}}, %union{{.+}}, i64, i64, i64, i32, i8* } |
35 | // CHECK-DAG: [[S_DOUBLE_TY:%.+]] = type { double } |
36 | // CHECK-DAG: [[CAP_MAIN_TY:%.+]] = type { i8 } |
37 | // CHECK-DAG: [[PRIVATES_MAIN_TY:%.+]] = type {{.?}}{ [2 x [[S_DOUBLE_TY]]], [[S_DOUBLE_TY]], i32, [2 x i32] |
38 | // CHECK-DAG: [[KMP_TASK_MAIN_TY:%.+]] = type { [[KMP_TASK_T_TY]], [[PRIVATES_MAIN_TY]] } |
39 | // CHECK-DAG: [[S_INT_TY:%.+]] = type { i32 } |
40 | // CHECK-DAG: [[CAP_TMAIN_TY:%.+]] = type { i8 } |
41 | // CHECK-DAG: [[PRIVATES_TMAIN_TY:%.+]] = type { i32, [2 x i32], [2 x [[S_INT_TY]]], [[S_INT_TY]], [104 x i8] } |
42 | // CHECK-DAG: [[KMP_TASK_TMAIN_TY:%.+]] = type { [[KMP_TASK_T_TY]], [{{[0-9]+}} x i8], [[PRIVATES_TMAIN_TY]] } |
43 | template <typename T> |
44 | T tmain() { |
45 | S<T> test; |
46 | T t_var __attribute__((aligned(128))) = T(); |
47 | T vec[] = {1, 2}; |
48 | S<T> s_arr[] = {1, 2}; |
49 | S<T> var(3); |
50 | #pragma omp taskloop simd private(t_var, vec, s_arr, s_arr, var, var) |
51 | for (int i = 0; i < 10; ++i) { |
52 | vec[0] = t_var; |
53 | s_arr[0] = var; |
54 | } |
55 | return T(); |
56 | } |
57 | |
58 | int main() { |
59 | static int sivar; |
60 | #ifdef LAMBDA |
61 | // LAMBDA: [[G:@.+]] = global double |
62 | // LAMBDA-LABEL: @main |
63 | // LAMBDA: call{{( x86_thiscallcc)?}} void [[OUTER_LAMBDA:@.+]]( |
64 | [&]() { |
65 | // LAMBDA: define{{.*}} internal{{.*}} void [[OUTER_LAMBDA]]( |
66 | // LAMBDA: [[RES:%.+]] = call i8* @__kmpc_omp_task_alloc(%{{[^ ]+}} @{{[^,]+}}, i32 %{{[^,]+}}, i32 1, i64 96, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, %{{[^*]+}}*)* [[TASK_ENTRY:@[^ ]+]] to i32 (i32, i8*)*)) |
67 | // LAMBDA: [[PRIVATES:%.+]] = getelementptr inbounds %{{.+}}, %{{.+}}* %{{.+}}, i{{.+}} 0, i{{.+}} 1 |
68 | // LAMBDA: call void @__kmpc_taskloop(%{{.+}}* @{{.+}}, i32 %{{.+}}, i8* [[RES]], i32 1, i64* %{{.+}}, i64* %{{.+}}, i64 %{{.+}}, i32 1, i32 0, i64 0, i8* null) |
69 | // LAMBDA: ret |
70 | #pragma omp taskloop simd private(g, sivar) |
71 | for (int i = 0; i < 10; ++i) { |
72 | // LAMBDA: define {{.+}} void [[INNER_LAMBDA:@.+]](%{{.+}}* [[ARG_PTR:%.+]]) |
73 | // LAMBDA: store %{{.+}}* [[ARG_PTR]], %{{.+}}** [[ARG_PTR_REF:%.+]], |
74 | // LAMBDA: [[ARG_PTR:%.+]] = load %{{.+}}*, %{{.+}}** [[ARG_PTR_REF]] |
75 | // LAMBDA: [[G_PTR_REF:%.+]] = getelementptr inbounds %{{.+}}, %{{.+}}* [[ARG_PTR]], i{{[0-9]+}} 0, i{{[0-9]+}} 0 |
76 | // LAMBDA: [[G_REF:%.+]] = load double*, double** [[G_PTR_REF]] |
77 | // LAMBDA: store double 2.0{{.+}}, double* [[G_REF]] |
78 | // LAMBDA: [[SIVAR_PTR_REF:%.+]] = getelementptr inbounds %{{.+}}, %{{.+}}* [[ARG_PTR]], i{{[0-9]+}} 0, i{{[0-9]+}} 1 |
79 | // LAMBDA: [[SIVAR_REF:%.+]] = load i{{[0-9]+}}*, i{{[0-9]+}}** [[SIVAR_PTR_REF]] |
80 | // LAMBDA: store i{{[0-9]+}} 3, i{{[0-9]+}}* [[SIVAR_REF]] |
81 | |
82 | // LAMBDA: define internal i32 [[TASK_ENTRY]](i32, %{{.+}}* noalias) |
83 | g = 1; |
84 | sivar = 2; |
85 | // LAMBDA: store double 1.0{{.+}}, double* %{{.+}}, |
86 | // LAMBDA: store i{{[0-9]+}} 2, i{{[0-9]+}}* %{{.+}}, |
87 | // LAMBDA: call void [[INNER_LAMBDA]](% |
88 | // LAMBDA: ret |
89 | [&]() { |
90 | g = 2; |
91 | sivar = 3; |
92 | }(); |
93 | } |
94 | }(); |
95 | return 0; |
96 | #elif defined(BLOCKS) |
97 | // BLOCKS: [[G:@.+]] = global double |
98 | // BLOCKS-LABEL: @main |
99 | // BLOCKS: call void {{%.+}}(i8 |
100 | ^{ |
101 | // BLOCKS: define{{.*}} internal{{.*}} void {{.+}}(i8* |
102 | // BLOCKS: [[RES:%.+]] = call i8* @__kmpc_omp_task_alloc(%{{[^ ]+}} @{{[^,]+}}, i32 %{{[^,]+}}, i32 1, i64 96, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, %{{[^*]+}}*)* [[TASK_ENTRY:@[^ ]+]] to i32 (i32, i8*)*)) |
103 | // BLOCKS: [[PRIVATES:%.+]] = getelementptr inbounds %{{.+}}, %{{.+}}* %{{.+}}, i{{.+}} 0, i{{.+}} 1 |
104 | // BLOCKS: call void @__kmpc_taskloop(%{{.+}}* @{{.+}}, i32 %{{.+}}, i8* [[RES]], i32 1, i64* %{{.+}}, i64* %{{.+}}, i64 %{{.+}}, i32 1, i32 0, i64 0, i8* null) |
105 | // BLOCKS: ret |
106 | #pragma omp taskloop simd private(g, sivar) |
107 | for (int i = 0; i < 10; ++i) { |
108 | // BLOCKS: define {{.+}} void {{@.+}}(i8* |
109 | // BLOCKS-NOT: [[G]]{{[[^:word:]]}} |
110 | // BLOCKS: store double 2.0{{.+}}, double* |
111 | // BLOCKS-NOT: [[G]]{{[[^:word:]]}} |
112 | // BLOCKS-NOT: [[SIVAR]]{{[[^:word:]]}} |
113 | // BLOCKS: store i{{[0-9]+}} 4, i{{[0-9]+}}* |
114 | // BLOCKS-NOT: [[SIVAR]]{{[[^:word:]]}} |
115 | // BLOCKS: ret |
116 | |
117 | // BLOCKS: define internal i32 [[TASK_ENTRY]](i32, %{{.+}}* noalias) |
118 | g = 1; |
119 | sivar = 3; |
120 | // BLOCKS: store double 1.0{{.+}}, double* %{{.+}}, |
121 | // BLOCKS-NOT: [[G]]{{[[^:word:]]}} |
122 | // BLOCKS: store i{{[0-9]+}} 3, i{{[0-9]+}}* %{{.+}}, |
123 | // BLOCKS-NOT: [[SIVAR]]{{[[^:word:]]}} |
124 | // BLOCKS: call void {{%.+}}(i8 |
125 | ^{ |
126 | g = 2; |
127 | sivar = 4; |
128 | }(); |
129 | } |
130 | }(); |
131 | return 0; |
132 | #else |
133 | S<double> test; |
134 | int t_var = 0; |
135 | int vec[] = {1, 2}; |
136 | S<double> s_arr[] = {1, 2}; |
137 | S<double> var(3); |
138 | #pragma omp taskloop simd private(var, t_var, s_arr, vec, s_arr, var, sivar) |
139 | for (int i = 0; i < 10; ++i) { |
140 | vec[0] = t_var; |
141 | s_arr[0] = var; |
142 | sivar = 8; |
143 | } |
144 | #pragma omp task |
145 | g+=1; |
146 | return tmain<int>(); |
147 | #endif |
148 | } |
149 | |
150 | // CHECK: define i{{[0-9]+}} @main() |
151 | // CHECK: [[TEST:%.+]] = alloca [[S_DOUBLE_TY]], |
152 | // CHECK: [[T_VAR_ADDR:%.+]] = alloca i32, |
153 | // CHECK: [[VEC_ADDR:%.+]] = alloca [2 x i32], |
154 | // CHECK: [[S_ARR_ADDR:%.+]] = alloca [2 x [[S_DOUBLE_TY]]], |
155 | // CHECK: [[VAR_ADDR:%.+]] = alloca [[S_DOUBLE_TY]], |
156 | // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num([[LOC:%.+]]) |
157 | |
158 | // CHECK: call {{.*}} [[S_DOUBLE_TY_DEF_CONSTR:@.+]]([[S_DOUBLE_TY]]* [[TEST]]) |
159 | |
160 | // Do not store original variables in capture struct. |
161 | // CHECK-NOT: getelementptr inbounds [[CAP_MAIN_TY]], |
162 | |
163 | // Allocate task. |
164 | // Returns struct kmp_task_t { |
165 | // [[KMP_TASK_T_TY]] task_data; |
166 | // [[KMP_TASK_MAIN_TY]] privates; |
167 | // }; |
168 | // CHECK: [[RES:%.+]] = call i8* @__kmpc_omp_task_alloc([[LOC]], i32 [[GTID]], i32 9, i64 120, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[KMP_TASK_MAIN_TY]]*)* [[TASK_ENTRY:@[^ ]+]] to i32 (i32, i8*)*)) |
169 | // CHECK: [[RES_KMP_TASK:%.+]] = bitcast i8* [[RES]] to [[KMP_TASK_MAIN_TY]]* |
170 | |
171 | // CHECK: [[TASK:%.+]] = getelementptr inbounds [[KMP_TASK_MAIN_TY]], [[KMP_TASK_MAIN_TY]]* [[RES_KMP_TASK]], i{{[0-9]+}} 0, i{{[0-9]+}} 0 |
172 | // Initialize kmp_task_t->privates with default values (no init for simple types, default constructors for classes). |
173 | // Also copy address of private copy to the corresponding shareds reference. |
174 | // CHECK: [[PRIVATES:%.+]] = getelementptr inbounds [[KMP_TASK_MAIN_TY]], [[KMP_TASK_MAIN_TY]]* [[RES_KMP_TASK]], i{{[0-9]+}} 0, i{{[0-9]+}} 1 |
175 | |
176 | // Constructors for s_arr and var. |
177 | // a_arr; |
178 | // CHECK: [[PRIVATE_S_ARR_REF:%.+]] = getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i{{[0-9]+}} 0, i{{[0-9]+}} 0 |
179 | // CHECK: getelementptr inbounds [2 x [[S_DOUBLE_TY]]], [2 x [[S_DOUBLE_TY]]]* [[PRIVATE_S_ARR_REF]], i{{.+}} 0, i{{.+}} 0 |
180 | // CHECK: getelementptr inbounds [[S_DOUBLE_TY]], [[S_DOUBLE_TY]]* %{{.+}}, i{{.+}} 2 |
181 | // CHECK: call void [[S_DOUBLE_TY_DEF_CONSTR]]([[S_DOUBLE_TY]]* [[S_ARR_CUR:%.+]]) |
182 | // CHECK: getelementptr inbounds [[S_DOUBLE_TY]], [[S_DOUBLE_TY]]* [[S_ARR_CUR]], i{{.+}} 1 |
183 | // CHECK: icmp eq |
184 | // CHECK: br i1 |
185 | |
186 | // var; |
187 | // CHECK: [[PRIVATE_VAR_REF:%.+]] = getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 1 |
188 | // CHECK: call void [[S_DOUBLE_TY_DEF_CONSTR]]([[S_DOUBLE_TY]]* [[PRIVATE_VAR_REF:%.+]]) |
189 | |
190 | // Provide pointer to destructor function, which will destroy private variables at the end of the task. |
191 | // CHECK: [[DESTRUCTORS_REF:%.+]] = getelementptr inbounds [[KMP_TASK_T_TY]], [[KMP_TASK_T_TY]]* [[TASK]], i{{.+}} 0, i{{.+}} 3 |
192 | // CHECK: [[DESTRUCTORS_PTR:%.+]] = bitcast %union{{.+}}* [[DESTRUCTORS_REF]] to i32 (i32, i8*)** |
193 | // CHECK: store i32 (i32, i8*)* bitcast (i32 (i32, [[KMP_TASK_MAIN_TY]]*)* [[DESTRUCTORS:@.+]] to i32 (i32, i8*)*), i32 (i32, i8*)** [[DESTRUCTORS_PTR]], |
194 | |
195 | // Start task. |
196 | // CHECK: call void @__kmpc_taskloop([[LOC]], i32 [[GTID]], i8* [[RES]], i32 1, i64* %{{.+}}, i64* %{{.+}}, i64 %{{.+}}, i32 1, i32 0, i64 0, i8* bitcast (void ([[KMP_TASK_MAIN_TY]]*, [[KMP_TASK_MAIN_TY]]*, i32)* [[MAIN_DUP:@.+]] to i8*)) |
197 | // CHECK: call i32 @__kmpc_omp_task([[LOC]], i32 [[GTID]], i8* |
198 | |
199 | // CHECK: = call i{{.+}} [[TMAIN_INT:@.+]]() |
200 | |
201 | // No destructors must be called for private copies of s_arr and var. |
202 | // CHECK-NOT: getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 2 |
203 | // CHECK-NOT: getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 3 |
204 | // CHECK: call void [[S_DOUBLE_TY_DESTR:@.+]]([[S_DOUBLE_TY]]* |
205 | // CHECK-NOT: getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 2 |
206 | // CHECK-NOT: getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 3 |
207 | // CHECK: ret |
208 | // |
209 | |
210 | // CHECK: define internal void [[PRIVATES_MAP_FN:@.+]]([[PRIVATES_MAIN_TY]]* noalias, [[S_DOUBLE_TY]]** noalias, i32** noalias, [2 x [[S_DOUBLE_TY]]]** noalias, [2 x i32]** noalias, i32** noalias) |
211 | // CHECK: [[PRIVATES:%.+]] = load [[PRIVATES_MAIN_TY]]*, [[PRIVATES_MAIN_TY]]** |
212 | // CHECK: [[PRIV_S_VAR:%.+]] = getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i32 0, i32 0 |
213 | // CHECK: [[ARG3:%.+]] = load [2 x [[S_DOUBLE_TY]]]**, [2 x [[S_DOUBLE_TY]]]*** %{{.+}}, |
214 | // CHECK: store [2 x [[S_DOUBLE_TY]]]* [[PRIV_S_VAR]], [2 x [[S_DOUBLE_TY]]]** [[ARG3]], |
215 | // CHECK: [[PRIV_VAR:%.+]] = getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i32 0, i32 1 |
216 | // CHECK: [[ARG1:%.+]] = load [[S_DOUBLE_TY]]**, [[S_DOUBLE_TY]]*** {{.+}}, |
217 | // CHECK: store [[S_DOUBLE_TY]]* [[PRIV_VAR]], [[S_DOUBLE_TY]]** [[ARG1]], |
218 | // CHECK: [[PRIV_T_VAR:%.+]] = getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i32 0, i32 2 |
219 | // CHECK: [[ARG2:%.+]] = load i32**, i32*** %{{.+}}, |
220 | // CHECK: store i32* [[PRIV_T_VAR]], i32** [[ARG2]], |
221 | // CHECK: [[PRIV_VEC:%.+]] = getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i32 0, i32 3 |
222 | // CHECK: [[ARG4:%.+]] = load [2 x i32]**, [2 x i32]*** %{{.+}}, |
223 | // CHECK: store [2 x i32]* [[PRIV_VEC]], [2 x i32]** [[ARG4]], |
224 | // CHECK: ret void |
225 | |
226 | // CHECK: define internal i32 [[TASK_ENTRY]](i32, [[KMP_TASK_MAIN_TY]]* noalias) |
227 | |
228 | // CHECK: [[PRIV_VAR_ADDR:%.+]] = alloca [[S_DOUBLE_TY]]*, |
229 | // CHECK: [[PRIV_T_VAR_ADDR:%.+]] = alloca i32*, |
230 | // CHECK: [[PRIV_S_ARR_ADDR:%.+]] = alloca [2 x [[S_DOUBLE_TY]]]*, |
231 | // CHECK: [[PRIV_VEC_ADDR:%.+]] = alloca [2 x i32]*, |
232 | // CHECK: [[PRIV_SIVAR_ADDR:%.+]] = alloca i32*, |
233 | // CHECK: store void (i8*, ...)* bitcast (void ([[PRIVATES_MAIN_TY]]*, [[S_DOUBLE_TY]]**, i32**, [2 x [[S_DOUBLE_TY]]]**, [2 x i32]**, i32**)* [[PRIVATES_MAP_FN]] to void (i8*, ...)*), void (i8*, ...)** [[MAP_FN_ADDR:%.+]], |
234 | // CHECK: [[MAP_FN:%.+]] = load void (i8*, ...)*, void (i8*, ...)** [[MAP_FN_ADDR]], |
235 | // CHECK: call void (i8*, ...) [[MAP_FN]](i8* %{{.+}}, [[S_DOUBLE_TY]]** [[PRIV_VAR_ADDR]], i32** [[PRIV_T_VAR_ADDR]], [2 x [[S_DOUBLE_TY]]]** [[PRIV_S_ARR_ADDR]], [2 x i32]** [[PRIV_VEC_ADDR]], i32** [[PRIV_SIVAR_ADDR]]) |
236 | // CHECK: [[PRIV_VAR:%.+]] = load [[S_DOUBLE_TY]]*, [[S_DOUBLE_TY]]** [[PRIV_VAR_ADDR]], |
237 | // CHECK: [[PRIV_T_VAR:%.+]] = load i32*, i32** [[PRIV_T_VAR_ADDR]], |
238 | // CHECK: [[PRIV_S_ARR:%.+]] = load [2 x [[S_DOUBLE_TY]]]*, [2 x [[S_DOUBLE_TY]]]** [[PRIV_S_ARR_ADDR]], |
239 | // CHECK: [[PRIV_VEC:%.+]] = load [2 x i32]*, [2 x i32]** [[PRIV_VEC_ADDR]], |
240 | // CHECK: [[PRIV_SIVAR:%.+]] = load i32*, i32** [[PRIV_SIVAR_ADDR]], |
241 | |
242 | // Privates actually are used. |
243 | // CHECK-DAG: [[PRIV_VAR]] |
244 | // CHECK-DAG: [[PRIV_T_VAR]] |
245 | // CHECK-DAG: [[PRIV_S_ARR]] |
246 | // CHECK-DAG: [[PRIV_VEC]] |
247 | // CHECK_DAG: [[PRIV_SIVAR]] |
248 | |
249 | // CHECK: ret |
250 | |
251 | // CHECK: define internal void [[MAIN_DUP]]([[KMP_TASK_MAIN_TY]]*, [[KMP_TASK_MAIN_TY]]*, i32) |
252 | // CHECK: getelementptr inbounds [[KMP_TASK_MAIN_TY]], [[KMP_TASK_MAIN_TY]]* %{{.+}}, i32 0, i32 1 |
253 | // CHECK: getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* %{{.+}}, i32 0, i32 0 |
254 | // CHECK: getelementptr inbounds [2 x [[S_DOUBLE_TY]]], [2 x [[S_DOUBLE_TY]]]* %{{.+}}, i32 0, i32 0 |
255 | // CHECK: getelementptr inbounds [[S_DOUBLE_TY]], [[S_DOUBLE_TY]]* %{{.+}}, i64 2 |
256 | // CHECK: br label % |
257 | |
258 | // CHECK: phi [[S_DOUBLE_TY]]* |
259 | // CHECK: call {{.*}} [[S_DOUBLE_TY_DEF_CONSTR]]([[S_DOUBLE_TY]]* |
260 | // CHECK: getelementptr inbounds [[S_DOUBLE_TY]], [[S_DOUBLE_TY]]* %{{.+}}, i64 1 |
261 | // CHECK: icmp eq [[S_DOUBLE_TY]]* % |
262 | // CHECK: br i1 % |
263 | |
264 | // CHECK: getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* %{{.+}}, i32 0, i32 1 |
265 | // CHECK: call {{.*}} [[S_DOUBLE_TY_DEF_CONSTR]]([[S_DOUBLE_TY]]* |
266 | // CHECK: ret void |
267 | |
268 | // CHECK: define internal i32 [[DESTRUCTORS]](i32, [[KMP_TASK_MAIN_TY]]* noalias) |
269 | // CHECK: [[PRIVATES:%.+]] = getelementptr inbounds [[KMP_TASK_MAIN_TY]], [[KMP_TASK_MAIN_TY]]* [[RES_KMP_TASK:%.+]], i{{[0-9]+}} 0, i{{[0-9]+}} 1 |
270 | // CHECK: [[PRIVATE_S_ARR_REF:%.+]] = getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 0 |
271 | // CHECK: [[PRIVATE_VAR_REF:%.+]] = getelementptr inbounds [[PRIVATES_MAIN_TY]], [[PRIVATES_MAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 1 |
272 | // CHECK: call void [[S_DOUBLE_TY_DESTR]]([[S_DOUBLE_TY]]* [[PRIVATE_VAR_REF]]) |
273 | // CHECK: getelementptr inbounds [2 x [[S_DOUBLE_TY]]], [2 x [[S_DOUBLE_TY]]]* [[PRIVATE_S_ARR_REF]], i{{.+}} 0, i{{.+}} 0 |
274 | // CHECK: getelementptr inbounds [[S_DOUBLE_TY]], [[S_DOUBLE_TY]]* %{{.+}}, i{{.+}} 2 |
275 | // CHECK: [[PRIVATE_S_ARR_ELEM_REF:%.+]] = getelementptr inbounds [[S_DOUBLE_TY]], [[S_DOUBLE_TY]]* %{{.+}}, i{{.+}} -1 |
276 | // CHECK: call void [[S_DOUBLE_TY_DESTR]]([[S_DOUBLE_TY]]* [[PRIVATE_S_ARR_ELEM_REF]]) |
277 | // CHECK: icmp eq |
278 | // CHECK: br i1 |
279 | // CHECK: ret i32 |
280 | |
281 | // CHECK: define {{.*}} i{{[0-9]+}} [[TMAIN_INT]]() |
282 | // CHECK: [[TEST:%.+]] = alloca [[S_INT_TY]], |
283 | // CHECK: [[T_VAR_ADDR:%.+]] = alloca i32, |
284 | // CHECK: [[VEC_ADDR:%.+]] = alloca [2 x i32], |
285 | // CHECK: [[S_ARR_ADDR:%.+]] = alloca [2 x [[S_INT_TY]]], |
286 | // CHECK: [[VAR_ADDR:%.+]] = alloca [[S_INT_TY]], |
287 | // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num([[LOC:%.+]]) |
288 | |
289 | // CHECK: call {{.*}} [[S_INT_TY_DEF_CONSTR:@.+]]([[S_INT_TY]]* [[TEST]]) |
290 | |
291 | // Do not store original variables in capture struct. |
292 | // CHECK-NOT: getelementptr inbounds [[CAP_TMAIN_TY]], |
293 | |
294 | // Allocate task. |
295 | // Returns struct kmp_task_t { |
296 | // [[KMP_TASK_T_TY]] task_data; |
297 | // [[KMP_TASK_TMAIN_TY]] privates; |
298 | // }; |
299 | // CHECK: [[RES:%.+]] = call i8* @__kmpc_omp_task_alloc([[LOC]], i32 [[GTID]], i32 9, i64 256, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[KMP_TASK_TMAIN_TY]]*)* [[TASK_ENTRY:@[^ ]+]] to i32 (i32, i8*)*)) |
300 | // CHECK: [[RES_KMP_TASK:%.+]] = bitcast i8* [[RES]] to [[KMP_TASK_TMAIN_TY]]* |
301 | |
302 | // CHECK: [[TASK:%.+]] = getelementptr inbounds [[KMP_TASK_TMAIN_TY]], [[KMP_TASK_TMAIN_TY]]* [[RES_KMP_TASK]], i{{[0-9]+}} 0, i{{[0-9]+}} 0 |
303 | |
304 | // Initialize kmp_task_t->privates with default values (no init for simple types, default constructors for classes). |
305 | // CHECK: [[PRIVATES:%.+]] = getelementptr inbounds [[KMP_TASK_TMAIN_TY]], [[KMP_TASK_TMAIN_TY]]* [[RES_KMP_TASK]], i{{[0-9]+}} 0, i{{[0-9]+}} 2 |
306 | |
307 | // Constructors for s_arr and var. |
308 | // a_arr; |
309 | // CHECK: [[PRIVATE_S_ARR_REF:%.+]] = getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i{{[0-9]+}} 0, i{{[0-9]+}} 2 |
310 | // CHECK: getelementptr inbounds [2 x [[S_INT_TY]]], [2 x [[S_INT_TY]]]* [[PRIVATE_S_ARR_REF]], i{{.+}} 0, i{{.+}} 0 |
311 | // CHECK: getelementptr inbounds [[S_INT_TY]], [[S_INT_TY]]* %{{.+}}, i{{.+}} 2 |
312 | // CHECK: call void [[S_INT_TY_DEF_CONSTR]]([[S_INT_TY]]* [[S_ARR_CUR:%.+]]) |
313 | // CHECK: getelementptr inbounds [[S_INT_TY]], [[S_INT_TY]]* [[S_ARR_CUR]], i{{.+}} 1 |
314 | // CHECK: icmp eq |
315 | // CHECK: br i1 |
316 | |
317 | // var; |
318 | // CHECK: [[PRIVATE_VAR_REF:%.+]] = getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 3 |
319 | // CHECK: call void [[S_INT_TY_DEF_CONSTR]]([[S_INT_TY]]* [[PRIVATE_VAR_REF:%.+]]) |
320 | |
321 | // Provide pointer to destructor function, which will destroy private variables at the end of the task. |
322 | // CHECK: [[DESTRUCTORS_REF:%.+]] = getelementptr inbounds [[KMP_TASK_T_TY]], [[KMP_TASK_T_TY]]* [[TASK]], i{{.+}} 0, i{{.+}} 3 |
323 | // CHECK: [[DESTRUCTORS_PTR:%.+]] = bitcast %union{{.+}}* [[DESTRUCTORS_REF]] to i32 (i32, i8*)** |
324 | // CHECK: store i32 (i32, i8*)* bitcast (i32 (i32, [[KMP_TASK_TMAIN_TY]]*)* [[DESTRUCTORS:@.+]] to i32 (i32, i8*)*), i32 (i32, i8*)** [[DESTRUCTORS_PTR]], |
325 | |
326 | // Start task. |
327 | // CHECK: call void @__kmpc_taskloop([[LOC]], i32 [[GTID]], i8* [[RES]], i32 1, i64* %{{.+}}, i64* %{{.+}}, i64 %{{.+}}, i32 1, i32 0, i64 0, i8* bitcast (void ([[KMP_TASK_TMAIN_TY]]*, [[KMP_TASK_TMAIN_TY]]*, i32)* [[TMAIN_DUP:@.+]] to i8*)) |
328 | |
329 | // No destructors must be called for private copies of s_arr and var. |
330 | // CHECK-NOT: getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 2 |
331 | // CHECK-NOT: getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 3 |
332 | // CHECK: call void [[S_INT_TY_DESTR:@.+]]([[S_INT_TY]]* |
333 | // CHECK-NOT: getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 2 |
334 | // CHECK-NOT: getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 3 |
335 | // CHECK: ret |
336 | // |
337 | |
338 | // CHECK: define internal void [[PRIVATES_MAP_FN:@.+]]([[PRIVATES_TMAIN_TY]]* noalias, i32** noalias, [2 x i32]** noalias, [2 x [[S_INT_TY]]]** noalias, [[S_INT_TY]]** noalias) |
339 | // CHECK: [[PRIVATES:%.+]] = load [[PRIVATES_TMAIN_TY]]*, [[PRIVATES_TMAIN_TY]]** |
340 | // CHECK: [[PRIV_T_VAR:%.+]] = getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i32 0, i32 0 |
341 | // CHECK: [[ARG1:%.+]] = load i32**, i32*** %{{.+}}, |
342 | // CHECK: store i32* [[PRIV_T_VAR]], i32** [[ARG1]], |
343 | // CHECK: [[PRIV_VEC:%.+]] = getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i32 0, i32 1 |
344 | // CHECK: [[ARG2:%.+]] = load [2 x i32]**, [2 x i32]*** %{{.+}}, |
345 | // CHECK: store [2 x i32]* [[PRIV_VEC]], [2 x i32]** [[ARG2]], |
346 | // CHECK: [[PRIV_S_VAR:%.+]] = getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i32 0, i32 2 |
347 | // CHECK: [[ARG3:%.+]] = load [2 x [[S_INT_TY]]]**, [2 x [[S_INT_TY]]]*** %{{.+}}, |
348 | // CHECK: store [2 x [[S_INT_TY]]]* [[PRIV_S_VAR]], [2 x [[S_INT_TY]]]** [[ARG3]], |
349 | // CHECK: [[PRIV_VAR:%.+]] = getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i32 0, i32 3 |
350 | // CHECK: [[ARG4:%.+]] = load [[S_INT_TY]]**, [[S_INT_TY]]*** {{.+}}, |
351 | // CHECK: store [[S_INT_TY]]* [[PRIV_VAR]], [[S_INT_TY]]** [[ARG4]], |
352 | // CHECK: ret void |
353 | |
354 | // CHECK: define internal i32 [[TASK_ENTRY]](i32, [[KMP_TASK_TMAIN_TY]]* noalias) |
355 | |
356 | // CHECK: alloca i32*, |
357 | // CHECK-DAG: [[PRIV_T_VAR_ADDR:%.+]] = alloca i32*, |
358 | // CHECK-DAG: [[PRIV_VEC_ADDR:%.+]] = alloca [2 x i32]*, |
359 | // CHECK-DAG: [[PRIV_S_ARR_ADDR:%.+]] = alloca [2 x [[S_INT_TY]]]*, |
360 | // CHECK-DAG: [[PRIV_VAR_ADDR:%.+]] = alloca [[S_INT_TY]]*, |
361 | // CHECK: store void (i8*, ...)* bitcast (void ([[PRIVATES_TMAIN_TY]]*, i32**, [2 x i32]**, [2 x [[S_INT_TY]]]**, [[S_INT_TY]]**)* [[PRIVATES_MAP_FN]] to void (i8*, ...)*), void (i8*, ...)** [[MAP_FN_ADDR:%.+]], |
362 | // CHECK: [[MAP_FN:%.+]] = load void (i8*, ...)*, void (i8*, ...)** [[MAP_FN_ADDR]], |
363 | // CHECK: call void (i8*, ...) [[MAP_FN]](i8* %{{.+}}, i32** [[PRIV_T_VAR_ADDR]], [2 x i32]** [[PRIV_VEC_ADDR]], [2 x [[S_INT_TY]]]** [[PRIV_S_ARR_ADDR]], [[S_INT_TY]]** [[PRIV_VAR_ADDR]]) |
364 | // CHECK: [[PRIV_T_VAR:%.+]] = load i32*, i32** [[PRIV_T_VAR_ADDR]], |
365 | // CHECK: [[PRIV_VEC:%.+]] = load [2 x i32]*, [2 x i32]** [[PRIV_VEC_ADDR]], |
366 | // CHECK: [[PRIV_S_ARR:%.+]] = load [2 x [[S_INT_TY]]]*, [2 x [[S_INT_TY]]]** [[PRIV_S_ARR_ADDR]], |
367 | // CHECK: [[PRIV_VAR:%.+]] = load [[S_INT_TY]]*, [[S_INT_TY]]** [[PRIV_VAR_ADDR]], |
368 | |
369 | // Privates actually are used. |
370 | // CHECK-DAG: [[PRIV_VAR]] |
371 | // CHECK-DAG: [[PRIV_T_VAR]] |
372 | // CHECK-DAG: [[PRIV_S_ARR]] |
373 | // CHECK-DAG: [[PRIV_VEC]] |
374 | |
375 | // CHECK: ret |
376 | |
377 | // CHECK: define internal void [[TMAIN_DUP]]([[KMP_TASK_TMAIN_TY]]*, [[KMP_TASK_TMAIN_TY]]*, i32) |
378 | // CHECK: getelementptr inbounds [[KMP_TASK_TMAIN_TY]], [[KMP_TASK_TMAIN_TY]]* %{{.+}}, i32 0, i32 2 |
379 | // CHECK: getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* %{{.+}}, i32 0, i32 2 |
380 | // CHECK: getelementptr inbounds [2 x [[S_INT_TY]]], [2 x [[S_INT_TY]]]* %{{.+}}, i32 0, i32 0 |
381 | // CHECK: getelementptr inbounds [[S_INT_TY]], [[S_INT_TY]]* %{{.+}}, i64 2 |
382 | // CHECK: br label % |
383 | |
384 | // CHECK: phi [[S_INT_TY]]* |
385 | // CHECK: call {{.*}} [[S_INT_TY_DEF_CONSTR]]([[S_INT_TY]]* |
386 | // CHECK: getelementptr inbounds [[S_INT_TY]], [[S_INT_TY]]* %{{.+}}, i64 1 |
387 | // CHECK: icmp eq [[S_INT_TY]]* % |
388 | // CHECK: br i1 % |
389 | |
390 | // CHECK: getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* %{{.+}}, i32 0, i32 3 |
391 | // CHECK: call {{.*}} [[S_INT_TY_DEF_CONSTR]]([[S_INT_TY]]* |
392 | // CHECK: ret void |
393 | |
394 | // CHECK: define internal i32 [[DESTRUCTORS]](i32, [[KMP_TASK_TMAIN_TY]]* noalias) |
395 | // CHECK: [[PRIVATES:%.+]] = getelementptr inbounds [[KMP_TASK_TMAIN_TY]], [[KMP_TASK_TMAIN_TY]]* [[RES_KMP_TASK:%.+]], i{{[0-9]+}} 0, i{{[0-9]+}} 2 |
396 | // CHECK: [[PRIVATE_S_ARR_REF:%.+]] = getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 2 |
397 | // CHECK: [[PRIVATE_VAR_REF:%.+]] = getelementptr inbounds [[PRIVATES_TMAIN_TY]], [[PRIVATES_TMAIN_TY]]* [[PRIVATES]], i{{.+}} 0, i{{.+}} 3 |
398 | // CHECK: call void [[S_INT_TY_DESTR]]([[S_INT_TY]]* [[PRIVATE_VAR_REF]]) |
399 | // CHECK: getelementptr inbounds [2 x [[S_INT_TY]]], [2 x [[S_INT_TY]]]* [[PRIVATE_S_ARR_REF]], i{{.+}} 0, i{{.+}} 0 |
400 | // CHECK: getelementptr inbounds [[S_INT_TY]], [[S_INT_TY]]* %{{.+}}, i{{.+}} 2 |
401 | // CHECK: [[PRIVATE_S_ARR_ELEM_REF:%.+]] = getelementptr inbounds [[S_INT_TY]], [[S_INT_TY]]* %{{.+}}, i{{.+}} -1 |
402 | // CHECK: call void [[S_INT_TY_DESTR]]([[S_INT_TY]]* [[PRIVATE_S_ARR_ELEM_REF]]) |
403 | // CHECK: icmp eq |
404 | // CHECK: br i1 |
405 | // CHECK: ret i32 |
406 | |
407 | #endif |
408 | #else |
409 | // ARRAY-LABEL: array_func |
410 | struct St { |
411 | int a, b; |
412 | St() : a(0), b(0) {} |
413 | St &operator=(const St &) { return *this; }; |
414 | ~St() {} |
415 | }; |
416 | |
417 | void array_func(int n, float a[n], St s[2]) { |
418 | // ARRAY: call i8* @__kmpc_omp_task_alloc( |
419 | // ARRAY: call void @__kmpc_taskloop( |
420 | // ARRAY: store float** %{{.+}}, float*** %{{.+}}, |
421 | // ARRAY: store %struct.St** %{{.+}}, %struct.St*** %{{.+}}, |
422 | #pragma omp taskloop simd private(a, s) |
423 | for (int i = 0; i < 10; ++i) |
424 | ; |
425 | } |
426 | #endif |
427 | |
428 | |