1 | // RUN: %clang_cc1 %s -emit-llvm -o - -triple=armv5-unknown-freebsd -std=c11 | FileCheck %s |
2 | |
3 | // Test that we are generating atomicrmw instructions, rather than |
4 | // compare-exchange loops for common atomic ops. This makes a big difference |
5 | // on RISC platforms, where the compare-exchange loop becomes a ll/sc pair for |
6 | // the load and then another ll/sc in the loop, expanding to about 30 |
7 | // instructions when it should be only 4. It has a smaller, but still |
8 | // noticeable, impact on platforms like x86 and RISC-V, where there are atomic |
9 | // RMW instructions. |
10 | // |
11 | // We currently emit cmpxchg loops for most operations on _Bools, because |
12 | // they're sufficiently rare that it's not worth making sure that the semantics |
13 | // are correct. |
14 | |
15 | struct elem; |
16 | |
17 | struct ptr { |
18 | struct elem *ptr; |
19 | }; |
20 | // CHECK-DAG: %struct.ptr = type { %struct.elem* } |
21 | |
22 | struct elem { |
23 | _Atomic(struct ptr) link; |
24 | }; |
25 | // CHECK-DAG: %struct.elem = type { %struct.ptr } |
26 | |
27 | struct ptr object; |
28 | // CHECK-DAG: @object = common global %struct.ptr zeroinitializer |
29 | |
30 | // CHECK-DAG: @testStructGlobal = global {{.*}} { i16 1, i16 2, i16 3, i16 4 } |
31 | // CHECK-DAG: @testPromotedStructGlobal = global {{.*}} { %{{.*}} { i16 1, i16 2, i16 3 }, [2 x i8] zeroinitializer } |
32 | |
33 | |
34 | typedef int __attribute__((vector_size(16))) vector; |
35 | |
36 | _Atomic(_Bool) b; |
37 | _Atomic(int) i; |
38 | _Atomic(long long) l; |
39 | _Atomic(short) s; |
40 | _Atomic(char*) p; |
41 | _Atomic(float) f; |
42 | _Atomic(vector) v; |
43 | |
44 | // CHECK: testinc |
45 | void testinc(void) |
46 | { |
47 | // Special case for suffix bool++, sets to true and returns the old value. |
48 | // CHECK: atomicrmw xchg i8* @b, i8 1 seq_cst |
49 | b++; |
50 | // CHECK: atomicrmw add i32* @i, i32 1 seq_cst |
51 | i++; |
52 | // CHECK: atomicrmw add i64* @l, i64 1 seq_cst |
53 | l++; |
54 | // CHECK: atomicrmw add i16* @s, i16 1 seq_cst |
55 | s++; |
56 | // Prefix increment |
57 | // Special case for bool: set to true and return true |
58 | // CHECK: store atomic i8 1, i8* @b seq_cst, align 1 |
59 | ++b; |
60 | // Currently, we have no variant of atomicrmw that returns the new value, so |
61 | // we have to generate an atomic add, which returns the old value, and then a |
62 | // non-atomic add. |
63 | // CHECK: atomicrmw add i32* @i, i32 1 seq_cst |
64 | // CHECK: add i32 |
65 | ++i; |
66 | // CHECK: atomicrmw add i64* @l, i64 1 seq_cst |
67 | // CHECK: add i64 |
68 | ++l; |
69 | // CHECK: atomicrmw add i16* @s, i16 1 seq_cst |
70 | // CHECK: add i16 |
71 | ++s; |
72 | } |
73 | // CHECK: testdec |
74 | void testdec(void) |
75 | { |
76 | // CHECK: call arm_aapcscc zeroext i1 @__atomic_compare_exchange(i32 1, i8* @b |
77 | b--; |
78 | // CHECK: atomicrmw sub i32* @i, i32 1 seq_cst |
79 | i--; |
80 | // CHECK: atomicrmw sub i64* @l, i64 1 seq_cst |
81 | l--; |
82 | // CHECK: atomicrmw sub i16* @s, i16 1 seq_cst |
83 | s--; |
84 | // CHECK: call arm_aapcscc zeroext i1 @__atomic_compare_exchange(i32 1, i8* @b |
85 | --b; |
86 | // CHECK: atomicrmw sub i32* @i, i32 1 seq_cst |
87 | // CHECK: sub i32 |
88 | --i; |
89 | // CHECK: atomicrmw sub i64* @l, i64 1 seq_cst |
90 | // CHECK: sub i64 |
91 | --l; |
92 | // CHECK: atomicrmw sub i16* @s, i16 1 seq_cst |
93 | // CHECK: sub i16 |
94 | --s; |
95 | } |
96 | // CHECK: testaddeq |
97 | void testaddeq(void) |
98 | { |
99 | // CHECK: call arm_aapcscc zeroext i1 @__atomic_compare_exchange(i32 1, i8* @b |
100 | // CHECK: atomicrmw add i32* @i, i32 42 seq_cst |
101 | // CHECK: atomicrmw add i64* @l, i64 42 seq_cst |
102 | // CHECK: atomicrmw add i16* @s, i16 42 seq_cst |
103 | b += 42; |
104 | i += 42; |
105 | l += 42; |
106 | s += 42; |
107 | } |
108 | // CHECK: testsubeq |
109 | void testsubeq(void) |
110 | { |
111 | // CHECK: call arm_aapcscc zeroext i1 @__atomic_compare_exchange(i32 1, i8* @b |
112 | // CHECK: atomicrmw sub i32* @i, i32 42 seq_cst |
113 | // CHECK: atomicrmw sub i64* @l, i64 42 seq_cst |
114 | // CHECK: atomicrmw sub i16* @s, i16 42 seq_cst |
115 | b -= 42; |
116 | i -= 42; |
117 | l -= 42; |
118 | s -= 42; |
119 | } |
120 | // CHECK: testxoreq |
121 | void testxoreq(void) |
122 | { |
123 | // CHECK: call arm_aapcscc zeroext i1 @__atomic_compare_exchange(i32 1, i8* @b |
124 | // CHECK: atomicrmw xor i32* @i, i32 42 seq_cst |
125 | // CHECK: atomicrmw xor i64* @l, i64 42 seq_cst |
126 | // CHECK: atomicrmw xor i16* @s, i16 42 seq_cst |
127 | b ^= 42; |
128 | i ^= 42; |
129 | l ^= 42; |
130 | s ^= 42; |
131 | } |
132 | // CHECK: testoreq |
133 | void testoreq(void) |
134 | { |
135 | // CHECK: call arm_aapcscc zeroext i1 @__atomic_compare_exchange(i32 1, i8* @b |
136 | // CHECK: atomicrmw or i32* @i, i32 42 seq_cst |
137 | // CHECK: atomicrmw or i64* @l, i64 42 seq_cst |
138 | // CHECK: atomicrmw or i16* @s, i16 42 seq_cst |
139 | b |= 42; |
140 | i |= 42; |
141 | l |= 42; |
142 | s |= 42; |
143 | } |
144 | // CHECK: testandeq |
145 | void testandeq(void) |
146 | { |
147 | // CHECK: call arm_aapcscc zeroext i1 @__atomic_compare_exchange(i32 1, i8* @b |
148 | // CHECK: atomicrmw and i32* @i, i32 42 seq_cst |
149 | // CHECK: atomicrmw and i64* @l, i64 42 seq_cst |
150 | // CHECK: atomicrmw and i16* @s, i16 42 seq_cst |
151 | b &= 42; |
152 | i &= 42; |
153 | l &= 42; |
154 | s &= 42; |
155 | } |
156 | |
157 | // CHECK-LABEL: define arm_aapcscc void @testFloat(float* |
158 | void testFloat(_Atomic(float) *fp) { |
159 | // CHECK: [[FP:%.*]] = alloca float* |
160 | // CHECK-NEXT: [[X:%.*]] = alloca float |
161 | // CHECK-NEXT: [[F:%.*]] = alloca float |
162 | // CHECK-NEXT: [[TMP0:%.*]] = alloca float |
163 | // CHECK-NEXT: [[TMP1:%.*]] = alloca float |
164 | // CHECK-NEXT: store float* {{%.*}}, float** [[FP]] |
165 | |
166 | // CHECK-NEXT: [[T0:%.*]] = load float*, float** [[FP]] |
167 | // CHECK-NEXT: store float 1.000000e+00, float* [[T0]], align 4 |
168 | __c11_atomic_init(fp, 1.0f); |
169 | |
170 | // CHECK-NEXT: store float 2.000000e+00, float* [[X]], align 4 |
171 | _Atomic(float) x = 2.0f; |
172 | |
173 | // CHECK-NEXT: [[T0:%.*]] = load float*, float** [[FP]] |
174 | // CHECK-NEXT: [[T1:%.*]] = bitcast float* [[T0]] to i8* |
175 | // CHECK-NEXT: [[T2:%.*]] = bitcast float* [[TMP0]] to i8* |
176 | // CHECK-NEXT: call arm_aapcscc void @__atomic_load(i32 4, i8* [[T1]], i8* [[T2]], i32 5) |
177 | // CHECK-NEXT: [[T3:%.*]] = load float, float* [[TMP0]], align 4 |
178 | // CHECK-NEXT: store float [[T3]], float* [[F]] |
179 | float f = *fp; |
180 | |
181 | // CHECK-NEXT: [[T0:%.*]] = load float, float* [[F]], align 4 |
182 | // CHECK-NEXT: [[T1:%.*]] = load float*, float** [[FP]], align 4 |
183 | // CHECK-NEXT: store float [[T0]], float* [[TMP1]], align 4 |
184 | // CHECK-NEXT: [[T2:%.*]] = bitcast float* [[T1]] to i8* |
185 | // CHECK-NEXT: [[T3:%.*]] = bitcast float* [[TMP1]] to i8* |
186 | // CHECK-NEXT: call arm_aapcscc void @__atomic_store(i32 4, i8* [[T2]], i8* [[T3]], i32 5) |
187 | *fp = f; |
188 | |
189 | // CHECK-NEXT: ret void |
190 | } |
191 | |
192 | // CHECK: define arm_aapcscc void @testComplexFloat([[CF:{ float, float }]]* |
193 | void testComplexFloat(_Atomic(_Complex float) *fp) { |
194 | // CHECK: [[FP:%.*]] = alloca [[CF]]*, align 4 |
195 | // CHECK-NEXT: [[X:%.*]] = alloca [[CF]], align 8 |
196 | // CHECK-NEXT: [[F:%.*]] = alloca [[CF]], align 4 |
197 | // CHECK-NEXT: [[TMP0:%.*]] = alloca [[CF]], align 8 |
198 | // CHECK-NEXT: [[TMP1:%.*]] = alloca [[CF]], align 8 |
199 | // CHECK-NEXT: store [[CF]]* |
200 | |
201 | // CHECK-NEXT: [[P:%.*]] = load [[CF]]*, [[CF]]** [[FP]] |
202 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[P]], i32 0, i32 0 |
203 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[P]], i32 0, i32 1 |
204 | // CHECK-NEXT: store float 1.000000e+00, float* [[T0]] |
205 | // CHECK-NEXT: store float 0.000000e+00, float* [[T1]] |
206 | __c11_atomic_init(fp, 1.0f); |
207 | |
208 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[X]], i32 0, i32 0 |
209 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[X]], i32 0, i32 1 |
210 | // CHECK-NEXT: store float 2.000000e+00, float* [[T0]] |
211 | // CHECK-NEXT: store float 0.000000e+00, float* [[T1]] |
212 | _Atomic(_Complex float) x = 2.0f; |
213 | |
214 | // CHECK-NEXT: [[T0:%.*]] = load [[CF]]*, [[CF]]** [[FP]] |
215 | // CHECK-NEXT: [[T1:%.*]] = bitcast [[CF]]* [[T0]] to i8* |
216 | // CHECK-NEXT: [[T2:%.*]] = bitcast [[CF]]* [[TMP0]] to i8* |
217 | // CHECK-NEXT: call arm_aapcscc void @__atomic_load(i32 8, i8* [[T1]], i8* [[T2]], i32 5) |
218 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[TMP0]], i32 0, i32 0 |
219 | // CHECK-NEXT: [[R:%.*]] = load float, float* [[T0]] |
220 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[TMP0]], i32 0, i32 1 |
221 | // CHECK-NEXT: [[I:%.*]] = load float, float* [[T0]] |
222 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[F]], i32 0, i32 0 |
223 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[F]], i32 0, i32 1 |
224 | // CHECK-NEXT: store float [[R]], float* [[T0]] |
225 | // CHECK-NEXT: store float [[I]], float* [[T1]] |
226 | _Complex float f = *fp; |
227 | |
228 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[F]], i32 0, i32 0 |
229 | // CHECK-NEXT: [[R:%.*]] = load float, float* [[T0]] |
230 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[F]], i32 0, i32 1 |
231 | // CHECK-NEXT: [[I:%.*]] = load float, float* [[T0]] |
232 | // CHECK-NEXT: [[DEST:%.*]] = load [[CF]]*, [[CF]]** [[FP]], align 4 |
233 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[TMP1]], i32 0, i32 0 |
234 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[CF]], [[CF]]* [[TMP1]], i32 0, i32 1 |
235 | // CHECK-NEXT: store float [[R]], float* [[T0]] |
236 | // CHECK-NEXT: store float [[I]], float* [[T1]] |
237 | // CHECK-NEXT: [[T0:%.*]] = bitcast [[CF]]* [[DEST]] to i8* |
238 | // CHECK-NEXT: [[T1:%.*]] = bitcast [[CF]]* [[TMP1]] to i8* |
239 | // CHECK-NEXT: call arm_aapcscc void @__atomic_store(i32 8, i8* [[T0]], i8* [[T1]], i32 5) |
240 | *fp = f; |
241 | |
242 | // CHECK-NEXT: ret void |
243 | } |
244 | |
245 | typedef struct { short x, y, z, w; } S; |
246 | _Atomic S testStructGlobal = (S){1, 2, 3, 4}; |
247 | // CHECK: define arm_aapcscc void @testStruct([[S:.*]]* |
248 | void testStruct(_Atomic(S) *fp) { |
249 | // CHECK: [[FP:%.*]] = alloca [[S]]*, align 4 |
250 | // CHECK-NEXT: [[X:%.*]] = alloca [[S]], align 8 |
251 | // CHECK-NEXT: [[F:%.*]] = alloca [[S:%.*]], align 2 |
252 | // CHECK-NEXT: [[TMP0:%.*]] = alloca [[S]], align 8 |
253 | // CHECK-NEXT: store [[S]]* |
254 | |
255 | // CHECK-NEXT: [[P:%.*]] = load [[S]]*, [[S]]** [[FP]] |
256 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]], [[S]]* [[P]], i32 0, i32 0 |
257 | // CHECK-NEXT: store i16 1, i16* [[T0]], align 8 |
258 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]], [[S]]* [[P]], i32 0, i32 1 |
259 | // CHECK-NEXT: store i16 2, i16* [[T0]], align 2 |
260 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]], [[S]]* [[P]], i32 0, i32 2 |
261 | // CHECK-NEXT: store i16 3, i16* [[T0]], align 4 |
262 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]], [[S]]* [[P]], i32 0, i32 3 |
263 | // CHECK-NEXT: store i16 4, i16* [[T0]], align 2 |
264 | __c11_atomic_init(fp, (S){1,2,3,4}); |
265 | |
266 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]], [[S]]* [[X]], i32 0, i32 0 |
267 | // CHECK-NEXT: store i16 1, i16* [[T0]], align 8 |
268 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]], [[S]]* [[X]], i32 0, i32 1 |
269 | // CHECK-NEXT: store i16 2, i16* [[T0]], align 2 |
270 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]], [[S]]* [[X]], i32 0, i32 2 |
271 | // CHECK-NEXT: store i16 3, i16* [[T0]], align 4 |
272 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]], [[S]]* [[X]], i32 0, i32 3 |
273 | // CHECK-NEXT: store i16 4, i16* [[T0]], align 2 |
274 | _Atomic(S) x = (S){1,2,3,4}; |
275 | |
276 | // CHECK-NEXT: [[T0:%.*]] = load [[S]]*, [[S]]** [[FP]] |
277 | // CHECK-NEXT: [[T1:%.*]] = bitcast [[S]]* [[T0]] to i8* |
278 | // CHECK-NEXT: [[T2:%.*]] = bitcast [[S]]* [[F]] to i8* |
279 | // CHECK-NEXT: call arm_aapcscc void @__atomic_load(i32 8, i8* [[T1]], i8* [[T2]], i32 5) |
280 | S f = *fp; |
281 | |
282 | // CHECK-NEXT: [[T0:%.*]] = load [[S]]*, [[S]]** [[FP]] |
283 | // CHECK-NEXT: [[T1:%.*]] = bitcast [[S]]* [[TMP0]] to i8* |
284 | // CHECK-NEXT: [[T2:%.*]] = bitcast [[S]]* [[F]] to i8* |
285 | // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 8 [[T1]], i8* align 2 [[T2]], i32 8, i1 false) |
286 | // CHECK-NEXT: [[T3:%.*]] = bitcast [[S]]* [[T0]] to i8* |
287 | // CHECK-NEXT: [[T4:%.*]] = bitcast [[S]]* [[TMP0]] to i8* |
288 | // CHECK-NEXT: call arm_aapcscc void @__atomic_store(i32 8, i8* [[T3]], i8* [[T4]], i32 5) |
289 | *fp = f; |
290 | |
291 | // CHECK-NEXT: ret void |
292 | } |
293 | |
294 | typedef struct { short x, y, z; } PS; |
295 | _Atomic PS testPromotedStructGlobal = (PS){1, 2, 3}; |
296 | // CHECK: define arm_aapcscc void @testPromotedStruct([[APS:.*]]* |
297 | void testPromotedStruct(_Atomic(PS) *fp) { |
298 | // CHECK: [[FP:%.*]] = alloca [[APS]]*, align 4 |
299 | // CHECK-NEXT: [[X:%.*]] = alloca [[APS]], align 8 |
300 | // CHECK-NEXT: [[F:%.*]] = alloca [[PS:%.*]], align 2 |
301 | // CHECK-NEXT: [[TMP0:%.*]] = alloca [[APS]], align 8 |
302 | // CHECK-NEXT: [[TMP1:%.*]] = alloca [[APS]], align 8 |
303 | // CHECK-NEXT: [[A:%.*]] = alloca i32, align 4 |
304 | // CHECK-NEXT: [[TMP2:%.*]] = alloca %struct.PS, align 2 |
305 | // CHECK-NEXT: [[TMP3:%.*]] = alloca [[APS]], align 8 |
306 | // CHECK-NEXT: store [[APS]]* |
307 | |
308 | // CHECK-NEXT: [[P:%.*]] = load [[APS]]*, [[APS]]** [[FP]] |
309 | // CHECK-NEXT: [[T0:%.*]] = bitcast [[APS]]* [[P]] to i8* |
310 | // CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* align 8 [[T0]], i8 0, i64 8, i1 false) |
311 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[APS]], [[APS]]* [[P]], i32 0, i32 0 |
312 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]], [[PS]]* [[T0]], i32 0, i32 0 |
313 | // CHECK-NEXT: store i16 1, i16* [[T1]], align 8 |
314 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]], [[PS]]* [[T0]], i32 0, i32 1 |
315 | // CHECK-NEXT: store i16 2, i16* [[T1]], align 2 |
316 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]], [[PS]]* [[T0]], i32 0, i32 2 |
317 | // CHECK-NEXT: store i16 3, i16* [[T1]], align 4 |
318 | __c11_atomic_init(fp, (PS){1,2,3}); |
319 | |
320 | // CHECK-NEXT: [[T0:%.*]] = bitcast [[APS]]* [[X]] to i8* |
321 | // CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* align 8 [[T0]], i8 0, i32 8, i1 false) |
322 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[APS]], [[APS]]* [[X]], i32 0, i32 0 |
323 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]], [[PS]]* [[T0]], i32 0, i32 0 |
324 | // CHECK-NEXT: store i16 1, i16* [[T1]], align 8 |
325 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]], [[PS]]* [[T0]], i32 0, i32 1 |
326 | // CHECK-NEXT: store i16 2, i16* [[T1]], align 2 |
327 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]], [[PS]]* [[T0]], i32 0, i32 2 |
328 | // CHECK-NEXT: store i16 3, i16* [[T1]], align 4 |
329 | _Atomic(PS) x = (PS){1,2,3}; |
330 | |
331 | // CHECK-NEXT: [[T0:%.*]] = load [[APS]]*, [[APS]]** [[FP]] |
332 | // CHECK-NEXT: [[T1:%.*]] = bitcast [[APS]]* [[T0]] to i8* |
333 | // CHECK-NEXT: [[T2:%.*]] = bitcast [[APS]]* [[TMP0]] to i8* |
334 | // CHECK-NEXT: call arm_aapcscc void @__atomic_load(i32 8, i8* [[T1]], i8* [[T2]], i32 5) |
335 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[APS]], [[APS]]* [[TMP0]], i32 0, i32 0 |
336 | // CHECK-NEXT: [[T1:%.*]] = bitcast [[PS]]* [[F]] to i8* |
337 | // CHECK-NEXT: [[T2:%.*]] = bitcast [[PS]]* [[T0]] to i8* |
338 | // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 2 [[T1]], i8* align 8 [[T2]], i32 6, i1 false) |
339 | PS f = *fp; |
340 | |
341 | // CHECK-NEXT: [[T0:%.*]] = load [[APS]]*, [[APS]]** [[FP]] |
342 | // CHECK-NEXT: [[T1:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[TMP1]] to i8* |
343 | // CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* align 8 [[T1]], i8 0, i32 8, i1 false) |
344 | // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[APS]], [[APS]]* [[TMP1]], i32 0, i32 0 |
345 | // CHECK-NEXT: [[T2:%.*]] = bitcast [[PS]]* [[T1]] to i8* |
346 | // CHECK-NEXT: [[T3:%.*]] = bitcast [[PS]]* [[F]] to i8* |
347 | // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 8 [[T2]], i8* align 2 [[T3]], i32 6, i1 false) |
348 | // CHECK-NEXT: [[T4:%.*]] = bitcast [[APS]]* [[T0]] to i8* |
349 | // CHECK-NEXT: [[T5:%.*]] = bitcast [[APS]]* [[TMP1]] to i8* |
350 | // CHECK-NEXT: call arm_aapcscc void @__atomic_store(i32 8, i8* [[T4]], i8* [[T5]], i32 5) |
351 | *fp = f; |
352 | |
353 | // CHECK-NEXT: [[T0:%.*]] = load [[APS]]*, [[APS]]** [[FP]], align 4 |
354 | // CHECK-NEXT: [[T1:%.*]] = bitcast [[APS]]* [[T0]] to i8* |
355 | // CHECK-NEXT: [[T2:%.*]] = bitcast [[APS]]* [[TMP3]] to i8* |
356 | // CHECK-NEXT: call arm_aapcscc void @__atomic_load(i32 8, i8* [[T1]], i8* [[T2]], i32 5) |
357 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[APS]], [[APS]]* [[TMP3]], i32 0, i32 0 |
358 | // CHECK-NEXT: [[T1:%.*]] = bitcast %struct.PS* [[TMP2]] to i8* |
359 | // CHECK-NEXT: [[T2:%.*]] = bitcast %struct.PS* [[T0]] to i8* |
360 | // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 2 [[T1]], i8* align 8 [[T2]], i32 6, i1 false) |
361 | // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds %struct.PS, %struct.PS* [[TMP2]], i32 0, i32 0 |
362 | // CHECK-NEXT: [[T1:%.*]] = load i16, i16* [[T0]], align 2 |
363 | // CHECK-NEXT: [[T2:%.*]] = sext i16 [[T1]] to i32 |
364 | // CHECK-NEXT: store i32 [[T2]], i32* [[A]], align 4 |
365 | int a = ((PS)*fp).x; |
366 | |
367 | // CHECK-NEXT: ret void |
368 | } |
369 | |
370 | PS test_promoted_load(_Atomic(PS) *addr) { |
371 | // CHECK-LABEL: @test_promoted_load(%struct.PS* noalias sret %agg.result, { %struct.PS, [2 x i8] }* %addr) |
372 | // CHECK: [[ADDR_ARG:%.*]] = alloca { %struct.PS, [2 x i8] }*, align 4 |
373 | // CHECK: [[ATOMIC_RES:%.*]] = alloca { %struct.PS, [2 x i8] }, align 8 |
374 | // CHECK: store { %struct.PS, [2 x i8] }* %addr, { %struct.PS, [2 x i8] }** [[ADDR_ARG]], align 4 |
375 | // CHECK: [[ADDR:%.*]] = load { %struct.PS, [2 x i8] }*, { %struct.PS, [2 x i8] }** [[ADDR_ARG]], align 4 |
376 | // CHECK: [[ADDR64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ADDR]] to i64* |
377 | // CHECK: [[ATOMIC_RES64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_RES]] to i64* |
378 | // CHECK: [[ADDR8:%.*]] = bitcast i64* [[ADDR64]] to i8* |
379 | // CHECK: [[RES:%.*]] = call arm_aapcscc i64 @__atomic_load_8(i8* [[ADDR8]], i32 5) |
380 | // CHECK: store i64 [[RES]], i64* [[ATOMIC_RES64]], align 8 |
381 | // CHECK: [[ATOMIC_RES_STRUCT:%.*]] = bitcast i64* [[ATOMIC_RES64]] to %struct.PS* |
382 | // CHECK: [[AGG_RESULT8:%.*]] = bitcast %struct.PS* %agg.result to i8* |
383 | // CHECK: [[ATOMIC_RES8:%.*]] = bitcast %struct.PS* [[ATOMIC_RES_STRUCT]] to i8* |
384 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 2 [[AGG_RESULT8]], i8* align 8 [[ATOMIC_RES8]], i32 6, i1 false) |
385 | |
386 | return __c11_atomic_load(addr, 5); |
387 | } |
388 | |
389 | void test_promoted_store(_Atomic(PS) *addr, PS *val) { |
390 | // CHECK-LABEL: @test_promoted_store({ %struct.PS, [2 x i8] }* %addr, %struct.PS* %val) |
391 | // CHECK: [[ADDR_ARG:%.*]] = alloca { %struct.PS, [2 x i8] }*, align 4 |
392 | // CHECK: [[VAL_ARG:%.*]] = alloca %struct.PS*, align 4 |
393 | // CHECK: [[NONATOMIC_TMP:%.*]] = alloca %struct.PS, align 2 |
394 | // CHECK: [[ATOMIC_VAL:%.*]] = alloca { %struct.PS, [2 x i8] }, align 8 |
395 | // CHECK: store { %struct.PS, [2 x i8] }* %addr, { %struct.PS, [2 x i8] }** [[ADDR_ARG]], align 4 |
396 | // CHECK: store %struct.PS* %val, %struct.PS** [[VAL_ARG]], align 4 |
397 | // CHECK: [[ADDR:%.*]] = load { %struct.PS, [2 x i8] }*, { %struct.PS, [2 x i8] }** [[ADDR_ARG]], align 4 |
398 | // CHECK: [[VAL:%.*]] = load %struct.PS*, %struct.PS** [[VAL_ARG]], align 4 |
399 | // CHECK: [[NONATOMIC_TMP8:%.*]] = bitcast %struct.PS* [[NONATOMIC_TMP]] to i8* |
400 | // CHECK: [[VAL8:%.*]] = bitcast %struct.PS* [[VAL]] to i8* |
401 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 2 [[NONATOMIC_TMP8]], i8* align 2 [[VAL8]], i32 6, i1 false) |
402 | // CHECK: [[ADDR64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ADDR]] to i64* |
403 | // CHECK: [[ATOMIC_VAL8:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_VAL]] to i8* |
404 | // CHECK: [[NONATOMIC_TMP8:%.*]] = bitcast %struct.PS* [[NONATOMIC_TMP]] to i8* |
405 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 8 [[ATOMIC_VAL8]], i8* align 2 [[NONATOMIC_TMP8]], i64 6, i1 false) |
406 | // CHECK: [[ATOMIC_VAL64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_VAL]] to i64* |
407 | // CHECK: [[ADDR8:%.*]] = bitcast i64* [[ADDR64]] to i8* |
408 | // CHECK: [[VAL64:%.*]] = load i64, i64* [[ATOMIC_VAL64]], align 2 |
409 | // CHECK: call arm_aapcscc void @__atomic_store_8(i8* [[ADDR8]], i64 [[VAL64]], i32 5) |
410 | __c11_atomic_store(addr, *val, 5); |
411 | } |
412 | |
413 | PS test_promoted_exchange(_Atomic(PS) *addr, PS *val) { |
414 | // CHECK-LABEL: @test_promoted_exchange(%struct.PS* noalias sret %agg.result, { %struct.PS, [2 x i8] }* %addr, %struct.PS* %val) |
415 | // CHECK: [[ADDR_ARG:%.*]] = alloca { %struct.PS, [2 x i8] }*, align 4 |
416 | // CHECK: [[VAL_ARG:%.*]] = alloca %struct.PS*, align 4 |
417 | // CHECK: [[NONATOMIC_TMP:%.*]] = alloca %struct.PS, align 2 |
418 | // CHECK: [[ATOMIC_VAL:%.*]] = alloca { %struct.PS, [2 x i8] }, align 8 |
419 | // CHECK: [[ATOMIC_RES:%.*]] = alloca { %struct.PS, [2 x i8] }, align 8 |
420 | // CHECK: store { %struct.PS, [2 x i8] }* %addr, { %struct.PS, [2 x i8] }** [[ADDR_ARG]], align 4 |
421 | // CHECK: store %struct.PS* %val, %struct.PS** [[VAL_ARG]], align 4 |
422 | // CHECK: [[ADDR:%.*]] = load { %struct.PS, [2 x i8] }*, { %struct.PS, [2 x i8] }** [[ADDR_ARG]], align 4 |
423 | // CHECK: [[VAL:%.*]] = load %struct.PS*, %struct.PS** [[VAL_ARG]], align 4 |
424 | // CHECK: [[NONATOMIC_TMP8:%.*]] = bitcast %struct.PS* [[NONATOMIC_TMP]] to i8* |
425 | // CHECK: [[VAL8:%.*]] = bitcast %struct.PS* [[VAL]] to i8* |
426 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 2 [[NONATOMIC_TMP8]], i8* align 2 [[VAL8]], i32 6, i1 false) |
427 | // CHECK: [[ADDR64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ADDR]] to i64* |
428 | // CHECK: [[ATOMIC_VAL8:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_VAL]] to i8* |
429 | // CHECK: [[NONATOMIC_TMP8:%.*]] = bitcast %struct.PS* [[NONATOMIC_TMP]] to i8* |
430 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 8 [[ATOMIC_VAL8]], i8* align 2 [[NONATOMIC_TMP8]], i64 6, i1 false) |
431 | // CHECK: [[ATOMIC_VAL64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_VAL]] to i64* |
432 | // CHECK: [[ATOMIC_RES64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_RES]] to i64* |
433 | // CHECK: [[ADDR8:%.*]] = bitcast i64* [[ADDR64]] to i8* |
434 | // CHECK: [[VAL64:%.*]] = load i64, i64* [[ATOMIC_VAL64]], align 2 |
435 | // CHECK: [[RES:%.*]] = call arm_aapcscc i64 @__atomic_exchange_8(i8* [[ADDR8]], i64 [[VAL64]], i32 5) |
436 | // CHECK: store i64 [[RES]], i64* [[ATOMIC_RES64]], align 8 |
437 | // CHECK: [[ATOMIC_RES_STRUCT:%.*]] = bitcast i64* [[ATOMIC_RES64]] to %struct.PS* |
438 | // CHECK: [[AGG_RESULT8:%.*]] = bitcast %struct.PS* %agg.result to i8* |
439 | // CHECK: [[ATOMIC_RES8:%.*]] = bitcast %struct.PS* [[ATOMIC_RES_STRUCT]] to i8* |
440 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 2 [[AGG_RESULT8]], i8* align 8 [[ATOMIC_RES8]], i32 6, i1 false) |
441 | return __c11_atomic_exchange(addr, *val, 5); |
442 | } |
443 | |
444 | _Bool test_promoted_cmpxchg(_Atomic(PS) *addr, PS *desired, PS *new) { |
445 | // CHECK-LABEL: i1 @test_promoted_cmpxchg({ %struct.PS, [2 x i8] }* %addr, %struct.PS* %desired, %struct.PS* %new) #0 { |
446 | // CHECK: [[ADDR_ARG:%.*]] = alloca { %struct.PS, [2 x i8] }*, align 4 |
447 | // CHECK: [[DESIRED_ARG:%.*]] = alloca %struct.PS*, align 4 |
448 | // CHECK: [[NEW_ARG:%.*]] = alloca %struct.PS*, align 4 |
449 | // CHECK: [[NONATOMIC_TMP:%.*]] = alloca %struct.PS, align 2 |
450 | // CHECK: [[ATOMIC_DESIRED:%.*]] = alloca { %struct.PS, [2 x i8] }, align 8 |
451 | // CHECK: [[ATOMIC_NEW:%.*]] = alloca { %struct.PS, [2 x i8] }, align 8 |
452 | // CHECK: store { %struct.PS, [2 x i8] }* %addr, { %struct.PS, [2 x i8] }** [[ADDR_ARG]], align 4 |
453 | // CHECK: store %struct.PS* %desired, %struct.PS** [[DESIRED_ARG]], align 4 |
454 | // CHECK: store %struct.PS* %new, %struct.PS** [[NEW_ARG]], align 4 |
455 | // CHECK: [[ADDR:%.*]] = load { %struct.PS, [2 x i8] }*, { %struct.PS, [2 x i8] }** [[ADDR_ARG]], align 4 |
456 | // CHECK: [[DESIRED:%.*]]= load %struct.PS*, %struct.PS** [[DESIRED_ARG]], align 4 |
457 | // CHECK: [[NEW:%.*]] = load %struct.PS*, %struct.PS** [[NEW_ARG]], align 4 |
458 | // CHECK: [[NONATOMIC_TMP8:%.*]] = bitcast %struct.PS* [[NONATOMIC_TMP]] to i8* |
459 | // CHECK: [[NEW8:%.*]] = bitcast %struct.PS* [[NEW]] to i8* |
460 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 2 [[NONATOMIC_TMP8]], i8* align 2 [[NEW8]], i32 6, i1 false) |
461 | // CHECK: [[ADDR64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ADDR]] to i64* |
462 | // CHECK: [[ATOMIC_DESIRED8:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_DESIRED]] to i8* |
463 | // CHECK: [[DESIRED8:%.*]] = bitcast %struct.PS* [[DESIRED]]to i8* |
464 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 8 [[ATOMIC_DESIRED8]], i8* align 2 [[DESIRED8]], i64 6, i1 false) |
465 | // CHECK: [[ATOMIC_DESIRED64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_DESIRED]] to i64* |
466 | // CHECK: [[ATOMIC_NEW8:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_NEW]] to i8* |
467 | // CHECK: [[NONATOMIC_TMP8:%.*]] = bitcast %struct.PS* [[NONATOMIC_TMP]] to i8* |
468 | // CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 8 [[ATOMIC_NEW8]], i8* align 2 [[NONATOMIC_TMP8]], i64 6, i1 false) |
469 | // CHECK: [[ATOMIC_NEW64:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[ATOMIC_NEW]] to i64* |
470 | // CHECK: [[ADDR8:%.*]] = bitcast i64* [[ADDR64]] to i8* |
471 | // CHECK: [[ATOMIC_DESIRED8:%.*]] = bitcast i64* [[ATOMIC_DESIRED64]] to i8* |
472 | // CHECK: [[NEW64:%.*]] = load i64, i64* [[ATOMIC_NEW64]], align 2 |
473 | // CHECK: [[RES:%.*]] = call arm_aapcscc zeroext i1 @__atomic_compare_exchange_8(i8* [[ADDR8]], i8* [[ATOMIC_DESIRED8]], i64 [[NEW64]], i32 5, i32 5) |
474 | // CHECK: ret i1 [[RES]] |
475 | return __c11_atomic_compare_exchange_strong(addr, desired, *new, 5, 5); |
476 | } |
477 | |
478 | struct Empty {}; |
479 | |
480 | struct Empty test_empty_struct_load(_Atomic(struct Empty)* empty) { |
481 | // CHECK-LABEL: @test_empty_struct_load( |
482 | // CHECK: call arm_aapcscc zeroext i8 @__atomic_load_1(i8* %{{.*}}, i32 5) |
483 | return __c11_atomic_load(empty, 5); |
484 | } |
485 | |
486 | void test_empty_struct_store(_Atomic(struct Empty)* empty, struct Empty value) { |
487 | // CHECK-LABEL: @test_empty_struct_store( |
488 | // CHECK: call arm_aapcscc void @__atomic_store_1(i8* %{{.*}}, i8 zeroext %{{.*}}, i32 5) |
489 | __c11_atomic_store(empty, value, 5); |
490 | } |
491 | |