1// RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c -emit-llvm %s -o - | FileCheck %s
2// RUN: %clang_cc1 -fopenmp -x c -triple x86_64-apple-darwin10 -emit-pch -o %t %s
3// RUN: %clang_cc1 -fopenmp -x c -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s
4// expected-no-diagnostics
5// REQUIRES: x86-registered-target
6#ifndef HEADER
7#define HEADER
8
9_Bool bv, bx;
10char cv, cx;
11unsigned char ucv, ucx;
12short sv, sx;
13unsigned short usv, usx;
14int iv, ix;
15unsigned int uiv, uix;
16long lv, lx;
17unsigned long ulv, ulx;
18long long llv, llx;
19unsigned long long ullv, ullx;
20float fv, fx;
21double dv, dx;
22long double ldv, ldx;
23_Complex int civ, cix;
24_Complex float cfv, cfx;
25_Complex double cdv, cdx;
26
27typedef int int4 __attribute__((__vector_size__(16)));
28int4 int4x;
29
30struct BitFields {
31  int : 32;
32  int a : 31;
33} bfx;
34
35struct BitFields_packed {
36  int : 32;
37  int a : 31;
38} __attribute__ ((__packed__)) bfx_packed;
39
40struct BitFields2 {
41  int : 31;
42  int a : 1;
43} bfx2;
44
45struct BitFields2_packed {
46  int : 31;
47  int a : 1;
48} __attribute__ ((__packed__)) bfx2_packed;
49
50struct BitFields3 {
51  int : 11;
52  int a : 14;
53} bfx3;
54
55struct BitFields3_packed {
56  int : 11;
57  int a : 14;
58} __attribute__ ((__packed__)) bfx3_packed;
59
60struct BitFields4 {
61  short : 16;
62  int a: 1;
63  long b : 7;
64} bfx4;
65
66struct BitFields4_packed {
67  short : 16;
68  int a: 1;
69  long b : 7;
70} __attribute__ ((__packed__)) bfx4_packed;
71
72typedef float float2 __attribute__((ext_vector_type(2)));
73float2 float2x;
74
75// Register "0" is currently an invalid register for global register variables.
76// Use "esp" instead of "0".
77// register int rix __asm__("0");
78register int rix __asm__("esp");
79
80int main() {
81// CHECK: load i8, i8*
82// CHECK: store atomic i8
83#pragma omp atomic write
84  bx = bv;
85// CHECK: load i8, i8*
86// CHECK: store atomic i8
87#pragma omp atomic write
88  cx = cv;
89// CHECK: load i8, i8*
90// CHECK: store atomic i8
91#pragma omp atomic write
92  ucx = ucv;
93// CHECK: load i16, i16*
94// CHECK: store atomic i16
95#pragma omp atomic write
96  sx = sv;
97// CHECK: load i16, i16*
98// CHECK: store atomic i16
99#pragma omp atomic write
100  usx = usv;
101// CHECK: load i32, i32*
102// CHECK: store atomic i32
103#pragma omp atomic write
104  ix = iv;
105// CHECK: load i32, i32*
106// CHECK: store atomic i32
107#pragma omp atomic write
108  uix = uiv;
109// CHECK: load i64, i64*
110// CHECK: store atomic i64
111#pragma omp atomic write
112  lx = lv;
113// CHECK: load i64, i64*
114// CHECK: store atomic i64
115#pragma omp atomic write
116  ulx = ulv;
117// CHECK: load i64, i64*
118// CHECK: store atomic i64
119#pragma omp atomic write
120  llx = llv;
121// CHECK: load i64, i64*
122// CHECK: store atomic i64
123#pragma omp atomic write
124  ullx = ullv;
125// CHECK: load float, float*
126// CHECK: bitcast float {{.*}} to i32
127// CHECK: store atomic i32 {{.*}}, i32* bitcast (float*
128#pragma omp atomic write
129  fx = fv;
130// CHECK: load double, double*
131// CHECK: bitcast double {{.*}} to i64
132// CHECK: store atomic i64 {{.*}}, i64* bitcast (double*
133#pragma omp atomic write
134  dx = dv;
135// CHECK: [[LD:%.+]] = load x86_fp80, x86_fp80*
136// CHECK: [[BITCAST:%.+]] = bitcast x86_fp80* [[LDTEMP:%.*]] to i8*
137// CHECK: call void @llvm.memset.p0i8.i64(i8* [[BITCAST]], i8 0, i64 16, i32 16, i1 false)
138// CHECK: store x86_fp80 [[LD]], x86_fp80* [[LDTEMP]]
139// CHECK: [[BITCAST:%.+]] = bitcast x86_fp80* [[LDTEMP:%.*]] to i128*
140// CHECK: [[LD:%.+]] = load i128, i128* [[BITCAST]]
141// CHECK: store atomic i128 [[LD]], i128* bitcast (x86_fp80*
142#pragma omp atomic write
143  ldx = ldv;
144// CHECK: [[REAL_VAL:%.+]] = load i32, i32* getelementptr inbounds ({ i32, i32 }, { i32, i32 }* @{{.*}}, i32 0, i32 0)
145// CHECK: [[IMG_VAL:%.+]] = load i32, i32* getelementptr inbounds ({ i32, i32 }, { i32, i32 }* @{{.*}}, i32 0, i32 1)
146// CHECK: [[TEMP_REAL_REF:%.+]] = getelementptr inbounds { i32, i32 }, { i32, i32 }* [[TEMP:%.+]], i32 0, i32 0
147// CHECK: [[TEMP_IMG_REF:%.+]] = getelementptr inbounds { i32, i32 }, { i32, i32 }* [[TEMP]], i32 0, i32 1
148// CHECK: store i32 [[REAL_VAL]], i32* [[TEMP_REAL_REF]]
149// CHECK: store i32 [[IMG_VAL]], i32* [[TEMP_IMG_REF]]
150// CHECK: [[BITCAST:%.+]] = bitcast { i32, i32 }* [[TEMP]] to i8*
151// CHECK: call void @__atomic_store(i64 8, i8* bitcast ({ i32, i32 }* @{{.*}} to i8*), i8* [[BITCAST]], i32 0)
152#pragma omp atomic write
153  cix = civ;
154// CHECK: [[REAL_VAL:%.+]] = load float, float* getelementptr inbounds ({ float, float }, { float, float }* @{{.*}}, i32 0, i32 0)
155// CHECK: [[IMG_VAL:%.+]] = load float, float* getelementptr inbounds ({ float, float }, { float, float }* @{{.*}}, i32 0, i32 1)
156// CHECK: [[TEMP_REAL_REF:%.+]] = getelementptr inbounds { float, float }, { float, float }* [[TEMP:%.+]], i32 0, i32 0
157// CHECK: [[TEMP_IMG_REF:%.+]] = getelementptr inbounds { float, float }, { float, float }* [[TEMP]], i32 0, i32 1
158// CHECK: store float [[REAL_VAL]], float* [[TEMP_REAL_REF]]
159// CHECK: store float [[IMG_VAL]], float* [[TEMP_IMG_REF]]
160// CHECK: [[BITCAST:%.+]] = bitcast { float, float }* [[TEMP]] to i8*
161// CHECK: call void @__atomic_store(i64 8, i8* bitcast ({ float, float }* @{{.*}} to i8*), i8* [[BITCAST]], i32 0)
162#pragma omp atomic write
163  cfx = cfv;
164// CHECK: [[REAL_VAL:%.+]] = load double, double* getelementptr inbounds ({ double, double }, { double, double }* @{{.*}}, i32 0, i32 0)
165// CHECK: [[IMG_VAL:%.+]] = load double, double* getelementptr inbounds ({ double, double }, { double, double }* @{{.*}}, i32 0, i32 1)
166// CHECK: [[TEMP_REAL_REF:%.+]] = getelementptr inbounds { double, double }, { double, double }* [[TEMP:%.+]], i32 0, i32 0
167// CHECK: [[TEMP_IMG_REF:%.+]] = getelementptr inbounds { double, double }, { double, double }* [[TEMP]], i32 0, i32 1
168// CHECK: store double [[REAL_VAL]], double* [[TEMP_REAL_REF]]
169// CHECK: store double [[IMG_VAL]], double* [[TEMP_IMG_REF]]
170// CHECK: [[BITCAST:%.+]] = bitcast { double, double }* [[TEMP]] to i8*
171// CHECK: call void @__atomic_store(i64 16, i8* bitcast ({ double, double }* @{{.*}} to i8*), i8* [[BITCAST]], i32 5)
172// CHECK: call{{.*}} @__kmpc_flush(
173#pragma omp atomic seq_cst write
174  cdx = cdv;
175// CHECK: load i8, i8*
176// CHECK: store atomic i64
177#pragma omp atomic write
178  ulx = bv;
179// CHECK: load i8, i8*
180// CHECK: store atomic i8
181#pragma omp atomic write
182  bx = cv;
183// CHECK: load i8, i8*
184// CHECK: store atomic i8
185// CHECK: call{{.*}} @__kmpc_flush(
186#pragma omp atomic write, seq_cst
187  cx = ucv;
188// CHECK: load i16, i16*
189// CHECK: store atomic i64
190#pragma omp atomic write
191  ulx = sv;
192// CHECK: load i16, i16*
193// CHECK: store atomic i64
194#pragma omp atomic write
195  lx = usv;
196// CHECK: load i32, i32*
197// CHECK: store atomic i32
198// CHECK: call{{.*}} @__kmpc_flush(
199#pragma omp atomic seq_cst, write
200  uix = iv;
201// CHECK: load i32, i32*
202// CHECK: store atomic i32
203#pragma omp atomic write
204  ix = uiv;
205// CHECK: load i64, i64*
206// CHECK: [[VAL:%.+]] = trunc i64 %{{.*}} to i32
207// CHECK: [[TEMP_REAL_REF:%.+]] = getelementptr inbounds { i32, i32 }, { i32, i32 }* [[TEMP:%.+]], i32 0, i32 0
208// CHECK: [[TEMP_IMG_REF:%.+]] = getelementptr inbounds { i32, i32 }, { i32, i32 }* [[TEMP]], i32 0, i32 1
209// CHECK: store i32 [[VAL]], i32* [[TEMP_REAL_REF]]
210// CHECK: store i32 0, i32* [[TEMP_IMG_REF]]
211// CHECK: [[BITCAST:%.+]] = bitcast { i32, i32 }* [[TEMP]] to i8*
212// CHECK: call void @__atomic_store(i64 8, i8* bitcast ({ i32, i32 }* @{{.+}} to i8*), i8* [[BITCAST]], i32 0)
213#pragma omp atomic write
214  cix = lv;
215// CHECK: load i64, i64*
216// CHECK: store atomic i32 %{{.+}}, i32* bitcast (float*
217#pragma omp atomic write
218  fx = ulv;
219// CHECK: load i64, i64*
220// CHECK: store atomic i64 %{{.+}}, i64* bitcast (double*
221#pragma omp atomic write
222  dx = llv;
223// CHECK: load i64, i64*
224// CHECK: [[VAL:%.+]] = uitofp i64 %{{.+}} to x86_fp80
225// CHECK: [[BITCAST:%.+]] = bitcast x86_fp80* [[TEMP:%.+]] to i8*
226// CHECK: call void @llvm.memset.p0i8.i64(i8* [[BITCAST]], i8 0, i64 16, i32 16, i1 false)
227// CHECK: store x86_fp80 [[VAL]], x86_fp80* [[TEMP]]
228// CHECK: [[BITCAST:%.+]] = bitcast x86_fp80* [[TEMP]] to i128*
229// CHECK: [[VAL:%.+]] = load i128, i128* [[BITCAST]]
230// CHECK: store atomic i128 [[VAL]], i128* bitcast (x86_fp80*
231#pragma omp atomic write
232  ldx = ullv;
233// CHECK: load float, float*
234// CHECK: [[VAL:%.+]] = fptosi float %{{.*}} to i32
235// CHECK: [[TEMP_REAL_REF:%.+]] = getelementptr inbounds { i32, i32 }, { i32, i32 }* [[TEMP:%.+]], i32 0, i32 0
236// CHECK: [[TEMP_IMG_REF:%.+]] = getelementptr inbounds { i32, i32 }, { i32, i32 }* [[TEMP]], i32 0, i32 1
237// CHECK: store i32 [[VAL]], i32* [[TEMP_REAL_REF]]
238// CHECK: store i32 0, i32* [[TEMP_IMG_REF]]
239// CHECK: [[BITCAST:%.+]] = bitcast { i32, i32 }* [[TEMP]] to i8*
240// CHECK: call void @__atomic_store(i64 8, i8* bitcast ({ i32, i32 }* @{{.+}} to i8*), i8* [[BITCAST]], i32 0)
241#pragma omp atomic write
242  cix = fv;
243// CHECK: load double, double*
244// CHECK: store atomic i16
245#pragma omp atomic write
246  sx = dv;
247// CHECK: load x86_fp80, x86_fp80*
248// CHECK: store atomic i8
249#pragma omp atomic write
250  bx = ldv;
251// CHECK: load i32, i32* getelementptr inbounds ({ i32, i32 }, { i32, i32 }* @{{.+}}, i32 0, i32 0)
252// CHECK: load i32, i32* getelementptr inbounds ({ i32, i32 }, { i32, i32 }* @{{.+}}, i32 0, i32 1)
253// CHECK: icmp ne i32 %{{.+}}, 0
254// CHECK: icmp ne i32 %{{.+}}, 0
255// CHECK: or i1
256// CHECK: store atomic i8
257#pragma omp atomic write
258  bx = civ;
259// CHECK: load float, float* getelementptr inbounds ({ float, float }, { float, float }* @{{.*}}, i32 0, i32 0)
260// CHECK: store atomic i16
261#pragma omp atomic write
262  usx = cfv;
263// CHECK: load double, double* getelementptr inbounds ({ double, double }, { double, double }* @{{.+}}, i32 0, i32 0)
264// CHECK: store atomic i64
265#pragma omp atomic write
266  llx = cdv;
267// CHECK-DAG: [[IDX:%.+]] = load i16, i16* @{{.+}}
268// CHECK-DAG: load i8, i8*
269// CHECK-DAG: [[VEC_ITEM_VAL:%.+]] = zext i1 %{{.+}} to i32
270// CHECK: [[I128VAL:%.+]] = load atomic i128, i128* bitcast (<4 x i32>* [[DEST:@.+]] to i128*) monotonic
271// CHECK: br label %[[CONT:.+]]
272// CHECK: [[CONT]]
273// CHECK: [[OLD_I128:%.+]] = phi i128 [ [[I128VAL]], %{{.+}} ], [ [[FAILED_I128_OLD_VAL:%.+]], %[[CONT]] ]
274// CHECK: [[BITCAST:%.+]] = bitcast <4 x i32>* [[LDTEMP:%.+]] to i128*
275// CHECK: store i128 [[OLD_I128]], i128* [[BITCAST]],
276// CHECK: [[VEC_VAL:%.+]] = load <4 x i32>, <4 x i32>* [[LDTEMP]]
277// CHECK: [[NEW_VEC_VAL:%.+]] = insertelement <4 x i32> [[VEC_VAL]], i32 [[VEC_ITEM_VAL]], i16 [[IDX]]
278// CHECK: store <4 x i32> [[NEW_VEC_VAL]], <4 x i32>* [[LDTEMP]]
279// CHECK: [[NEW_I128:%.+]] = load i128, i128* [[BITCAST]]
280// CHECK: [[RES:%.+]] = cmpxchg i128* bitcast (<4 x i32>* [[DEST]] to i128*), i128 [[OLD_I128]], i128 [[NEW_I128]] monotonic monotonic
281// CHECK: [[FAILED_I128_OLD_VAL:%.+]] = extractvalue { i128, i1 } [[RES]], 0
282// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i128, i1 } [[RES]], 1
283// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
284// CHECK: [[EXIT]]
285#pragma omp atomic write
286  int4x[sv] = bv;
287// CHECK: load x86_fp80, x86_fp80* @{{.+}}
288// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i32
289// CHECK: [[PREV_VALUE:%.+]] = load atomic i32, i32* bitcast (i8* getelementptr (i8, i8* bitcast (%struct.BitFields* @{{.+}} to i8*), i64 4) to i32*) monotonic
290// CHECK: br label %[[CONT:.+]]
291// CHECK: [[CONT]]
292// CHECK: [[OLD_BF_VALUE:%.+]] = phi i32 [ [[PREV_VALUE]], %[[EXIT]] ], [ [[FAILED_OLD_VAL:%.+]], %[[CONT]] ]
293// CHECK: [[BF_VALUE:%.+]] = and i32 [[NEW_VAL]], 2147483647
294// CHECK: [[BF_CLEAR:%.+]] = and i32 %{{.+}}, -2147483648
295// CHECK: or i32 [[BF_CLEAR]], [[BF_VALUE]]
296// CHECK: store i32 %{{.+}}, i32* [[LDTEMP:%.+]]
297// CHECK: [[NEW_BF_VALUE:%.+]] = load i32, i32* [[LDTEMP]]
298// CHECK: [[RES:%.+]] = cmpxchg i32* bitcast (i8* getelementptr (i8, i8* bitcast (%struct.BitFields* @{{.+}} to i8*), i64 4) to i32*), i32 [[OLD_BF_VALUE]], i32 [[NEW_BF_VALUE]] monotonic monotonic
299// CHECK: [[FAILED_OLD_VAL]] = extractvalue { i32, i1 } [[RES]], 0
300// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i32, i1 } [[RES]], 1
301// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
302// CHECK: [[EXIT]]
303#pragma omp atomic write
304  bfx.a = ldv;
305// CHECK: load x86_fp80, x86_fp80* @{{.+}}
306// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i32
307// CHECK: [[BITCAST:%.+]] = bitcast i32* [[LDTEMP:%.+]] to i8*
308// CHECK: call void @__atomic_load(i64 4, i8* getelementptr (i8, i8* bitcast (%struct.BitFields_packed* @{{.+}} to i8*), i64 4), i8* [[BITCAST]], i32 0)
309// CHECK: br label %[[CONT:.+]]
310// CHECK: [[CONT]]
311// CHECK: [[OLD_BF_VALUE:%.+]] = load i32, i32* [[LDTEMP]],
312// CHECK: store i32 [[OLD_BF_VALUE]], i32* [[LDTEMP1:%.+]],
313// CHECK: [[OLD_BF_VALUE:%.+]] = load i32, i32* [[LDTEMP1]],
314// CHECK: [[BF_VALUE:%.+]] = and i32 [[NEW_VAL]], 2147483647
315// CHECK: [[BF_CLEAR:%.+]] = and i32 [[OLD_BF_VALUE]], -2147483648
316// CHECK: or i32 [[BF_CLEAR]], [[BF_VALUE]]
317// CHECK: store i32 %{{.+}}, i32* [[LDTEMP1]]
318// CHECK: [[BITCAST_TEMP_OLD_BF_ADDR:%.+]] = bitcast i32* [[LDTEMP]] to i8*
319// CHECK: [[BITCAST_TEMP_NEW_BF_ADDR:%.+]] = bitcast i32* [[LDTEMP1]] to i8*
320// CHECK: [[FAIL_SUCCESS:%.+]] = call zeroext i1 @__atomic_compare_exchange(i64 4, i8* getelementptr (i8, i8* bitcast (%struct.BitFields_packed* @{{.+}} to i8*), i64 4), i8* [[BITCAST_TEMP_OLD_BF_ADDR]], i8* [[BITCAST_TEMP_NEW_BF_ADDR]], i32 0, i32 0)
321// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
322// CHECK: [[EXIT]]
323#pragma omp atomic write
324  bfx_packed.a = ldv;
325// CHECK: load x86_fp80, x86_fp80* @{{.+}}
326// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i32
327// CHECK: [[PREV_VALUE:%.+]] = load atomic i32, i32* getelementptr inbounds (%struct.BitFields2, %struct.BitFields2* @{{.+}}, i32 0, i32 0) monotonic
328// CHECK: br label %[[CONT:.+]]
329// CHECK: [[CONT]]
330// CHECK: [[OLD_BF_VALUE:%.+]] = phi i32 [ [[PREV_VALUE]], %[[EXIT]] ], [ [[FAILED_OLD_VAL:%.+]], %[[CONT]] ]
331// CHECK: [[BF_AND:%.+]] = and i32 [[NEW_VAL]], 1
332// CHECK: [[BF_VALUE:%.+]] = shl i32 [[BF_AND]], 31
333// CHECK: [[BF_CLEAR:%.+]] = and i32 %{{.+}}, 2147483647
334// CHECK: or i32 [[BF_CLEAR]], [[BF_VALUE]]
335// CHECK: store i32 %{{.+}}, i32* [[LDTEMP:%.+]]
336// CHECK: [[NEW_BF_VALUE:%.+]] = load i32, i32* [[LDTEMP]]
337// CHECK: [[RES:%.+]] = cmpxchg i32* getelementptr inbounds (%struct.BitFields2, %struct.BitFields2* @{{.+}}, i32 0, i32 0), i32 [[OLD_BF_VALUE]], i32 [[NEW_BF_VALUE]] monotonic monotonic
338// CHECK: [[FAILED_OLD_VAL]] = extractvalue { i32, i1 } [[RES]], 0
339// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i32, i1 } [[RES]], 1
340// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
341// CHECK: [[EXIT]]
342#pragma omp atomic write
343  bfx2.a = ldv;
344// CHECK: load x86_fp80, x86_fp80* @{{.+}}
345// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i32
346// CHECK: [[PREV_VALUE:%.+]] = load atomic i8, i8* getelementptr (i8, i8* bitcast (%struct.BitFields2_packed* @{{.+}} to i8*), i64 3) monotonic
347// CHECK: br label %[[CONT:.+]]
348// CHECK: [[CONT]]
349// CHECK: [[OLD_BF_VALUE:%.+]] = phi i8 [ [[PREV_VALUE]], %[[EXIT]] ], [ [[FAILED_OLD_VAL:%.+]], %[[CONT]] ]
350// CHECK: [[TRUNC:%.+]] = trunc i32 [[NEW_VAL]] to i8
351// CHECK: [[BF_AND:%.+]] = and i8 [[TRUNC]], 1
352// CHECK: [[BF_VALUE:%.+]] = shl i8 [[BF_AND]], 7
353// CHECK: [[BF_CLEAR:%.+]] = and i8 %{{.+}}, 127
354// CHECK: or i8 [[BF_CLEAR]], [[BF_VALUE]]
355// CHECK: store i8 %{{.+}}, i8* [[LDTEMP:%.+]]
356// CHECK: [[NEW_BF_VALUE:%.+]] = load i8, i8* [[LDTEMP]]
357// CHECK: [[RES:%.+]] = cmpxchg i8* getelementptr (i8, i8* bitcast (%struct.BitFields2_packed* @{{.+}} to i8*), i64 3), i8 [[OLD_BF_VALUE]], i8 [[NEW_BF_VALUE]] monotonic monotonic
358// CHECK: [[FAILED_OLD_VAL]] = extractvalue { i8, i1 } [[RES]], 0
359// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i8, i1 } [[RES]], 1
360// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
361// CHECK: [[EXIT]]
362#pragma omp atomic write
363  bfx2_packed.a = ldv;
364// CHECK: load x86_fp80, x86_fp80* @{{.+}}
365// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i32
366// CHECK: [[PREV_VALUE:%.+]] = load atomic i32, i32* getelementptr inbounds (%struct.BitFields3, %struct.BitFields3* @{{.+}}, i32 0, i32 0) monotonic
367// CHECK: br label %[[CONT:.+]]
368// CHECK: [[CONT]]
369// CHECK: [[OLD_BF_VALUE:%.+]] = phi i32 [ [[PREV_VALUE]], %[[EXIT]] ], [ [[FAILED_OLD_VAL:%.+]], %[[CONT]] ]
370// CHECK: [[BF_AND:%.+]] = and i32 [[NEW_VAL]], 16383
371// CHECK: [[BF_VALUE:%.+]] = shl i32 [[BF_AND]], 11
372// CHECK: [[BF_CLEAR:%.+]] = and i32 %{{.+}}, -33552385
373// CHECK: or i32 [[BF_CLEAR]], [[BF_VALUE]]
374// CHECK: store i32 %{{.+}}, i32* [[LDTEMP:%.+]]
375// CHECK: [[NEW_BF_VALUE:%.+]] = load i32, i32* [[LDTEMP]]
376// CHECK: [[RES:%.+]] = cmpxchg i32* getelementptr inbounds (%struct.BitFields3, %struct.BitFields3* @{{.+}}, i32 0, i32 0), i32 [[OLD_BF_VALUE]], i32 [[NEW_BF_VALUE]] monotonic monotonic
377// CHECK: [[FAILED_OLD_VAL]] = extractvalue { i32, i1 } [[RES]], 0
378// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i32, i1 } [[RES]], 1
379// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
380// CHECK: [[EXIT]]
381#pragma omp atomic write
382  bfx3.a = ldv;
383// CHECK: load x86_fp80, x86_fp80* @{{.+}}
384// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i32
385// CHECK: [[LDTEMP:%.+]] = bitcast i32* %{{.+}} to i24*
386// CHECK: [[BITCAST:%.+]] = bitcast i24* %{{.+}} to i8*
387// CHECK: call void @__atomic_load(i64 3, i8* getelementptr (i8, i8* bitcast (%struct.BitFields3_packed* @{{.+}} to i8*), i64 1), i8* [[BITCAST]], i32 0)
388// CHECK: br label %[[CONT:.+]]
389// CHECK: [[CONT]]
390// CHECK: [[OLD_VAL:%.+]] = load i24, i24* %{{.+}},
391// CHECK: store i24 [[OLD_VAL]], i24* [[TEMP:%.+]],
392// CHECK: [[TRUNC:%.+]] = trunc i32 [[NEW_VAL]] to i24
393// CHECK: [[BF_AND:%.+]] = and i24 [[TRUNC]], 16383
394// CHECK: [[BF_VALUE:%.+]] = shl i24 [[BF_AND]], 3
395// CHECK: [[BF_CLEAR:%.+]] = and i24 %{{.+}}, -131065
396// CHECK: or i24 [[BF_CLEAR]], [[BF_VALUE]]
397// CHECK: store i24 %{{.+}}, i24* [[TEMP]]
398// CHECK: [[BITCAST_TEMP_OLD_BF_ADDR:%.+]] = bitcast i24* [[LDTEMP]] to i8*
399// CHECK: [[BITCAST_TEMP_NEW_BF_ADDR:%.+]] = bitcast i24* [[TEMP]] to i8*
400// CHECK: [[FAIL_SUCCESS:%.+]] = call zeroext i1 @__atomic_compare_exchange(i64 3, i8* getelementptr (i8, i8* bitcast (%struct.BitFields3_packed* @{{.+}} to i8*), i64 1), i8* [[BITCAST_TEMP_OLD_BF_ADDR]], i8* [[BITCAST_TEMP_NEW_BF_ADDR]], i32 0, i32 0)
401// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
402// CHECK: [[EXIT]]
403#pragma omp atomic write
404  bfx3_packed.a = ldv;
405// CHECK: load x86_fp80, x86_fp80* @{{.+}}
406// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i32
407// CHECK: [[PREV_VALUE:%.+]] = load atomic i64, i64* bitcast (%struct.BitFields4* @{{.+}} to i64*) monotonic
408// CHECK: br label %[[CONT:.+]]
409// CHECK: [[CONT]]
410// CHECK: [[OLD_BF_VALUE:%.+]] = phi i64 [ [[PREV_VALUE]], %[[EXIT]] ], [ [[FAILED_OLD_VAL:%.+]], %[[CONT]] ]
411// CHECK: [[ZEXT:%.+]] = zext i32 [[NEW_VAL]] to i64
412// CHECK: [[BF_AND:%.+]] = and i64 [[ZEXT]], 1
413// CHECK: [[BF_VALUE:%.+]] = shl i64 [[BF_AND]], 16
414// CHECK: [[BF_CLEAR:%.+]] = and i64 %{{.+}}, -65537
415// CHECK: or i64 [[BF_CLEAR]], [[BF_VALUE]]
416// CHECK: store i64 %{{.+}}, i64* [[LDTEMP:%.+]]
417// CHECK: [[NEW_BF_VALUE:%.+]] = load i64, i64* [[LDTEMP]]
418// CHECK: [[RES:%.+]] = cmpxchg i64* bitcast (%struct.BitFields4* @{{.+}} to i64*), i64 [[OLD_BF_VALUE]], i64 [[NEW_BF_VALUE]] monotonic monotonic
419// CHECK: [[FAILED_OLD_VAL]] = extractvalue { i64, i1 } [[RES]], 0
420// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i64, i1 } [[RES]], 1
421// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
422// CHECK: [[EXIT]]
423#pragma omp atomic write
424  bfx4.a = ldv;
425// CHECK: load x86_fp80, x86_fp80* @{{.+}}
426// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i32
427// CHECK: [[PREV_VALUE:%.+]] = load atomic i8, i8* getelementptr inbounds (%struct.BitFields4_packed, %struct.BitFields4_packed* @{{.+}}, i32 0, i32 0, i64 2) monotonic
428// CHECK: br label %[[CONT:.+]]
429// CHECK: [[CONT]]
430// CHECK: [[OLD_BF_VALUE:%.+]] = phi i8 [ [[PREV_VALUE]], %[[EXIT]] ], [ [[FAILED_OLD_VAL:%.+]], %[[CONT]] ]
431// CHECK: [[TRUNC:%.+]] = trunc i32 [[NEW_VAL]] to i8
432// CHECK: [[BF_VALUE:%.+]] = and i8 [[TRUNC]], 1
433// CHECK: [[BF_CLEAR:%.+]] = and i8 %{{.+}}, -2
434// CHECK: or i8 [[BF_CLEAR]], [[BF_VALUE]]
435// CHECK: store i8 %{{.+}}, i8* [[LDTEMP:%.+]]
436// CHECK: [[NEW_BF_VALUE:%.+]] = load i8, i8* [[LDTEMP]]
437// CHECK: [[RES:%.+]] = cmpxchg i8* getelementptr inbounds (%struct.BitFields4_packed, %struct.BitFields4_packed* @{{.+}}, i32 0, i32 0, i64 2), i8 [[OLD_BF_VALUE]], i8 [[NEW_BF_VALUE]] monotonic monotonic
438// CHECK: [[FAILED_OLD_VAL]] = extractvalue { i8, i1 } [[RES]], 0
439// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i8, i1 } [[RES]], 1
440// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
441// CHECK: [[EXIT]]
442#pragma omp atomic write
443  bfx4_packed.a = ldv;
444// CHECK: load x86_fp80, x86_fp80* @{{.+}}
445// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i64
446// CHECK: [[PREV_VALUE:%.+]] = load atomic i64, i64* bitcast (%struct.BitFields4* @{{.+}} to i64*) monotonic
447// CHECK: br label %[[CONT:.+]]
448// CHECK: [[CONT]]
449// CHECK: [[OLD_BF_VALUE:%.+]] = phi i64 [ [[PREV_VALUE]], %[[EXIT]] ], [ [[FAILED_OLD_VAL:%.+]], %[[CONT]] ]
450// CHECK: [[BF_AND:%.+]] = and i64 [[NEW_VAL]], 127
451// CHECK: [[BF_VALUE:%.+]] = shl i64 [[BF_AND]], 17
452// CHECK: [[BF_CLEAR:%.+]] = and i64 %{{.+}}, -16646145
453// CHECK: or i64 [[BF_CLEAR]], [[BF_VALUE]]
454// CHECK: store i64 %{{.+}}, i64* [[LDTEMP:%.+]]
455// CHECK: [[NEW_BF_VALUE:%.+]] = load i64, i64* [[LDTEMP]]
456// CHECK: [[RES:%.+]] = cmpxchg i64* bitcast (%struct.BitFields4* @{{.+}} to i64*), i64 [[OLD_BF_VALUE]], i64 [[NEW_BF_VALUE]] monotonic monotonic
457// CHECK: [[FAILED_OLD_VAL]] = extractvalue { i64, i1 } [[RES]], 0
458// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i64, i1 } [[RES]], 1
459// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
460// CHECK: [[EXIT]]
461#pragma omp atomic write
462  bfx4.b = ldv;
463// CHECK: load x86_fp80, x86_fp80* @{{.+}}
464// CHECK: [[NEW_VAL:%.+]] = fptosi x86_fp80 %{{.+}} to i64
465// CHECK: [[PREV_VALUE:%.+]] = load atomic i8, i8* getelementptr inbounds (%struct.BitFields4_packed, %struct.BitFields4_packed* @{{.+}}, i32 0, i32 0, i64 2) monotonic
466// CHECK: br label %[[CONT:.+]]
467// CHECK: [[CONT]]
468// CHECK: [[OLD_BF_VALUE:%.+]] = phi i8 [ [[PREV_VALUE]], %[[EXIT]] ], [ [[FAILED_OLD_VAL:%.+]], %[[CONT]] ]
469// CHECK: [[TRUNC:%.+]] = trunc i64 [[NEW_VAL]] to i8
470// CHECK: [[BF_AND:%.+]] = and i8 [[TRUNC]], 127
471// CHECK: [[BF_VALUE:%.+]] = shl i8 [[BF_AND]], 1
472// CHECK: [[BF_CLEAR:%.+]] = and i8 %{{.+}}, 1
473// CHECK: or i8 [[BF_CLEAR]], [[BF_VALUE]]
474// CHECK: store i8 %{{.+}}, i8* [[LDTEMP:%.+]]
475// CHECK: [[NEW_BF_VALUE:%.+]] = load i8, i8* [[LDTEMP]]
476// CHECK: [[RES:%.+]] = cmpxchg i8* getelementptr inbounds (%struct.BitFields4_packed, %struct.BitFields4_packed* @{{.+}}, i32 0, i32 0, i64 2), i8 [[OLD_BF_VALUE]], i8 [[NEW_BF_VALUE]] monotonic monotonic
477// CHECK: [[FAILED_OLD_VAL]] = extractvalue { i8, i1 } [[RES]], 0
478// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i8, i1 } [[RES]], 1
479// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
480// CHECK: [[EXIT]]
481#pragma omp atomic write
482  bfx4_packed.b = ldv;
483// CHECK: load i64, i64*
484// CHECK: [[VEC_ITEM_VAL:%.+]] = uitofp i64 %{{.+}} to float
485// CHECK: [[I64VAL:%.+]] = load atomic i64, i64* bitcast (<2 x float>* [[DEST:@.+]] to i64*) monotonic
486// CHECK: br label %[[CONT:.+]]
487// CHECK: [[CONT]]
488// CHECK: [[OLD_I64:%.+]] = phi i64 [ [[I64VAL]], %{{.+}} ], [ [[FAILED_I64_OLD_VAL:%.+]], %[[CONT]] ]
489// CHECK: [[BITCAST:%.+]] = bitcast <2 x float>* [[LDTEMP:%.+]] to i64*
490// CHECK: store i64 [[OLD_I64]], i64* [[BITCAST]],
491// CHECK: [[VEC_VAL:%.+]] = load <2 x float>, <2 x float>* [[LDTEMP]]
492// CHECK: [[NEW_VEC_VAL:%.+]] = insertelement <2 x float> [[VEC_VAL]], float [[VEC_ITEM_VAL]], i64 0
493// CHECK: store <2 x float> [[NEW_VEC_VAL]], <2 x float>* [[LDTEMP]]
494// CHECK: [[NEW_I64:%.+]] = load i64, i64* [[BITCAST]]
495// CHECK: [[RES:%.+]] = cmpxchg i64* bitcast (<2 x float>* [[DEST]] to i64*), i64 [[OLD_I64]], i64 [[NEW_I64]] monotonic monotonic
496// CHECK: [[FAILED_I64_OLD_VAL:%.+]] = extractvalue { i64, i1 } [[RES]], 0
497// CHECK: [[FAIL_SUCCESS:%.+]] = extractvalue { i64, i1 } [[RES]], 1
498// CHECK: br i1 [[FAIL_SUCCESS]], label %[[EXIT:.+]], label %[[CONT]]
499// CHECK: [[EXIT]]
500#pragma omp atomic write
501  float2x.x = ulv;
502// CHECK: call i32 @llvm.read_register.i32(
503// CHECK: sitofp i32 %{{.+}} to double
504// CHECK: bitcast double %{{.+}} to i64
505// CHECK: store atomic i64 %{{.+}}, i64* bitcast (double* @{{.+}} to i64*) seq_cst
506// CHECK: call{{.*}} @__kmpc_flush(
507#pragma omp atomic write seq_cst
508  dv = rix;
509  return 0;
510}
511
512#endif
513