1 /*
2  * Distributed under the Boost Software License, Version 1.0.
3  * (See accompanying file LICENSE_1_0.txt or copy at
4  * http://www.boost.org/LICENSE_1_0.txt)
5  *
6  * Copyright (c) 2009 Helge Bahmann
7  * Copyright (c) 2012 Tim Blechmann
8  * Copyright (c) 2014 Andrey Semashev
9  */
10 /*!
11  * \file   atomic/detail/core_arch_ops_gcc_x86.hpp
12  *
13  * This header contains implementation of the \c core_arch_operations template.
14  */
15 
16 #ifndef BOOST_ATOMIC_DETAIL_CORE_ARCH_OPS_GCC_X86_HPP_INCLUDED_
17 #define BOOST_ATOMIC_DETAIL_CORE_ARCH_OPS_GCC_X86_HPP_INCLUDED_
18 
19 #include <cstddef>
20 #include <boost/memory_order.hpp>
21 #include <boost/atomic/detail/config.hpp>
22 #include <boost/atomic/detail/storage_traits.hpp>
23 #include <boost/atomic/detail/core_arch_operations_fwd.hpp>
24 #include <boost/atomic/detail/capabilities.hpp>
25 #if defined(BOOST_ATOMIC_DETAIL_X86_HAS_CMPXCHG8B) || defined(BOOST_ATOMIC_DETAIL_X86_HAS_CMPXCHG16B)
26 #include <boost/cstdint.hpp>
27 #include <boost/atomic/detail/intptr.hpp>
28 #include <boost/atomic/detail/string_ops.hpp>
29 #include <boost/atomic/detail/core_ops_cas_based.hpp>
30 #endif
31 #include <boost/atomic/detail/header.hpp>
32 
33 #ifdef BOOST_HAS_PRAGMA_ONCE
34 #pragma once
35 #endif
36 
37 namespace boost {
38 namespace atomics {
39 namespace detail {
40 
41 struct core_arch_operations_gcc_x86_base
42 {
43     static BOOST_CONSTEXPR_OR_CONST bool full_cas_based = false;
44     static BOOST_CONSTEXPR_OR_CONST bool is_always_lock_free = true;
45 
fence_beforeboost::atomics::detail::core_arch_operations_gcc_x86_base46     static BOOST_FORCEINLINE void fence_before(memory_order order) BOOST_NOEXCEPT
47     {
48         if ((static_cast< unsigned int >(order) & static_cast< unsigned int >(memory_order_release)) != 0u)
49             __asm__ __volatile__ ("" ::: "memory");
50     }
51 
fence_afterboost::atomics::detail::core_arch_operations_gcc_x86_base52     static BOOST_FORCEINLINE void fence_after(memory_order order) BOOST_NOEXCEPT
53     {
54         if ((static_cast< unsigned int >(order) & (static_cast< unsigned int >(memory_order_consume) | static_cast< unsigned int >(memory_order_acquire))) != 0u)
55             __asm__ __volatile__ ("" ::: "memory");
56     }
57 };
58 
59 template< std::size_t Size, bool Signed, bool Interprocess, typename Derived >
60 struct core_arch_operations_gcc_x86 :
61     public core_arch_operations_gcc_x86_base
62 {
63     typedef typename storage_traits< Size >::type storage_type;
64 
65     static BOOST_CONSTEXPR_OR_CONST std::size_t storage_size = Size;
66     static BOOST_CONSTEXPR_OR_CONST std::size_t storage_alignment = Size;
67     static BOOST_CONSTEXPR_OR_CONST bool is_signed = Signed;
68     static BOOST_CONSTEXPR_OR_CONST bool is_interprocess = Interprocess;
69 
storeboost::atomics::detail::core_arch_operations_gcc_x8670     static BOOST_FORCEINLINE void store(storage_type volatile& storage, storage_type v, memory_order order) BOOST_NOEXCEPT
71     {
72         if (order != memory_order_seq_cst)
73         {
74             fence_before(order);
75             storage = v;
76             fence_after(order);
77         }
78         else
79         {
80             Derived::exchange(storage, v, order);
81         }
82     }
83 
loadboost::atomics::detail::core_arch_operations_gcc_x8684     static BOOST_FORCEINLINE storage_type load(storage_type const volatile& storage, memory_order order) BOOST_NOEXCEPT
85     {
86         storage_type v = storage;
87         fence_after(order);
88         return v;
89     }
90 
fetch_subboost::atomics::detail::core_arch_operations_gcc_x8691     static BOOST_FORCEINLINE storage_type fetch_sub(storage_type volatile& storage, storage_type v, memory_order order) BOOST_NOEXCEPT
92     {
93         return Derived::fetch_add(storage, -v, order);
94     }
95 
compare_exchange_weakboost::atomics::detail::core_arch_operations_gcc_x8696     static BOOST_FORCEINLINE bool compare_exchange_weak(
97         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order success_order, memory_order failure_order) BOOST_NOEXCEPT
98     {
99         return Derived::compare_exchange_strong(storage, expected, desired, success_order, failure_order);
100     }
101 
test_and_setboost::atomics::detail::core_arch_operations_gcc_x86102     static BOOST_FORCEINLINE bool test_and_set(storage_type volatile& storage, memory_order order) BOOST_NOEXCEPT
103     {
104         return !!Derived::exchange(storage, (storage_type)1, order);
105     }
106 
clearboost::atomics::detail::core_arch_operations_gcc_x86107     static BOOST_FORCEINLINE void clear(storage_type volatile& storage, memory_order order) BOOST_NOEXCEPT
108     {
109         store(storage, (storage_type)0, order);
110     }
111 };
112 
113 template< bool Signed, bool Interprocess >
114 struct core_arch_operations< 1u, Signed, Interprocess > :
115     public core_arch_operations_gcc_x86< 1u, Signed, Interprocess, core_arch_operations< 1u, Signed, Interprocess > >
116 {
117     typedef core_arch_operations_gcc_x86< 1u, Signed, Interprocess, core_arch_operations< 1u, Signed, Interprocess > > base_type;
118     typedef typename base_type::storage_type storage_type;
119     typedef typename storage_traits< 4u >::type temp_storage_type;
120 
fetch_addboost::atomics::detail::core_arch_operations121     static BOOST_FORCEINLINE storage_type fetch_add(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
122     {
123         __asm__ __volatile__
124         (
125             "lock; xaddb %0, %1"
126             : "+q" (v), "+m" (storage)
127             :
128             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
129         );
130         return v;
131     }
132 
exchangeboost::atomics::detail::core_arch_operations133     static BOOST_FORCEINLINE storage_type exchange(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
134     {
135         __asm__ __volatile__
136         (
137             "xchgb %0, %1"
138             : "+q" (v), "+m" (storage)
139             :
140             : "memory"
141         );
142         return v;
143     }
144 
compare_exchange_strongboost::atomics::detail::core_arch_operations145     static BOOST_FORCEINLINE bool compare_exchange_strong(
146         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order, memory_order) BOOST_NOEXCEPT
147     {
148         storage_type previous = expected;
149         bool success;
150 #if defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
151         __asm__ __volatile__
152         (
153             "lock; cmpxchgb %3, %1"
154             : "+a" (previous), "+m" (storage), "=@ccz" (success)
155             : "q" (desired)
156             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
157         );
158 #else // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
159         __asm__ __volatile__
160         (
161             "lock; cmpxchgb %3, %1\n\t"
162             "sete %2"
163             : "+a" (previous), "+m" (storage), "=q" (success)
164             : "q" (desired)
165             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
166         );
167 #endif // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
168         expected = previous;
169         return success;
170     }
171 
172 #define BOOST_ATOMIC_DETAIL_CAS_LOOP(op, argument, result)\
173     temp_storage_type new_val;\
174     __asm__ __volatile__\
175     (\
176         ".align 16\n\t"\
177         "1: mov %[arg], %2\n\t"\
178         op " %%al, %b2\n\t"\
179         "lock; cmpxchgb %b2, %[storage]\n\t"\
180         "jne 1b"\
181         : [res] "+a" (result), [storage] "+m" (storage), "=&q" (new_val)\
182         : [arg] "ir" ((temp_storage_type)argument)\
183         : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"\
184     )
185 
fetch_andboost::atomics::detail::core_arch_operations186     static BOOST_FORCEINLINE storage_type fetch_and(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
187     {
188         storage_type res = storage;
189         BOOST_ATOMIC_DETAIL_CAS_LOOP("andb", v, res);
190         return res;
191     }
192 
fetch_orboost::atomics::detail::core_arch_operations193     static BOOST_FORCEINLINE storage_type fetch_or(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
194     {
195         storage_type res = storage;
196         BOOST_ATOMIC_DETAIL_CAS_LOOP("orb", v, res);
197         return res;
198     }
199 
fetch_xorboost::atomics::detail::core_arch_operations200     static BOOST_FORCEINLINE storage_type fetch_xor(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
201     {
202         storage_type res = storage;
203         BOOST_ATOMIC_DETAIL_CAS_LOOP("xorb", v, res);
204         return res;
205     }
206 
207 #undef BOOST_ATOMIC_DETAIL_CAS_LOOP
208 };
209 
210 template< bool Signed, bool Interprocess >
211 struct core_arch_operations< 2u, Signed, Interprocess > :
212     public core_arch_operations_gcc_x86< 2u, Signed, Interprocess, core_arch_operations< 2u, Signed, Interprocess > >
213 {
214     typedef core_arch_operations_gcc_x86< 2u, Signed, Interprocess, core_arch_operations< 2u, Signed, Interprocess > > base_type;
215     typedef typename base_type::storage_type storage_type;
216     typedef typename storage_traits< 4u >::type temp_storage_type;
217 
fetch_addboost::atomics::detail::core_arch_operations218     static BOOST_FORCEINLINE storage_type fetch_add(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
219     {
220         __asm__ __volatile__
221         (
222             "lock; xaddw %0, %1"
223             : "+q" (v), "+m" (storage)
224             :
225             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
226         );
227         return v;
228     }
229 
exchangeboost::atomics::detail::core_arch_operations230     static BOOST_FORCEINLINE storage_type exchange(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
231     {
232         __asm__ __volatile__
233         (
234             "xchgw %0, %1"
235             : "+q" (v), "+m" (storage)
236             :
237             : "memory"
238         );
239         return v;
240     }
241 
compare_exchange_strongboost::atomics::detail::core_arch_operations242     static BOOST_FORCEINLINE bool compare_exchange_strong(
243         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order, memory_order) BOOST_NOEXCEPT
244     {
245         storage_type previous = expected;
246         bool success;
247 #if defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
248         __asm__ __volatile__
249         (
250             "lock; cmpxchgw %3, %1"
251             : "+a" (previous), "+m" (storage), "=@ccz" (success)
252             : "q" (desired)
253             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
254         );
255 #else // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
256         __asm__ __volatile__
257         (
258             "lock; cmpxchgw %3, %1\n\t"
259             "sete %2"
260             : "+a" (previous), "+m" (storage), "=q" (success)
261             : "q" (desired)
262             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
263         );
264 #endif // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
265         expected = previous;
266         return success;
267     }
268 
269 #define BOOST_ATOMIC_DETAIL_CAS_LOOP(op, argument, result)\
270     temp_storage_type new_val;\
271     __asm__ __volatile__\
272     (\
273         ".align 16\n\t"\
274         "1: mov %[arg], %2\n\t"\
275         op " %%ax, %w2\n\t"\
276         "lock; cmpxchgw %w2, %[storage]\n\t"\
277         "jne 1b"\
278         : [res] "+a" (result), [storage] "+m" (storage), "=&q" (new_val)\
279         : [arg] "ir" ((temp_storage_type)argument)\
280         : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"\
281     )
282 
fetch_andboost::atomics::detail::core_arch_operations283     static BOOST_FORCEINLINE storage_type fetch_and(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
284     {
285         storage_type res = storage;
286         BOOST_ATOMIC_DETAIL_CAS_LOOP("andw", v, res);
287         return res;
288     }
289 
fetch_orboost::atomics::detail::core_arch_operations290     static BOOST_FORCEINLINE storage_type fetch_or(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
291     {
292         storage_type res = storage;
293         BOOST_ATOMIC_DETAIL_CAS_LOOP("orw", v, res);
294         return res;
295     }
296 
fetch_xorboost::atomics::detail::core_arch_operations297     static BOOST_FORCEINLINE storage_type fetch_xor(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
298     {
299         storage_type res = storage;
300         BOOST_ATOMIC_DETAIL_CAS_LOOP("xorw", v, res);
301         return res;
302     }
303 
304 #undef BOOST_ATOMIC_DETAIL_CAS_LOOP
305 };
306 
307 template< bool Signed, bool Interprocess >
308 struct core_arch_operations< 4u, Signed, Interprocess > :
309     public core_arch_operations_gcc_x86< 4u, Signed, Interprocess, core_arch_operations< 4u, Signed, Interprocess > >
310 {
311     typedef core_arch_operations_gcc_x86< 4u, Signed, Interprocess, core_arch_operations< 4u, Signed, Interprocess > > base_type;
312     typedef typename base_type::storage_type storage_type;
313 
fetch_addboost::atomics::detail::core_arch_operations314     static BOOST_FORCEINLINE storage_type fetch_add(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
315     {
316         __asm__ __volatile__
317         (
318             "lock; xaddl %0, %1"
319             : "+r" (v), "+m" (storage)
320             :
321             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
322         );
323         return v;
324     }
325 
exchangeboost::atomics::detail::core_arch_operations326     static BOOST_FORCEINLINE storage_type exchange(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
327     {
328         __asm__ __volatile__
329         (
330             "xchgl %0, %1"
331             : "+r" (v), "+m" (storage)
332             :
333             : "memory"
334         );
335         return v;
336     }
337 
compare_exchange_strongboost::atomics::detail::core_arch_operations338     static BOOST_FORCEINLINE bool compare_exchange_strong(
339         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order, memory_order) BOOST_NOEXCEPT
340     {
341         storage_type previous = expected;
342         bool success;
343 #if defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
344         __asm__ __volatile__
345         (
346             "lock; cmpxchgl %3, %1"
347             : "+a" (previous), "+m" (storage), "=@ccz" (success)
348             : "r" (desired)
349             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
350         );
351 #else // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
352         __asm__ __volatile__
353         (
354             "lock; cmpxchgl %3, %1\n\t"
355             "sete %2"
356             : "+a" (previous), "+m" (storage), "=q" (success)
357             : "r" (desired)
358             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
359         );
360 #endif // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
361         expected = previous;
362         return success;
363     }
364 
365 #define BOOST_ATOMIC_DETAIL_CAS_LOOP(op, argument, result)\
366     storage_type new_val;\
367     __asm__ __volatile__\
368     (\
369         ".align 16\n\t"\
370         "1: mov %[arg], %[new_val]\n\t"\
371         op " %%eax, %[new_val]\n\t"\
372         "lock; cmpxchgl %[new_val], %[storage]\n\t"\
373         "jne 1b"\
374         : [res] "+a" (result), [storage] "+m" (storage), [new_val] "=&r" (new_val)\
375         : [arg] "ir" (argument)\
376         : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"\
377     )
378 
fetch_andboost::atomics::detail::core_arch_operations379     static BOOST_FORCEINLINE storage_type fetch_and(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
380     {
381         storage_type res = storage;
382         BOOST_ATOMIC_DETAIL_CAS_LOOP("andl", v, res);
383         return res;
384     }
385 
fetch_orboost::atomics::detail::core_arch_operations386     static BOOST_FORCEINLINE storage_type fetch_or(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
387     {
388         storage_type res = storage;
389         BOOST_ATOMIC_DETAIL_CAS_LOOP("orl", v, res);
390         return res;
391     }
392 
fetch_xorboost::atomics::detail::core_arch_operations393     static BOOST_FORCEINLINE storage_type fetch_xor(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
394     {
395         storage_type res = storage;
396         BOOST_ATOMIC_DETAIL_CAS_LOOP("xorl", v, res);
397         return res;
398     }
399 
400 #undef BOOST_ATOMIC_DETAIL_CAS_LOOP
401 };
402 
403 #if defined(BOOST_ATOMIC_DETAIL_X86_HAS_CMPXCHG8B)
404 
405 // Note: In the 32-bit PIC code guarded with BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX below we have to avoid using memory
406 // operand constraints because the compiler may choose to use ebx as the base register for that operand. At least, clang
407 // is known to do that. For this reason we have to pre-compute a pointer to storage and pass it in edi. For the same reason
408 // we cannot save ebx to the stack with a mov instruction, so we use esi as a scratch register and restore it afterwards.
409 // Alternatively, we could push/pop the register to the stack, but exchanging the registers is faster.
410 // The need to pass a pointer in edi is a bit wasteful because normally the memory operand would use a base pointer
411 // with an offset (e.g. `this` + offset). But unfortunately, there seems to be no way around it.
412 
413 template< bool Signed, bool Interprocess >
414 struct gcc_dcas_x86
415 {
416     typedef typename storage_traits< 8u >::type storage_type;
417     typedef uint32_t BOOST_ATOMIC_DETAIL_MAY_ALIAS aliasing_uint32_t;
418 
419     static BOOST_CONSTEXPR_OR_CONST std::size_t storage_size = 8u;
420     static BOOST_CONSTEXPR_OR_CONST std::size_t storage_alignment = 8u;
421     static BOOST_CONSTEXPR_OR_CONST bool is_signed = Signed;
422     static BOOST_CONSTEXPR_OR_CONST bool is_interprocess = Interprocess;
423     static BOOST_CONSTEXPR_OR_CONST bool full_cas_based = true;
424     static BOOST_CONSTEXPR_OR_CONST bool is_always_lock_free = true;
425 
storeboost::atomics::detail::gcc_dcas_x86426     static BOOST_FORCEINLINE void store(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
427     {
428         if (BOOST_LIKELY((((uintptr_t)&storage) & 0x00000007) == 0u))
429         {
430 #if defined(__SSE__)
431             typedef float xmm_t __attribute__((__vector_size__(16)));
432             xmm_t xmm_scratch;
433             __asm__ __volatile__
434             (
435 #if defined(__AVX__)
436                 "vmovq %[value], %[xmm_scratch]\n\t"
437                 "vmovq %[xmm_scratch], %[storage]\n\t"
438 #elif defined(__SSE2__)
439                 "movq %[value], %[xmm_scratch]\n\t"
440                 "movq %[xmm_scratch], %[storage]\n\t"
441 #else
442                 "xorps %[xmm_scratch], %[xmm_scratch]\n\t"
443                 "movlps %[value], %[xmm_scratch]\n\t"
444                 "movlps %[xmm_scratch], %[storage]\n\t"
445 #endif
446                 : [storage] "=m" (storage), [xmm_scratch] "=x" (xmm_scratch)
447                 : [value] "m" (v)
448                 : "memory"
449             );
450 #else
451             __asm__ __volatile__
452             (
453                 "fildll %[value]\n\t"
454                 "fistpll %[storage]\n\t"
455                 : [storage] "=m" (storage)
456                 : [value] "m" (v)
457                 : "memory"
458             );
459 #endif
460         }
461         else
462         {
463 #if defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
464             __asm__ __volatile__
465             (
466                 "xchgl %%ebx, %%esi\n\t"
467                 "movl %%eax, %%ebx\n\t"
468                 "movl (%[dest]), %%eax\n\t"
469                 "movl 4(%[dest]), %%edx\n\t"
470                 ".align 16\n\t"
471                 "1: lock; cmpxchg8b (%[dest])\n\t"
472                 "jne 1b\n\t"
473                 "xchgl %%ebx, %%esi\n\t"
474                 :
475                 : "a" ((uint32_t)v), "c" ((uint32_t)(v >> 32)), [dest] "D" (&storage)
476                 : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "edx", "memory"
477             );
478 #else // defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
479             __asm__ __volatile__
480             (
481                 "movl %[dest_lo], %%eax\n\t"
482                 "movl %[dest_hi], %%edx\n\t"
483                 ".align 16\n\t"
484                 "1: lock; cmpxchg8b %[dest_lo]\n\t"
485                 "jne 1b\n\t"
486                 : [dest_lo] "=m" (storage), [dest_hi] "=m" (reinterpret_cast< volatile aliasing_uint32_t* >(&storage)[1])
487                 : [value_lo] "b" ((uint32_t)v), "c" ((uint32_t)(v >> 32))
488                 : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "eax", "edx", "memory"
489             );
490 #endif // defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
491         }
492     }
493 
loadboost::atomics::detail::gcc_dcas_x86494     static BOOST_FORCEINLINE storage_type load(storage_type const volatile& storage, memory_order) BOOST_NOEXCEPT
495     {
496         storage_type value;
497 
498         if (BOOST_LIKELY((((uintptr_t)&storage) & 0x00000007) == 0u))
499         {
500 #if defined(__SSE__)
501             typedef float xmm_t __attribute__((__vector_size__(16)));
502             xmm_t xmm_scratch;
503             __asm__ __volatile__
504             (
505 #if defined(__AVX__)
506                 "vmovq %[storage], %[xmm_scratch]\n\t"
507                 "vmovq %[xmm_scratch], %[value]\n\t"
508 #elif defined(__SSE2__)
509                 "movq %[storage], %[xmm_scratch]\n\t"
510                 "movq %[xmm_scratch], %[value]\n\t"
511 #else
512                 "xorps %[xmm_scratch], %[xmm_scratch]\n\t"
513                 "movlps %[storage], %[xmm_scratch]\n\t"
514                 "movlps %[xmm_scratch], %[value]\n\t"
515 #endif
516                 : [value] "=m" (value), [xmm_scratch] "=x" (xmm_scratch)
517                 : [storage] "m" (storage)
518                 : "memory"
519             );
520 #else
521             __asm__ __volatile__
522             (
523                 "fildll %[storage]\n\t"
524                 "fistpll %[value]\n\t"
525                 : [value] "=m" (value)
526                 : [storage] "m" (storage)
527                 : "memory"
528             );
529 #endif
530         }
531         else
532         {
533             // Note that despite const qualification cmpxchg8b below may issue a store to the storage. The storage value
534             // will not change, but this prevents the storage to reside in read-only memory.
535 
536 #if defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
537 
538             uint32_t value_bits[2];
539 
540             // We don't care for comparison result here; the previous value will be stored into value anyway.
541             // Also we don't care for ebx and ecx values, they just have to be equal to eax and edx before cmpxchg8b.
542             __asm__ __volatile__
543             (
544                 "movl %%ebx, %%eax\n\t"
545                 "movl %%ecx, %%edx\n\t"
546                 "lock; cmpxchg8b %[storage]\n\t"
547                 : "=&a" (value_bits[0]), "=&d" (value_bits[1])
548                 : [storage] "m" (storage)
549                 : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
550             );
551             BOOST_ATOMIC_DETAIL_MEMCPY(&value, value_bits, sizeof(value));
552 
553 #else // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
554 
555             // We don't care for comparison result here; the previous value will be stored into value anyway.
556             // Also we don't care for ebx and ecx values, they just have to be equal to eax and edx before cmpxchg8b.
557             __asm__ __volatile__
558             (
559                 "movl %%ebx, %%eax\n\t"
560                 "movl %%ecx, %%edx\n\t"
561                 "lock; cmpxchg8b %[storage]\n\t"
562                 : "=&A" (value)
563                 : [storage] "m" (storage)
564                 : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
565             );
566 
567 #endif // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
568         }
569 
570         return value;
571     }
572 
compare_exchange_strongboost::atomics::detail::gcc_dcas_x86573     static BOOST_FORCEINLINE bool compare_exchange_strong(
574         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order, memory_order) BOOST_NOEXCEPT
575     {
576 #if defined(__clang__)
577 
578         // Clang cannot allocate eax:edx register pairs but it has sync intrinsics
579         storage_type old_expected = expected;
580         expected = __sync_val_compare_and_swap(&storage, old_expected, desired);
581         return expected == old_expected;
582 
583 #elif defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
584 
585         bool success;
586 
587 #if defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
588         __asm__ __volatile__
589         (
590             "xchgl %%ebx, %%esi\n\t"
591             "lock; cmpxchg8b (%[dest])\n\t"
592             "xchgl %%ebx, %%esi\n\t"
593             : "+A" (expected), [success] "=@ccz" (success)
594             : "S" ((uint32_t)desired), "c" ((uint32_t)(desired >> 32)), [dest] "D" (&storage)
595             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
596         );
597 #else // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
598         __asm__ __volatile__
599         (
600             "xchgl %%ebx, %%esi\n\t"
601             "lock; cmpxchg8b (%[dest])\n\t"
602             "xchgl %%ebx, %%esi\n\t"
603             "sete %[success]\n\t"
604             : "+A" (expected), [success] "=qm" (success)
605             : "S" ((uint32_t)desired), "c" ((uint32_t)(desired >> 32)), [dest] "D" (&storage)
606             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
607         );
608 #endif // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
609 
610         return success;
611 
612 #else // defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
613 
614         bool success;
615 
616 #if defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
617         __asm__ __volatile__
618         (
619             "lock; cmpxchg8b %[dest]\n\t"
620             : "+A" (expected), [dest] "+m" (storage), [success] "=@ccz" (success)
621             : "b" ((uint32_t)desired), "c" ((uint32_t)(desired >> 32))
622             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
623         );
624 #else // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
625         __asm__ __volatile__
626         (
627             "lock; cmpxchg8b %[dest]\n\t"
628             "sete %[success]\n\t"
629             : "+A" (expected), [dest] "+m" (storage), [success] "=qm" (success)
630             : "b" ((uint32_t)desired), "c" ((uint32_t)(desired >> 32))
631             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
632         );
633 #endif // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
634 
635         return success;
636 
637 #endif // defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
638     }
639 
compare_exchange_weakboost::atomics::detail::gcc_dcas_x86640     static BOOST_FORCEINLINE bool compare_exchange_weak(
641         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order success_order, memory_order failure_order) BOOST_NOEXCEPT
642     {
643         return compare_exchange_strong(storage, expected, desired, success_order, failure_order);
644     }
645 
exchangeboost::atomics::detail::gcc_dcas_x86646     static BOOST_FORCEINLINE storage_type exchange(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
647     {
648 #if defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
649 #if defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
650 
651         uint32_t old_bits[2];
652         __asm__ __volatile__
653         (
654             "xchgl %%ebx, %%esi\n\t"
655             "movl (%[dest]), %%eax\n\t"
656             "movl 4(%[dest]), %%edx\n\t"
657             ".align 16\n\t"
658             "1: lock; cmpxchg8b (%[dest])\n\t"
659             "jne 1b\n\t"
660             "xchgl %%ebx, %%esi\n\t"
661             : "=a" (old_bits[0]), "=d" (old_bits[1])
662             : "S" ((uint32_t)v), "c" ((uint32_t)(v >> 32)), [dest] "D" (&storage)
663             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
664         );
665 
666         storage_type old_value;
667         BOOST_ATOMIC_DETAIL_MEMCPY(&old_value, old_bits, sizeof(old_value));
668         return old_value;
669 
670 #else // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
671 
672         storage_type old_value;
673         __asm__ __volatile__
674         (
675             "xchgl %%ebx, %%esi\n\t"
676             "movl (%[dest]), %%eax\n\t"
677             "movl 4(%[dest]), %%edx\n\t"
678             ".align 16\n\t"
679             "1: lock; cmpxchg8b (%[dest])\n\t"
680             "jne 1b\n\t"
681             "xchgl %%ebx, %%esi\n\t"
682             : "=A" (old_value)
683             : "S" ((uint32_t)v), "c" ((uint32_t)(v >> 32)), [dest] "D" (&storage)
684             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
685         );
686         return old_value;
687 
688 #endif // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
689 #else // defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
690 #if defined(__MINGW32__) && ((__GNUC__+0) * 100 + (__GNUC_MINOR__+0)) < 407
691 
692         // MinGW gcc up to 4.6 has problems with allocating registers in the asm blocks below
693         uint32_t old_bits[2];
694         __asm__ __volatile__
695         (
696             "movl (%[dest]), %%eax\n\t"
697             "movl 4(%[dest]), %%edx\n\t"
698             ".align 16\n\t"
699             "1: lock; cmpxchg8b (%[dest])\n\t"
700             "jne 1b\n\t"
701             : "=&a" (old_bits[0]), "=&d" (old_bits[1])
702             : "b" ((uint32_t)v), "c" ((uint32_t)(v >> 32)), [dest] "DS" (&storage)
703             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
704         );
705 
706         storage_type old_value;
707         BOOST_ATOMIC_DETAIL_MEMCPY(&old_value, old_bits, sizeof(old_value));
708         return old_value;
709 
710 #elif defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
711 
712         uint32_t old_bits[2];
713         __asm__ __volatile__
714         (
715             "movl %[dest_lo], %%eax\n\t"
716             "movl %[dest_hi], %%edx\n\t"
717             ".align 16\n\t"
718             "1: lock; cmpxchg8b %[dest_lo]\n\t"
719             "jne 1b\n\t"
720             : "=&a" (old_bits[0]), "=&d" (old_bits[1]), [dest_lo] "+m" (storage), [dest_hi] "+m" (reinterpret_cast< volatile aliasing_uint32_t* >(&storage)[1])
721             : "b" ((uint32_t)v), "c" ((uint32_t)(v >> 32))
722             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
723         );
724 
725         storage_type old_value;
726         BOOST_ATOMIC_DETAIL_MEMCPY(&old_value, old_bits, sizeof(old_value));
727         return old_value;
728 
729 #else // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
730 
731         storage_type old_value;
732         __asm__ __volatile__
733         (
734             "movl %[dest_lo], %%eax\n\t"
735             "movl %[dest_hi], %%edx\n\t"
736             ".align 16\n\t"
737             "1: lock; cmpxchg8b %[dest_lo]\n\t"
738             "jne 1b\n\t"
739             : "=&A" (old_value), [dest_lo] "+m" (storage), [dest_hi] "+m" (reinterpret_cast< volatile aliasing_uint32_t* >(&storage)[1])
740             : "b" ((uint32_t)v), "c" ((uint32_t)(v >> 32))
741             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
742         );
743         return old_value;
744 
745 #endif // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
746 #endif // defined(BOOST_ATOMIC_DETAIL_X86_ASM_PRESERVE_EBX)
747     }
748 };
749 
750 template< bool Signed, bool Interprocess >
751 struct core_arch_operations< 8u, Signed, Interprocess > :
752     public core_operations_cas_based< gcc_dcas_x86< Signed, Interprocess > >
753 {
754 };
755 
756 #elif defined(__x86_64__)
757 
758 template< bool Signed, bool Interprocess >
759 struct core_arch_operations< 8u, Signed, Interprocess > :
760     public core_arch_operations_gcc_x86< 8u, Signed, Interprocess, core_arch_operations< 8u, Signed, Interprocess > >
761 {
762     typedef core_arch_operations_gcc_x86< 8u, Signed, Interprocess, core_arch_operations< 8u, Signed, Interprocess > > base_type;
763     typedef typename base_type::storage_type storage_type;
764 
fetch_addboost::atomics::detail::core_arch_operations765     static BOOST_FORCEINLINE storage_type fetch_add(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
766     {
767         __asm__ __volatile__
768         (
769             "lock; xaddq %0, %1"
770             : "+r" (v), "+m" (storage)
771             :
772             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
773         );
774         return v;
775     }
776 
exchangeboost::atomics::detail::core_arch_operations777     static BOOST_FORCEINLINE storage_type exchange(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
778     {
779         __asm__ __volatile__
780         (
781             "xchgq %0, %1"
782             : "+r" (v), "+m" (storage)
783             :
784             : "memory"
785         );
786         return v;
787     }
788 
compare_exchange_strongboost::atomics::detail::core_arch_operations789     static BOOST_FORCEINLINE bool compare_exchange_strong(
790         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order, memory_order) BOOST_NOEXCEPT
791     {
792         storage_type previous = expected;
793         bool success;
794 #if defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
795         __asm__ __volatile__
796         (
797             "lock; cmpxchgq %3, %1"
798             : "+a" (previous), "+m" (storage), "=@ccz" (success)
799             : "r" (desired)
800             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
801         );
802 #else // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
803         __asm__ __volatile__
804         (
805             "lock; cmpxchgq %3, %1\n\t"
806             "sete %2"
807             : "+a" (previous), "+m" (storage), "=q" (success)
808             : "r" (desired)
809             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
810         );
811 #endif // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
812         expected = previous;
813         return success;
814     }
815 
816 #define BOOST_ATOMIC_DETAIL_CAS_LOOP(op, argument, result)\
817     storage_type new_val;\
818     __asm__ __volatile__\
819     (\
820         ".align 16\n\t"\
821         "1: movq %[arg], %[new_val]\n\t"\
822         op " %%rax, %[new_val]\n\t"\
823         "lock; cmpxchgq %[new_val], %[storage]\n\t"\
824         "jne 1b"\
825         : [res] "+a" (result), [storage] "+m" (storage), [new_val] "=&r" (new_val)\
826         : [arg] "r" (argument)\
827         : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"\
828     )
829 
fetch_andboost::atomics::detail::core_arch_operations830     static BOOST_FORCEINLINE storage_type fetch_and(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
831     {
832         storage_type res = storage;
833         BOOST_ATOMIC_DETAIL_CAS_LOOP("andq", v, res);
834         return res;
835     }
836 
fetch_orboost::atomics::detail::core_arch_operations837     static BOOST_FORCEINLINE storage_type fetch_or(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
838     {
839         storage_type res = storage;
840         BOOST_ATOMIC_DETAIL_CAS_LOOP("orq", v, res);
841         return res;
842     }
843 
fetch_xorboost::atomics::detail::core_arch_operations844     static BOOST_FORCEINLINE storage_type fetch_xor(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
845     {
846         storage_type res = storage;
847         BOOST_ATOMIC_DETAIL_CAS_LOOP("xorq", v, res);
848         return res;
849     }
850 
851 #undef BOOST_ATOMIC_DETAIL_CAS_LOOP
852 };
853 
854 #endif
855 
856 #if defined(BOOST_ATOMIC_DETAIL_X86_HAS_CMPXCHG16B)
857 
858 template< bool Signed, bool Interprocess >
859 struct gcc_dcas_x86_64
860 {
861     typedef typename storage_traits< 16u >::type storage_type;
862     typedef uint64_t BOOST_ATOMIC_DETAIL_MAY_ALIAS aliasing_uint64_t;
863 
864     static BOOST_CONSTEXPR_OR_CONST std::size_t storage_size = 16u;
865     static BOOST_CONSTEXPR_OR_CONST std::size_t storage_alignment = 16u;
866     static BOOST_CONSTEXPR_OR_CONST bool is_signed = Signed;
867     static BOOST_CONSTEXPR_OR_CONST bool is_interprocess = Interprocess;
868     static BOOST_CONSTEXPR_OR_CONST bool full_cas_based = true;
869     static BOOST_CONSTEXPR_OR_CONST bool is_always_lock_free = true;
870 
storeboost::atomics::detail::gcc_dcas_x86_64871     static BOOST_FORCEINLINE void store(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
872     {
873         __asm__ __volatile__
874         (
875             "movq %[dest_lo], %%rax\n\t"
876             "movq %[dest_hi], %%rdx\n\t"
877             ".align 16\n\t"
878             "1: lock; cmpxchg16b %[dest_lo]\n\t"
879             "jne 1b\n\t"
880             : [dest_lo] "=m" (storage), [dest_hi] "=m" (reinterpret_cast< volatile aliasing_uint64_t* >(&storage)[1])
881             : "b" (reinterpret_cast< const aliasing_uint64_t* >(&v)[0]), "c" (reinterpret_cast< const aliasing_uint64_t* >(&v)[1])
882             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "rax", "rdx", "memory"
883         );
884     }
885 
loadboost::atomics::detail::gcc_dcas_x86_64886     static BOOST_FORCEINLINE storage_type load(storage_type const volatile& storage, memory_order) BOOST_NOEXCEPT
887     {
888         // Note that despite const qualification cmpxchg16b below may issue a store to the storage. The storage value
889         // will not change, but this prevents the storage to reside in read-only memory.
890 
891 #if defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
892 
893         uint64_t value_bits[2];
894 
895         // We don't care for comparison result here; the previous value will be stored into value anyway.
896         // Also we don't care for rbx and rcx values, they just have to be equal to rax and rdx before cmpxchg16b.
897         __asm__ __volatile__
898         (
899             "movq %%rbx, %%rax\n\t"
900             "movq %%rcx, %%rdx\n\t"
901             "lock; cmpxchg16b %[storage]\n\t"
902             : "=&a" (value_bits[0]), "=&d" (value_bits[1])
903             : [storage] "m" (storage)
904             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
905         );
906 
907         storage_type value;
908         BOOST_ATOMIC_DETAIL_MEMCPY(&value, value_bits, sizeof(value));
909         return value;
910 
911 #else // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
912 
913         storage_type value;
914 
915         // We don't care for comparison result here; the previous value will be stored into value anyway.
916         // Also we don't care for rbx and rcx values, they just have to be equal to rax and rdx before cmpxchg16b.
917         __asm__ __volatile__
918         (
919             "movq %%rbx, %%rax\n\t"
920             "movq %%rcx, %%rdx\n\t"
921             "lock; cmpxchg16b %[storage]\n\t"
922             : "=&A" (value)
923             : [storage] "m" (storage)
924             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
925         );
926 
927         return value;
928 
929 #endif // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
930     }
931 
compare_exchange_strongboost::atomics::detail::gcc_dcas_x86_64932     static BOOST_FORCEINLINE bool compare_exchange_strong(
933         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order, memory_order) BOOST_NOEXCEPT
934     {
935 #if defined(__clang__)
936 
937         // Clang cannot allocate rax:rdx register pairs but it has sync intrinsics
938         storage_type old_expected = expected;
939         expected = __sync_val_compare_and_swap(&storage, old_expected, desired);
940         return expected == old_expected;
941 
942 #elif defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
943 
944         // Some compilers can't allocate rax:rdx register pair either but also don't support 128-bit __sync_val_compare_and_swap
945         bool success;
946         __asm__ __volatile__
947         (
948             "lock; cmpxchg16b %[dest]\n\t"
949             "sete %[success]\n\t"
950             : [dest] "+m" (storage), "+a" (reinterpret_cast< aliasing_uint64_t* >(&expected)[0]), "+d" (reinterpret_cast< aliasing_uint64_t* >(&expected)[1]), [success] "=q" (success)
951             : "b" (reinterpret_cast< const aliasing_uint64_t* >(&desired)[0]), "c" (reinterpret_cast< const aliasing_uint64_t* >(&desired)[1])
952             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
953         );
954 
955         return success;
956 
957 #else // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
958 
959         bool success;
960 
961 #if defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
962         __asm__ __volatile__
963         (
964             "lock; cmpxchg16b %[dest]\n\t"
965             : "+A" (expected), [dest] "+m" (storage), "=@ccz" (success)
966             : "b" (reinterpret_cast< const aliasing_uint64_t* >(&desired)[0]), "c" (reinterpret_cast< const aliasing_uint64_t* >(&desired)[1])
967             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
968         );
969 #else // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
970         __asm__ __volatile__
971         (
972             "lock; cmpxchg16b %[dest]\n\t"
973             "sete %[success]\n\t"
974             : "+A" (expected), [dest] "+m" (storage), [success] "=qm" (success)
975             : "b" (reinterpret_cast< const aliasing_uint64_t* >(&desired)[0]), "c" (reinterpret_cast< const aliasing_uint64_t* >(&desired)[1])
976             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
977         );
978 #endif // defined(BOOST_ATOMIC_DETAIL_ASM_HAS_FLAG_OUTPUTS)
979 
980         return success;
981 
982 #endif // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
983     }
984 
compare_exchange_weakboost::atomics::detail::gcc_dcas_x86_64985     static BOOST_FORCEINLINE bool compare_exchange_weak(
986         storage_type volatile& storage, storage_type& expected, storage_type desired, memory_order success_order, memory_order failure_order) BOOST_NOEXCEPT
987     {
988         return compare_exchange_strong(storage, expected, desired, success_order, failure_order);
989     }
990 
exchangeboost::atomics::detail::gcc_dcas_x86_64991     static BOOST_FORCEINLINE storage_type exchange(storage_type volatile& storage, storage_type v, memory_order) BOOST_NOEXCEPT
992     {
993 #if defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
994         uint64_t old_bits[2];
995         __asm__ __volatile__
996         (
997             "movq %[dest_lo], %%rax\n\t"
998             "movq %[dest_hi], %%rdx\n\t"
999             ".align 16\n\t"
1000             "1: lock; cmpxchg16b %[dest_lo]\n\t"
1001             "jne 1b\n\t"
1002             : [dest_lo] "+m" (storage), [dest_hi] "+m" (reinterpret_cast< volatile aliasing_uint64_t* >(&storage)[1]), "=&a" (old_bits[0]), "=&d" (old_bits[1])
1003             : "b" (reinterpret_cast< const aliasing_uint64_t* >(&v)[0]), "c" (reinterpret_cast< const aliasing_uint64_t* >(&v)[1])
1004             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
1005         );
1006 
1007         storage_type old_value;
1008         BOOST_ATOMIC_DETAIL_MEMCPY(&old_value, old_bits, sizeof(old_value));
1009         return old_value;
1010 #else // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
1011         storage_type old_value;
1012         __asm__ __volatile__
1013         (
1014             "movq %[dest_lo], %%rax\n\t"
1015             "movq %[dest_hi], %%rdx\n\t"
1016             ".align 16\n\t"
1017             "1: lock; cmpxchg16b %[dest_lo]\n\t"
1018             "jne 1b\n\t"
1019             : "=&A" (old_value), [dest_lo] "+m" (storage), [dest_hi] "+m" (reinterpret_cast< volatile aliasing_uint64_t* >(&storage)[1])
1020             : "b" (reinterpret_cast< const aliasing_uint64_t* >(&v)[0]), "c" (reinterpret_cast< const aliasing_uint64_t* >(&v)[1])
1021             : BOOST_ATOMIC_DETAIL_ASM_CLOBBER_CC_COMMA "memory"
1022         );
1023 
1024         return old_value;
1025 #endif // defined(BOOST_ATOMIC_DETAIL_X86_NO_ASM_AX_DX_PAIRS)
1026     }
1027 };
1028 
1029 template< bool Signed, bool Interprocess >
1030 struct core_arch_operations< 16u, Signed, Interprocess > :
1031     public core_operations_cas_based< gcc_dcas_x86_64< Signed, Interprocess > >
1032 {
1033 };
1034 
1035 #endif // defined(BOOST_ATOMIC_DETAIL_X86_HAS_CMPXCHG16B)
1036 
1037 } // namespace detail
1038 } // namespace atomics
1039 } // namespace boost
1040 
1041 #include <boost/atomic/detail/footer.hpp>
1042 
1043 #endif // BOOST_ATOMIC_DETAIL_CORE_ARCH_OPS_GCC_X86_HPP_INCLUDED_
1044