Blame - runtime/atomic.h - platform/art

blob: 0faa3c69c6cf292e347fccc586d5fee37699d577 [file] [log] [blame]

Elliott Hughes	5ea047b	2011-09-13 14:38:18 -0700	[diff] [blame]	1	/*
				2	* Copyright (C) 2008 The Android Open Source Project
				3	*
				4	* Licensed under the Apache License, Version 2.0 (the "License");
				5	* you may not use this file except in compliance with the License.
				6	* You may obtain a copy of the License at
				7	*
				8	* http://www.apache.org/licenses/LICENSE-2.0
				9	*
				10	* Unless required by applicable law or agreed to in writing, software
				11	* distributed under the License is distributed on an "AS IS" BASIS,
				12	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
				13	* See the License for the specific language governing permissions and
				14	* limitations under the License.
				15	*/
				16
Brian Carlstrom	fc0e321	2013-07-17 14:40:12 -0700	[diff] [blame]	17	#ifndef ART_RUNTIME_ATOMIC_H_
				18	#define ART_RUNTIME_ATOMIC_H_
Elliott Hughes	5ea047b	2011-09-13 14:38:18 -0700	[diff] [blame]	19
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	20	#include <stdint.h>
Ian Rogers	3e5cf30	2014-05-20 16:40:37 -0700	[diff] [blame]	21	#include <atomic>
Ian Rogers	3e5cf30	2014-05-20 16:40:37 -0700	[diff] [blame]	22	#include <limits>
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	23	#include <vector>
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	24
Ian Rogers	a984454	2014-04-21 17:01:02 -0700	[diff] [blame]	25	#include "base/logging.h"
Elliott Hughes	7616005	2012-12-12 16:31:20 -0800	[diff] [blame]	26	#include "base/macros.h"
Elliott Hughes	5ea047b	2011-09-13 14:38:18 -0700	[diff] [blame]	27
				28	namespace art {
				29
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	30	class Mutex;
				31
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	32	// QuasiAtomic encapsulates two separate facilities that we are
				33	// trying to move away from: "quasiatomic" 64 bit operations
				34	// and custom memory fences. For the time being, they remain
				35	// exposed. Clients should be converted to use either class Atomic
				36	// below whenever possible, and should eventually use C++11 atomics.
				37	// The two facilities that do not have a good C++11 analog are
				38	// ThreadFenceForConstructor and Atomic::*JavaData.
				39	//
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	40	// NOTE: Two "quasiatomic" operations on the exact same memory address
				41	// are guaranteed to operate atomically with respect to each other,
				42	// but no guarantees are made about quasiatomic operations mixed with
				43	// non-quasiatomic operations on the same address, nor about
				44	// quasiatomic operations that are performed on partially-overlapping
				45	// memory.
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	46	class QuasiAtomic {
Ian Rogers	936b37f	2014-02-14 00:52:24 -0800	[diff] [blame]	47	#if defined(__mips__) && !defined(__LP64__)
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	48	static constexpr bool kNeedSwapMutexes = true;
Andreas Gampe	1a5c406	2015-01-15 12:10:47 -0800	[diff] [blame]	49	#elif defined(__mips__) && defined(__LP64__)
				50	// TODO - mips64 still need this for Cas64 ???
				51	static constexpr bool kNeedSwapMutexes = true;
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	52	#else
				53	static constexpr bool kNeedSwapMutexes = false;
				54	#endif
				55
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	56	public:
				57	static void Startup();
Elliott Hughes	5ea047b	2011-09-13 14:38:18 -0700	[diff] [blame]	58
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	59	static void Shutdown();
Elliott Hughes	5ea047b	2011-09-13 14:38:18 -0700	[diff] [blame]	60
Ian Rogers	9adbff5	2013-01-23 18:19:03 -0800	[diff] [blame]	61	// Reads the 64-bit value at "addr" without tearing.
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	62	static int64_t Read64(volatile const int64_t* addr) {
				63	if (!kNeedSwapMutexes) {
Ian Rogers	a984454	2014-04-21 17:01:02 -0700	[diff] [blame]	64	int64_t value;
				65	#if defined(__LP64__)
				66	value = *addr;
				67	#else
				68	#if defined(__arm__)
				69	#if defined(__ARM_FEATURE_LPAE)
				70	// With LPAE support (such as Cortex-A15) then ldrd is defined not to tear.
				71	__asm__ __volatile__("@ QuasiAtomic::Read64\n"
				72	"ldrd %0, %H0, %1"
				73	: "=r" (value)
				74	: "m" (*addr));
				75	#else
				76	// Exclusive loads are defined not to tear, clearing the exclusive state isn't necessary.
				77	__asm__ __volatile__("@ QuasiAtomic::Read64\n"
				78	"ldrexd %0, %H0, %1"
				79	: "=r" (value)
				80	: "Q" (*addr));
				81	#endif
				82	#elif defined(__i386__)
				83	__asm__ __volatile__(
				84	"movq %1, %0\n"
				85	: "=x" (value)
				86	: "m" (*addr));
				87	#else
				88	LOG(FATAL) << "Unsupported architecture";
				89	#endif
				90	#endif // defined(__LP64__)
				91	return value;
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	92	} else {
				93	return SwapMutexRead64(addr);
				94	}
				95	}
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	96
Ian Rogers	9adbff5	2013-01-23 18:19:03 -0800	[diff] [blame]	97	// Writes to the 64-bit value at "addr" without tearing.
Ian Rogers	a984454	2014-04-21 17:01:02 -0700	[diff] [blame]	98	static void Write64(volatile int64_t* addr, int64_t value) {
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	99	if (!kNeedSwapMutexes) {
Ian Rogers	a984454	2014-04-21 17:01:02 -0700	[diff] [blame]	100	#if defined(__LP64__)
				101	*addr = value;
				102	#else
				103	#if defined(__arm__)
				104	#if defined(__ARM_FEATURE_LPAE)
				105	// If we know that ARM architecture has LPAE (such as Cortex-A15) strd is defined not to tear.
				106	__asm__ __volatile__("@ QuasiAtomic::Write64\n"
				107	"strd %1, %H1, %0"
				108	: "=m"(*addr)
				109	: "r" (value));
				110	#else
				111	// The write is done as a swap so that the cache-line is in the exclusive state for the store.
				112	int64_t prev;
				113	int status;
				114	do {
				115	__asm__ __volatile__("@ QuasiAtomic::Write64\n"
				116	"ldrexd %0, %H0, %2\n"
				117	"strexd %1, %3, %H3, %2"
				118	: "=&r" (prev), "=&r" (status), "+Q"(*addr)
				119	: "r" (value)
				120	: "cc");
				121	} while (UNLIKELY(status != 0));
				122	#endif
				123	#elif defined(__i386__)
				124	__asm__ __volatile__(
				125	"movq %1, %0"
				126	: "=m" (*addr)
				127	: "x" (value));
				128	#else
				129	LOG(FATAL) << "Unsupported architecture";
				130	#endif
				131	#endif // defined(__LP64__)
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	132	} else {
Ian Rogers	a984454	2014-04-21 17:01:02 -0700	[diff] [blame]	133	SwapMutexWrite64(addr, value);
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	134	}
				135	}
Ian Rogers	9adbff5	2013-01-23 18:19:03 -0800	[diff] [blame]	136
				137	// Atomically compare the value at "addr" to "old_value", if equal replace it with "new_value"
				138	// and return true. Otherwise, don't swap, and return false.
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	139	// This is fully ordered, i.e. it has C++11 memory_order_seq_cst
				140	// semantics (assuming all other accesses use a mutex if this one does).
				141	// This has "strong" semantics; if it fails then it is guaranteed that
				142	// at some point during the execution of Cas64, *addr was not equal to
				143	// old_value.
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	144	static bool Cas64(int64_t old_value, int64_t new_value, volatile int64_t* addr) {
				145	if (!kNeedSwapMutexes) {
				146	return __sync_bool_compare_and_swap(addr, old_value, new_value);
				147	} else {
				148	return SwapMutexCas64(old_value, new_value, addr);
				149	}
				150	}
Ian Rogers	9adbff5	2013-01-23 18:19:03 -0800	[diff] [blame]	151
				152	// Does the architecture provide reasonable atomic long operations or do we fall back on mutexes?
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	153	static bool LongAtomicsUseMutexes() {
Ian Rogers	63c5dd0	2014-05-19 22:55:00 -0700	[diff] [blame]	154	return kNeedSwapMutexes;
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	155	}
				156
Hans Boehm	a1ec065	2014-06-06 17:13:03 -0700	[diff] [blame]	157	static void ThreadFenceAcquire() {
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	158	std::atomic_thread_fence(std::memory_order_acquire);
				159	}
				160
Hans Boehm	a1ec065	2014-06-06 17:13:03 -0700	[diff] [blame]	161	static void ThreadFenceRelease() {
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	162	std::atomic_thread_fence(std::memory_order_release);
				163	}
				164
				165	static void ThreadFenceForConstructor() {
				166	#if defined(__aarch64__)
				167	__asm__ __volatile__("dmb ishst" : : : "memory");
				168	#else
				169	std::atomic_thread_fence(std::memory_order_release);
				170	#endif
				171	}
				172
				173	static void ThreadFenceSequentiallyConsistent() {
				174	std::atomic_thread_fence(std::memory_order_seq_cst);
				175	}
				176
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	177	private:
Ian Rogers	b122a4b	2013-11-19 18:00:50 -0800	[diff] [blame]	178	static Mutex* GetSwapMutex(const volatile int64_t* addr);
				179	static int64_t SwapMutexRead64(volatile const int64_t* addr);
				180	static void SwapMutexWrite64(volatile int64_t* addr, int64_t val);
				181	static bool SwapMutexCas64(int64_t old_value, int64_t new_value, volatile int64_t* addr);
				182
				183	// We stripe across a bunch of different mutexes to reduce contention.
				184	static constexpr size_t kSwapMutexCount = 32;
				185	static std::vector<Mutex> gSwapMutexes;
				186
Elliott Hughes	7c6169d	2012-05-02 16:11:48 -0700	[diff] [blame]	187	DISALLOW_COPY_AND_ASSIGN(QuasiAtomic);
				188	};
Elliott Hughes	5ea047b	2011-09-13 14:38:18 -0700	[diff] [blame]	189
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	190	template<typename T>
Dan Albert	aab0f86	2014-08-11 16:38:02 -0700	[diff] [blame]	191	class PACKED(sizeof(T)) Atomic : public std::atomic<T> {
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	192	public:
Dan Albert	6a3f8d9	2014-08-12 11:48:34 -0700	[diff] [blame]	193	Atomic<T>() : std::atomic<T>(0) { }
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	194
				195	explicit Atomic<T>(T value) : std::atomic<T>(value) { }
				196
				197	// Load from memory without ordering or synchronization constraints.
				198	T LoadRelaxed() const {
				199	return this->load(std::memory_order_relaxed);
				200	}
				201
Calin Juravle	4d77b6a	2015-12-01 18:38:09 +0000	[diff] [blame]	202	// Load from memory with acquire ordering.
				203	T LoadAcquire() const {
				204	return this->load(std::memory_order_acquire);
				205	}
				206
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	207	// Word tearing allowed, but may race.
				208	// TODO: Optimize?
				209	// There has been some discussion of eventually disallowing word
				210	// tearing for Java data loads.
				211	T LoadJavaData() const {
				212	return this->load(std::memory_order_relaxed);
				213	}
				214
				215	// Load from memory with a total ordering.
				216	// Corresponds exactly to a Java volatile load.
				217	T LoadSequentiallyConsistent() const {
				218	return this->load(std::memory_order_seq_cst);
				219	}
				220
				221	// Store to memory without ordering or synchronization constraints.
				222	void StoreRelaxed(T desired) {
				223	this->store(desired, std::memory_order_relaxed);
				224	}
				225
				226	// Word tearing allowed, but may race.
				227	void StoreJavaData(T desired) {
				228	this->store(desired, std::memory_order_relaxed);
				229	}
				230
				231	// Store to memory with release ordering.
				232	void StoreRelease(T desired) {
				233	this->store(desired, std::memory_order_release);
				234	}
				235
				236	// Store to memory with a total ordering.
				237	void StoreSequentiallyConsistent(T desired) {
				238	this->store(desired, std::memory_order_seq_cst);
				239	}
				240
				241	// Atomically replace the value with desired value if it matches the expected value.
				242	// Participates in total ordering of atomic operations.
				243	bool CompareExchangeStrongSequentiallyConsistent(T expected_value, T desired_value) {
				244	return this->compare_exchange_strong(expected_value, desired_value, std::memory_order_seq_cst);
				245	}
				246
				247	// The same, except it may fail spuriously.
				248	bool CompareExchangeWeakSequentiallyConsistent(T expected_value, T desired_value) {
				249	return this->compare_exchange_weak(expected_value, desired_value, std::memory_order_seq_cst);
				250	}
				251
				252	// Atomically replace the value with desired value if it matches the expected value. Doesn't
				253	// imply ordering or synchronization constraints.
				254	bool CompareExchangeStrongRelaxed(T expected_value, T desired_value) {
				255	return this->compare_exchange_strong(expected_value, desired_value, std::memory_order_relaxed);
				256	}
				257
				258	// The same, except it may fail spuriously.
				259	bool CompareExchangeWeakRelaxed(T expected_value, T desired_value) {
				260	return this->compare_exchange_weak(expected_value, desired_value, std::memory_order_relaxed);
				261	}
				262
				263	// Atomically replace the value with desired value if it matches the expected value. Prior writes
				264	// made to other memory locations by the thread that did the release become visible in this
				265	// thread.
				266	bool CompareExchangeWeakAcquire(T expected_value, T desired_value) {
				267	return this->compare_exchange_weak(expected_value, desired_value, std::memory_order_acquire);
				268	}
				269
				270	// Atomically replace the value with desired value if it matches the expected value. prior writes
				271	// to other memory locations become visible to the threads that do a consume or an acquire on the
				272	// same location.
				273	bool CompareExchangeWeakRelease(T expected_value, T desired_value) {
				274	return this->compare_exchange_weak(expected_value, desired_value, std::memory_order_release);
				275	}
				276
				277	T FetchAndAddSequentiallyConsistent(const T value) {
				278	return this->fetch_add(value, std::memory_order_seq_cst); // Return old_value.
				279	}
				280
				281	T FetchAndSubSequentiallyConsistent(const T value) {
				282	return this->fetch_sub(value, std::memory_order_seq_cst); // Return old value.
				283	}
				284
Ian Rogers	8c1b5f7	2014-07-09 22:02:36 -0700	[diff] [blame]	285	T FetchAndOrSequentiallyConsistent(const T value) {
				286	return this->fetch_or(value, std::memory_order_seq_cst); // Return old_value.
				287	}
				288
				289	T FetchAndAndSequentiallyConsistent(const T value) {
				290	return this->fetch_and(value, std::memory_order_seq_cst); // Return old_value.
				291	}
				292
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	293	volatile T* Address() {
				294	return reinterpret_cast<T*>(this);
				295	}
				296
				297	static T MaxValue() {
				298	return std::numeric_limits<T>::max();
				299	}
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	300	};
				301
Hans Boehm	3035961	2014-05-21 17:46:23 -0700	[diff] [blame]	302	typedef Atomic<int32_t> AtomicInteger;
				303
Andreas Gampe	575e78c	2014-11-03 23:41:03 -0800	[diff] [blame]	304	static_assert(sizeof(AtomicInteger) == sizeof(int32_t), "Weird AtomicInteger size");
				305	static_assert(alignof(AtomicInteger) == alignof(int32_t),
				306	"AtomicInteger alignment differs from that of underlyingtype");
				307	static_assert(sizeof(Atomic<int64_t>) == sizeof(int64_t), "Weird Atomic<int64> size");
Dan Albert	aab0f86	2014-08-11 16:38:02 -0700	[diff] [blame]	308
				309	// Assert the alignment of 64-bit integers is 64-bit. This isn't true on certain 32-bit
				310	// architectures (e.g. x86-32) but we know that 64-bit integers here are arranged to be 8-byte
				311	// aligned.
Hans Boehm	2f4a2ed	2014-06-06 18:17:43 -0700	[diff] [blame]	312	#if defined(__LP64__)
Andreas Gampe	575e78c	2014-11-03 23:41:03 -0800	[diff] [blame]	313	static_assert(alignof(Atomic<int64_t>) == alignof(int64_t),
				314	"Atomic<int64> alignment differs from that of underlying type");
Hans Boehm	2f4a2ed	2014-06-06 18:17:43 -0700	[diff] [blame]	315	#endif
Ian Rogers	3e5cf30	2014-05-20 16:40:37 -0700	[diff] [blame]	316
Elliott Hughes	5ea047b	2011-09-13 14:38:18 -0700	[diff] [blame]	317	} // namespace art
				318
Brian Carlstrom	fc0e321	2013-07-17 14:40:12 -0700	[diff] [blame]	319	#endif // ART_RUNTIME_ATOMIC_H_