Blame - lib/percpu-refcount.c - kernel/msm-4.9

blob: 5a6d43baccc52782ca50436113d075ada9a08f84 [file] [log] [blame]

Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	1	#define pr_fmt(fmt) "%s: " fmt "\n", __func__
				2
				3	#include <linux/kernel.h>
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	4	#include <linux/sched.h>
				5	#include <linux/wait.h>
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	6	#include <linux/percpu-refcount.h>
				7
				8	/*
				9	* Initially, a percpu refcount is just a set of percpu counters. Initially, we
				10	* don't try to detect the ref hitting 0 - which means that get/put can just
				11	* increment or decrement the local counter. Note that the counter on a
				12	* particular cpu can (and will) wrap - this is fine, when we go to shutdown the
				13	* percpu counters will all sum to the correct value
				14	*
				15	* (More precisely: because moduler arithmatic is commutative the sum of all the
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	16	* percpu_count vars will be equal to what it would have been if all the gets
				17	* and puts were done to a single integer, even if some of the percpu integers
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	18	* overflow or underflow).
				19	*
				20	* The real trick to implementing percpu refcounts is shutdown. We can't detect
				21	* the ref hitting 0 on every put - this would require global synchronization
				22	* and defeat the whole purpose of using percpu refs.
				23	*
				24	* What we do is require the user to keep track of the initial refcount; we know
				25	* the ref can't hit 0 before the user drops the initial ref, so as long as we
				26	* convert to non percpu mode before the initial ref is dropped everything
				27	* works.
				28	*
				29	* Converting to non percpu mode is done with some RCUish stuff in
Tejun Heo	e625305	2014-09-20 01:27:25 -0400	[diff] [blame]	30	* percpu_ref_kill. Additionally, we need a bias value so that the
				31	* atomic_long_t can't hit 0 before we've added up all the percpu refs.
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	32	*/
				33
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	34	#define PERCPU_COUNT_BIAS (1LU << (BITS_PER_LONG - 1))
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	35
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	36	static DECLARE_WAIT_QUEUE_HEAD(percpu_ref_switch_waitq);
				37
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	38	static unsigned long __percpu percpu_count_ptr(struct percpu_ref ref)
Tejun Heo	eae7975	2014-06-28 08:10:13 -0400	[diff] [blame]	39	{
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	40	return (unsigned long __percpu *)
Tejun Heo	27344a9	2014-09-24 13:31:49 -0400	[diff] [blame]	41	(ref->percpu_count_ptr & ~__PERCPU_REF_ATOMIC_DEAD);
Tejun Heo	eae7975	2014-06-28 08:10:13 -0400	[diff] [blame]	42	}
				43
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	44	/**
				45	* percpu_ref_init - initialize a percpu refcount
Tejun Heo	ac89906	2013-06-12 20:43:06 -0700	[diff] [blame]	46	* @ref: percpu_ref to initialize
				47	* @release: function which will be called when refcount hits 0
Tejun Heo	a34375e	2014-09-08 09:51:30 +0900	[diff] [blame]	48	* @gfp: allocation mask to use
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	49	*
				50	* Initializes the refcount in single atomic counter mode with a refcount of 1;
Tejun Heo	e625305	2014-09-20 01:27:25 -0400	[diff] [blame]	51	* analagous to atomic_long_set(ref, 1).
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	52	*
				53	* Note that @release must not sleep - it may potentially be called from RCU
				54	* callback context by percpu_ref_kill().
				55	*/
Tejun Heo	a34375e	2014-09-08 09:51:30 +0900	[diff] [blame]	56	int percpu_ref_init(struct percpu_ref ref, percpu_ref_func_t release,
				57	gfp_t gfp)
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	58	{
Tejun Heo	27344a9	2014-09-24 13:31:49 -0400	[diff] [blame]	59	size_t align = max_t(size_t, 1 << __PERCPU_REF_FLAG_BITS,
				60	__alignof__(unsigned long));
				61
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	62	atomic_long_set(&ref->count, 1 + PERCPU_COUNT_BIAS);
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	63
Tejun Heo	27344a9	2014-09-24 13:31:49 -0400	[diff] [blame]	64	ref->percpu_count_ptr = (unsigned long)
				65	__alloc_percpu_gfp(sizeof(unsigned long), align, gfp);
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	66	if (!ref->percpu_count_ptr)
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	67	return -ENOMEM;
				68
				69	ref->release = release;
				70	return 0;
				71	}
Matias Bjorling	5e9dd37	2013-10-16 13:47:01 -0700	[diff] [blame]	72	EXPORT_SYMBOL_GPL(percpu_ref_init);
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	73
Tejun Heo	bc497bd	2013-06-12 20:52:35 -0700	[diff] [blame]	74	/**
Tejun Heo	9a1049d	2014-06-28 08:10:14 -0400	[diff] [blame]	75	* percpu_ref_exit - undo percpu_ref_init()
				76	* @ref: percpu_ref to exit
Tejun Heo	bc497bd	2013-06-12 20:52:35 -0700	[diff] [blame]	77	*
Tejun Heo	9a1049d	2014-06-28 08:10:14 -0400	[diff] [blame]	78	* This function exits @ref. The caller is responsible for ensuring that
				79	* @ref is no longer in active use. The usual places to invoke this
				80	* function from are the @ref->release() callback or in init failure path
				81	* where percpu_ref_init() succeeded but other parts of the initialization
				82	* of the embedding object failed.
Tejun Heo	bc497bd	2013-06-12 20:52:35 -0700	[diff] [blame]	83	*/
Tejun Heo	9a1049d	2014-06-28 08:10:14 -0400	[diff] [blame]	84	void percpu_ref_exit(struct percpu_ref *ref)
Tejun Heo	bc497bd	2013-06-12 20:52:35 -0700	[diff] [blame]	85	{
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	86	unsigned long __percpu *percpu_count = percpu_count_ptr(ref);
Tejun Heo	bc497bd	2013-06-12 20:52:35 -0700	[diff] [blame]	87
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	88	if (percpu_count) {
				89	free_percpu(percpu_count);
Tejun Heo	27344a9	2014-09-24 13:31:49 -0400	[diff] [blame]	90	ref->percpu_count_ptr = __PERCPU_REF_ATOMIC_DEAD;
Tejun Heo	bc497bd	2013-06-12 20:52:35 -0700	[diff] [blame]	91	}
				92	}
Tejun Heo	9a1049d	2014-06-28 08:10:14 -0400	[diff] [blame]	93	EXPORT_SYMBOL_GPL(percpu_ref_exit);
Tejun Heo	bc497bd	2013-06-12 20:52:35 -0700	[diff] [blame]	94
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	95	static void percpu_ref_call_confirm_rcu(struct rcu_head *rcu)
				96	{
				97	struct percpu_ref *ref = container_of(rcu, struct percpu_ref, rcu);
				98
				99	ref->confirm_switch(ref);
				100	ref->confirm_switch = NULL;
				101	wake_up_all(&percpu_ref_switch_waitq);
				102
				103	/* drop ref from percpu_ref_switch_to_atomic() */
				104	percpu_ref_put(ref);
				105	}
				106
				107	static void percpu_ref_switch_to_atomic_rcu(struct rcu_head *rcu)
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	108	{
				109	struct percpu_ref *ref = container_of(rcu, struct percpu_ref, rcu);
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	110	unsigned long __percpu *percpu_count = percpu_count_ptr(ref);
Tejun Heo	e625305	2014-09-20 01:27:25 -0400	[diff] [blame]	111	unsigned long count = 0;
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	112	int cpu;
				113
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	114	for_each_possible_cpu(cpu)
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	115	count += *per_cpu_ptr(percpu_count, cpu);
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	116
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	117	pr_debug("global %ld percpu %ld",
Tejun Heo	e625305	2014-09-20 01:27:25 -0400	[diff] [blame]	118	atomic_long_read(&ref->count), (long)count);
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	119
				120	/*
				121	* It's crucial that we sum the percpu counters _before_ adding the sum
				122	* to &ref->count; since gets could be happening on one cpu while puts
				123	* happen on another, adding a single cpu's count could cause
				124	* @ref->count to hit 0 before we've got a consistent value - but the
				125	* sum of all the counts will be consistent and correct.
				126	*
				127	* Subtracting the bias value then has to happen _after_ adding count to
				128	* &ref->count; we need the bias value to prevent &ref->count from
				129	* reaching 0 before we add the percpu counts. But doing it at the same
				130	* time is equivalent and saves us atomic operations:
				131	*/
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	132	atomic_long_add((long)count - PERCPU_COUNT_BIAS, &ref->count);
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	133
Tejun Heo	e625305	2014-09-20 01:27:25 -0400	[diff] [blame]	134	WARN_ONCE(atomic_long_read(&ref->count) <= 0,
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	135	"percpu ref (%pf) <= 0 (%ld) after switching to atomic",
Tejun Heo	e625305	2014-09-20 01:27:25 -0400	[diff] [blame]	136	ref->release, atomic_long_read(&ref->count));
Kent Overstreet	687b0ad	2014-01-06 13:13:26 -0800	[diff] [blame]	137
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	138	/* @ref is viewed as dead on all CPUs, send out switch confirmation */
				139	percpu_ref_call_confirm_rcu(rcu);
				140	}
Tejun Heo	dbece3a	2013-06-13 19:23:53 -0700	[diff] [blame]	141
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	142	static void percpu_ref_noop_confirm_switch(struct percpu_ref *ref)
				143	{
				144	}
				145
				146	static void __percpu_ref_switch_to_atomic(struct percpu_ref *ref,
				147	percpu_ref_func_t *confirm_switch)
				148	{
				149	if (!(ref->percpu_count_ptr & __PERCPU_REF_ATOMIC)) {
				150	/* switching from percpu to atomic */
				151	ref->percpu_count_ptr \|= __PERCPU_REF_ATOMIC;
				152
				153	/*
				154	* Non-NULL ->confirm_switch is used to indicate that
				155	* switching is in progress. Use noop one if unspecified.
				156	*/
				157	WARN_ON_ONCE(ref->confirm_switch);
				158	ref->confirm_switch =
				159	confirm_switch ?: percpu_ref_noop_confirm_switch;
				160
				161	percpu_ref_get(ref); /* put after confirmation */
				162	call_rcu_sched(&ref->rcu, percpu_ref_switch_to_atomic_rcu);
				163	} else if (confirm_switch) {
				164	/*
				165	* Somebody already set ATOMIC. Switching may still be in
				166	* progress. @confirm_switch must be invoked after the
				167	* switching is complete and a full sched RCU grace period
				168	* has passed. Wait synchronously for the previous
				169	* switching and schedule @confirm_switch invocation.
				170	*/
				171	wait_event(percpu_ref_switch_waitq, !ref->confirm_switch);
				172	ref->confirm_switch = confirm_switch;
				173
				174	percpu_ref_get(ref); /* put after confirmation */
				175	call_rcu_sched(&ref->rcu, percpu_ref_call_confirm_rcu);
				176	}
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	177	}
				178
				179	/**
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	180	* percpu_ref_switch_to_atomic - switch a percpu_ref to atomic mode
				181	* @ref: percpu_ref to switch to atomic mode
				182	* @confirm_switch: optional confirmation callback
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	183	*
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	184	* There's no reason to use this function for the usual reference counting.
				185	* Use percpu_ref_kill[_and_confirm]().
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	186	*
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	187	* Schedule switching of @ref to atomic mode. All its percpu counts will
				188	* be collected to the main atomic counter. On completion, when all CPUs
				189	* are guaraneed to be in atomic mode, @confirm_switch, which may not
				190	* block, is invoked. This function may be invoked concurrently with all
				191	* the get/put operations and can safely be mixed with kill and reinit
				192	* operations.
				193	*
				194	* This function normally doesn't block and can be called from any context
				195	* but it may block if @confirm_kill is specified and @ref is already in
				196	* the process of switching to atomic mode. In such cases, @confirm_switch
				197	* will be invoked after the switching is complete.
				198	*
				199	* Due to the way percpu_ref is implemented, @confirm_switch will be called
				200	* after at least one full sched RCU grace period has passed but this is an
				201	* implementation detail and must not be depended upon.
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	202	*/
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	203	void percpu_ref_switch_to_atomic(struct percpu_ref *ref,
				204	percpu_ref_func_t *confirm_switch)
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	205	{
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	206	__percpu_ref_switch_to_atomic(ref, confirm_switch);
Kent Overstreet	215e262	2013-05-31 15:26:45 -0700	[diff] [blame]	207	}
Tejun Heo	a223737	2014-09-24 13:31:48 -0400	[diff] [blame]	208
Tejun Heo	f47ad45	2014-09-24 13:31:49 -0400	[diff] [blame^]	209	static void __percpu_ref_switch_to_percpu(struct percpu_ref *ref)
Tejun Heo	a223737	2014-09-24 13:31:48 -0400	[diff] [blame]	210	{
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	211	unsigned long __percpu *percpu_count = percpu_count_ptr(ref);
Tejun Heo	a223737	2014-09-24 13:31:48 -0400	[diff] [blame]	212	int cpu;
				213
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	214	BUG_ON(!percpu_count);
Tejun Heo	a223737	2014-09-24 13:31:48 -0400	[diff] [blame]	215
Tejun Heo	f47ad45	2014-09-24 13:31:49 -0400	[diff] [blame^]	216	if (!(ref->percpu_count_ptr & __PERCPU_REF_ATOMIC))
				217	return;
				218
				219	wait_event(percpu_ref_switch_waitq, !ref->confirm_switch);
				220
				221	atomic_long_add(PERCPU_COUNT_BIAS, &ref->count);
Tejun Heo	a223737	2014-09-24 13:31:48 -0400	[diff] [blame]	222
				223	/*
				224	* Restore per-cpu operation. smp_store_release() is paired with
Tejun Heo	9e804d1	2014-09-24 13:31:48 -0400	[diff] [blame]	225	* smp_read_barrier_depends() in __ref_is_percpu() and guarantees
				226	* that the zeroing is visible to all percpu accesses which can see
Tejun Heo	f47ad45	2014-09-24 13:31:49 -0400	[diff] [blame^]	227	* the following __PERCPU_REF_ATOMIC clearing.
Tejun Heo	a223737	2014-09-24 13:31:48 -0400	[diff] [blame]	228	*/
				229	for_each_possible_cpu(cpu)
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	230	*per_cpu_ptr(percpu_count, cpu) = 0;
Tejun Heo	a223737	2014-09-24 13:31:48 -0400	[diff] [blame]	231
Tejun Heo	eecc16b	2014-09-24 13:31:48 -0400	[diff] [blame]	232	smp_store_release(&ref->percpu_count_ptr,
Tejun Heo	f47ad45	2014-09-24 13:31:49 -0400	[diff] [blame^]	233	ref->percpu_count_ptr & ~__PERCPU_REF_ATOMIC);
Tejun Heo	a223737	2014-09-24 13:31:48 -0400	[diff] [blame]	234	}
Tejun Heo	f47ad45	2014-09-24 13:31:49 -0400	[diff] [blame^]	235
				236	/**
				237	* percpu_ref_switch_to_percpu - switch a percpu_ref to percpu mode
				238	* @ref: percpu_ref to switch to percpu mode
				239	*
				240	* There's no reason to use this function for the usual reference counting.
				241	* To re-use an expired ref, use percpu_ref_reinit().
				242	*
				243	* Switch @ref to percpu mode. This function may be invoked concurrently
				244	* with all the get/put operations and can safely be mixed with kill and
				245	* reinit operations.
				246	*
				247	* This function normally doesn't block and can be called from any context
				248	* but it may block if @ref is in the process of switching to atomic mode
				249	* by percpu_ref_switch_atomic().
				250	*/
				251	void percpu_ref_switch_to_percpu(struct percpu_ref *ref)
				252	{
				253	/* a dying or dead ref can't be switched to percpu mode w/o reinit */
				254	if (!(ref->percpu_count_ptr & __PERCPU_REF_DEAD))
				255	__percpu_ref_switch_to_percpu(ref);
				256	}
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	257
				258	/**
				259	* percpu_ref_kill_and_confirm - drop the initial ref and schedule confirmation
				260	* @ref: percpu_ref to kill
				261	* @confirm_kill: optional confirmation callback
				262	*
				263	* Equivalent to percpu_ref_kill() but also schedules kill confirmation if
				264	* @confirm_kill is not NULL. @confirm_kill, which may not block, will be
				265	* called after @ref is seen as dead from all CPUs at which point all
				266	* further invocations of percpu_ref_tryget_live() will fail. See
				267	* percpu_ref_tryget_live() for details.
				268	*
				269	* This function normally doesn't block and can be called from any context
Tejun Heo	f47ad45	2014-09-24 13:31:49 -0400	[diff] [blame^]	270	* but it may block if @confirm_kill is specified and @ref is in the
				271	* process of switching to atomic mode by percpu_ref_switch_atomic().
Tejun Heo	490c79a	2014-09-24 13:31:49 -0400	[diff] [blame]	272	*
				273	* Due to the way percpu_ref is implemented, @confirm_switch will be called
				274	* after at least one full sched RCU grace period has passed but this is an
				275	* implementation detail and must not be depended upon.
				276	*/
				277	void percpu_ref_kill_and_confirm(struct percpu_ref *ref,
				278	percpu_ref_func_t *confirm_kill)
				279	{
				280	WARN_ONCE(ref->percpu_count_ptr & __PERCPU_REF_DEAD,
				281	"%s called more than once on %pf!", __func__, ref->release);
				282
				283	ref->percpu_count_ptr \|= __PERCPU_REF_DEAD;
				284	__percpu_ref_switch_to_atomic(ref, confirm_kill);
				285	percpu_ref_put(ref);
				286	}
				287	EXPORT_SYMBOL_GPL(percpu_ref_kill_and_confirm);
Tejun Heo	f47ad45	2014-09-24 13:31:49 -0400	[diff] [blame^]	288
				289	/**
				290	* percpu_ref_reinit - re-initialize a percpu refcount
				291	* @ref: perpcu_ref to re-initialize
				292	*
				293	* Re-initialize @ref so that it's in the same state as when it finished
				294	* percpu_ref_init(). @ref must have been initialized successfully and
				295	* reached 0 but not exited.
				296	*
				297	* Note that percpu_ref_tryget[_live]() are safe to perform on @ref while
				298	* this function is in progress.
				299	*/
				300	void percpu_ref_reinit(struct percpu_ref *ref)
				301	{
				302	WARN_ON_ONCE(!percpu_ref_is_zero(ref));
				303
				304	ref->percpu_count_ptr &= ~__PERCPU_REF_DEAD;
				305	percpu_ref_get(ref);
				306	__percpu_ref_switch_to_percpu(ref);
				307	}
				308	EXPORT_SYMBOL_GPL(percpu_ref_reinit);