Blame - kernel/bpf/cgroup.c - kernel/msm-4.9

blob: a44a7e4c23d20469381afde1062e8e6a415a939a [file] [log] [blame]

Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	1	/*
				2	* Functions to manage eBPF programs attached to cgroups
				3	*
				4	* Copyright (c) 2016 Daniel Mack
				5	*
				6	* This file is subject to the terms and conditions of version 2 of the GNU
				7	* General Public License. See the file COPYING in the main directory of the
				8	* Linux distribution for more details.
				9	*/
				10
				11	#include <linux/kernel.h>
				12	#include <linux/atomic.h>
				13	#include <linux/cgroup.h>
				14	#include <linux/slab.h>
				15	#include <linux/bpf.h>
				16	#include <linux/bpf-cgroup.h>
				17	#include <net/sock.h>
				18
				19	DEFINE_STATIC_KEY_FALSE(cgroup_bpf_enabled_key);
				20	EXPORT_SYMBOL(cgroup_bpf_enabled_key);
				21
				22	/**
				23	* cgroup_bpf_put() - put references of all bpf programs
				24	* @cgrp: the cgroup to modify
				25	*/
				26	void cgroup_bpf_put(struct cgroup *cgrp)
				27	{
				28	unsigned int type;
				29
				30	for (type = 0; type < ARRAY_SIZE(cgrp->bpf.prog); type++) {
				31	struct bpf_prog *prog = cgrp->bpf.prog[type];
				32
				33	if (prog) {
				34	bpf_prog_put(prog);
				35	static_branch_dec(&cgroup_bpf_enabled_key);
				36	}
				37	}
				38	}
				39
				40	/**
				41	* cgroup_bpf_inherit() - inherit effective programs from parent
				42	* @cgrp: the cgroup to modify
				43	* @parent: the parent to inherit from
				44	*/
				45	void cgroup_bpf_inherit(struct cgroup cgrp, struct cgroup parent)
				46	{
				47	unsigned int type;
				48
				49	for (type = 0; type < ARRAY_SIZE(cgrp->bpf.effective); type++) {
				50	struct bpf_prog *e;
				51
				52	e = rcu_dereference_protected(parent->bpf.effective[type],
				53	lockdep_is_held(&cgroup_mutex));
				54	rcu_assign_pointer(cgrp->bpf.effective[type], e);
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	55	cgrp->bpf.disallow_override[type] = parent->bpf.disallow_override[type];
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	56	}
				57	}
				58
				59	/**
				60	* __cgroup_bpf_update() - Update the pinned program of a cgroup, and
				61	* propagate the change to descendants
				62	* @cgrp: The cgroup which descendants to traverse
				63	* @parent: The parent of @cgrp, or %NULL if @cgrp is the root
				64	* @prog: A new program to pin
				65	* @type: Type of pinning operation (ingress/egress)
				66	*
				67	* Each cgroup has a set of two pointers for bpf programs; one for eBPF
				68	* programs it owns, and which is effective for execution.
				69	*
Daniel Mack	a5d371c	2016-11-28 14:11:04 +0100	[diff] [blame]	70	* If @prog is not %NULL, this function attaches a new program to the cgroup
				71	* and releases the one that is currently attached, if any. @prog is then made
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	72	* the effective program of type @type in that cgroup.
				73	*
				74	* If @prog is %NULL, the currently attached program of type @type is released,
				75	* and the effective program of the parent cgroup (if any) is inherited to
				76	* @cgrp.
				77	*
				78	* Then, the descendants of @cgrp are walked and the effective program for
				79	* each of them is set to the effective program of @cgrp unless the
				80	* descendant has its own program attached, in which case the subbranch is
				81	* skipped. This ensures that delegated subcgroups with own programs are left
				82	* untouched.
				83	*
				84	* Must be called with cgroup_mutex held.
				85	*/
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	86	int __cgroup_bpf_update(struct cgroup cgrp, struct cgroup parent,
				87	struct bpf_prog *prog, enum bpf_attach_type type,
				88	bool new_overridable)
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	89	{
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	90	struct bpf_prog old_prog, effective = NULL;
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	91	struct cgroup_subsys_state *pos;
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	92	bool overridable = true;
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	93
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	94	if (parent) {
				95	overridable = !parent->bpf.disallow_override[type];
				96	effective = rcu_dereference_protected(parent->bpf.effective[type],
				97	lockdep_is_held(&cgroup_mutex));
				98	}
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	99
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	100	if (prog && effective && !overridable)
				101	/* if parent has non-overridable prog attached, disallow
				102	* attaching new programs to descendent cgroup
				103	*/
				104	return -EPERM;
				105
				106	if (prog && effective && overridable != new_overridable)
				107	/* if parent has overridable prog attached, only
				108	* allow overridable programs in descendent cgroup
				109	*/
				110	return -EPERM;
				111
				112	old_prog = cgrp->bpf.prog[type];
				113
				114	if (prog) {
				115	overridable = new_overridable;
				116	effective = prog;
				117	if (old_prog &&
				118	cgrp->bpf.disallow_override[type] == new_overridable)
				119	/* disallow attaching non-overridable on top
				120	* of existing overridable in this cgroup
				121	* and vice versa
				122	*/
				123	return -EPERM;
				124	}
				125
				126	if (!prog && !old_prog)
				127	/* report error when trying to detach and nothing is attached */
				128	return -ENOENT;
				129
				130	cgrp->bpf.prog[type] = prog;
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	131
				132	css_for_each_descendant_pre(pos, &cgrp->self) {
				133	struct cgroup *desc = container_of(pos, struct cgroup, self);
				134
				135	/* skip the subtree if the descendant has its own program */
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	136	if (desc->bpf.prog[type] && desc != cgrp) {
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	137	pos = css_rightmost_descendant(pos);
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	138	} else {
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	139	rcu_assign_pointer(desc->bpf.effective[type],
				140	effective);
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	141	desc->bpf.disallow_override[type] = !overridable;
				142	}
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	143	}
				144
				145	if (prog)
				146	static_branch_inc(&cgroup_bpf_enabled_key);
				147
				148	if (old_prog) {
				149	bpf_prog_put(old_prog);
				150	static_branch_dec(&cgroup_bpf_enabled_key);
				151	}
Alexei Starovoitov	1ee2b4b	2017-02-10 20:28:24 -0800	[diff] [blame]	152	return 0;
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	153	}
				154
				155	/**
				156	* __cgroup_bpf_run_filter() - Run a program for packet filtering
Willem de Bruijn	2c1289c	2017-04-11 14:08:08 -0400	[diff] [blame]	157	* @sk: The socket sending or receiving traffic
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	158	* @skb: The skb that is being sent or received
				159	* @type: The type of program to be exectuted
				160	*
				161	* If no socket is passed, or the socket is not of type INET or INET6,
				162	* this function does nothing and returns 0.
				163	*
				164	* The program type passed in via @type must be suitable for network
				165	* filtering. No further check is performed to assert that.
				166	*
				167	* This function will return %-EPERM if any if an attached program was found
				168	* and if it returned != 1 during execution. In all other cases, 0 is returned.
				169	*/
				170	int __cgroup_bpf_run_filter(struct sock *sk,
				171	struct sk_buff *skb,
				172	enum bpf_attach_type type)
				173	{
				174	struct bpf_prog *prog;
				175	struct cgroup *cgrp;
				176	int ret = 0;
				177
				178	if (!sk \|\| !sk_fullsock(sk))
				179	return 0;
				180
				181	if (sk->sk_family != AF_INET &&
				182	sk->sk_family != AF_INET6)
				183	return 0;
				184
				185	cgrp = sock_cgroup_ptr(&sk->sk_cgrp_data);
				186
				187	rcu_read_lock();
				188
				189	prog = rcu_dereference(cgrp->bpf.effective[type]);
				190	if (prog) {
				191	unsigned int offset = skb->data - skb_network_header(skb);
Willem de Bruijn	2c1289c	2017-04-11 14:08:08 -0400	[diff] [blame]	192	struct sock *save_sk = skb->sk;
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	193
Willem de Bruijn	2c1289c	2017-04-11 14:08:08 -0400	[diff] [blame]	194	skb->sk = sk;
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	195	__skb_push(skb, offset);
				196	ret = bpf_prog_run_save_cb(prog, skb) == 1 ? 0 : -EPERM;
				197	__skb_pull(skb, offset);
Willem de Bruijn	2c1289c	2017-04-11 14:08:08 -0400	[diff] [blame]	198	skb->sk = save_sk;
Daniel Mack	f791c42	2016-11-23 16:52:26 +0100	[diff] [blame]	199	}
				200
				201	rcu_read_unlock();
				202
				203	return ret;
				204	}
				205	EXPORT_SYMBOL(__cgroup_bpf_run_filter);