kernel/bpf/cgroup.c - kernel/msm-4.9 - Gitiles

 /*
  * Functions to manage eBPF programs attached to cgroups
  *
  * Copyright (c) 2016 Daniel Mack
  *
  * This file is subject to the terms and conditions of version 2 of the GNU
  * General Public License.  See the file COPYING in the main directory of the
  * Linux distribution for more details.
  */

 #include <linux/kernel.h>
 #include <linux/atomic.h>
 #include <linux/cgroup.h>
 #include <linux/slab.h>
 #include <linux/bpf.h>
 #include <linux/bpf-cgroup.h>
 #include <net/sock.h>

 DEFINE_STATIC_KEY_FALSE(cgroup_bpf_enabled_key);
 EXPORT_SYMBOL(cgroup_bpf_enabled_key);

 /**
  * cgroup_bpf_put() - put references of all bpf programs
  * @cgrp: the cgroup to modify
  */
 void cgroup_bpf_put(struct cgroup *cgrp)
 {
 	unsigned int type;

 	for (type = 0; type < ARRAY_SIZE(cgrp->bpf.prog); type++) {
 		struct bpf_prog *prog = cgrp->bpf.prog[type];

 		if (prog) {
 			bpf_prog_put(prog);
 			static_branch_dec(&cgroup_bpf_enabled_key);
 		}
 	}
 }

 /**
  * cgroup_bpf_inherit() - inherit effective programs from parent
  * @cgrp: the cgroup to modify
  * @parent: the parent to inherit from
  */
 void cgroup_bpf_inherit(struct cgroup *cgrp, struct cgroup *parent)
 {
 	unsigned int type;

 	for (type = 0; type < ARRAY_SIZE(cgrp->bpf.effective); type++) {
 		struct bpf_prog *e;

 		e = rcu_dereference_protected(parent->bpf.effective[type],
 					      lockdep_is_held(&cgroup_mutex));
 		rcu_assign_pointer(cgrp->bpf.effective[type], e);
 		cgrp->bpf.disallow_override[type] = parent->bpf.disallow_override[type];
 	}
 }

 /**
  * __cgroup_bpf_update() - Update the pinned program of a cgroup, and
  *                         propagate the change to descendants
  * @cgrp: The cgroup which descendants to traverse
  * @parent: The parent of @cgrp, or %NULL if @cgrp is the root
  * @prog: A new program to pin
  * @type: Type of pinning operation (ingress/egress)
  *
  * Each cgroup has a set of two pointers for bpf programs; one for eBPF
  * programs it owns, and which is effective for execution.
  *
  * If @prog is not %NULL, this function attaches a new program to the cgroup
  * and releases the one that is currently attached, if any. @prog is then made
  * the effective program of type @type in that cgroup.
  *
  * If @prog is %NULL, the currently attached program of type @type is released,
  * and the effective program of the parent cgroup (if any) is inherited to
  * @cgrp.
  *
  * Then, the descendants of @cgrp are walked and the effective program for
  * each of them is set to the effective program of @cgrp unless the
  * descendant has its own program attached, in which case the subbranch is
  * skipped. This ensures that delegated subcgroups with own programs are left
  * untouched.
  *
  * Must be called with cgroup_mutex held.
  */
 int __cgroup_bpf_update(struct cgroup *cgrp, struct cgroup *parent,
 			struct bpf_prog *prog, enum bpf_attach_type type,
 			bool new_overridable)
 {
 	struct bpf_prog *old_prog, *effective = NULL;
 	struct cgroup_subsys_state *pos;
 	bool overridable = true;

 	if (parent) {
 		overridable = !parent->bpf.disallow_override[type];
 		effective = rcu_dereference_protected(parent->bpf.effective[type],
 						      lockdep_is_held(&cgroup_mutex));
 	}

 	if (prog && effective && !overridable)
 		/* if parent has non-overridable prog attached, disallow
 		 * attaching new programs to descendent cgroup
 		 */
 		return -EPERM;

 	if (prog && effective && overridable != new_overridable)
 		/* if parent has overridable prog attached, only
 		 * allow overridable programs in descendent cgroup
 		 */
 		return -EPERM;

 	old_prog = cgrp->bpf.prog[type];

 	if (prog) {
 		overridable = new_overridable;
 		effective = prog;
 		if (old_prog &&
 		    cgrp->bpf.disallow_override[type] == new_overridable)
 			/* disallow attaching non-overridable on top
 			 * of existing overridable in this cgroup
 			 * and vice versa
 			 */
 			return -EPERM;
 	}

 	if (!prog && !old_prog)
 		/* report error when trying to detach and nothing is attached */
 		return -ENOENT;

 	cgrp->bpf.prog[type] = prog;

 	css_for_each_descendant_pre(pos, &cgrp->self) {
 		struct cgroup *desc = container_of(pos, struct cgroup, self);

 		/* skip the subtree if the descendant has its own program */
 		if (desc->bpf.prog[type] && desc != cgrp) {
 			pos = css_rightmost_descendant(pos);
 		} else {
 			rcu_assign_pointer(desc->bpf.effective[type],
 					   effective);
 			desc->bpf.disallow_override[type] = !overridable;
 		}
 	}

 	if (prog)
 		static_branch_inc(&cgroup_bpf_enabled_key);

 	if (old_prog) {
 		bpf_prog_put(old_prog);
 		static_branch_dec(&cgroup_bpf_enabled_key);
 	}
 	return 0;
 }

 /**
  * __cgroup_bpf_run_filter() - Run a program for packet filtering
  * @sk: The socket sending or receiving traffic
  * @skb: The skb that is being sent or received
  * @type: The type of program to be exectuted
  *
  * If no socket is passed, or the socket is not of type INET or INET6,
  * this function does nothing and returns 0.
  *
  * The program type passed in via @type must be suitable for network
  * filtering. No further check is performed to assert that.
  *
  * This function will return %-EPERM if any if an attached program was found
  * and if it returned != 1 during execution. In all other cases, 0 is returned.
  */
 int __cgroup_bpf_run_filter(struct sock *sk,
 			    struct sk_buff *skb,
 			    enum bpf_attach_type type)
 {
 	struct bpf_prog *prog;
 	struct cgroup *cgrp;
 	int ret = 0;

 	if (!sk || !sk_fullsock(sk))
 		return 0;

 	if (sk->sk_family != AF_INET &&
 	    sk->sk_family != AF_INET6)
 		return 0;

 	cgrp = sock_cgroup_ptr(&sk->sk_cgrp_data);

 	rcu_read_lock();

 	prog = rcu_dereference(cgrp->bpf.effective[type]);
 	if (prog) {
 		unsigned int offset = skb->data - skb_network_header(skb);
 		struct sock *save_sk = skb->sk;

 		skb->sk = sk;
 		__skb_push(skb, offset);
 		ret = bpf_prog_run_save_cb(prog, skb) == 1 ? 0 : -EPERM;
 		__skb_pull(skb, offset);
 		skb->sk = save_sk;
 	}

 	rcu_read_unlock();

 	return ret;
 }
 EXPORT_SYMBOL(__cgroup_bpf_run_filter);
	/*
	* Functions to manage eBPF programs attached to cgroups
	*
	* Copyright (c) 2016 Daniel Mack
	*
	* This file is subject to the terms and conditions of version 2 of the GNU
	* General Public License. See the file COPYING in the main directory of the
	* Linux distribution for more details.
	*/

	#include <linux/kernel.h>
	#include <linux/atomic.h>
	#include <linux/cgroup.h>
	#include <linux/slab.h>
	#include <linux/bpf.h>
	#include <linux/bpf-cgroup.h>
	#include <net/sock.h>

	DEFINE_STATIC_KEY_FALSE(cgroup_bpf_enabled_key);
	EXPORT_SYMBOL(cgroup_bpf_enabled_key);

	/**
	* cgroup_bpf_put() - put references of all bpf programs
	* @cgrp: the cgroup to modify
	*/
	void cgroup_bpf_put(struct cgroup *cgrp)
	{
	unsigned int type;

	for (type = 0; type < ARRAY_SIZE(cgrp->bpf.prog); type++) {
	struct bpf_prog *prog = cgrp->bpf.prog[type];

	if (prog) {
	bpf_prog_put(prog);
	static_branch_dec(&cgroup_bpf_enabled_key);
	}
	}
	}

	/**
	* cgroup_bpf_inherit() - inherit effective programs from parent
	* @cgrp: the cgroup to modify
	* @parent: the parent to inherit from
	*/
	void cgroup_bpf_inherit(struct cgroup cgrp, struct cgroup parent)
	{
	unsigned int type;

	for (type = 0; type < ARRAY_SIZE(cgrp->bpf.effective); type++) {
	struct bpf_prog *e;

	e = rcu_dereference_protected(parent->bpf.effective[type],
	lockdep_is_held(&cgroup_mutex));
	rcu_assign_pointer(cgrp->bpf.effective[type], e);
	cgrp->bpf.disallow_override[type] = parent->bpf.disallow_override[type];
	}
	}

	/**
	* __cgroup_bpf_update() - Update the pinned program of a cgroup, and
	* propagate the change to descendants
	* @cgrp: The cgroup which descendants to traverse
	* @parent: The parent of @cgrp, or %NULL if @cgrp is the root
	* @prog: A new program to pin
	* @type: Type of pinning operation (ingress/egress)
	*
	* Each cgroup has a set of two pointers for bpf programs; one for eBPF
	* programs it owns, and which is effective for execution.
	*
	* If @prog is not %NULL, this function attaches a new program to the cgroup
	* and releases the one that is currently attached, if any. @prog is then made
	* the effective program of type @type in that cgroup.
	*
	* If @prog is %NULL, the currently attached program of type @type is released,
	* and the effective program of the parent cgroup (if any) is inherited to
	* @cgrp.
	*
	* Then, the descendants of @cgrp are walked and the effective program for
	* each of them is set to the effective program of @cgrp unless the
	* descendant has its own program attached, in which case the subbranch is
	* skipped. This ensures that delegated subcgroups with own programs are left
	* untouched.
	*
	* Must be called with cgroup_mutex held.
	*/
	int __cgroup_bpf_update(struct cgroup cgrp, struct cgroup parent,
	struct bpf_prog *prog, enum bpf_attach_type type,
	bool new_overridable)
	{
	struct bpf_prog old_prog, effective = NULL;
	struct cgroup_subsys_state *pos;
	bool overridable = true;

	if (parent) {
	overridable = !parent->bpf.disallow_override[type];
	effective = rcu_dereference_protected(parent->bpf.effective[type],
	lockdep_is_held(&cgroup_mutex));
	}

	if (prog && effective && !overridable)
	/* if parent has non-overridable prog attached, disallow
	* attaching new programs to descendent cgroup
	*/
	return -EPERM;

	if (prog && effective && overridable != new_overridable)
	/* if parent has overridable prog attached, only
	* allow overridable programs in descendent cgroup
	*/
	return -EPERM;

	old_prog = cgrp->bpf.prog[type];

	if (prog) {
	overridable = new_overridable;
	effective = prog;
	if (old_prog &&
	cgrp->bpf.disallow_override[type] == new_overridable)
	/* disallow attaching non-overridable on top
	* of existing overridable in this cgroup
	* and vice versa
	*/
	return -EPERM;
	}

	if (!prog && !old_prog)
	/* report error when trying to detach and nothing is attached */
	return -ENOENT;

	cgrp->bpf.prog[type] = prog;

	css_for_each_descendant_pre(pos, &cgrp->self) {
	struct cgroup *desc = container_of(pos, struct cgroup, self);

	/* skip the subtree if the descendant has its own program */
	if (desc->bpf.prog[type] && desc != cgrp) {
	pos = css_rightmost_descendant(pos);
	} else {
	rcu_assign_pointer(desc->bpf.effective[type],
	effective);
	desc->bpf.disallow_override[type] = !overridable;
	}
	}

	if (prog)
	static_branch_inc(&cgroup_bpf_enabled_key);

	if (old_prog) {
	bpf_prog_put(old_prog);
	static_branch_dec(&cgroup_bpf_enabled_key);
	}
	return 0;
	}

	/**
	* __cgroup_bpf_run_filter() - Run a program for packet filtering
	* @sk: The socket sending or receiving traffic
	* @skb: The skb that is being sent or received
	* @type: The type of program to be exectuted
	*
	* If no socket is passed, or the socket is not of type INET or INET6,
	* this function does nothing and returns 0.
	*
	* The program type passed in via @type must be suitable for network
	* filtering. No further check is performed to assert that.
	*
	* This function will return %-EPERM if any if an attached program was found
	* and if it returned != 1 during execution. In all other cases, 0 is returned.
	*/
	int __cgroup_bpf_run_filter(struct sock *sk,
	struct sk_buff *skb,
	enum bpf_attach_type type)
	{
	struct bpf_prog *prog;
	struct cgroup *cgrp;
	int ret = 0;

	if (!sk \|\| !sk_fullsock(sk))
	return 0;

	if (sk->sk_family != AF_INET &&
	sk->sk_family != AF_INET6)
	return 0;

	cgrp = sock_cgroup_ptr(&sk->sk_cgrp_data);

	rcu_read_lock();

	prog = rcu_dereference(cgrp->bpf.effective[type]);
	if (prog) {
	unsigned int offset = skb->data - skb_network_header(skb);
	struct sock *save_sk = skb->sk;

	skb->sk = sk;
	__skb_push(skb, offset);
	ret = bpf_prog_run_save_cb(prog, skb) == 1 ? 0 : -EPERM;
	__skb_pull(skb, offset);
	skb->sk = save_sk;
	}

	rcu_read_unlock();

	return ret;
	}
	EXPORT_SYMBOL(__cgroup_bpf_run_filter);