blob: 8f3948dd38b85f70e654e317280db09e66c23f5c [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Jiri Pirko0c6965d2014-11-05 20:51:51 +01002 * net/sched/act_mirred.c packet mirroring and redirect actions
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Jamal Hadi Salim (2002-4)
10 *
11 * TODO: Add ingress support (and socket redirect support)
12 *
13 */
14
Linus Torvalds1da177e2005-04-16 15:20:36 -070015#include <linux/types.h>
16#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/string.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/errno.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070019#include <linux/skbuff.h>
20#include <linux/rtnetlink.h>
21#include <linux/module.h>
22#include <linux/init.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090023#include <linux/gfp.h>
Eric W. Biederman881d9662007-09-17 11:56:21 -070024#include <net/net_namespace.h>
Arnaldo Carvalho de Melodc5fc572007-03-25 23:06:12 -070025#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026#include <net/pkt_sched.h>
27#include <linux/tc_act/tc_mirred.h>
28#include <net/tc_act/tc_mirred.h>
29
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/if_arp.h>
31
David S. Millere9ce1cd2006-08-21 23:54:55 -070032#define MIRRED_TAB_MASK 7
stephen hemminger3b879562010-07-22 18:45:04 +000033static LIST_HEAD(mirred_list);
WANG Cong6bd00b82015-10-01 11:37:42 -070034static DEFINE_SPINLOCK(mirred_list_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
WANG Conga5b5c952014-02-11 17:07:32 -080036static void tcf_mirred_release(struct tc_action *a, int bind)
Linus Torvalds1da177e2005-04-16 15:20:36 -070037{
WANG Cong86062032014-02-11 17:07:31 -080038 struct tcf_mirred *m = to_mirred(a);
Eric Dumazet2ee22a92015-07-06 05:18:09 -070039 struct net_device *dev = rcu_dereference_protected(m->tcfm_dev, 1);
40
WANG Cong6bd00b82015-10-01 11:37:42 -070041 /* We could be called either in a RCU callback or with RTNL lock held. */
42 spin_lock_bh(&mirred_list_lock);
WANG Conga5b5c952014-02-11 17:07:32 -080043 list_del(&m->tcfm_list);
WANG Cong6bd00b82015-10-01 11:37:42 -070044 spin_unlock_bh(&mirred_list_lock);
Eric Dumazet2ee22a92015-07-06 05:18:09 -070045 if (dev)
46 dev_put(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -070047}
48
Patrick McHardy53b2bf32008-01-23 20:36:30 -080049static const struct nla_policy mirred_policy[TCA_MIRRED_MAX + 1] = {
50 [TCA_MIRRED_PARMS] = { .len = sizeof(struct tc_mirred) },
51};
52
WANG Congddf97cc2016-02-22 15:57:53 -080053static int mirred_net_id;
54
Benjamin LaHaisec1b52732013-01-14 05:15:39 +000055static int tcf_mirred_init(struct net *net, struct nlattr *nla,
56 struct nlattr *est, struct tc_action *a, int ovr,
57 int bind)
Linus Torvalds1da177e2005-04-16 15:20:36 -070058{
WANG Congddf97cc2016-02-22 15:57:53 -080059 struct tc_action_net *tn = net_generic(net, mirred_net_id);
Patrick McHardy7ba699c2008-01-22 22:11:50 -080060 struct nlattr *tb[TCA_MIRRED_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -070061 struct tc_mirred *parm;
David S. Millere9ce1cd2006-08-21 23:54:55 -070062 struct tcf_mirred *m;
Changli Gaob76965e2009-11-17 04:15:16 -080063 struct net_device *dev;
Jamal Hadi Salim87dfbdc2016-05-10 16:49:28 -040064 int ret, ok_push = 0, exists = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070065
Patrick McHardycee63722008-01-23 20:33:32 -080066 if (nla == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -070067 return -EINVAL;
Changli Gaob76965e2009-11-17 04:15:16 -080068 ret = nla_parse_nested(tb, TCA_MIRRED_MAX, nla, mirred_policy);
69 if (ret < 0)
70 return ret;
Patrick McHardy53b2bf32008-01-23 20:36:30 -080071 if (tb[TCA_MIRRED_PARMS] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -070072 return -EINVAL;
Patrick McHardy7ba699c2008-01-22 22:11:50 -080073 parm = nla_data(tb[TCA_MIRRED_PARMS]);
Jamal Hadi Salim87dfbdc2016-05-10 16:49:28 -040074
75 exists = tcf_hash_check(tn, parm->index, a, bind);
76 if (exists && bind)
77 return 0;
78
Changli Gaob76965e2009-11-17 04:15:16 -080079 switch (parm->eaction) {
80 case TCA_EGRESS_MIRROR:
81 case TCA_EGRESS_REDIR:
82 break;
83 default:
Jamal Hadi Salim87dfbdc2016-05-10 16:49:28 -040084 if (exists)
85 tcf_hash_release(a, bind);
Changli Gaob76965e2009-11-17 04:15:16 -080086 return -EINVAL;
87 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070088 if (parm->ifindex) {
Benjamin LaHaisec1b52732013-01-14 05:15:39 +000089 dev = __dev_get_by_index(net, parm->ifindex);
Jamal Hadi Salim87dfbdc2016-05-10 16:49:28 -040090 if (dev == NULL) {
91 if (exists)
92 tcf_hash_release(a, bind);
Linus Torvalds1da177e2005-04-16 15:20:36 -070093 return -ENODEV;
Jamal Hadi Salim87dfbdc2016-05-10 16:49:28 -040094 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070095 switch (dev->type) {
Changli Gaob76965e2009-11-17 04:15:16 -080096 case ARPHRD_TUNNEL:
97 case ARPHRD_TUNNEL6:
98 case ARPHRD_SIT:
99 case ARPHRD_IPGRE:
100 case ARPHRD_VOID:
101 case ARPHRD_NONE:
102 ok_push = 0;
103 break;
104 default:
105 ok_push = 1;
106 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107 }
Changli Gaob76965e2009-11-17 04:15:16 -0800108 } else {
109 dev = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110 }
111
Jamal Hadi Salim87dfbdc2016-05-10 16:49:28 -0400112 if (!exists) {
Changli Gaob76965e2009-11-17 04:15:16 -0800113 if (dev == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 return -EINVAL;
WANG Congddf97cc2016-02-22 15:57:53 -0800115 ret = tcf_hash_create(tn, parm->index, est, a,
116 sizeof(*m), bind, true);
WANG Cong86062032014-02-11 17:07:31 -0800117 if (ret)
118 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119 ret = ACT_P_CREATED;
120 } else {
WANG Cong215c90a2015-10-01 11:37:43 -0700121 tcf_hash_release(a, bind);
122 if (!ovr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700123 return -EEXIST;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124 }
WANG Cong86062032014-02-11 17:07:31 -0800125 m = to_mirred(a);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700127 ASSERT_RTNL();
David S. Millere9ce1cd2006-08-21 23:54:55 -0700128 m->tcf_action = parm->action;
129 m->tcfm_eaction = parm->eaction;
Changli Gaob76965e2009-11-17 04:15:16 -0800130 if (dev != NULL) {
David S. Millere9ce1cd2006-08-21 23:54:55 -0700131 m->tcfm_ifindex = parm->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132 if (ret != ACT_P_CREATED)
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700133 dev_put(rcu_dereference_protected(m->tcfm_dev, 1));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134 dev_hold(dev);
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700135 rcu_assign_pointer(m->tcfm_dev, dev);
David S. Millere9ce1cd2006-08-21 23:54:55 -0700136 m->tcfm_ok_push = ok_push;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137 }
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700138
stephen hemminger3b879562010-07-22 18:45:04 +0000139 if (ret == ACT_P_CREATED) {
WANG Cong6bd00b82015-10-01 11:37:42 -0700140 spin_lock_bh(&mirred_list_lock);
stephen hemminger3b879562010-07-22 18:45:04 +0000141 list_add(&m->tcfm_list, &mirred_list);
WANG Cong6bd00b82015-10-01 11:37:42 -0700142 spin_unlock_bh(&mirred_list_lock);
WANG Congddf97cc2016-02-22 15:57:53 -0800143 tcf_hash_insert(tn, a);
stephen hemminger3b879562010-07-22 18:45:04 +0000144 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146 return ret;
147}
148
Eric Dumazetdc7f9f62011-07-05 23:25:42 +0000149static int tcf_mirred(struct sk_buff *skb, const struct tc_action *a,
David S. Millere9ce1cd2006-08-21 23:54:55 -0700150 struct tcf_result *res)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151{
David S. Millere9ce1cd2006-08-21 23:54:55 -0700152 struct tcf_mirred *m = a->priv;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 struct net_device *dev;
Changli Gaofeed1f12009-11-17 04:14:00 -0800154 struct sk_buff *skb2;
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700155 int retval, err;
Changli Gaofeed1f12009-11-17 04:14:00 -0800156 u32 at;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700158 tcf_lastuse_update(&m->tcf_tm);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700160 bstats_cpu_update(this_cpu_ptr(m->common.cpu_bstats), skb);
161
162 rcu_read_lock();
163 retval = READ_ONCE(m->tcf_action);
164 dev = rcu_dereference(m->tcfm_dev);
165 if (unlikely(!dev)) {
166 pr_notice_once("tc mirred: target device is gone\n");
stephen hemminger3b879562010-07-22 18:45:04 +0000167 goto out;
168 }
169
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700170 if (unlikely(!(dev->flags & IFF_UP))) {
Joe Perchese87cc472012-05-13 21:56:26 +0000171 net_notice_ratelimited("tc mirred to Houston: device %s is down\n",
172 dev->name);
Changli Gaofeed1f12009-11-17 04:14:00 -0800173 goto out;
174 }
175
Changli Gao210d6de2010-06-24 16:25:12 +0000176 at = G_TC_AT(skb->tc_verd);
Florian Westphale578d9c2015-05-11 19:50:41 +0200177 skb2 = skb_clone(skb, GFP_ATOMIC);
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700178 if (!skb2)
Changli Gaofeed1f12009-11-17 04:14:00 -0800179 goto out;
180
Changli Gaofeed1f12009-11-17 04:14:00 -0800181 if (!(at & AT_EGRESS)) {
David S. Millere9ce1cd2006-08-21 23:54:55 -0700182 if (m->tcfm_ok_push)
Herbert Xuf40ae912015-04-17 13:32:09 +0800183 skb_push(skb2, skb->mac_len);
Changli Gaofeed1f12009-11-17 04:14:00 -0800184 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700185
186 /* mirror is always swallowed */
David S. Millere9ce1cd2006-08-21 23:54:55 -0700187 if (m->tcfm_eaction != TCA_EGRESS_MIRROR)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700188 skb2->tc_verd = SET_TC_FROM(skb2->tc_verd, at);
189
Eric Dumazet8964be42009-11-20 15:35:04 -0800190 skb2->skb_iif = skb->dev->ifindex;
Changli Gao210d6de2010-06-24 16:25:12 +0000191 skb2->dev = dev;
Jamal Hadi Salim8919bc12011-08-15 05:25:40 +0000192 err = dev_queue_xmit(skb2);
Changli Gaofeed1f12009-11-17 04:14:00 -0800193
Changli Gaofeed1f12009-11-17 04:14:00 -0800194 if (err) {
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700195out:
196 qstats_overlimit_inc(this_cpu_ptr(m->common.cpu_qstats));
Jason Wang16c0b162012-08-15 20:44:27 +0000197 if (m->tcfm_eaction != TCA_EGRESS_MIRROR)
198 retval = TC_ACT_SHOT;
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700199 }
200 rcu_read_unlock();
Changli Gaofeed1f12009-11-17 04:14:00 -0800201
202 return retval;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203}
204
David S. Millere9ce1cd2006-08-21 23:54:55 -0700205static int tcf_mirred_dump(struct sk_buff *skb, struct tc_action *a, int bind, int ref)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206{
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700207 unsigned char *b = skb_tail_pointer(skb);
David S. Millere9ce1cd2006-08-21 23:54:55 -0700208 struct tcf_mirred *m = a->priv;
Eric Dumazet1c40be12010-08-16 20:04:22 +0000209 struct tc_mirred opt = {
210 .index = m->tcf_index,
211 .action = m->tcf_action,
212 .refcnt = m->tcf_refcnt - ref,
213 .bindcnt = m->tcf_bindcnt - bind,
214 .eaction = m->tcfm_eaction,
215 .ifindex = m->tcfm_ifindex,
216 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217 struct tcf_t t;
218
David S. Miller1b34ec42012-03-29 05:11:39 -0400219 if (nla_put(skb, TCA_MIRRED_PARMS, sizeof(opt), &opt))
220 goto nla_put_failure;
David S. Millere9ce1cd2006-08-21 23:54:55 -0700221 t.install = jiffies_to_clock_t(jiffies - m->tcf_tm.install);
222 t.lastuse = jiffies_to_clock_t(jiffies - m->tcf_tm.lastuse);
223 t.expires = jiffies_to_clock_t(m->tcf_tm.expires);
David S. Miller1b34ec42012-03-29 05:11:39 -0400224 if (nla_put(skb, TCA_MIRRED_TM, sizeof(t), &t))
225 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226 return skb->len;
227
Patrick McHardy7ba699c2008-01-22 22:11:50 -0800228nla_put_failure:
Arnaldo Carvalho de Melodc5fc572007-03-25 23:06:12 -0700229 nlmsg_trim(skb, b);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230 return -1;
231}
232
WANG Congddf97cc2016-02-22 15:57:53 -0800233static int tcf_mirred_walker(struct net *net, struct sk_buff *skb,
234 struct netlink_callback *cb, int type,
235 struct tc_action *a)
236{
237 struct tc_action_net *tn = net_generic(net, mirred_net_id);
238
239 return tcf_generic_walker(tn, skb, cb, type, a);
240}
241
242static int tcf_mirred_search(struct net *net, struct tc_action *a, u32 index)
243{
244 struct tc_action_net *tn = net_generic(net, mirred_net_id);
245
246 return tcf_hash_search(tn, a, index);
247}
248
stephen hemminger3b879562010-07-22 18:45:04 +0000249static int mirred_device_event(struct notifier_block *unused,
250 unsigned long event, void *ptr)
251{
Jiri Pirko351638e2013-05-28 01:30:21 +0000252 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
stephen hemminger3b879562010-07-22 18:45:04 +0000253 struct tcf_mirred *m;
254
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700255 ASSERT_RTNL();
WANG Cong6bd00b82015-10-01 11:37:42 -0700256 if (event == NETDEV_UNREGISTER) {
257 spin_lock_bh(&mirred_list_lock);
stephen hemminger3b879562010-07-22 18:45:04 +0000258 list_for_each_entry(m, &mirred_list, tcfm_list) {
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700259 if (rcu_access_pointer(m->tcfm_dev) == dev) {
stephen hemminger3b879562010-07-22 18:45:04 +0000260 dev_put(dev);
Eric Dumazet2ee22a92015-07-06 05:18:09 -0700261 /* Note : no rcu grace period necessary, as
262 * net_device are already rcu protected.
263 */
264 RCU_INIT_POINTER(m->tcfm_dev, NULL);
stephen hemminger3b879562010-07-22 18:45:04 +0000265 }
266 }
WANG Cong6bd00b82015-10-01 11:37:42 -0700267 spin_unlock_bh(&mirred_list_lock);
268 }
stephen hemminger3b879562010-07-22 18:45:04 +0000269
270 return NOTIFY_DONE;
271}
272
273static struct notifier_block mirred_device_notifier = {
274 .notifier_call = mirred_device_event,
275};
276
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277static struct tc_action_ops act_mirred_ops = {
278 .kind = "mirred",
279 .type = TCA_ACT_MIRRED,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280 .owner = THIS_MODULE,
281 .act = tcf_mirred,
282 .dump = tcf_mirred_dump,
WANG Cong86062032014-02-11 17:07:31 -0800283 .cleanup = tcf_mirred_release,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284 .init = tcf_mirred_init,
WANG Congddf97cc2016-02-22 15:57:53 -0800285 .walk = tcf_mirred_walker,
286 .lookup = tcf_mirred_search,
287};
288
289static __net_init int mirred_init_net(struct net *net)
290{
291 struct tc_action_net *tn = net_generic(net, mirred_net_id);
292
293 return tc_action_net_init(tn, &act_mirred_ops, MIRRED_TAB_MASK);
294}
295
296static void __net_exit mirred_exit_net(struct net *net)
297{
298 struct tc_action_net *tn = net_generic(net, mirred_net_id);
299
300 tc_action_net_exit(tn);
301}
302
303static struct pernet_operations mirred_net_ops = {
304 .init = mirred_init_net,
305 .exit = mirred_exit_net,
306 .id = &mirred_net_id,
307 .size = sizeof(struct tc_action_net),
Linus Torvalds1da177e2005-04-16 15:20:36 -0700308};
309
310MODULE_AUTHOR("Jamal Hadi Salim(2002)");
311MODULE_DESCRIPTION("Device Mirror/redirect actions");
312MODULE_LICENSE("GPL");
313
David S. Millere9ce1cd2006-08-21 23:54:55 -0700314static int __init mirred_init_module(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315{
stephen hemminger3b879562010-07-22 18:45:04 +0000316 int err = register_netdevice_notifier(&mirred_device_notifier);
317 if (err)
318 return err;
319
stephen hemminger6ff9c362010-05-12 06:37:05 +0000320 pr_info("Mirror/redirect action on\n");
WANG Congddf97cc2016-02-22 15:57:53 -0800321 return tcf_register_action(&act_mirred_ops, &mirred_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322}
323
David S. Millere9ce1cd2006-08-21 23:54:55 -0700324static void __exit mirred_cleanup_module(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700325{
WANG Congddf97cc2016-02-22 15:57:53 -0800326 tcf_unregister_action(&act_mirred_ops, &mirred_net_ops);
WANG Cong568a1532013-12-20 00:08:51 -0800327 unregister_netdevice_notifier(&mirred_device_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328}
329
330module_init(mirred_init_module);
331module_exit(mirred_cleanup_module);