blob: fdfdb56aaae263e4042e1e343f9d36fd8cc105cc [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/sch_red.c Random Early Detection queue.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Changes:
Thomas Grafdba051f2005-11-05 21:14:08 +010012 * J Hadi Salim 980914: computation fixes
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 * Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
Thomas Grafdba051f2005-11-05 21:14:08 +010014 * J Hadi Salim 980816: ECN support
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 */
16
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/types.h>
19#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <net/pkt_sched.h>
22#include <net/inet_ecn.h>
Thomas Graf6b31b282005-11-05 21:14:05 +010023#include <net/red.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024
25
Thomas Graf6b31b282005-11-05 21:14:05 +010026/* Parameters, settable by user:
Linus Torvalds1da177e2005-04-16 15:20:36 -070027 -----------------------------
28
29 limit - bytes (must be > qth_max + burst)
30
31 Hard limit on queue length, should be chosen >qth_max
32 to allow packet bursts. This parameter does not
33 affect the algorithms behaviour and can be chosen
34 arbitrarily high (well, less than ram size)
35 Really, this limit will never be reached
36 if RED works correctly.
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 */
38
Eric Dumazetcc7ec452011-01-19 19:26:56 +000039struct red_sched_data {
Thomas Graf6b31b282005-11-05 21:14:05 +010040 u32 limit; /* HARD maximal queue length */
41 unsigned char flags;
Eric Dumazet8af2a212011-12-08 06:06:03 +000042 struct timer_list adapt_timer;
Kees Cookcdeabbb2017-10-16 17:29:17 -070043 struct Qdisc *sch;
Thomas Graf6b31b282005-11-05 21:14:05 +010044 struct red_parms parms;
Eric Dumazeteeca6682012-01-05 02:25:16 +000045 struct red_vars vars;
Thomas Graf6b31b282005-11-05 21:14:05 +010046 struct red_stats stats;
Patrick McHardyf38c39d2006-03-20 19:20:44 -080047 struct Qdisc *qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -070048};
49
Thomas Graf6b31b282005-11-05 21:14:05 +010050static inline int red_use_ecn(struct red_sched_data *q)
Linus Torvalds1da177e2005-04-16 15:20:36 -070051{
Thomas Graf6b31b282005-11-05 21:14:05 +010052 return q->flags & TC_RED_ECN;
Linus Torvalds1da177e2005-04-16 15:20:36 -070053}
54
Thomas Grafbdc450a2005-11-05 21:14:28 +010055static inline int red_use_harddrop(struct red_sched_data *q)
56{
57 return q->flags & TC_RED_HARDDROP;
58}
59
Eric Dumazet520ac302016-06-21 23:16:49 -070060static int red_enqueue(struct sk_buff *skb, struct Qdisc *sch,
61 struct sk_buff **to_free)
Linus Torvalds1da177e2005-04-16 15:20:36 -070062{
63 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080064 struct Qdisc *child = q->qdisc;
65 int ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
Eric Dumazeteeca6682012-01-05 02:25:16 +000067 q->vars.qavg = red_calc_qavg(&q->parms,
68 &q->vars,
69 child->qstats.backlog);
Linus Torvalds1da177e2005-04-16 15:20:36 -070070
Eric Dumazeteeca6682012-01-05 02:25:16 +000071 if (red_is_idling(&q->vars))
72 red_end_of_idle_period(&q->vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -070073
Eric Dumazeteeca6682012-01-05 02:25:16 +000074 switch (red_action(&q->parms, &q->vars, q->vars.qavg)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +000075 case RED_DONT_MARK:
76 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070077
Eric Dumazetcc7ec452011-01-19 19:26:56 +000078 case RED_PROB_MARK:
John Fastabend25331d62014-09-28 11:53:29 -070079 qdisc_qstats_overlimit(sch);
Eric Dumazetcc7ec452011-01-19 19:26:56 +000080 if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
81 q->stats.prob_drop++;
82 goto congestion_drop;
83 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070084
Eric Dumazetcc7ec452011-01-19 19:26:56 +000085 q->stats.prob_mark++;
86 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070087
Eric Dumazetcc7ec452011-01-19 19:26:56 +000088 case RED_HARD_MARK:
John Fastabend25331d62014-09-28 11:53:29 -070089 qdisc_qstats_overlimit(sch);
Eric Dumazetcc7ec452011-01-19 19:26:56 +000090 if (red_use_harddrop(q) || !red_use_ecn(q) ||
91 !INET_ECN_set_ce(skb)) {
92 q->stats.forced_drop++;
93 goto congestion_drop;
94 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070095
Eric Dumazetcc7ec452011-01-19 19:26:56 +000096 q->stats.forced_mark++;
97 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070098 }
99
Eric Dumazet520ac302016-06-21 23:16:49 -0700100 ret = qdisc_enqueue(skb, child, to_free);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800101 if (likely(ret == NET_XMIT_SUCCESS)) {
WANG Congd7f4f332016-06-01 16:15:18 -0700102 qdisc_qstats_backlog_inc(sch, skb);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800103 sch->q.qlen++;
Jarek Poplawski378a2f02008-08-04 22:31:03 -0700104 } else if (net_xmit_drop_count(ret)) {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800105 q->stats.pdrop++;
John Fastabend25331d62014-09-28 11:53:29 -0700106 qdisc_qstats_drop(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800107 }
108 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Thomas Graf6b31b282005-11-05 21:14:05 +0100110congestion_drop:
Eric Dumazet520ac302016-06-21 23:16:49 -0700111 qdisc_drop(skb, sch, to_free);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 return NET_XMIT_CN;
113}
114
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000115static struct sk_buff *red_dequeue(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116{
117 struct sk_buff *skb;
118 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800119 struct Qdisc *child = q->qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800121 skb = child->dequeue(child);
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800122 if (skb) {
123 qdisc_bstats_update(sch, skb);
WANG Congd7f4f332016-06-01 16:15:18 -0700124 qdisc_qstats_backlog_dec(sch, skb);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800125 sch->q.qlen--;
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800126 } else {
Eric Dumazeteeca6682012-01-05 02:25:16 +0000127 if (!red_is_idling(&q->vars))
128 red_start_of_idle_period(&q->vars);
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800129 }
Thomas Graf9e178ff2005-11-05 21:14:06 +0100130 return skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131}
132
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000133static struct sk_buff *red_peek(struct Qdisc *sch)
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700134{
135 struct red_sched_data *q = qdisc_priv(sch);
136 struct Qdisc *child = q->qdisc;
137
138 return child->ops->peek(child);
139}
140
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000141static void red_reset(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142{
143 struct red_sched_data *q = qdisc_priv(sch);
144
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800145 qdisc_reset(q->qdisc);
WANG Congd7f4f332016-06-01 16:15:18 -0700146 sch->qstats.backlog = 0;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800147 sch->q.qlen = 0;
Eric Dumazeteeca6682012-01-05 02:25:16 +0000148 red_restart(&q->vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700149}
150
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800151static void red_destroy(struct Qdisc *sch)
152{
153 struct red_sched_data *q = qdisc_priv(sch);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000154
155 del_timer_sync(&q->adapt_timer);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800156 qdisc_destroy(q->qdisc);
157}
158
Patrick McHardy27a34212008-01-23 20:35:39 -0800159static const struct nla_policy red_policy[TCA_RED_MAX + 1] = {
160 [TCA_RED_PARMS] = { .len = sizeof(struct tc_red_qopt) },
161 [TCA_RED_STAB] = { .len = RED_STAB_SIZE },
Eric Dumazeta73ed262011-12-09 02:46:45 +0000162 [TCA_RED_MAX_P] = { .type = NLA_U32 },
Patrick McHardy27a34212008-01-23 20:35:39 -0800163};
164
Patrick McHardy1e904742008-01-22 22:11:17 -0800165static int red_change(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166{
167 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800168 struct nlattr *tb[TCA_RED_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169 struct tc_red_qopt *ctl;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800170 struct Qdisc *child = NULL;
Patrick McHardycee63722008-01-23 20:33:32 -0800171 int err;
Eric Dumazeta73ed262011-12-09 02:46:45 +0000172 u32 max_P;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173
Patrick McHardycee63722008-01-23 20:33:32 -0800174 if (opt == NULL)
Thomas Grafdba051f2005-11-05 21:14:08 +0100175 return -EINVAL;
176
Johannes Bergfceb6432017-04-12 14:34:07 +0200177 err = nla_parse_nested(tb, TCA_RED_MAX, opt, red_policy, NULL);
Patrick McHardycee63722008-01-23 20:33:32 -0800178 if (err < 0)
179 return err;
180
Patrick McHardy1e904742008-01-22 22:11:17 -0800181 if (tb[TCA_RED_PARMS] == NULL ||
Patrick McHardy27a34212008-01-23 20:35:39 -0800182 tb[TCA_RED_STAB] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183 return -EINVAL;
184
Eric Dumazeta73ed262011-12-09 02:46:45 +0000185 max_P = tb[TCA_RED_MAX_P] ? nla_get_u32(tb[TCA_RED_MAX_P]) : 0;
186
Patrick McHardy1e904742008-01-22 22:11:17 -0800187 ctl = nla_data(tb[TCA_RED_PARMS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700188
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800189 if (ctl->limit > 0) {
Patrick McHardyfb0305c2008-07-05 23:40:21 -0700190 child = fifo_create_dflt(sch, &bfifo_qdisc_ops, ctl->limit);
191 if (IS_ERR(child))
192 return PTR_ERR(child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800193 }
194
Jiri Kosina49b49972017-03-08 16:03:32 +0100195 if (child != &noop_qdisc)
196 qdisc_hash_add(child, true);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197 sch_tree_lock(sch);
198 q->flags = ctl->flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199 q->limit = ctl->limit;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800200 if (child) {
WANG Cong2ccccf52016-02-25 14:55:01 -0800201 qdisc_tree_reduce_backlog(q->qdisc, q->qdisc->q.qlen,
202 q->qdisc->qstats.backlog);
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800203 qdisc_destroy(q->qdisc);
204 q->qdisc = child;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800205 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206
Eric Dumazeteeca6682012-01-05 02:25:16 +0000207 red_set_parms(&q->parms,
208 ctl->qth_min, ctl->qth_max, ctl->Wlog,
Eric Dumazeta73ed262011-12-09 02:46:45 +0000209 ctl->Plog, ctl->Scell_log,
210 nla_data(tb[TCA_RED_STAB]),
211 max_P);
Eric Dumazeteeca6682012-01-05 02:25:16 +0000212 red_set_vars(&q->vars);
Thomas Graf6b31b282005-11-05 21:14:05 +0100213
Eric Dumazet8af2a212011-12-08 06:06:03 +0000214 del_timer(&q->adapt_timer);
215 if (ctl->flags & TC_RED_ADAPTATIVE)
216 mod_timer(&q->adapt_timer, jiffies + HZ/2);
217
Eric Dumazet1ee5fa12011-12-01 11:06:34 +0000218 if (!q->qdisc->q.qlen)
Eric Dumazeteeca6682012-01-05 02:25:16 +0000219 red_start_of_idle_period(&q->vars);
Thomas Grafdba051f2005-11-05 21:14:08 +0100220
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221 sch_tree_unlock(sch);
222 return 0;
223}
224
Kees Cookcdeabbb2017-10-16 17:29:17 -0700225static inline void red_adaptative_timer(struct timer_list *t)
Eric Dumazet8af2a212011-12-08 06:06:03 +0000226{
Kees Cookcdeabbb2017-10-16 17:29:17 -0700227 struct red_sched_data *q = from_timer(q, t, adapt_timer);
228 struct Qdisc *sch = q->sch;
Eric Dumazet8af2a212011-12-08 06:06:03 +0000229 spinlock_t *root_lock = qdisc_lock(qdisc_root_sleeping(sch));
230
231 spin_lock(root_lock);
Eric Dumazeteeca6682012-01-05 02:25:16 +0000232 red_adaptative_algo(&q->parms, &q->vars);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000233 mod_timer(&q->adapt_timer, jiffies + HZ/2);
234 spin_unlock(root_lock);
235}
236
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000237static int red_init(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800239 struct red_sched_data *q = qdisc_priv(sch);
240
241 q->qdisc = &noop_qdisc;
Kees Cookcdeabbb2017-10-16 17:29:17 -0700242 q->sch = sch;
243 timer_setup(&q->adapt_timer, red_adaptative_timer, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700244 return red_change(sch, opt);
245}
246
247static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
248{
249 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800250 struct nlattr *opts = NULL;
Thomas Graf6b31b282005-11-05 21:14:05 +0100251 struct tc_red_qopt opt = {
252 .limit = q->limit,
253 .flags = q->flags,
254 .qth_min = q->parms.qth_min >> q->parms.Wlog,
255 .qth_max = q->parms.qth_max >> q->parms.Wlog,
256 .Wlog = q->parms.Wlog,
257 .Plog = q->parms.Plog,
258 .Scell_log = q->parms.Scell_log,
259 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260
Eric Dumazet0dfb33a2011-01-03 08:11:38 +0000261 sch->qstats.backlog = q->qdisc->qstats.backlog;
Patrick McHardy1e904742008-01-22 22:11:17 -0800262 opts = nla_nest_start(skb, TCA_OPTIONS);
263 if (opts == NULL)
264 goto nla_put_failure;
David S. Miller1b34ec42012-03-29 05:11:39 -0400265 if (nla_put(skb, TCA_RED_PARMS, sizeof(opt), &opt) ||
266 nla_put_u32(skb, TCA_RED_MAX_P, q->parms.max_P))
267 goto nla_put_failure;
Patrick McHardy1e904742008-01-22 22:11:17 -0800268 return nla_nest_end(skb, opts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269
Patrick McHardy1e904742008-01-22 22:11:17 -0800270nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -0700271 nla_nest_cancel(skb, opts);
272 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273}
274
275static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
276{
277 struct red_sched_data *q = qdisc_priv(sch);
Thomas Graf6b31b282005-11-05 21:14:05 +0100278 struct tc_red_xstats st = {
279 .early = q->stats.prob_drop + q->stats.forced_drop,
280 .pdrop = q->stats.pdrop,
281 .other = q->stats.other,
282 .marked = q->stats.prob_mark + q->stats.forced_mark,
283 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284
Thomas Graf6b31b282005-11-05 21:14:05 +0100285 return gnet_stats_copy_app(d, &st, sizeof(st));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286}
287
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800288static int red_dump_class(struct Qdisc *sch, unsigned long cl,
289 struct sk_buff *skb, struct tcmsg *tcm)
290{
291 struct red_sched_data *q = qdisc_priv(sch);
292
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800293 tcm->tcm_handle |= TC_H_MIN(1);
294 tcm->tcm_info = q->qdisc->handle;
295 return 0;
296}
297
298static int red_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
299 struct Qdisc **old)
300{
301 struct red_sched_data *q = qdisc_priv(sch);
302
303 if (new == NULL)
304 new = &noop_qdisc;
305
WANG Cong86a79962016-02-25 14:55:00 -0800306 *old = qdisc_replace(sch, new, &q->qdisc);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800307 return 0;
308}
309
310static struct Qdisc *red_leaf(struct Qdisc *sch, unsigned long arg)
311{
312 struct red_sched_data *q = qdisc_priv(sch);
313 return q->qdisc;
314}
315
WANG Cong143976c2017-08-24 16:51:29 -0700316static unsigned long red_find(struct Qdisc *sch, u32 classid)
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800317{
318 return 1;
319}
320
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800321static void red_walk(struct Qdisc *sch, struct qdisc_walker *walker)
322{
323 if (!walker->stop) {
324 if (walker->count >= walker->skip)
325 if (walker->fn(sch, 1, walker) < 0) {
326 walker->stop = 1;
327 return;
328 }
329 walker->count++;
330 }
331}
332
Eric Dumazet20fea082007-11-14 01:44:41 -0800333static const struct Qdisc_class_ops red_class_ops = {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800334 .graft = red_graft,
335 .leaf = red_leaf,
WANG Cong143976c2017-08-24 16:51:29 -0700336 .find = red_find,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800337 .walk = red_walk,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800338 .dump = red_dump_class,
339};
340
Eric Dumazet20fea082007-11-14 01:44:41 -0800341static struct Qdisc_ops red_qdisc_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 .id = "red",
343 .priv_size = sizeof(struct red_sched_data),
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800344 .cl_ops = &red_class_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345 .enqueue = red_enqueue,
346 .dequeue = red_dequeue,
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700347 .peek = red_peek,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 .init = red_init,
349 .reset = red_reset,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800350 .destroy = red_destroy,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 .change = red_change,
352 .dump = red_dump,
353 .dump_stats = red_dump_stats,
354 .owner = THIS_MODULE,
355};
356
357static int __init red_module_init(void)
358{
359 return register_qdisc(&red_qdisc_ops);
360}
Thomas Grafdba051f2005-11-05 21:14:08 +0100361
362static void __exit red_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363{
364 unregister_qdisc(&red_qdisc_ops);
365}
Thomas Grafdba051f2005-11-05 21:14:08 +0100366
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367module_init(red_module_init)
368module_exit(red_module_exit)
Thomas Grafdba051f2005-11-05 21:14:08 +0100369
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370MODULE_LICENSE("GPL");