blob: 235942f3464e7fa90886c685e339e6cf88114cbc [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/sch_red.c Random Early Detection queue.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Changes:
Thomas Grafdba051f2005-11-05 21:14:08 +010012 * J Hadi Salim 980914: computation fixes
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 * Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
Thomas Grafdba051f2005-11-05 21:14:08 +010014 * J Hadi Salim 980816: ECN support
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 */
16
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/types.h>
19#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <net/pkt_sched.h>
22#include <net/inet_ecn.h>
Thomas Graf6b31b282005-11-05 21:14:05 +010023#include <net/red.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024
25
Thomas Graf6b31b282005-11-05 21:14:05 +010026/* Parameters, settable by user:
Linus Torvalds1da177e2005-04-16 15:20:36 -070027 -----------------------------
28
29 limit - bytes (must be > qth_max + burst)
30
31 Hard limit on queue length, should be chosen >qth_max
32 to allow packet bursts. This parameter does not
33 affect the algorithms behaviour and can be chosen
34 arbitrarily high (well, less than ram size)
35 Really, this limit will never be reached
36 if RED works correctly.
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 */
38
Eric Dumazetcc7ec452011-01-19 19:26:56 +000039struct red_sched_data {
Thomas Graf6b31b282005-11-05 21:14:05 +010040 u32 limit; /* HARD maximal queue length */
41 unsigned char flags;
Eric Dumazet8af2a212011-12-08 06:06:03 +000042 struct timer_list adapt_timer;
Thomas Graf6b31b282005-11-05 21:14:05 +010043 struct red_parms parms;
Eric Dumazeteeca6682012-01-05 02:25:16 +000044 struct red_vars vars;
Thomas Graf6b31b282005-11-05 21:14:05 +010045 struct red_stats stats;
Patrick McHardyf38c39d2006-03-20 19:20:44 -080046 struct Qdisc *qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -070047};
48
Thomas Graf6b31b282005-11-05 21:14:05 +010049static inline int red_use_ecn(struct red_sched_data *q)
Linus Torvalds1da177e2005-04-16 15:20:36 -070050{
Thomas Graf6b31b282005-11-05 21:14:05 +010051 return q->flags & TC_RED_ECN;
Linus Torvalds1da177e2005-04-16 15:20:36 -070052}
53
Thomas Grafbdc450a2005-11-05 21:14:28 +010054static inline int red_use_harddrop(struct red_sched_data *q)
55{
56 return q->flags & TC_RED_HARDDROP;
57}
58
Eric Dumazetcc7ec452011-01-19 19:26:56 +000059static int red_enqueue(struct sk_buff *skb, struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -070060{
61 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080062 struct Qdisc *child = q->qdisc;
63 int ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -070064
Eric Dumazeteeca6682012-01-05 02:25:16 +000065 q->vars.qavg = red_calc_qavg(&q->parms,
66 &q->vars,
67 child->qstats.backlog);
Linus Torvalds1da177e2005-04-16 15:20:36 -070068
Eric Dumazeteeca6682012-01-05 02:25:16 +000069 if (red_is_idling(&q->vars))
70 red_end_of_idle_period(&q->vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -070071
Eric Dumazeteeca6682012-01-05 02:25:16 +000072 switch (red_action(&q->parms, &q->vars, q->vars.qavg)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +000073 case RED_DONT_MARK:
74 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070075
Eric Dumazetcc7ec452011-01-19 19:26:56 +000076 case RED_PROB_MARK:
John Fastabend25331d62014-09-28 11:53:29 -070077 qdisc_qstats_overlimit(sch);
Eric Dumazetcc7ec452011-01-19 19:26:56 +000078 if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
79 q->stats.prob_drop++;
80 goto congestion_drop;
81 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070082
Eric Dumazetcc7ec452011-01-19 19:26:56 +000083 q->stats.prob_mark++;
84 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070085
Eric Dumazetcc7ec452011-01-19 19:26:56 +000086 case RED_HARD_MARK:
John Fastabend25331d62014-09-28 11:53:29 -070087 qdisc_qstats_overlimit(sch);
Eric Dumazetcc7ec452011-01-19 19:26:56 +000088 if (red_use_harddrop(q) || !red_use_ecn(q) ||
89 !INET_ECN_set_ce(skb)) {
90 q->stats.forced_drop++;
91 goto congestion_drop;
92 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
Eric Dumazetcc7ec452011-01-19 19:26:56 +000094 q->stats.forced_mark++;
95 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070096 }
97
Jussi Kivilinna5f861732008-07-20 00:08:04 -070098 ret = qdisc_enqueue(skb, child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080099 if (likely(ret == NET_XMIT_SUCCESS)) {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800100 sch->q.qlen++;
Jarek Poplawski378a2f02008-08-04 22:31:03 -0700101 } else if (net_xmit_drop_count(ret)) {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800102 q->stats.pdrop++;
John Fastabend25331d62014-09-28 11:53:29 -0700103 qdisc_qstats_drop(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800104 }
105 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106
Thomas Graf6b31b282005-11-05 21:14:05 +0100107congestion_drop:
Thomas Graf9e178ff2005-11-05 21:14:06 +0100108 qdisc_drop(skb, sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109 return NET_XMIT_CN;
110}
111
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000112static struct sk_buff *red_dequeue(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113{
114 struct sk_buff *skb;
115 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800116 struct Qdisc *child = q->qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800118 skb = child->dequeue(child);
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800119 if (skb) {
120 qdisc_bstats_update(sch, skb);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800121 sch->q.qlen--;
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800122 } else {
Eric Dumazeteeca6682012-01-05 02:25:16 +0000123 if (!red_is_idling(&q->vars))
124 red_start_of_idle_period(&q->vars);
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800125 }
Thomas Graf9e178ff2005-11-05 21:14:06 +0100126 return skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127}
128
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000129static struct sk_buff *red_peek(struct Qdisc *sch)
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700130{
131 struct red_sched_data *q = qdisc_priv(sch);
132 struct Qdisc *child = q->qdisc;
133
134 return child->ops->peek(child);
135}
136
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000137static void red_reset(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700138{
139 struct red_sched_data *q = qdisc_priv(sch);
140
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800141 qdisc_reset(q->qdisc);
142 sch->q.qlen = 0;
Eric Dumazeteeca6682012-01-05 02:25:16 +0000143 red_restart(&q->vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144}
145
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800146static void red_destroy(struct Qdisc *sch)
147{
148 struct red_sched_data *q = qdisc_priv(sch);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000149
150 del_timer_sync(&q->adapt_timer);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800151 qdisc_destroy(q->qdisc);
152}
153
Patrick McHardy27a34212008-01-23 20:35:39 -0800154static const struct nla_policy red_policy[TCA_RED_MAX + 1] = {
155 [TCA_RED_PARMS] = { .len = sizeof(struct tc_red_qopt) },
156 [TCA_RED_STAB] = { .len = RED_STAB_SIZE },
Eric Dumazeta73ed262011-12-09 02:46:45 +0000157 [TCA_RED_MAX_P] = { .type = NLA_U32 },
Patrick McHardy27a34212008-01-23 20:35:39 -0800158};
159
Patrick McHardy1e904742008-01-22 22:11:17 -0800160static int red_change(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161{
162 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800163 struct nlattr *tb[TCA_RED_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164 struct tc_red_qopt *ctl;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800165 struct Qdisc *child = NULL;
Patrick McHardycee63722008-01-23 20:33:32 -0800166 int err;
Eric Dumazeta73ed262011-12-09 02:46:45 +0000167 u32 max_P;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168
Patrick McHardycee63722008-01-23 20:33:32 -0800169 if (opt == NULL)
Thomas Grafdba051f2005-11-05 21:14:08 +0100170 return -EINVAL;
171
Patrick McHardy27a34212008-01-23 20:35:39 -0800172 err = nla_parse_nested(tb, TCA_RED_MAX, opt, red_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800173 if (err < 0)
174 return err;
175
Patrick McHardy1e904742008-01-22 22:11:17 -0800176 if (tb[TCA_RED_PARMS] == NULL ||
Patrick McHardy27a34212008-01-23 20:35:39 -0800177 tb[TCA_RED_STAB] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178 return -EINVAL;
179
Eric Dumazeta73ed262011-12-09 02:46:45 +0000180 max_P = tb[TCA_RED_MAX_P] ? nla_get_u32(tb[TCA_RED_MAX_P]) : 0;
181
Patrick McHardy1e904742008-01-22 22:11:17 -0800182 ctl = nla_data(tb[TCA_RED_PARMS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800184 if (ctl->limit > 0) {
Patrick McHardyfb0305c2008-07-05 23:40:21 -0700185 child = fifo_create_dflt(sch, &bfifo_qdisc_ops, ctl->limit);
186 if (IS_ERR(child))
187 return PTR_ERR(child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800188 }
189
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190 sch_tree_lock(sch);
191 q->flags = ctl->flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192 q->limit = ctl->limit;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800193 if (child) {
WANG Cong2ccccf52016-02-25 14:55:01 -0800194 qdisc_tree_reduce_backlog(q->qdisc, q->qdisc->q.qlen,
195 q->qdisc->qstats.backlog);
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800196 qdisc_destroy(q->qdisc);
197 q->qdisc = child;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800198 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199
Eric Dumazeteeca6682012-01-05 02:25:16 +0000200 red_set_parms(&q->parms,
201 ctl->qth_min, ctl->qth_max, ctl->Wlog,
Eric Dumazeta73ed262011-12-09 02:46:45 +0000202 ctl->Plog, ctl->Scell_log,
203 nla_data(tb[TCA_RED_STAB]),
204 max_P);
Eric Dumazeteeca6682012-01-05 02:25:16 +0000205 red_set_vars(&q->vars);
Thomas Graf6b31b282005-11-05 21:14:05 +0100206
Eric Dumazet8af2a212011-12-08 06:06:03 +0000207 del_timer(&q->adapt_timer);
208 if (ctl->flags & TC_RED_ADAPTATIVE)
209 mod_timer(&q->adapt_timer, jiffies + HZ/2);
210
Eric Dumazet1ee5fa12011-12-01 11:06:34 +0000211 if (!q->qdisc->q.qlen)
Eric Dumazeteeca6682012-01-05 02:25:16 +0000212 red_start_of_idle_period(&q->vars);
Thomas Grafdba051f2005-11-05 21:14:08 +0100213
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214 sch_tree_unlock(sch);
215 return 0;
216}
217
Eric Dumazet8af2a212011-12-08 06:06:03 +0000218static inline void red_adaptative_timer(unsigned long arg)
219{
220 struct Qdisc *sch = (struct Qdisc *)arg;
221 struct red_sched_data *q = qdisc_priv(sch);
222 spinlock_t *root_lock = qdisc_lock(qdisc_root_sleeping(sch));
223
224 spin_lock(root_lock);
Eric Dumazeteeca6682012-01-05 02:25:16 +0000225 red_adaptative_algo(&q->parms, &q->vars);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000226 mod_timer(&q->adapt_timer, jiffies + HZ/2);
227 spin_unlock(root_lock);
228}
229
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000230static int red_init(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800232 struct red_sched_data *q = qdisc_priv(sch);
233
234 q->qdisc = &noop_qdisc;
Eric Dumazet8af2a212011-12-08 06:06:03 +0000235 setup_timer(&q->adapt_timer, red_adaptative_timer, (unsigned long)sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236 return red_change(sch, opt);
237}
238
239static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
240{
241 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800242 struct nlattr *opts = NULL;
Thomas Graf6b31b282005-11-05 21:14:05 +0100243 struct tc_red_qopt opt = {
244 .limit = q->limit,
245 .flags = q->flags,
246 .qth_min = q->parms.qth_min >> q->parms.Wlog,
247 .qth_max = q->parms.qth_max >> q->parms.Wlog,
248 .Wlog = q->parms.Wlog,
249 .Plog = q->parms.Plog,
250 .Scell_log = q->parms.Scell_log,
251 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252
Eric Dumazet0dfb33a2011-01-03 08:11:38 +0000253 sch->qstats.backlog = q->qdisc->qstats.backlog;
Patrick McHardy1e904742008-01-22 22:11:17 -0800254 opts = nla_nest_start(skb, TCA_OPTIONS);
255 if (opts == NULL)
256 goto nla_put_failure;
David S. Miller1b34ec42012-03-29 05:11:39 -0400257 if (nla_put(skb, TCA_RED_PARMS, sizeof(opt), &opt) ||
258 nla_put_u32(skb, TCA_RED_MAX_P, q->parms.max_P))
259 goto nla_put_failure;
Patrick McHardy1e904742008-01-22 22:11:17 -0800260 return nla_nest_end(skb, opts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261
Patrick McHardy1e904742008-01-22 22:11:17 -0800262nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -0700263 nla_nest_cancel(skb, opts);
264 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265}
266
267static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
268{
269 struct red_sched_data *q = qdisc_priv(sch);
Thomas Graf6b31b282005-11-05 21:14:05 +0100270 struct tc_red_xstats st = {
271 .early = q->stats.prob_drop + q->stats.forced_drop,
272 .pdrop = q->stats.pdrop,
273 .other = q->stats.other,
274 .marked = q->stats.prob_mark + q->stats.forced_mark,
275 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276
Thomas Graf6b31b282005-11-05 21:14:05 +0100277 return gnet_stats_copy_app(d, &st, sizeof(st));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278}
279
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800280static int red_dump_class(struct Qdisc *sch, unsigned long cl,
281 struct sk_buff *skb, struct tcmsg *tcm)
282{
283 struct red_sched_data *q = qdisc_priv(sch);
284
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800285 tcm->tcm_handle |= TC_H_MIN(1);
286 tcm->tcm_info = q->qdisc->handle;
287 return 0;
288}
289
290static int red_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
291 struct Qdisc **old)
292{
293 struct red_sched_data *q = qdisc_priv(sch);
294
295 if (new == NULL)
296 new = &noop_qdisc;
297
WANG Cong86a79962016-02-25 14:55:00 -0800298 *old = qdisc_replace(sch, new, &q->qdisc);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800299 return 0;
300}
301
302static struct Qdisc *red_leaf(struct Qdisc *sch, unsigned long arg)
303{
304 struct red_sched_data *q = qdisc_priv(sch);
305 return q->qdisc;
306}
307
308static unsigned long red_get(struct Qdisc *sch, u32 classid)
309{
310 return 1;
311}
312
313static void red_put(struct Qdisc *sch, unsigned long arg)
314{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800315}
316
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800317static void red_walk(struct Qdisc *sch, struct qdisc_walker *walker)
318{
319 if (!walker->stop) {
320 if (walker->count >= walker->skip)
321 if (walker->fn(sch, 1, walker) < 0) {
322 walker->stop = 1;
323 return;
324 }
325 walker->count++;
326 }
327}
328
Eric Dumazet20fea082007-11-14 01:44:41 -0800329static const struct Qdisc_class_ops red_class_ops = {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800330 .graft = red_graft,
331 .leaf = red_leaf,
332 .get = red_get,
333 .put = red_put,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800334 .walk = red_walk,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800335 .dump = red_dump_class,
336};
337
Eric Dumazet20fea082007-11-14 01:44:41 -0800338static struct Qdisc_ops red_qdisc_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 .id = "red",
340 .priv_size = sizeof(struct red_sched_data),
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800341 .cl_ops = &red_class_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 .enqueue = red_enqueue,
343 .dequeue = red_dequeue,
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700344 .peek = red_peek,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345 .init = red_init,
346 .reset = red_reset,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800347 .destroy = red_destroy,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 .change = red_change,
349 .dump = red_dump,
350 .dump_stats = red_dump_stats,
351 .owner = THIS_MODULE,
352};
353
354static int __init red_module_init(void)
355{
356 return register_qdisc(&red_qdisc_ops);
357}
Thomas Grafdba051f2005-11-05 21:14:08 +0100358
359static void __exit red_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360{
361 unregister_qdisc(&red_qdisc_ops);
362}
Thomas Grafdba051f2005-11-05 21:14:08 +0100363
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364module_init(red_module_init)
365module_exit(red_module_exit)
Thomas Grafdba051f2005-11-05 21:14:08 +0100366
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367MODULE_LICENSE("GPL");