blob: a0d57530335e229112a3316de1a0a195e01f03d7 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/sch_red.c Random Early Detection queue.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Changes:
Thomas Grafdba051f2005-11-05 21:14:08 +010012 * J Hadi Salim 980914: computation fixes
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 * Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
Thomas Grafdba051f2005-11-05 21:14:08 +010014 * J Hadi Salim 980816: ECN support
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 */
16
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/types.h>
19#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <net/pkt_sched.h>
22#include <net/inet_ecn.h>
Thomas Graf6b31b282005-11-05 21:14:05 +010023#include <net/red.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024
25
Thomas Graf6b31b282005-11-05 21:14:05 +010026/* Parameters, settable by user:
Linus Torvalds1da177e2005-04-16 15:20:36 -070027 -----------------------------
28
29 limit - bytes (must be > qth_max + burst)
30
31 Hard limit on queue length, should be chosen >qth_max
32 to allow packet bursts. This parameter does not
33 affect the algorithms behaviour and can be chosen
34 arbitrarily high (well, less than ram size)
35 Really, this limit will never be reached
36 if RED works correctly.
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 */
38
Eric Dumazetcc7ec452011-01-19 19:26:56 +000039struct red_sched_data {
Thomas Graf6b31b282005-11-05 21:14:05 +010040 u32 limit; /* HARD maximal queue length */
41 unsigned char flags;
Eric Dumazet8af2a212011-12-08 06:06:03 +000042 struct timer_list adapt_timer;
Thomas Graf6b31b282005-11-05 21:14:05 +010043 struct red_parms parms;
Eric Dumazeteeca6682012-01-05 02:25:16 +000044 struct red_vars vars;
Thomas Graf6b31b282005-11-05 21:14:05 +010045 struct red_stats stats;
Patrick McHardyf38c39d2006-03-20 19:20:44 -080046 struct Qdisc *qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -070047};
48
Thomas Graf6b31b282005-11-05 21:14:05 +010049static inline int red_use_ecn(struct red_sched_data *q)
Linus Torvalds1da177e2005-04-16 15:20:36 -070050{
Thomas Graf6b31b282005-11-05 21:14:05 +010051 return q->flags & TC_RED_ECN;
Linus Torvalds1da177e2005-04-16 15:20:36 -070052}
53
Thomas Grafbdc450a2005-11-05 21:14:28 +010054static inline int red_use_harddrop(struct red_sched_data *q)
55{
56 return q->flags & TC_RED_HARDDROP;
57}
58
Eric Dumazetcc7ec452011-01-19 19:26:56 +000059static int red_enqueue(struct sk_buff *skb, struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -070060{
61 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080062 struct Qdisc *child = q->qdisc;
63 int ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -070064
Eric Dumazeteeca6682012-01-05 02:25:16 +000065 q->vars.qavg = red_calc_qavg(&q->parms,
66 &q->vars,
67 child->qstats.backlog);
Linus Torvalds1da177e2005-04-16 15:20:36 -070068
Eric Dumazeteeca6682012-01-05 02:25:16 +000069 if (red_is_idling(&q->vars))
70 red_end_of_idle_period(&q->vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -070071
Eric Dumazeteeca6682012-01-05 02:25:16 +000072 switch (red_action(&q->parms, &q->vars, q->vars.qavg)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +000073 case RED_DONT_MARK:
74 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070075
Eric Dumazetcc7ec452011-01-19 19:26:56 +000076 case RED_PROB_MARK:
John Fastabend25331d62014-09-28 11:53:29 -070077 qdisc_qstats_overlimit(sch);
Eric Dumazetcc7ec452011-01-19 19:26:56 +000078 if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
79 q->stats.prob_drop++;
80 goto congestion_drop;
81 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070082
Eric Dumazetcc7ec452011-01-19 19:26:56 +000083 q->stats.prob_mark++;
84 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070085
Eric Dumazetcc7ec452011-01-19 19:26:56 +000086 case RED_HARD_MARK:
John Fastabend25331d62014-09-28 11:53:29 -070087 qdisc_qstats_overlimit(sch);
Eric Dumazetcc7ec452011-01-19 19:26:56 +000088 if (red_use_harddrop(q) || !red_use_ecn(q) ||
89 !INET_ECN_set_ce(skb)) {
90 q->stats.forced_drop++;
91 goto congestion_drop;
92 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
Eric Dumazetcc7ec452011-01-19 19:26:56 +000094 q->stats.forced_mark++;
95 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070096 }
97
Jussi Kivilinna5f861732008-07-20 00:08:04 -070098 ret = qdisc_enqueue(skb, child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080099 if (likely(ret == NET_XMIT_SUCCESS)) {
WANG Congd7f4f332016-06-01 16:15:18 -0700100 qdisc_qstats_backlog_inc(sch, skb);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800101 sch->q.qlen++;
Jarek Poplawski378a2f02008-08-04 22:31:03 -0700102 } else if (net_xmit_drop_count(ret)) {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800103 q->stats.pdrop++;
John Fastabend25331d62014-09-28 11:53:29 -0700104 qdisc_qstats_drop(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800105 }
106 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107
Thomas Graf6b31b282005-11-05 21:14:05 +0100108congestion_drop:
Thomas Graf9e178ff2005-11-05 21:14:06 +0100109 qdisc_drop(skb, sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110 return NET_XMIT_CN;
111}
112
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000113static struct sk_buff *red_dequeue(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114{
115 struct sk_buff *skb;
116 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800117 struct Qdisc *child = q->qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800119 skb = child->dequeue(child);
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800120 if (skb) {
121 qdisc_bstats_update(sch, skb);
WANG Congd7f4f332016-06-01 16:15:18 -0700122 qdisc_qstats_backlog_dec(sch, skb);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800123 sch->q.qlen--;
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800124 } else {
Eric Dumazeteeca6682012-01-05 02:25:16 +0000125 if (!red_is_idling(&q->vars))
126 red_start_of_idle_period(&q->vars);
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800127 }
Thomas Graf9e178ff2005-11-05 21:14:06 +0100128 return skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129}
130
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000131static struct sk_buff *red_peek(struct Qdisc *sch)
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700132{
133 struct red_sched_data *q = qdisc_priv(sch);
134 struct Qdisc *child = q->qdisc;
135
136 return child->ops->peek(child);
137}
138
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000139static void red_reset(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700140{
141 struct red_sched_data *q = qdisc_priv(sch);
142
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800143 qdisc_reset(q->qdisc);
WANG Congd7f4f332016-06-01 16:15:18 -0700144 sch->qstats.backlog = 0;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800145 sch->q.qlen = 0;
Eric Dumazeteeca6682012-01-05 02:25:16 +0000146 red_restart(&q->vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700147}
148
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800149static void red_destroy(struct Qdisc *sch)
150{
151 struct red_sched_data *q = qdisc_priv(sch);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000152
153 del_timer_sync(&q->adapt_timer);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800154 qdisc_destroy(q->qdisc);
155}
156
Patrick McHardy27a34212008-01-23 20:35:39 -0800157static const struct nla_policy red_policy[TCA_RED_MAX + 1] = {
158 [TCA_RED_PARMS] = { .len = sizeof(struct tc_red_qopt) },
159 [TCA_RED_STAB] = { .len = RED_STAB_SIZE },
Eric Dumazeta73ed262011-12-09 02:46:45 +0000160 [TCA_RED_MAX_P] = { .type = NLA_U32 },
Patrick McHardy27a34212008-01-23 20:35:39 -0800161};
162
Patrick McHardy1e904742008-01-22 22:11:17 -0800163static int red_change(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164{
165 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800166 struct nlattr *tb[TCA_RED_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167 struct tc_red_qopt *ctl;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800168 struct Qdisc *child = NULL;
Patrick McHardycee63722008-01-23 20:33:32 -0800169 int err;
Eric Dumazeta73ed262011-12-09 02:46:45 +0000170 u32 max_P;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171
Patrick McHardycee63722008-01-23 20:33:32 -0800172 if (opt == NULL)
Thomas Grafdba051f2005-11-05 21:14:08 +0100173 return -EINVAL;
174
Patrick McHardy27a34212008-01-23 20:35:39 -0800175 err = nla_parse_nested(tb, TCA_RED_MAX, opt, red_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800176 if (err < 0)
177 return err;
178
Patrick McHardy1e904742008-01-22 22:11:17 -0800179 if (tb[TCA_RED_PARMS] == NULL ||
Patrick McHardy27a34212008-01-23 20:35:39 -0800180 tb[TCA_RED_STAB] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181 return -EINVAL;
182
Eric Dumazeta73ed262011-12-09 02:46:45 +0000183 max_P = tb[TCA_RED_MAX_P] ? nla_get_u32(tb[TCA_RED_MAX_P]) : 0;
184
Patrick McHardy1e904742008-01-22 22:11:17 -0800185 ctl = nla_data(tb[TCA_RED_PARMS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800187 if (ctl->limit > 0) {
Patrick McHardyfb0305c2008-07-05 23:40:21 -0700188 child = fifo_create_dflt(sch, &bfifo_qdisc_ops, ctl->limit);
189 if (IS_ERR(child))
190 return PTR_ERR(child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800191 }
192
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193 sch_tree_lock(sch);
194 q->flags = ctl->flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195 q->limit = ctl->limit;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800196 if (child) {
WANG Cong2ccccf52016-02-25 14:55:01 -0800197 qdisc_tree_reduce_backlog(q->qdisc, q->qdisc->q.qlen,
198 q->qdisc->qstats.backlog);
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800199 qdisc_destroy(q->qdisc);
200 q->qdisc = child;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800201 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202
Eric Dumazeteeca6682012-01-05 02:25:16 +0000203 red_set_parms(&q->parms,
204 ctl->qth_min, ctl->qth_max, ctl->Wlog,
Eric Dumazeta73ed262011-12-09 02:46:45 +0000205 ctl->Plog, ctl->Scell_log,
206 nla_data(tb[TCA_RED_STAB]),
207 max_P);
Eric Dumazeteeca6682012-01-05 02:25:16 +0000208 red_set_vars(&q->vars);
Thomas Graf6b31b282005-11-05 21:14:05 +0100209
Eric Dumazet8af2a212011-12-08 06:06:03 +0000210 del_timer(&q->adapt_timer);
211 if (ctl->flags & TC_RED_ADAPTATIVE)
212 mod_timer(&q->adapt_timer, jiffies + HZ/2);
213
Eric Dumazet1ee5fa12011-12-01 11:06:34 +0000214 if (!q->qdisc->q.qlen)
Eric Dumazeteeca6682012-01-05 02:25:16 +0000215 red_start_of_idle_period(&q->vars);
Thomas Grafdba051f2005-11-05 21:14:08 +0100216
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217 sch_tree_unlock(sch);
218 return 0;
219}
220
Eric Dumazet8af2a212011-12-08 06:06:03 +0000221static inline void red_adaptative_timer(unsigned long arg)
222{
223 struct Qdisc *sch = (struct Qdisc *)arg;
224 struct red_sched_data *q = qdisc_priv(sch);
225 spinlock_t *root_lock = qdisc_lock(qdisc_root_sleeping(sch));
226
227 spin_lock(root_lock);
Eric Dumazeteeca6682012-01-05 02:25:16 +0000228 red_adaptative_algo(&q->parms, &q->vars);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000229 mod_timer(&q->adapt_timer, jiffies + HZ/2);
230 spin_unlock(root_lock);
231}
232
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000233static int red_init(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800235 struct red_sched_data *q = qdisc_priv(sch);
236
237 q->qdisc = &noop_qdisc;
Eric Dumazet8af2a212011-12-08 06:06:03 +0000238 setup_timer(&q->adapt_timer, red_adaptative_timer, (unsigned long)sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239 return red_change(sch, opt);
240}
241
242static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
243{
244 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800245 struct nlattr *opts = NULL;
Thomas Graf6b31b282005-11-05 21:14:05 +0100246 struct tc_red_qopt opt = {
247 .limit = q->limit,
248 .flags = q->flags,
249 .qth_min = q->parms.qth_min >> q->parms.Wlog,
250 .qth_max = q->parms.qth_max >> q->parms.Wlog,
251 .Wlog = q->parms.Wlog,
252 .Plog = q->parms.Plog,
253 .Scell_log = q->parms.Scell_log,
254 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
Eric Dumazet0dfb33a2011-01-03 08:11:38 +0000256 sch->qstats.backlog = q->qdisc->qstats.backlog;
Patrick McHardy1e904742008-01-22 22:11:17 -0800257 opts = nla_nest_start(skb, TCA_OPTIONS);
258 if (opts == NULL)
259 goto nla_put_failure;
David S. Miller1b34ec42012-03-29 05:11:39 -0400260 if (nla_put(skb, TCA_RED_PARMS, sizeof(opt), &opt) ||
261 nla_put_u32(skb, TCA_RED_MAX_P, q->parms.max_P))
262 goto nla_put_failure;
Patrick McHardy1e904742008-01-22 22:11:17 -0800263 return nla_nest_end(skb, opts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264
Patrick McHardy1e904742008-01-22 22:11:17 -0800265nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -0700266 nla_nest_cancel(skb, opts);
267 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268}
269
270static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
271{
272 struct red_sched_data *q = qdisc_priv(sch);
Thomas Graf6b31b282005-11-05 21:14:05 +0100273 struct tc_red_xstats st = {
274 .early = q->stats.prob_drop + q->stats.forced_drop,
275 .pdrop = q->stats.pdrop,
276 .other = q->stats.other,
277 .marked = q->stats.prob_mark + q->stats.forced_mark,
278 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279
Thomas Graf6b31b282005-11-05 21:14:05 +0100280 return gnet_stats_copy_app(d, &st, sizeof(st));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281}
282
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800283static int red_dump_class(struct Qdisc *sch, unsigned long cl,
284 struct sk_buff *skb, struct tcmsg *tcm)
285{
286 struct red_sched_data *q = qdisc_priv(sch);
287
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800288 tcm->tcm_handle |= TC_H_MIN(1);
289 tcm->tcm_info = q->qdisc->handle;
290 return 0;
291}
292
293static int red_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
294 struct Qdisc **old)
295{
296 struct red_sched_data *q = qdisc_priv(sch);
297
298 if (new == NULL)
299 new = &noop_qdisc;
300
WANG Cong86a79962016-02-25 14:55:00 -0800301 *old = qdisc_replace(sch, new, &q->qdisc);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800302 return 0;
303}
304
305static struct Qdisc *red_leaf(struct Qdisc *sch, unsigned long arg)
306{
307 struct red_sched_data *q = qdisc_priv(sch);
308 return q->qdisc;
309}
310
311static unsigned long red_get(struct Qdisc *sch, u32 classid)
312{
313 return 1;
314}
315
316static void red_put(struct Qdisc *sch, unsigned long arg)
317{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800318}
319
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800320static void red_walk(struct Qdisc *sch, struct qdisc_walker *walker)
321{
322 if (!walker->stop) {
323 if (walker->count >= walker->skip)
324 if (walker->fn(sch, 1, walker) < 0) {
325 walker->stop = 1;
326 return;
327 }
328 walker->count++;
329 }
330}
331
Eric Dumazet20fea082007-11-14 01:44:41 -0800332static const struct Qdisc_class_ops red_class_ops = {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800333 .graft = red_graft,
334 .leaf = red_leaf,
335 .get = red_get,
336 .put = red_put,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800337 .walk = red_walk,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800338 .dump = red_dump_class,
339};
340
Eric Dumazet20fea082007-11-14 01:44:41 -0800341static struct Qdisc_ops red_qdisc_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 .id = "red",
343 .priv_size = sizeof(struct red_sched_data),
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800344 .cl_ops = &red_class_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345 .enqueue = red_enqueue,
346 .dequeue = red_dequeue,
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700347 .peek = red_peek,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 .init = red_init,
349 .reset = red_reset,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800350 .destroy = red_destroy,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 .change = red_change,
352 .dump = red_dump,
353 .dump_stats = red_dump_stats,
354 .owner = THIS_MODULE,
355};
356
357static int __init red_module_init(void)
358{
359 return register_qdisc(&red_qdisc_ops);
360}
Thomas Grafdba051f2005-11-05 21:14:08 +0100361
362static void __exit red_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363{
364 unregister_qdisc(&red_qdisc_ops);
365}
Thomas Grafdba051f2005-11-05 21:14:08 +0100366
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367module_init(red_module_init)
368module_exit(red_module_exit)
Thomas Grafdba051f2005-11-05 21:14:08 +0100369
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370MODULE_LICENSE("GPL");