blob: 8f5a85bf9d109b72dd3689a03080c25954a6dd5e [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/sch_red.c Random Early Detection queue.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Changes:
Thomas Grafdba051f2005-11-05 21:14:08 +010012 * J Hadi Salim 980914: computation fixes
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 * Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
Thomas Grafdba051f2005-11-05 21:14:08 +010014 * J Hadi Salim 980816: ECN support
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 */
16
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/types.h>
19#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <net/pkt_sched.h>
22#include <net/inet_ecn.h>
Thomas Graf6b31b282005-11-05 21:14:05 +010023#include <net/red.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024
25
Thomas Graf6b31b282005-11-05 21:14:05 +010026/* Parameters, settable by user:
Linus Torvalds1da177e2005-04-16 15:20:36 -070027 -----------------------------
28
29 limit - bytes (must be > qth_max + burst)
30
31 Hard limit on queue length, should be chosen >qth_max
32 to allow packet bursts. This parameter does not
33 affect the algorithms behaviour and can be chosen
34 arbitrarily high (well, less than ram size)
35 Really, this limit will never be reached
36 if RED works correctly.
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 */
38
Eric Dumazetcc7ec452011-01-19 19:26:56 +000039struct red_sched_data {
Thomas Graf6b31b282005-11-05 21:14:05 +010040 u32 limit; /* HARD maximal queue length */
41 unsigned char flags;
Eric Dumazet8af2a212011-12-08 06:06:03 +000042 struct timer_list adapt_timer;
Thomas Graf6b31b282005-11-05 21:14:05 +010043 struct red_parms parms;
44 struct red_stats stats;
Patrick McHardyf38c39d2006-03-20 19:20:44 -080045 struct Qdisc *qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -070046};
47
Thomas Graf6b31b282005-11-05 21:14:05 +010048static inline int red_use_ecn(struct red_sched_data *q)
Linus Torvalds1da177e2005-04-16 15:20:36 -070049{
Thomas Graf6b31b282005-11-05 21:14:05 +010050 return q->flags & TC_RED_ECN;
Linus Torvalds1da177e2005-04-16 15:20:36 -070051}
52
Thomas Grafbdc450a2005-11-05 21:14:28 +010053static inline int red_use_harddrop(struct red_sched_data *q)
54{
55 return q->flags & TC_RED_HARDDROP;
56}
57
Eric Dumazetcc7ec452011-01-19 19:26:56 +000058static int red_enqueue(struct sk_buff *skb, struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -070059{
60 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080061 struct Qdisc *child = q->qdisc;
62 int ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -070063
Patrick McHardyf38c39d2006-03-20 19:20:44 -080064 q->parms.qavg = red_calc_qavg(&q->parms, child->qstats.backlog);
Linus Torvalds1da177e2005-04-16 15:20:36 -070065
Thomas Graf6b31b282005-11-05 21:14:05 +010066 if (red_is_idling(&q->parms))
67 red_end_of_idle_period(&q->parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -070068
Thomas Graf6b31b282005-11-05 21:14:05 +010069 switch (red_action(&q->parms, q->parms.qavg)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +000070 case RED_DONT_MARK:
71 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
Eric Dumazetcc7ec452011-01-19 19:26:56 +000073 case RED_PROB_MARK:
74 sch->qstats.overlimits++;
75 if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
76 q->stats.prob_drop++;
77 goto congestion_drop;
78 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
Eric Dumazetcc7ec452011-01-19 19:26:56 +000080 q->stats.prob_mark++;
81 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070082
Eric Dumazetcc7ec452011-01-19 19:26:56 +000083 case RED_HARD_MARK:
84 sch->qstats.overlimits++;
85 if (red_use_harddrop(q) || !red_use_ecn(q) ||
86 !INET_ECN_set_ce(skb)) {
87 q->stats.forced_drop++;
88 goto congestion_drop;
89 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070090
Eric Dumazetcc7ec452011-01-19 19:26:56 +000091 q->stats.forced_mark++;
92 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070093 }
94
Jussi Kivilinna5f861732008-07-20 00:08:04 -070095 ret = qdisc_enqueue(skb, child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080096 if (likely(ret == NET_XMIT_SUCCESS)) {
Patrick McHardyf38c39d2006-03-20 19:20:44 -080097 sch->q.qlen++;
Jarek Poplawski378a2f02008-08-04 22:31:03 -070098 } else if (net_xmit_drop_count(ret)) {
Patrick McHardyf38c39d2006-03-20 19:20:44 -080099 q->stats.pdrop++;
100 sch->qstats.drops++;
101 }
102 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103
Thomas Graf6b31b282005-11-05 21:14:05 +0100104congestion_drop:
Thomas Graf9e178ff2005-11-05 21:14:06 +0100105 qdisc_drop(skb, sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106 return NET_XMIT_CN;
107}
108
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000109static struct sk_buff *red_dequeue(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110{
111 struct sk_buff *skb;
112 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800113 struct Qdisc *child = q->qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800115 skb = child->dequeue(child);
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800116 if (skb) {
117 qdisc_bstats_update(sch, skb);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800118 sch->q.qlen--;
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800119 } else {
120 if (!red_is_idling(&q->parms))
121 red_start_of_idle_period(&q->parms);
122 }
Thomas Graf9e178ff2005-11-05 21:14:06 +0100123 return skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124}
125
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000126static struct sk_buff *red_peek(struct Qdisc *sch)
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700127{
128 struct red_sched_data *q = qdisc_priv(sch);
129 struct Qdisc *child = q->qdisc;
130
131 return child->ops->peek(child);
132}
133
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000134static unsigned int red_drop(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700136 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800137 struct Qdisc *child = q->qdisc;
138 unsigned int len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800140 if (child->ops->drop && (len = child->ops->drop(child)) > 0) {
Thomas Graf6b31b282005-11-05 21:14:05 +0100141 q->stats.other++;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800142 sch->qstats.drops++;
143 sch->q.qlen--;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144 return len;
145 }
Thomas Graf6b31b282005-11-05 21:14:05 +0100146
Thomas Graf6a1b63d2005-11-05 21:14:07 +0100147 if (!red_is_idling(&q->parms))
148 red_start_of_idle_period(&q->parms);
149
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150 return 0;
151}
152
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000153static void red_reset(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154{
155 struct red_sched_data *q = qdisc_priv(sch);
156
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800157 qdisc_reset(q->qdisc);
158 sch->q.qlen = 0;
Thomas Graf6b31b282005-11-05 21:14:05 +0100159 red_restart(&q->parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160}
161
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800162static void red_destroy(struct Qdisc *sch)
163{
164 struct red_sched_data *q = qdisc_priv(sch);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000165
166 del_timer_sync(&q->adapt_timer);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800167 qdisc_destroy(q->qdisc);
168}
169
Patrick McHardy27a34212008-01-23 20:35:39 -0800170static const struct nla_policy red_policy[TCA_RED_MAX + 1] = {
171 [TCA_RED_PARMS] = { .len = sizeof(struct tc_red_qopt) },
172 [TCA_RED_STAB] = { .len = RED_STAB_SIZE },
173};
174
Patrick McHardy1e904742008-01-22 22:11:17 -0800175static int red_change(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176{
177 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800178 struct nlattr *tb[TCA_RED_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179 struct tc_red_qopt *ctl;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800180 struct Qdisc *child = NULL;
Patrick McHardycee63722008-01-23 20:33:32 -0800181 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182
Patrick McHardycee63722008-01-23 20:33:32 -0800183 if (opt == NULL)
Thomas Grafdba051f2005-11-05 21:14:08 +0100184 return -EINVAL;
185
Patrick McHardy27a34212008-01-23 20:35:39 -0800186 err = nla_parse_nested(tb, TCA_RED_MAX, opt, red_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800187 if (err < 0)
188 return err;
189
Patrick McHardy1e904742008-01-22 22:11:17 -0800190 if (tb[TCA_RED_PARMS] == NULL ||
Patrick McHardy27a34212008-01-23 20:35:39 -0800191 tb[TCA_RED_STAB] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192 return -EINVAL;
193
Patrick McHardy1e904742008-01-22 22:11:17 -0800194 ctl = nla_data(tb[TCA_RED_PARMS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800196 if (ctl->limit > 0) {
Patrick McHardyfb0305c2008-07-05 23:40:21 -0700197 child = fifo_create_dflt(sch, &bfifo_qdisc_ops, ctl->limit);
198 if (IS_ERR(child))
199 return PTR_ERR(child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800200 }
201
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202 sch_tree_lock(sch);
203 q->flags = ctl->flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204 q->limit = ctl->limit;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800205 if (child) {
206 qdisc_tree_decrease_qlen(q->qdisc, q->qdisc->q.qlen);
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800207 qdisc_destroy(q->qdisc);
208 q->qdisc = child;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800209 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210
Thomas Graf6b31b282005-11-05 21:14:05 +0100211 red_set_parms(&q->parms, ctl->qth_min, ctl->qth_max, ctl->Wlog,
212 ctl->Plog, ctl->Scell_log,
Patrick McHardy1e904742008-01-22 22:11:17 -0800213 nla_data(tb[TCA_RED_STAB]));
Thomas Graf6b31b282005-11-05 21:14:05 +0100214
Eric Dumazet8af2a212011-12-08 06:06:03 +0000215 del_timer(&q->adapt_timer);
216 if (ctl->flags & TC_RED_ADAPTATIVE)
217 mod_timer(&q->adapt_timer, jiffies + HZ/2);
218
Eric Dumazet1ee5fa12011-12-01 11:06:34 +0000219 if (!q->qdisc->q.qlen)
220 red_start_of_idle_period(&q->parms);
Thomas Grafdba051f2005-11-05 21:14:08 +0100221
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222 sch_tree_unlock(sch);
223 return 0;
224}
225
Eric Dumazet8af2a212011-12-08 06:06:03 +0000226static inline void red_adaptative_timer(unsigned long arg)
227{
228 struct Qdisc *sch = (struct Qdisc *)arg;
229 struct red_sched_data *q = qdisc_priv(sch);
230 spinlock_t *root_lock = qdisc_lock(qdisc_root_sleeping(sch));
231
232 spin_lock(root_lock);
233 red_adaptative_algo(&q->parms);
234 mod_timer(&q->adapt_timer, jiffies + HZ/2);
235 spin_unlock(root_lock);
236}
237
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000238static int red_init(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800240 struct red_sched_data *q = qdisc_priv(sch);
241
242 q->qdisc = &noop_qdisc;
Eric Dumazet8af2a212011-12-08 06:06:03 +0000243 setup_timer(&q->adapt_timer, red_adaptative_timer, (unsigned long)sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700244 return red_change(sch, opt);
245}
246
247static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
248{
249 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800250 struct nlattr *opts = NULL;
Thomas Graf6b31b282005-11-05 21:14:05 +0100251 struct tc_red_qopt opt = {
252 .limit = q->limit,
253 .flags = q->flags,
254 .qth_min = q->parms.qth_min >> q->parms.Wlog,
255 .qth_max = q->parms.qth_max >> q->parms.Wlog,
256 .Wlog = q->parms.Wlog,
257 .Plog = q->parms.Plog,
258 .Scell_log = q->parms.Scell_log,
259 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260
Eric Dumazet0dfb33a2011-01-03 08:11:38 +0000261 sch->qstats.backlog = q->qdisc->qstats.backlog;
Patrick McHardy1e904742008-01-22 22:11:17 -0800262 opts = nla_nest_start(skb, TCA_OPTIONS);
263 if (opts == NULL)
264 goto nla_put_failure;
265 NLA_PUT(skb, TCA_RED_PARMS, sizeof(opt), &opt);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000266 NLA_PUT_U32(skb, TCA_RED_MAX_P, q->parms.max_P);
Patrick McHardy1e904742008-01-22 22:11:17 -0800267 return nla_nest_end(skb, opts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268
Patrick McHardy1e904742008-01-22 22:11:17 -0800269nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -0700270 nla_nest_cancel(skb, opts);
271 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272}
273
274static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
275{
276 struct red_sched_data *q = qdisc_priv(sch);
Thomas Graf6b31b282005-11-05 21:14:05 +0100277 struct tc_red_xstats st = {
278 .early = q->stats.prob_drop + q->stats.forced_drop,
279 .pdrop = q->stats.pdrop,
280 .other = q->stats.other,
281 .marked = q->stats.prob_mark + q->stats.forced_mark,
282 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283
Thomas Graf6b31b282005-11-05 21:14:05 +0100284 return gnet_stats_copy_app(d, &st, sizeof(st));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285}
286
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800287static int red_dump_class(struct Qdisc *sch, unsigned long cl,
288 struct sk_buff *skb, struct tcmsg *tcm)
289{
290 struct red_sched_data *q = qdisc_priv(sch);
291
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800292 tcm->tcm_handle |= TC_H_MIN(1);
293 tcm->tcm_info = q->qdisc->handle;
294 return 0;
295}
296
297static int red_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
298 struct Qdisc **old)
299{
300 struct red_sched_data *q = qdisc_priv(sch);
301
302 if (new == NULL)
303 new = &noop_qdisc;
304
305 sch_tree_lock(sch);
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800306 *old = q->qdisc;
307 q->qdisc = new;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800308 qdisc_tree_decrease_qlen(*old, (*old)->q.qlen);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800309 qdisc_reset(*old);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800310 sch_tree_unlock(sch);
311 return 0;
312}
313
314static struct Qdisc *red_leaf(struct Qdisc *sch, unsigned long arg)
315{
316 struct red_sched_data *q = qdisc_priv(sch);
317 return q->qdisc;
318}
319
320static unsigned long red_get(struct Qdisc *sch, u32 classid)
321{
322 return 1;
323}
324
325static void red_put(struct Qdisc *sch, unsigned long arg)
326{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800327}
328
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800329static void red_walk(struct Qdisc *sch, struct qdisc_walker *walker)
330{
331 if (!walker->stop) {
332 if (walker->count >= walker->skip)
333 if (walker->fn(sch, 1, walker) < 0) {
334 walker->stop = 1;
335 return;
336 }
337 walker->count++;
338 }
339}
340
Eric Dumazet20fea082007-11-14 01:44:41 -0800341static const struct Qdisc_class_ops red_class_ops = {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800342 .graft = red_graft,
343 .leaf = red_leaf,
344 .get = red_get,
345 .put = red_put,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800346 .walk = red_walk,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800347 .dump = red_dump_class,
348};
349
Eric Dumazet20fea082007-11-14 01:44:41 -0800350static struct Qdisc_ops red_qdisc_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 .id = "red",
352 .priv_size = sizeof(struct red_sched_data),
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800353 .cl_ops = &red_class_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 .enqueue = red_enqueue,
355 .dequeue = red_dequeue,
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700356 .peek = red_peek,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357 .drop = red_drop,
358 .init = red_init,
359 .reset = red_reset,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800360 .destroy = red_destroy,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361 .change = red_change,
362 .dump = red_dump,
363 .dump_stats = red_dump_stats,
364 .owner = THIS_MODULE,
365};
366
367static int __init red_module_init(void)
368{
369 return register_qdisc(&red_qdisc_ops);
370}
Thomas Grafdba051f2005-11-05 21:14:08 +0100371
372static void __exit red_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373{
374 unregister_qdisc(&red_qdisc_ops);
375}
Thomas Grafdba051f2005-11-05 21:14:08 +0100376
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377module_init(red_module_init)
378module_exit(red_module_exit)
Thomas Grafdba051f2005-11-05 21:14:08 +0100379
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380MODULE_LICENSE("GPL");