blob: ce2256a17d7e1e8aa509a24f914ea69d404dce7c [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/sch_red.c Random Early Detection queue.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Changes:
Thomas Grafdba051f2005-11-05 21:14:08 +010012 * J Hadi Salim 980914: computation fixes
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 * Alexey Makarenko <makar@phoenix.kharkov.ua> 990814: qave on idle link was calculated incorrectly.
Thomas Grafdba051f2005-11-05 21:14:08 +010014 * J Hadi Salim 980816: ECN support
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 */
16
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/types.h>
19#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <net/pkt_sched.h>
22#include <net/inet_ecn.h>
Thomas Graf6b31b282005-11-05 21:14:05 +010023#include <net/red.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024
25
Thomas Graf6b31b282005-11-05 21:14:05 +010026/* Parameters, settable by user:
Linus Torvalds1da177e2005-04-16 15:20:36 -070027 -----------------------------
28
29 limit - bytes (must be > qth_max + burst)
30
31 Hard limit on queue length, should be chosen >qth_max
32 to allow packet bursts. This parameter does not
33 affect the algorithms behaviour and can be chosen
34 arbitrarily high (well, less than ram size)
35 Really, this limit will never be reached
36 if RED works correctly.
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 */
38
Eric Dumazetcc7ec452011-01-19 19:26:56 +000039struct red_sched_data {
Thomas Graf6b31b282005-11-05 21:14:05 +010040 u32 limit; /* HARD maximal queue length */
41 unsigned char flags;
Eric Dumazet8af2a212011-12-08 06:06:03 +000042 struct timer_list adapt_timer;
Thomas Graf6b31b282005-11-05 21:14:05 +010043 struct red_parms parms;
44 struct red_stats stats;
Patrick McHardyf38c39d2006-03-20 19:20:44 -080045 struct Qdisc *qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -070046};
47
Thomas Graf6b31b282005-11-05 21:14:05 +010048static inline int red_use_ecn(struct red_sched_data *q)
Linus Torvalds1da177e2005-04-16 15:20:36 -070049{
Thomas Graf6b31b282005-11-05 21:14:05 +010050 return q->flags & TC_RED_ECN;
Linus Torvalds1da177e2005-04-16 15:20:36 -070051}
52
Thomas Grafbdc450a2005-11-05 21:14:28 +010053static inline int red_use_harddrop(struct red_sched_data *q)
54{
55 return q->flags & TC_RED_HARDDROP;
56}
57
Eric Dumazetcc7ec452011-01-19 19:26:56 +000058static int red_enqueue(struct sk_buff *skb, struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -070059{
60 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080061 struct Qdisc *child = q->qdisc;
62 int ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -070063
Patrick McHardyf38c39d2006-03-20 19:20:44 -080064 q->parms.qavg = red_calc_qavg(&q->parms, child->qstats.backlog);
Linus Torvalds1da177e2005-04-16 15:20:36 -070065
Thomas Graf6b31b282005-11-05 21:14:05 +010066 if (red_is_idling(&q->parms))
67 red_end_of_idle_period(&q->parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -070068
Thomas Graf6b31b282005-11-05 21:14:05 +010069 switch (red_action(&q->parms, q->parms.qavg)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +000070 case RED_DONT_MARK:
71 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
Eric Dumazetcc7ec452011-01-19 19:26:56 +000073 case RED_PROB_MARK:
74 sch->qstats.overlimits++;
75 if (!red_use_ecn(q) || !INET_ECN_set_ce(skb)) {
76 q->stats.prob_drop++;
77 goto congestion_drop;
78 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
Eric Dumazetcc7ec452011-01-19 19:26:56 +000080 q->stats.prob_mark++;
81 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070082
Eric Dumazetcc7ec452011-01-19 19:26:56 +000083 case RED_HARD_MARK:
84 sch->qstats.overlimits++;
85 if (red_use_harddrop(q) || !red_use_ecn(q) ||
86 !INET_ECN_set_ce(skb)) {
87 q->stats.forced_drop++;
88 goto congestion_drop;
89 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070090
Eric Dumazetcc7ec452011-01-19 19:26:56 +000091 q->stats.forced_mark++;
92 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -070093 }
94
Jussi Kivilinna5f861732008-07-20 00:08:04 -070095 ret = qdisc_enqueue(skb, child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -080096 if (likely(ret == NET_XMIT_SUCCESS)) {
Patrick McHardyf38c39d2006-03-20 19:20:44 -080097 sch->q.qlen++;
Jarek Poplawski378a2f02008-08-04 22:31:03 -070098 } else if (net_xmit_drop_count(ret)) {
Patrick McHardyf38c39d2006-03-20 19:20:44 -080099 q->stats.pdrop++;
100 sch->qstats.drops++;
101 }
102 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103
Thomas Graf6b31b282005-11-05 21:14:05 +0100104congestion_drop:
Thomas Graf9e178ff2005-11-05 21:14:06 +0100105 qdisc_drop(skb, sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106 return NET_XMIT_CN;
107}
108
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000109static struct sk_buff *red_dequeue(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110{
111 struct sk_buff *skb;
112 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800113 struct Qdisc *child = q->qdisc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800115 skb = child->dequeue(child);
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800116 if (skb) {
117 qdisc_bstats_update(sch, skb);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800118 sch->q.qlen--;
Eric Dumazet9190b3b2011-01-20 23:31:33 -0800119 } else {
120 if (!red_is_idling(&q->parms))
121 red_start_of_idle_period(&q->parms);
122 }
Thomas Graf9e178ff2005-11-05 21:14:06 +0100123 return skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124}
125
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000126static struct sk_buff *red_peek(struct Qdisc *sch)
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700127{
128 struct red_sched_data *q = qdisc_priv(sch);
129 struct Qdisc *child = q->qdisc;
130
131 return child->ops->peek(child);
132}
133
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000134static unsigned int red_drop(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700136 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800137 struct Qdisc *child = q->qdisc;
138 unsigned int len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800140 if (child->ops->drop && (len = child->ops->drop(child)) > 0) {
Thomas Graf6b31b282005-11-05 21:14:05 +0100141 q->stats.other++;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800142 sch->qstats.drops++;
143 sch->q.qlen--;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144 return len;
145 }
Thomas Graf6b31b282005-11-05 21:14:05 +0100146
Thomas Graf6a1b63d2005-11-05 21:14:07 +0100147 if (!red_is_idling(&q->parms))
148 red_start_of_idle_period(&q->parms);
149
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150 return 0;
151}
152
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000153static void red_reset(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154{
155 struct red_sched_data *q = qdisc_priv(sch);
156
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800157 qdisc_reset(q->qdisc);
158 sch->q.qlen = 0;
Thomas Graf6b31b282005-11-05 21:14:05 +0100159 red_restart(&q->parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160}
161
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800162static void red_destroy(struct Qdisc *sch)
163{
164 struct red_sched_data *q = qdisc_priv(sch);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000165
166 del_timer_sync(&q->adapt_timer);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800167 qdisc_destroy(q->qdisc);
168}
169
Patrick McHardy27a34212008-01-23 20:35:39 -0800170static const struct nla_policy red_policy[TCA_RED_MAX + 1] = {
171 [TCA_RED_PARMS] = { .len = sizeof(struct tc_red_qopt) },
172 [TCA_RED_STAB] = { .len = RED_STAB_SIZE },
Eric Dumazeta73ed262011-12-09 02:46:45 +0000173 [TCA_RED_MAX_P] = { .type = NLA_U32 },
Patrick McHardy27a34212008-01-23 20:35:39 -0800174};
175
Patrick McHardy1e904742008-01-22 22:11:17 -0800176static int red_change(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177{
178 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800179 struct nlattr *tb[TCA_RED_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 struct tc_red_qopt *ctl;
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800181 struct Qdisc *child = NULL;
Patrick McHardycee63722008-01-23 20:33:32 -0800182 int err;
Eric Dumazeta73ed262011-12-09 02:46:45 +0000183 u32 max_P;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184
Patrick McHardycee63722008-01-23 20:33:32 -0800185 if (opt == NULL)
Thomas Grafdba051f2005-11-05 21:14:08 +0100186 return -EINVAL;
187
Patrick McHardy27a34212008-01-23 20:35:39 -0800188 err = nla_parse_nested(tb, TCA_RED_MAX, opt, red_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800189 if (err < 0)
190 return err;
191
Patrick McHardy1e904742008-01-22 22:11:17 -0800192 if (tb[TCA_RED_PARMS] == NULL ||
Patrick McHardy27a34212008-01-23 20:35:39 -0800193 tb[TCA_RED_STAB] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194 return -EINVAL;
195
Eric Dumazeta73ed262011-12-09 02:46:45 +0000196 max_P = tb[TCA_RED_MAX_P] ? nla_get_u32(tb[TCA_RED_MAX_P]) : 0;
197
Patrick McHardy1e904742008-01-22 22:11:17 -0800198 ctl = nla_data(tb[TCA_RED_PARMS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800200 if (ctl->limit > 0) {
Patrick McHardyfb0305c2008-07-05 23:40:21 -0700201 child = fifo_create_dflt(sch, &bfifo_qdisc_ops, ctl->limit);
202 if (IS_ERR(child))
203 return PTR_ERR(child);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800204 }
205
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206 sch_tree_lock(sch);
207 q->flags = ctl->flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208 q->limit = ctl->limit;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800209 if (child) {
210 qdisc_tree_decrease_qlen(q->qdisc, q->qdisc->q.qlen);
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800211 qdisc_destroy(q->qdisc);
212 q->qdisc = child;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800213 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214
Thomas Graf6b31b282005-11-05 21:14:05 +0100215 red_set_parms(&q->parms, ctl->qth_min, ctl->qth_max, ctl->Wlog,
Eric Dumazeta73ed262011-12-09 02:46:45 +0000216 ctl->Plog, ctl->Scell_log,
217 nla_data(tb[TCA_RED_STAB]),
218 max_P);
Thomas Graf6b31b282005-11-05 21:14:05 +0100219
Eric Dumazet8af2a212011-12-08 06:06:03 +0000220 del_timer(&q->adapt_timer);
221 if (ctl->flags & TC_RED_ADAPTATIVE)
222 mod_timer(&q->adapt_timer, jiffies + HZ/2);
223
Eric Dumazet1ee5fa12011-12-01 11:06:34 +0000224 if (!q->qdisc->q.qlen)
225 red_start_of_idle_period(&q->parms);
Thomas Grafdba051f2005-11-05 21:14:08 +0100226
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 sch_tree_unlock(sch);
228 return 0;
229}
230
Eric Dumazet8af2a212011-12-08 06:06:03 +0000231static inline void red_adaptative_timer(unsigned long arg)
232{
233 struct Qdisc *sch = (struct Qdisc *)arg;
234 struct red_sched_data *q = qdisc_priv(sch);
235 spinlock_t *root_lock = qdisc_lock(qdisc_root_sleeping(sch));
236
237 spin_lock(root_lock);
238 red_adaptative_algo(&q->parms);
239 mod_timer(&q->adapt_timer, jiffies + HZ/2);
240 spin_unlock(root_lock);
241}
242
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000243static int red_init(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700244{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800245 struct red_sched_data *q = qdisc_priv(sch);
246
247 q->qdisc = &noop_qdisc;
Eric Dumazet8af2a212011-12-08 06:06:03 +0000248 setup_timer(&q->adapt_timer, red_adaptative_timer, (unsigned long)sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 return red_change(sch, opt);
250}
251
252static int red_dump(struct Qdisc *sch, struct sk_buff *skb)
253{
254 struct red_sched_data *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800255 struct nlattr *opts = NULL;
Thomas Graf6b31b282005-11-05 21:14:05 +0100256 struct tc_red_qopt opt = {
257 .limit = q->limit,
258 .flags = q->flags,
259 .qth_min = q->parms.qth_min >> q->parms.Wlog,
260 .qth_max = q->parms.qth_max >> q->parms.Wlog,
261 .Wlog = q->parms.Wlog,
262 .Plog = q->parms.Plog,
263 .Scell_log = q->parms.Scell_log,
264 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265
Eric Dumazet0dfb33a2011-01-03 08:11:38 +0000266 sch->qstats.backlog = q->qdisc->qstats.backlog;
Patrick McHardy1e904742008-01-22 22:11:17 -0800267 opts = nla_nest_start(skb, TCA_OPTIONS);
268 if (opts == NULL)
269 goto nla_put_failure;
270 NLA_PUT(skb, TCA_RED_PARMS, sizeof(opt), &opt);
Eric Dumazet8af2a212011-12-08 06:06:03 +0000271 NLA_PUT_U32(skb, TCA_RED_MAX_P, q->parms.max_P);
Patrick McHardy1e904742008-01-22 22:11:17 -0800272 return nla_nest_end(skb, opts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273
Patrick McHardy1e904742008-01-22 22:11:17 -0800274nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -0700275 nla_nest_cancel(skb, opts);
276 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277}
278
279static int red_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
280{
281 struct red_sched_data *q = qdisc_priv(sch);
Thomas Graf6b31b282005-11-05 21:14:05 +0100282 struct tc_red_xstats st = {
283 .early = q->stats.prob_drop + q->stats.forced_drop,
284 .pdrop = q->stats.pdrop,
285 .other = q->stats.other,
286 .marked = q->stats.prob_mark + q->stats.forced_mark,
287 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288
Thomas Graf6b31b282005-11-05 21:14:05 +0100289 return gnet_stats_copy_app(d, &st, sizeof(st));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290}
291
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800292static int red_dump_class(struct Qdisc *sch, unsigned long cl,
293 struct sk_buff *skb, struct tcmsg *tcm)
294{
295 struct red_sched_data *q = qdisc_priv(sch);
296
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800297 tcm->tcm_handle |= TC_H_MIN(1);
298 tcm->tcm_info = q->qdisc->handle;
299 return 0;
300}
301
302static int red_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
303 struct Qdisc **old)
304{
305 struct red_sched_data *q = qdisc_priv(sch);
306
307 if (new == NULL)
308 new = &noop_qdisc;
309
310 sch_tree_lock(sch);
Patrick McHardyb94c8af2008-11-20 04:11:36 -0800311 *old = q->qdisc;
312 q->qdisc = new;
Patrick McHardy5e50da02006-11-29 17:36:20 -0800313 qdisc_tree_decrease_qlen(*old, (*old)->q.qlen);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800314 qdisc_reset(*old);
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800315 sch_tree_unlock(sch);
316 return 0;
317}
318
319static struct Qdisc *red_leaf(struct Qdisc *sch, unsigned long arg)
320{
321 struct red_sched_data *q = qdisc_priv(sch);
322 return q->qdisc;
323}
324
325static unsigned long red_get(struct Qdisc *sch, u32 classid)
326{
327 return 1;
328}
329
330static void red_put(struct Qdisc *sch, unsigned long arg)
331{
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800332}
333
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800334static void red_walk(struct Qdisc *sch, struct qdisc_walker *walker)
335{
336 if (!walker->stop) {
337 if (walker->count >= walker->skip)
338 if (walker->fn(sch, 1, walker) < 0) {
339 walker->stop = 1;
340 return;
341 }
342 walker->count++;
343 }
344}
345
Eric Dumazet20fea082007-11-14 01:44:41 -0800346static const struct Qdisc_class_ops red_class_ops = {
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800347 .graft = red_graft,
348 .leaf = red_leaf,
349 .get = red_get,
350 .put = red_put,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800351 .walk = red_walk,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800352 .dump = red_dump_class,
353};
354
Eric Dumazet20fea082007-11-14 01:44:41 -0800355static struct Qdisc_ops red_qdisc_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 .id = "red",
357 .priv_size = sizeof(struct red_sched_data),
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800358 .cl_ops = &red_class_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359 .enqueue = red_enqueue,
360 .dequeue = red_dequeue,
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700361 .peek = red_peek,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 .drop = red_drop,
363 .init = red_init,
364 .reset = red_reset,
Patrick McHardyf38c39d2006-03-20 19:20:44 -0800365 .destroy = red_destroy,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700366 .change = red_change,
367 .dump = red_dump,
368 .dump_stats = red_dump_stats,
369 .owner = THIS_MODULE,
370};
371
372static int __init red_module_init(void)
373{
374 return register_qdisc(&red_qdisc_ops);
375}
Thomas Grafdba051f2005-11-05 21:14:08 +0100376
377static void __exit red_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700378{
379 unregister_qdisc(&red_qdisc_ops);
380}
Thomas Grafdba051f2005-11-05 21:14:08 +0100381
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382module_init(red_module_init)
383module_exit(red_module_exit)
Thomas Grafdba051f2005-11-05 21:14:08 +0100384
Linus Torvalds1da177e2005-04-16 15:20:36 -0700385MODULE_LICENSE("GPL");