blob: 80105109f756315d7a31d6734887941c9f16ea9c [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/sch_gred.c Generic Random Early Detection queue.
3 *
4 *
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version
8 * 2 of the License, or (at your option) any later version.
9 *
10 * Authors: J Hadi Salim (hadi@cyberus.ca) 1998-2002
11 *
12 * 991129: - Bug fix with grio mode
13 * - a better sing. AvgQ mode with Grio(WRED)
14 * - A finer grained VQ dequeue based on sugestion
15 * from Ren Liu
16 * - More error checks
17 *
Thomas Graf1e4dfaf92005-11-05 21:14:25 +010018 * For all the glorious comments look at include/net/red.h
Linus Torvalds1da177e2005-04-16 15:20:36 -070019 */
20
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090021#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023#include <linux/types.h>
24#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026#include <net/pkt_sched.h>
Thomas Graf22b33422005-11-05 21:14:16 +010027#include <net/red.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
Thomas Graff62d6b92005-11-05 21:14:15 +010029#define GRED_DEF_PRIO (MAX_DPs / 2)
Thomas Graf716a1b42005-11-05 21:14:20 +010030#define GRED_VQ_MASK (MAX_DPs - 1)
Thomas Graff62d6b92005-11-05 21:14:15 +010031
Linus Torvalds1da177e2005-04-16 15:20:36 -070032struct gred_sched_data;
33struct gred_sched;
34
Eric Dumazetcc7ec452011-01-19 19:26:56 +000035struct gred_sched_data {
Linus Torvalds1da177e2005-04-16 15:20:36 -070036 u32 limit; /* HARD maximal queue length */
Eric Dumazeta73ed262011-12-09 02:46:45 +000037 u32 DP; /* the drop parameters */
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 u32 bytesin; /* bytes seen on virtualQ so far*/
39 u32 packetsin; /* packets seen on virtualQ so far*/
40 u32 backlog; /* bytes on the virtualQ */
Thomas Graf1e4dfaf92005-11-05 21:14:25 +010041 u8 prio; /* the prio of this vq */
Linus Torvalds1da177e2005-04-16 15:20:36 -070042
Thomas Graf22b33422005-11-05 21:14:16 +010043 struct red_parms parms;
Eric Dumazeteeca6682012-01-05 02:25:16 +000044 struct red_vars vars;
Thomas Graf22b33422005-11-05 21:14:16 +010045 struct red_stats stats;
Linus Torvalds1da177e2005-04-16 15:20:36 -070046};
47
Thomas Grafdea3f622005-11-05 21:14:09 +010048enum {
49 GRED_WRED_MODE = 1,
Thomas Grafd6fd4e92005-11-05 21:14:10 +010050 GRED_RIO_MODE,
Thomas Grafdea3f622005-11-05 21:14:09 +010051};
52
Eric Dumazetcc7ec452011-01-19 19:26:56 +000053struct gred_sched {
Linus Torvalds1da177e2005-04-16 15:20:36 -070054 struct gred_sched_data *tab[MAX_DPs];
Thomas Grafdea3f622005-11-05 21:14:09 +010055 unsigned long flags;
Thomas Grafb38c7ee2005-11-05 21:14:27 +010056 u32 red_flags;
Thomas Graf1e4dfaf92005-11-05 21:14:25 +010057 u32 DPs;
58 u32 def;
Eric Dumazeteeca6682012-01-05 02:25:16 +000059 struct red_vars wred_set;
Linus Torvalds1da177e2005-04-16 15:20:36 -070060};
61
Thomas Grafdea3f622005-11-05 21:14:09 +010062static inline int gred_wred_mode(struct gred_sched *table)
63{
64 return test_bit(GRED_WRED_MODE, &table->flags);
65}
66
67static inline void gred_enable_wred_mode(struct gred_sched *table)
68{
69 __set_bit(GRED_WRED_MODE, &table->flags);
70}
71
72static inline void gred_disable_wred_mode(struct gred_sched *table)
73{
74 __clear_bit(GRED_WRED_MODE, &table->flags);
75}
76
Thomas Grafd6fd4e92005-11-05 21:14:10 +010077static inline int gred_rio_mode(struct gred_sched *table)
78{
79 return test_bit(GRED_RIO_MODE, &table->flags);
80}
81
82static inline void gred_enable_rio_mode(struct gred_sched *table)
83{
84 __set_bit(GRED_RIO_MODE, &table->flags);
85}
86
87static inline void gred_disable_rio_mode(struct gred_sched *table)
88{
89 __clear_bit(GRED_RIO_MODE, &table->flags);
90}
91
Thomas Grafdea3f622005-11-05 21:14:09 +010092static inline int gred_wred_mode_check(struct Qdisc *sch)
93{
94 struct gred_sched *table = qdisc_priv(sch);
95 int i;
96
97 /* Really ugly O(n^2) but shouldn't be necessary too frequent. */
98 for (i = 0; i < table->DPs; i++) {
99 struct gred_sched_data *q = table->tab[i];
100 int n;
101
102 if (q == NULL)
103 continue;
104
David Wardc22e4642012-09-13 05:22:33 +0000105 for (n = i + 1; n < table->DPs; n++)
106 if (table->tab[n] && table->tab[n]->prio == q->prio)
Thomas Grafdea3f622005-11-05 21:14:09 +0100107 return 1;
108 }
109
110 return 0;
111}
112
Thomas Graf22b33422005-11-05 21:14:16 +0100113static inline unsigned int gred_backlog(struct gred_sched *table,
114 struct gred_sched_data *q,
115 struct Qdisc *sch)
116{
117 if (gred_wred_mode(table))
118 return sch->qstats.backlog;
119 else
120 return q->backlog;
121}
122
Thomas Graf716a1b42005-11-05 21:14:20 +0100123static inline u16 tc_index_to_dp(struct sk_buff *skb)
124{
125 return skb->tc_index & GRED_VQ_MASK;
126}
127
Eric Dumazeteeca6682012-01-05 02:25:16 +0000128static inline void gred_load_wred_set(const struct gred_sched *table,
Thomas Graf70517032005-11-05 21:14:23 +0100129 struct gred_sched_data *q)
130{
Eric Dumazeteeca6682012-01-05 02:25:16 +0000131 q->vars.qavg = table->wred_set.qavg;
132 q->vars.qidlestart = table->wred_set.qidlestart;
Thomas Graf70517032005-11-05 21:14:23 +0100133}
134
135static inline void gred_store_wred_set(struct gred_sched *table,
136 struct gred_sched_data *q)
137{
Eric Dumazeteeca6682012-01-05 02:25:16 +0000138 table->wred_set.qavg = q->vars.qavg;
David Wardba1bf472012-09-13 05:22:35 +0000139 table->wred_set.qidlestart = q->vars.qidlestart;
Thomas Graf70517032005-11-05 21:14:23 +0100140}
141
Thomas Grafb38c7ee2005-11-05 21:14:27 +0100142static inline int gred_use_ecn(struct gred_sched *t)
143{
144 return t->red_flags & TC_RED_ECN;
145}
146
Thomas Grafbdc450a2005-11-05 21:14:28 +0100147static inline int gred_use_harddrop(struct gred_sched *t)
148{
149 return t->red_flags & TC_RED_HARDDROP;
150}
151
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000152static int gred_enqueue(struct sk_buff *skb, struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000154 struct gred_sched_data *q = NULL;
155 struct gred_sched *t = qdisc_priv(sch);
Thomas Graf22b33422005-11-05 21:14:16 +0100156 unsigned long qavg = 0;
Thomas Graf4a591832005-11-05 21:14:22 +0100157 u16 dp = tc_index_to_dp(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000159 if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
Thomas Graf18e3fb842005-11-05 21:14:21 +0100160 dp = t->def;
161
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000162 q = t->tab[dp];
163 if (!q) {
Thomas Graf18e3fb842005-11-05 21:14:21 +0100164 /* Pass through packets not assigned to a DP
165 * if no default DP has been configured. This
166 * allows for DP flows to be left untouched.
167 */
David Warda3eb95f2015-05-09 22:01:46 -0400168 if (likely(sch->qstats.backlog + qdisc_pkt_len(skb) <=
169 sch->limit))
Thomas Graf18e3fb842005-11-05 21:14:21 +0100170 return qdisc_enqueue_tail(skb, sch);
171 else
172 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 }
Thomas Graf18e3fb842005-11-05 21:14:21 +0100174
Eric Dumazeteeca6682012-01-05 02:25:16 +0000175 /* fix tc_index? --could be controversial but needed for
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176 requeueing */
Thomas Graf18e3fb842005-11-05 21:14:21 +0100177 skb->tc_index = (skb->tc_index & ~GRED_VQ_MASK) | dp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178 }
179
David Warde29fe832012-09-13 05:22:32 +0000180 /* sum up all the qaves of prios < ours to get the new qave */
Thomas Grafd6fd4e92005-11-05 21:14:10 +0100181 if (!gred_wred_mode(t) && gred_rio_mode(t)) {
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100182 int i;
183
184 for (i = 0; i < t->DPs; i++) {
185 if (t->tab[i] && t->tab[i]->prio < q->prio &&
Eric Dumazeteeca6682012-01-05 02:25:16 +0000186 !red_is_idling(&t->tab[i]->vars))
187 qavg += t->tab[i]->vars.qavg;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700188 }
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100189
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190 }
191
192 q->packetsin++;
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700193 q->bytesin += qdisc_pkt_len(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100195 if (gred_wred_mode(t))
Thomas Graf70517032005-11-05 21:14:23 +0100196 gred_load_wred_set(t, q);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197
Eric Dumazeteeca6682012-01-05 02:25:16 +0000198 q->vars.qavg = red_calc_qavg(&q->parms,
199 &q->vars,
200 gred_backlog(t, q, sch));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700201
Eric Dumazeteeca6682012-01-05 02:25:16 +0000202 if (red_is_idling(&q->vars))
203 red_end_of_idle_period(&q->vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204
Thomas Grafdea3f622005-11-05 21:14:09 +0100205 if (gred_wred_mode(t))
Thomas Graf70517032005-11-05 21:14:23 +0100206 gred_store_wred_set(t, q);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207
Eric Dumazeteeca6682012-01-05 02:25:16 +0000208 switch (red_action(&q->parms, &q->vars, q->vars.qavg + qavg)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000209 case RED_DONT_MARK:
210 break;
Thomas Graf22b33422005-11-05 21:14:16 +0100211
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000212 case RED_PROB_MARK:
John Fastabend25331d62014-09-28 11:53:29 -0700213 qdisc_qstats_overlimit(sch);
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000214 if (!gred_use_ecn(t) || !INET_ECN_set_ce(skb)) {
215 q->stats.prob_drop++;
216 goto congestion_drop;
217 }
Thomas Grafb38c7ee2005-11-05 21:14:27 +0100218
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000219 q->stats.prob_mark++;
220 break;
Thomas Graf22b33422005-11-05 21:14:16 +0100221
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000222 case RED_HARD_MARK:
John Fastabend25331d62014-09-28 11:53:29 -0700223 qdisc_qstats_overlimit(sch);
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000224 if (gred_use_harddrop(t) || !gred_use_ecn(t) ||
225 !INET_ECN_set_ce(skb)) {
226 q->stats.forced_drop++;
227 goto congestion_drop;
228 }
229 q->stats.forced_mark++;
230 break;
Thomas Graf22b33422005-11-05 21:14:16 +0100231 }
232
David Ward145a42b2015-05-09 22:01:47 -0400233 if (gred_backlog(t, q, sch) + qdisc_pkt_len(skb) <= q->limit) {
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700234 q->backlog += qdisc_pkt_len(skb);
Thomas Grafedf7a7b2005-11-05 21:14:19 +0100235 return qdisc_enqueue_tail(skb, sch);
Thomas Graf22b33422005-11-05 21:14:16 +0100236 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700237
Thomas Graf22b33422005-11-05 21:14:16 +0100238 q->stats.pdrop++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239drop:
Thomas Grafedf7a7b2005-11-05 21:14:19 +0100240 return qdisc_drop(skb, sch);
Thomas Grafc3b553c2005-11-05 21:14:18 +0100241
242congestion_drop:
Thomas Grafedf7a7b2005-11-05 21:14:19 +0100243 qdisc_drop(skb, sch);
Thomas Grafc3b553c2005-11-05 21:14:18 +0100244 return NET_XMIT_CN;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245}
246
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000247static struct sk_buff *gred_dequeue(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248{
249 struct sk_buff *skb;
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100250 struct gred_sched *t = qdisc_priv(sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251
Thomas Grafedf7a7b2005-11-05 21:14:19 +0100252 skb = qdisc_dequeue_head(sch);
253
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254 if (skb) {
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100255 struct gred_sched_data *q;
Thomas Graf18e3fb842005-11-05 21:14:21 +0100256 u16 dp = tc_index_to_dp(skb);
257
258 if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
Joe Perchese87cc472012-05-13 21:56:26 +0000259 net_warn_ratelimited("GRED: Unable to relocate VQ 0x%x after dequeue, screwing up backlog\n",
260 tc_index_to_dp(skb));
Thomas Graf18e3fb842005-11-05 21:14:21 +0100261 } else {
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700262 q->backlog -= qdisc_pkt_len(skb);
Thomas Graf18e3fb842005-11-05 21:14:21 +0100263
David Wardba1bf472012-09-13 05:22:35 +0000264 if (gred_wred_mode(t)) {
265 if (!sch->qstats.backlog)
266 red_start_of_idle_period(&t->wred_set);
267 } else {
268 if (!q->backlog)
269 red_start_of_idle_period(&q->vars);
270 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271 }
Thomas Graf18e3fb842005-11-05 21:14:21 +0100272
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273 return skb;
274 }
275
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 return NULL;
277}
278
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000279static unsigned int gred_drop(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280{
281 struct sk_buff *skb;
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100282 struct gred_sched *t = qdisc_priv(sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283
Thomas Grafedf7a7b2005-11-05 21:14:19 +0100284 skb = qdisc_dequeue_tail(sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285 if (skb) {
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700286 unsigned int len = qdisc_pkt_len(skb);
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100287 struct gred_sched_data *q;
Thomas Graf18e3fb842005-11-05 21:14:21 +0100288 u16 dp = tc_index_to_dp(skb);
289
290 if (dp >= t->DPs || (q = t->tab[dp]) == NULL) {
Joe Perchese87cc472012-05-13 21:56:26 +0000291 net_warn_ratelimited("GRED: Unable to relocate VQ 0x%x while dropping, screwing up backlog\n",
292 tc_index_to_dp(skb));
Thomas Graf18e3fb842005-11-05 21:14:21 +0100293 } else {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294 q->backlog -= len;
Thomas Graf22b33422005-11-05 21:14:16 +0100295 q->stats.other++;
Thomas Graf18e3fb842005-11-05 21:14:21 +0100296
David Wardba1bf472012-09-13 05:22:35 +0000297 if (gred_wred_mode(t)) {
298 if (!sch->qstats.backlog)
299 red_start_of_idle_period(&t->wred_set);
300 } else {
301 if (!q->backlog)
302 red_start_of_idle_period(&q->vars);
303 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700304 }
305
Thomas Grafedf7a7b2005-11-05 21:14:19 +0100306 qdisc_drop(skb, sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307 return len;
308 }
309
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311}
312
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000313static void gred_reset(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314{
315 int i;
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100316 struct gred_sched *t = qdisc_priv(sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317
Thomas Grafedf7a7b2005-11-05 21:14:19 +0100318 qdisc_reset_queue(sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700319
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900320 for (i = 0; i < t->DPs; i++) {
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100321 struct gred_sched_data *q = t->tab[i];
322
323 if (!q)
324 continue;
325
Eric Dumazeteeca6682012-01-05 02:25:16 +0000326 red_restart(&q->vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 q->backlog = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 }
329}
330
Thomas Graf66396072005-11-05 21:14:13 +0100331static inline void gred_destroy_vq(struct gred_sched_data *q)
332{
333 kfree(q);
334}
335
Patrick McHardy1e904742008-01-22 22:11:17 -0800336static inline int gred_change_table_def(struct Qdisc *sch, struct nlattr *dps)
Thomas Graf66396072005-11-05 21:14:13 +0100337{
338 struct gred_sched *table = qdisc_priv(sch);
339 struct tc_gred_sopt *sopt;
340 int i;
341
Patrick McHardy27a34212008-01-23 20:35:39 -0800342 if (dps == NULL)
Thomas Graf66396072005-11-05 21:14:13 +0100343 return -EINVAL;
344
Patrick McHardy1e904742008-01-22 22:11:17 -0800345 sopt = nla_data(dps);
Thomas Graf66396072005-11-05 21:14:13 +0100346
347 if (sopt->DPs > MAX_DPs || sopt->DPs == 0 || sopt->def_DP >= sopt->DPs)
348 return -EINVAL;
349
350 sch_tree_lock(sch);
351 table->DPs = sopt->DPs;
352 table->def = sopt->def_DP;
Thomas Grafb38c7ee2005-11-05 21:14:27 +0100353 table->red_flags = sopt->flags;
Thomas Graf66396072005-11-05 21:14:13 +0100354
355 /*
356 * Every entry point to GRED is synchronized with the above code
357 * and the DP is checked against DPs, i.e. shadowed VQs can no
358 * longer be found so we can unlock right here.
359 */
360 sch_tree_unlock(sch);
361
362 if (sopt->grio) {
363 gred_enable_rio_mode(table);
364 gred_disable_wred_mode(table);
365 if (gred_wred_mode_check(sch))
366 gred_enable_wred_mode(table);
367 } else {
368 gred_disable_rio_mode(table);
369 gred_disable_wred_mode(table);
370 }
371
372 for (i = table->DPs; i < MAX_DPs; i++) {
373 if (table->tab[i]) {
Yang Yingliangc17988a2013-12-23 17:38:58 +0800374 pr_warn("GRED: Warning: Destroying shadowed VQ 0x%x\n",
375 i);
Thomas Graf66396072005-11-05 21:14:13 +0100376 gred_destroy_vq(table->tab[i]);
377 table->tab[i] = NULL;
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900378 }
Thomas Graf66396072005-11-05 21:14:13 +0100379 }
380
Thomas Graf66396072005-11-05 21:14:13 +0100381 return 0;
382}
383
Thomas Graff62d6b92005-11-05 21:14:15 +0100384static inline int gred_change_vq(struct Qdisc *sch, int dp,
Eric Dumazeta73ed262011-12-09 02:46:45 +0000385 struct tc_gred_qopt *ctl, int prio,
Eric Dumazet869aa412011-12-15 22:09:45 +0000386 u8 *stab, u32 max_P,
387 struct gred_sched_data **prealloc)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388{
389 struct gred_sched *table = qdisc_priv(sch);
Eric Dumazet869aa412011-12-15 22:09:45 +0000390 struct gred_sched_data *q = table->tab[dp];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700391
Eric Dumazet869aa412011-12-15 22:09:45 +0000392 if (!q) {
393 table->tab[dp] = q = *prealloc;
394 *prealloc = NULL;
395 if (!q)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700396 return -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 }
398
Thomas Graff62d6b92005-11-05 21:14:15 +0100399 q->DP = dp;
400 q->prio = prio;
David Warda3eb95f2015-05-09 22:01:46 -0400401 if (ctl->limit > sch->limit)
402 q->limit = sch->limit;
403 else
404 q->limit = ctl->limit;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700405
Thomas Graf22b33422005-11-05 21:14:16 +0100406 if (q->backlog == 0)
Eric Dumazeteeca6682012-01-05 02:25:16 +0000407 red_end_of_idle_period(&q->vars);
Thomas Graf22b33422005-11-05 21:14:16 +0100408
409 red_set_parms(&q->parms,
410 ctl->qth_min, ctl->qth_max, ctl->Wlog, ctl->Plog,
Eric Dumazeta73ed262011-12-09 02:46:45 +0000411 ctl->Scell_log, stab, max_P);
Eric Dumazeteeca6682012-01-05 02:25:16 +0000412 red_set_vars(&q->vars);
Thomas Graff62d6b92005-11-05 21:14:15 +0100413 return 0;
414}
415
Patrick McHardy27a34212008-01-23 20:35:39 -0800416static const struct nla_policy gred_policy[TCA_GRED_MAX + 1] = {
417 [TCA_GRED_PARMS] = { .len = sizeof(struct tc_gred_qopt) },
418 [TCA_GRED_STAB] = { .len = 256 },
419 [TCA_GRED_DPS] = { .len = sizeof(struct tc_gred_sopt) },
Eric Dumazeta73ed262011-12-09 02:46:45 +0000420 [TCA_GRED_MAX_P] = { .type = NLA_U32 },
David Warda3eb95f2015-05-09 22:01:46 -0400421 [TCA_GRED_LIMIT] = { .type = NLA_U32 },
Patrick McHardy27a34212008-01-23 20:35:39 -0800422};
423
Patrick McHardy1e904742008-01-22 22:11:17 -0800424static int gred_change(struct Qdisc *sch, struct nlattr *opt)
Thomas Graff62d6b92005-11-05 21:14:15 +0100425{
426 struct gred_sched *table = qdisc_priv(sch);
427 struct tc_gred_qopt *ctl;
Patrick McHardy1e904742008-01-22 22:11:17 -0800428 struct nlattr *tb[TCA_GRED_MAX + 1];
Patrick McHardycee63722008-01-23 20:33:32 -0800429 int err, prio = GRED_DEF_PRIO;
Thomas Graff62d6b92005-11-05 21:14:15 +0100430 u8 *stab;
Eric Dumazeta73ed262011-12-09 02:46:45 +0000431 u32 max_P;
Eric Dumazet869aa412011-12-15 22:09:45 +0000432 struct gred_sched_data *prealloc;
Thomas Graff62d6b92005-11-05 21:14:15 +0100433
Patrick McHardycee63722008-01-23 20:33:32 -0800434 if (opt == NULL)
Thomas Graff62d6b92005-11-05 21:14:15 +0100435 return -EINVAL;
436
Patrick McHardy27a34212008-01-23 20:35:39 -0800437 err = nla_parse_nested(tb, TCA_GRED_MAX, opt, gred_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800438 if (err < 0)
439 return err;
440
David Warda3eb95f2015-05-09 22:01:46 -0400441 if (tb[TCA_GRED_PARMS] == NULL && tb[TCA_GRED_STAB] == NULL) {
442 if (tb[TCA_GRED_LIMIT] != NULL)
443 sch->limit = nla_get_u32(tb[TCA_GRED_LIMIT]);
Thomas Graff62d6b92005-11-05 21:14:15 +0100444 return gred_change_table_def(sch, opt);
David Warda3eb95f2015-05-09 22:01:46 -0400445 }
Thomas Graff62d6b92005-11-05 21:14:15 +0100446
Patrick McHardy1e904742008-01-22 22:11:17 -0800447 if (tb[TCA_GRED_PARMS] == NULL ||
David Warda3eb95f2015-05-09 22:01:46 -0400448 tb[TCA_GRED_STAB] == NULL ||
449 tb[TCA_GRED_LIMIT] != NULL)
Thomas Graff62d6b92005-11-05 21:14:15 +0100450 return -EINVAL;
451
Eric Dumazeta73ed262011-12-09 02:46:45 +0000452 max_P = tb[TCA_GRED_MAX_P] ? nla_get_u32(tb[TCA_GRED_MAX_P]) : 0;
453
Patrick McHardycee63722008-01-23 20:33:32 -0800454 err = -EINVAL;
Patrick McHardy1e904742008-01-22 22:11:17 -0800455 ctl = nla_data(tb[TCA_GRED_PARMS]);
456 stab = nla_data(tb[TCA_GRED_STAB]);
Thomas Graff62d6b92005-11-05 21:14:15 +0100457
458 if (ctl->DP >= table->DPs)
459 goto errout;
460
461 if (gred_rio_mode(table)) {
462 if (ctl->prio == 0) {
463 int def_prio = GRED_DEF_PRIO;
464
465 if (table->tab[table->def])
466 def_prio = table->tab[table->def]->prio;
467
468 printk(KERN_DEBUG "GRED: DP %u does not have a prio "
469 "setting default to %d\n", ctl->DP, def_prio);
470
471 prio = def_prio;
472 } else
473 prio = ctl->prio;
474 }
475
Eric Dumazet869aa412011-12-15 22:09:45 +0000476 prealloc = kzalloc(sizeof(*prealloc), GFP_KERNEL);
Thomas Graff62d6b92005-11-05 21:14:15 +0100477 sch_tree_lock(sch);
478
Eric Dumazet869aa412011-12-15 22:09:45 +0000479 err = gred_change_vq(sch, ctl->DP, ctl, prio, stab, max_P, &prealloc);
Thomas Graff62d6b92005-11-05 21:14:15 +0100480 if (err < 0)
481 goto errout_locked;
482
Thomas Grafd6fd4e92005-11-05 21:14:10 +0100483 if (gred_rio_mode(table)) {
Thomas Grafdea3f622005-11-05 21:14:09 +0100484 gred_disable_wred_mode(table);
485 if (gred_wred_mode_check(sch))
486 gred_enable_wred_mode(table);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700487 }
488
Thomas Graff62d6b92005-11-05 21:14:15 +0100489 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490
Thomas Graff62d6b92005-11-05 21:14:15 +0100491errout_locked:
492 sch_tree_unlock(sch);
Eric Dumazet869aa412011-12-15 22:09:45 +0000493 kfree(prealloc);
Thomas Graff62d6b92005-11-05 21:14:15 +0100494errout:
495 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700496}
497
Patrick McHardy1e904742008-01-22 22:11:17 -0800498static int gred_init(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499{
Patrick McHardy1e904742008-01-22 22:11:17 -0800500 struct nlattr *tb[TCA_GRED_MAX + 1];
Patrick McHardycee63722008-01-23 20:33:32 -0800501 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700502
Patrick McHardycee63722008-01-23 20:33:32 -0800503 if (opt == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700504 return -EINVAL;
505
Patrick McHardy27a34212008-01-23 20:35:39 -0800506 err = nla_parse_nested(tb, TCA_GRED_MAX, opt, gred_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800507 if (err < 0)
508 return err;
509
Patrick McHardy1e904742008-01-22 22:11:17 -0800510 if (tb[TCA_GRED_PARMS] || tb[TCA_GRED_STAB])
Thomas Graf66396072005-11-05 21:14:13 +0100511 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512
David Warda3eb95f2015-05-09 22:01:46 -0400513 if (tb[TCA_GRED_LIMIT])
514 sch->limit = nla_get_u32(tb[TCA_GRED_LIMIT]);
Phil Sutter348e3432015-08-18 10:30:49 +0200515 else
516 sch->limit = qdisc_dev(sch)->tx_queue_len
517 * psched_mtu(qdisc_dev(sch));
David Warda3eb95f2015-05-09 22:01:46 -0400518
Patrick McHardy1e904742008-01-22 22:11:17 -0800519 return gred_change_table_def(sch, tb[TCA_GRED_DPS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520}
521
522static int gred_dump(struct Qdisc *sch, struct sk_buff *skb)
523{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 struct gred_sched *table = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800525 struct nlattr *parms, *opts = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700526 int i;
Eric Dumazeta73ed262011-12-09 02:46:45 +0000527 u32 max_p[MAX_DPs];
Thomas Grafe0636822005-11-05 21:14:12 +0100528 struct tc_gred_sopt sopt = {
529 .DPs = table->DPs,
530 .def_DP = table->def,
531 .grio = gred_rio_mode(table),
Thomas Grafb38c7ee2005-11-05 21:14:27 +0100532 .flags = table->red_flags,
Thomas Grafe0636822005-11-05 21:14:12 +0100533 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534
Patrick McHardy1e904742008-01-22 22:11:17 -0800535 opts = nla_nest_start(skb, TCA_OPTIONS);
536 if (opts == NULL)
537 goto nla_put_failure;
David S. Miller1b34ec42012-03-29 05:11:39 -0400538 if (nla_put(skb, TCA_GRED_DPS, sizeof(sopt), &sopt))
539 goto nla_put_failure;
Eric Dumazeta73ed262011-12-09 02:46:45 +0000540
541 for (i = 0; i < MAX_DPs; i++) {
542 struct gred_sched_data *q = table->tab[i];
543
544 max_p[i] = q ? q->parms.max_P : 0;
545 }
David S. Miller1b34ec42012-03-29 05:11:39 -0400546 if (nla_put(skb, TCA_GRED_MAX_P, sizeof(max_p), max_p))
547 goto nla_put_failure;
Eric Dumazeta73ed262011-12-09 02:46:45 +0000548
David Warda3eb95f2015-05-09 22:01:46 -0400549 if (nla_put_u32(skb, TCA_GRED_LIMIT, sch->limit))
550 goto nla_put_failure;
551
Patrick McHardy1e904742008-01-22 22:11:17 -0800552 parms = nla_nest_start(skb, TCA_GRED_PARMS);
553 if (parms == NULL)
554 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555
Thomas Graf05f1cc02005-11-05 21:14:11 +0100556 for (i = 0; i < MAX_DPs; i++) {
557 struct gred_sched_data *q = table->tab[i];
558 struct tc_gred_qopt opt;
David Ward1fe37b12012-09-13 05:22:34 +0000559 unsigned long qavg;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700560
Thomas Graf05f1cc02005-11-05 21:14:11 +0100561 memset(&opt, 0, sizeof(opt));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700562
563 if (!q) {
564 /* hack -- fix at some point with proper message
565 This is how we indicate to tc that there is no VQ
566 at this DP */
567
Thomas Graf05f1cc02005-11-05 21:14:11 +0100568 opt.DP = MAX_DPs + i;
569 goto append_opt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700570 }
571
Thomas Graf05f1cc02005-11-05 21:14:11 +0100572 opt.limit = q->limit;
573 opt.DP = q->DP;
David Ward145a42b2015-05-09 22:01:47 -0400574 opt.backlog = gred_backlog(table, q, sch);
Thomas Graf05f1cc02005-11-05 21:14:11 +0100575 opt.prio = q->prio;
Thomas Graf22b33422005-11-05 21:14:16 +0100576 opt.qth_min = q->parms.qth_min >> q->parms.Wlog;
577 opt.qth_max = q->parms.qth_max >> q->parms.Wlog;
578 opt.Wlog = q->parms.Wlog;
579 opt.Plog = q->parms.Plog;
580 opt.Scell_log = q->parms.Scell_log;
581 opt.other = q->stats.other;
582 opt.early = q->stats.prob_drop;
583 opt.forced = q->stats.forced_drop;
584 opt.pdrop = q->stats.pdrop;
Thomas Graf05f1cc02005-11-05 21:14:11 +0100585 opt.packets = q->packetsin;
586 opt.bytesin = q->bytesin;
587
David Ward244b65d2012-04-15 12:31:45 +0000588 if (gred_wred_mode(table))
589 gred_load_wred_set(table, q);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700590
David Ward1fe37b12012-09-13 05:22:34 +0000591 qavg = red_calc_qavg(&q->parms, &q->vars,
592 q->vars.qavg >> q->parms.Wlog);
593 opt.qave = qavg >> q->parms.Wlog;
Thomas Graf22b33422005-11-05 21:14:16 +0100594
Thomas Graf05f1cc02005-11-05 21:14:11 +0100595append_opt:
Patrick McHardy1e904742008-01-22 22:11:17 -0800596 if (nla_append(skb, sizeof(opt), &opt) < 0)
597 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700598 }
599
Patrick McHardy1e904742008-01-22 22:11:17 -0800600 nla_nest_end(skb, parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601
Patrick McHardy1e904742008-01-22 22:11:17 -0800602 return nla_nest_end(skb, opts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603
Patrick McHardy1e904742008-01-22 22:11:17 -0800604nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -0700605 nla_nest_cancel(skb, opts);
606 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607}
608
609static void gred_destroy(struct Qdisc *sch)
610{
611 struct gred_sched *table = qdisc_priv(sch);
612 int i;
613
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100614 for (i = 0; i < table->DPs; i++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700615 if (table->tab[i])
Thomas Graf66396072005-11-05 21:14:13 +0100616 gred_destroy_vq(table->tab[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700617 }
618}
619
Eric Dumazet20fea082007-11-14 01:44:41 -0800620static struct Qdisc_ops gred_qdisc_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621 .id = "gred",
622 .priv_size = sizeof(struct gred_sched),
623 .enqueue = gred_enqueue,
624 .dequeue = gred_dequeue,
Jarek Poplawski8e3af972008-10-31 00:45:55 -0700625 .peek = qdisc_peek_head,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626 .drop = gred_drop,
627 .init = gred_init,
628 .reset = gred_reset,
629 .destroy = gred_destroy,
630 .change = gred_change,
631 .dump = gred_dump,
632 .owner = THIS_MODULE,
633};
634
635static int __init gred_module_init(void)
636{
637 return register_qdisc(&gred_qdisc_ops);
638}
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100639
640static void __exit gred_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700641{
642 unregister_qdisc(&gred_qdisc_ops);
643}
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100644
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645module_init(gred_module_init)
646module_exit(gred_module_exit)
Thomas Graf1e4dfaf92005-11-05 21:14:25 +0100647
Linus Torvalds1da177e2005-04-16 15:20:36 -0700648MODULE_LICENSE("GPL");