blob: fcd06e29e8b3828f5d8f13dd8b220194e3b3bac8 [file] [log] [blame]
Stephen Hemminger87990462006-08-10 23:35:16 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * net/sched/sch_htb.c Hierarchical token bucket, feed tree version
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Martin Devera, <devik@cdi.cz>
10 *
11 * Credits (in time order) for older HTB versions:
12 * Stef Coene <stef.coene@docum.org>
13 * HTB support at LARTC mailing list
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +090014 * Ondrej Kraus, <krauso@barr.cz>
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 * found missing INIT_QDISC(htb)
16 * Vladimir Smelhaus, Aamer Akhter, Bert Hubert
17 * helped a lot to locate nasty class stall bug
18 * Andi Kleen, Jamal Hadi, Bert Hubert
19 * code review and helpful comments on shaping
20 * Tomasz Wrona, <tw@eter.tym.pl>
21 * created test case so that I was able to fix nasty bug
22 * Wilfried Weissmann
23 * spotted bug in dequeue code and helped with fix
24 * Jiri Fojtasek
25 * fixed requeue routine
26 * and many others. thanks.
Linus Torvalds1da177e2005-04-16 15:20:36 -070027 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/module.h>
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -070029#include <linux/moduleparam.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/types.h>
31#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/string.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070033#include <linux/errno.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070034#include <linux/skbuff.h>
35#include <linux/list.h>
36#include <linux/compiler.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070037#include <linux/rbtree.h>
Patrick McHardy0ba48052007-07-02 22:49:07 -070038#include <net/netlink.h>
39#include <net/pkt_sched.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070040
41/* HTB algorithm.
42 Author: devik@cdi.cz
43 ========================================================================
44 HTB is like TBF with multiple classes. It is also similar to CBQ because
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +090045 it allows to assign priority to each class in hierarchy.
Linus Torvalds1da177e2005-04-16 15:20:36 -070046 In fact it is another implementation of Floyd's formal sharing.
47
48 Levels:
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +090049 Each class is assigned level. Leaf has ALWAYS level 0 and root
Linus Torvalds1da177e2005-04-16 15:20:36 -070050 classes have level TC_HTB_MAXDEPTH-1. Interior nodes has level
51 one less than their parent.
52*/
53
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -070054static int htb_hysteresis __read_mostly = 0; /* whether to use mode hysteresis for speedup */
Stephen Hemminger87990462006-08-10 23:35:16 -070055#define HTB_VER 0x30011 /* major must be matched with number suplied by TC as version */
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
57#if HTB_VER >> 16 != TC_HTB_PROTOVER
58#error "Mismatched sch_htb.c and pkt_sch.h"
59#endif
60
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -070061/* Module parameter and sysfs export */
62module_param (htb_hysteresis, int, 0640);
63MODULE_PARM_DESC(htb_hysteresis, "Hysteresis mode, less CPU load, less accurate");
64
Linus Torvalds1da177e2005-04-16 15:20:36 -070065/* used internaly to keep status of single class */
66enum htb_cmode {
Stephen Hemminger87990462006-08-10 23:35:16 -070067 HTB_CANT_SEND, /* class can't send and can't borrow */
68 HTB_MAY_BORROW, /* class can't send but may borrow */
69 HTB_CAN_SEND /* class can send */
Linus Torvalds1da177e2005-04-16 15:20:36 -070070};
71
72/* interior & leaf nodes; props specific to leaves are marked L: */
Stephen Hemminger87990462006-08-10 23:35:16 -070073struct htb_class {
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -070074 struct Qdisc_class_common common;
Stephen Hemminger87990462006-08-10 23:35:16 -070075 /* general class parameters */
Stephen Hemminger87990462006-08-10 23:35:16 -070076 struct gnet_stats_basic bstats;
77 struct gnet_stats_queue qstats;
78 struct gnet_stats_rate_est rate_est;
79 struct tc_htb_xstats xstats; /* our special stats */
80 int refcnt; /* usage count of this class */
Linus Torvalds1da177e2005-04-16 15:20:36 -070081
Stephen Hemminger87990462006-08-10 23:35:16 -070082 /* topology */
83 int level; /* our level (see above) */
Patrick McHardy42077592008-07-05 23:22:53 -070084 unsigned int children;
Stephen Hemminger87990462006-08-10 23:35:16 -070085 struct htb_class *parent; /* parent class */
Linus Torvalds1da177e2005-04-16 15:20:36 -070086
Jarek Poplawskic19f7a32008-12-03 21:09:45 -080087 int prio; /* these two are used only by leaves... */
88 int quantum; /* but stored for parent-to-leaf return */
89
Stephen Hemminger87990462006-08-10 23:35:16 -070090 union {
91 struct htb_class_leaf {
92 struct Qdisc *q;
Stephen Hemminger87990462006-08-10 23:35:16 -070093 int deficit[TC_HTB_MAXDEPTH];
94 struct list_head drop_list;
95 } leaf;
96 struct htb_class_inner {
97 struct rb_root feed[TC_HTB_NUMPRIO]; /* feed trees */
98 struct rb_node *ptr[TC_HTB_NUMPRIO]; /* current class ptr */
99 /* When class changes from state 1->2 and disconnects from
100 parent's feed then we lost ptr value and start from the
101 first child again. Here we store classid of the
102 last valid ptr (used when ptr is NULL). */
103 u32 last_ptr_id[TC_HTB_NUMPRIO];
104 } inner;
105 } un;
106 struct rb_node node[TC_HTB_NUMPRIO]; /* node for self or feed tree */
107 struct rb_node pq_node; /* node for event queue */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700108 psched_time_t pq_key;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Stephen Hemminger87990462006-08-10 23:35:16 -0700110 int prio_activity; /* for which prios are we active */
111 enum htb_cmode cmode; /* current mode of the class */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112
Stephen Hemminger87990462006-08-10 23:35:16 -0700113 /* class attached filters */
114 struct tcf_proto *filter_list;
115 int filter_cnt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116
Stephen Hemminger87990462006-08-10 23:35:16 -0700117 int warned; /* only one warning about non work conserving .. */
118
119 /* token bucket parameters */
120 struct qdisc_rate_table *rate; /* rate table of the class itself */
121 struct qdisc_rate_table *ceil; /* ceiling rate (limits borrows too) */
122 long buffer, cbuffer; /* token bucket depth/rate */
123 psched_tdiff_t mbuffer; /* max wait time */
124 long tokens, ctokens; /* current number of tokens */
125 psched_time_t t_c; /* checkpoint time */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126};
127
Stephen Hemminger87990462006-08-10 23:35:16 -0700128struct htb_sched {
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700129 struct Qdisc_class_hash clhash;
Stephen Hemminger0cef2962006-08-10 23:35:38 -0700130 struct list_head drops[TC_HTB_NUMPRIO];/* active leaves (for drops) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131
Stephen Hemminger87990462006-08-10 23:35:16 -0700132 /* self list - roots of self generating tree */
133 struct rb_root row[TC_HTB_MAXDEPTH][TC_HTB_NUMPRIO];
134 int row_mask[TC_HTB_MAXDEPTH];
135 struct rb_node *ptr[TC_HTB_MAXDEPTH][TC_HTB_NUMPRIO];
136 u32 last_ptr_id[TC_HTB_MAXDEPTH][TC_HTB_NUMPRIO];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137
Stephen Hemminger87990462006-08-10 23:35:16 -0700138 /* self wait list - roots of wait PQs per row */
139 struct rb_root wait_pq[TC_HTB_MAXDEPTH];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700140
Stephen Hemminger87990462006-08-10 23:35:16 -0700141 /* time of nearest event per level (row) */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700142 psched_time_t near_ev_cache[TC_HTB_MAXDEPTH];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143
Stephen Hemminger87990462006-08-10 23:35:16 -0700144 int defcls; /* class where unclassified flows go to */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145
Stephen Hemminger87990462006-08-10 23:35:16 -0700146 /* filters for qdisc itself */
147 struct tcf_proto *filter_list;
Stephen Hemminger87990462006-08-10 23:35:16 -0700148
149 int rate2quantum; /* quant = rate / rate2quantum */
150 psched_time_t now; /* cached dequeue time */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700151 struct qdisc_watchdog watchdog;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700152
Stephen Hemminger87990462006-08-10 23:35:16 -0700153 /* non shaped skbs; let them go directly thru */
154 struct sk_buff_head direct_queue;
155 int direct_qlen; /* max qlen of above */
156
157 long direct_pkts;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158};
159
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160/* find class in global hash table using given handle */
Stephen Hemminger87990462006-08-10 23:35:16 -0700161static inline struct htb_class *htb_find(u32 handle, struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162{
163 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700164 struct Qdisc_class_common *clc;
Stephen Hemminger0cef2962006-08-10 23:35:38 -0700165
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700166 clc = qdisc_class_find(&q->clhash, handle);
167 if (clc == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168 return NULL;
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700169 return container_of(clc, struct htb_class, common);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700170}
171
172/**
173 * htb_classify - classify a packet into class
174 *
175 * It returns NULL if the packet should be dropped or -1 if the packet
176 * should be passed directly thru. In all other cases leaf class is returned.
177 * We allow direct class selection by classid in priority. The we examine
178 * filters in qdisc and in inner nodes (if higher filter points to the inner
179 * node). If we end up with classid MAJOR:0 we enqueue the skb into special
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900180 * internal fifo (direct). These packets then go directly thru. If we still
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181 * have no valid leaf we try to use MAJOR:default leaf. It still unsuccessfull
182 * then finish and return direct queue.
183 */
184#define HTB_DIRECT (struct htb_class*)-1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700185
Stephen Hemminger87990462006-08-10 23:35:16 -0700186static struct htb_class *htb_classify(struct sk_buff *skb, struct Qdisc *sch,
187 int *qerr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700188{
189 struct htb_sched *q = qdisc_priv(sch);
190 struct htb_class *cl;
191 struct tcf_result res;
192 struct tcf_proto *tcf;
193 int result;
194
195 /* allow to select class by setting skb->priority to valid classid;
196 note that nfmark can be used too by attaching filter fw with no
197 rules in it */
198 if (skb->priority == sch->handle)
Stephen Hemminger87990462006-08-10 23:35:16 -0700199 return HTB_DIRECT; /* X:0 (direct flow) selected */
200 if ((cl = htb_find(skb->priority, sch)) != NULL && cl->level == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700201 return cl;
202
Jarek Poplawskic27f3392008-08-04 22:39:11 -0700203 *qerr = NET_XMIT_SUCCESS | __NET_XMIT_BYPASS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204 tcf = q->filter_list;
205 while (tcf && (result = tc_classify(skb, tcf, &res)) >= 0) {
206#ifdef CONFIG_NET_CLS_ACT
207 switch (result) {
208 case TC_ACT_QUEUED:
Stephen Hemminger87990462006-08-10 23:35:16 -0700209 case TC_ACT_STOLEN:
Jarek Poplawski378a2f02008-08-04 22:31:03 -0700210 *qerr = NET_XMIT_SUCCESS | __NET_XMIT_STOLEN;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211 case TC_ACT_SHOT:
212 return NULL;
213 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214#endif
Stephen Hemminger87990462006-08-10 23:35:16 -0700215 if ((cl = (void *)res.class) == NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700216 if (res.classid == sch->handle)
Stephen Hemminger87990462006-08-10 23:35:16 -0700217 return HTB_DIRECT; /* X:0 (direct flow) */
218 if ((cl = htb_find(res.classid, sch)) == NULL)
219 break; /* filter selected invalid classid */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 }
221 if (!cl->level)
Stephen Hemminger87990462006-08-10 23:35:16 -0700222 return cl; /* we hit leaf; return it */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223
224 /* we have got inner class; apply inner filter chain */
225 tcf = cl->filter_list;
226 }
227 /* classification failed; try to use default class */
Stephen Hemminger87990462006-08-10 23:35:16 -0700228 cl = htb_find(TC_H_MAKE(TC_H_MAJ(sch->handle), q->defcls), sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 if (!cl || cl->level)
Stephen Hemminger87990462006-08-10 23:35:16 -0700230 return HTB_DIRECT; /* bad default .. this is safe bet */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231 return cl;
232}
233
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234/**
235 * htb_add_to_id_tree - adds class to the round robin list
236 *
237 * Routine adds class to the list (actually tree) sorted by classid.
238 * Make sure that class is not already on such list for given prio.
239 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700240static void htb_add_to_id_tree(struct rb_root *root,
241 struct htb_class *cl, int prio)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242{
243 struct rb_node **p = &root->rb_node, *parent = NULL;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700244
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 while (*p) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700246 struct htb_class *c;
247 parent = *p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248 c = rb_entry(parent, struct htb_class, node[prio]);
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700249
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700250 if (cl->common.classid > c->common.classid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251 p = &parent->rb_right;
Stephen Hemminger87990462006-08-10 23:35:16 -0700252 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253 p = &parent->rb_left;
254 }
255 rb_link_node(&cl->node[prio], parent, p);
256 rb_insert_color(&cl->node[prio], root);
257}
258
259/**
260 * htb_add_to_wait_tree - adds class to the event queue with delay
261 *
262 * The class is added to priority event queue to indicate that class will
263 * change its mode in cl->pq_key microseconds. Make sure that class is not
264 * already in the queue.
265 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700266static void htb_add_to_wait_tree(struct htb_sched *q,
267 struct htb_class *cl, long delay)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268{
269 struct rb_node **p = &q->wait_pq[cl->level].rb_node, *parent = NULL;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700270
Patrick McHardyfb983d42007-03-16 01:22:39 -0700271 cl->pq_key = q->now + delay;
272 if (cl->pq_key == q->now)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273 cl->pq_key++;
274
275 /* update the nearest event cache */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700276 if (q->near_ev_cache[cl->level] > cl->pq_key)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277 q->near_ev_cache[cl->level] = cl->pq_key;
Stephen Hemminger87990462006-08-10 23:35:16 -0700278
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 while (*p) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700280 struct htb_class *c;
281 parent = *p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700282 c = rb_entry(parent, struct htb_class, pq_node);
Patrick McHardyfb983d42007-03-16 01:22:39 -0700283 if (cl->pq_key >= c->pq_key)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284 p = &parent->rb_right;
Stephen Hemminger87990462006-08-10 23:35:16 -0700285 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286 p = &parent->rb_left;
287 }
288 rb_link_node(&cl->pq_node, parent, p);
289 rb_insert_color(&cl->pq_node, &q->wait_pq[cl->level]);
290}
291
292/**
293 * htb_next_rb_node - finds next node in binary tree
294 *
295 * When we are past last key we return NULL.
296 * Average complexity is 2 steps per call.
297 */
Stephen Hemminger3696f622006-08-10 23:36:01 -0700298static inline void htb_next_rb_node(struct rb_node **n)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299{
300 *n = rb_next(*n);
301}
302
303/**
304 * htb_add_class_to_row - add class to its row
305 *
306 * The class is added to row at priorities marked in mask.
307 * It does nothing if mask == 0.
308 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700309static inline void htb_add_class_to_row(struct htb_sched *q,
310 struct htb_class *cl, int mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 q->row_mask[cl->level] |= mask;
313 while (mask) {
314 int prio = ffz(~mask);
315 mask &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700316 htb_add_to_id_tree(q->row[cl->level] + prio, cl, prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317 }
318}
319
Stephen Hemminger3696f622006-08-10 23:36:01 -0700320/* If this triggers, it is a bug in this code, but it need not be fatal */
321static void htb_safe_rb_erase(struct rb_node *rb, struct rb_root *root)
322{
Ismail Donmez81771b32006-10-03 13:49:10 -0700323 if (RB_EMPTY_NODE(rb)) {
Stephen Hemminger3696f622006-08-10 23:36:01 -0700324 WARN_ON(1);
325 } else {
326 rb_erase(rb, root);
327 RB_CLEAR_NODE(rb);
328 }
329}
330
331
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332/**
333 * htb_remove_class_from_row - removes class from its row
334 *
335 * The class is removed from row at priorities marked in mask.
336 * It does nothing if mask == 0.
337 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700338static inline void htb_remove_class_from_row(struct htb_sched *q,
339 struct htb_class *cl, int mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340{
341 int m = 0;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700342
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 while (mask) {
344 int prio = ffz(~mask);
Stephen Hemminger3696f622006-08-10 23:36:01 -0700345
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346 mask &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700347 if (q->ptr[cl->level][prio] == cl->node + prio)
348 htb_next_rb_node(q->ptr[cl->level] + prio);
Stephen Hemminger3696f622006-08-10 23:36:01 -0700349
350 htb_safe_rb_erase(cl->node + prio, q->row[cl->level] + prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700351 if (!q->row[cl->level][prio].rb_node)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352 m |= 1 << prio;
353 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 q->row_mask[cl->level] &= ~m;
355}
356
357/**
358 * htb_activate_prios - creates active classe's feed chain
359 *
360 * The class is connected to ancestors and/or appropriate rows
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900361 * for priorities it is participating on. cl->cmode must be new
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 * (activated) mode. It does nothing if cl->prio_activity == 0.
363 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700364static void htb_activate_prios(struct htb_sched *q, struct htb_class *cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365{
366 struct htb_class *p = cl->parent;
Stephen Hemminger87990462006-08-10 23:35:16 -0700367 long m, mask = cl->prio_activity;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368
369 while (cl->cmode == HTB_MAY_BORROW && p && mask) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700370 m = mask;
371 while (m) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 int prio = ffz(~m);
373 m &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700374
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375 if (p->un.inner.feed[prio].rb_node)
376 /* parent already has its feed in use so that
377 reset bit in mask as parent is already ok */
378 mask &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700379
380 htb_add_to_id_tree(p->un.inner.feed + prio, cl, prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382 p->prio_activity |= mask;
Stephen Hemminger87990462006-08-10 23:35:16 -0700383 cl = p;
384 p = cl->parent;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700385
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386 }
387 if (cl->cmode == HTB_CAN_SEND && mask)
Stephen Hemminger87990462006-08-10 23:35:16 -0700388 htb_add_class_to_row(q, cl, mask);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700389}
390
391/**
392 * htb_deactivate_prios - remove class from feed chain
393 *
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900394 * cl->cmode must represent old mode (before deactivation). It does
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 * nothing if cl->prio_activity == 0. Class is removed from all feed
396 * chains and rows.
397 */
398static void htb_deactivate_prios(struct htb_sched *q, struct htb_class *cl)
399{
400 struct htb_class *p = cl->parent;
Stephen Hemminger87990462006-08-10 23:35:16 -0700401 long m, mask = cl->prio_activity;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402
403 while (cl->cmode == HTB_MAY_BORROW && p && mask) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700404 m = mask;
405 mask = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406 while (m) {
407 int prio = ffz(~m);
408 m &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700409
410 if (p->un.inner.ptr[prio] == cl->node + prio) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411 /* we are removing child which is pointed to from
412 parent feed - forget the pointer but remember
413 classid */
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700414 p->un.inner.last_ptr_id[prio] = cl->common.classid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415 p->un.inner.ptr[prio] = NULL;
416 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700417
Stephen Hemminger3696f622006-08-10 23:36:01 -0700418 htb_safe_rb_erase(cl->node + prio, p->un.inner.feed + prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700419
420 if (!p->un.inner.feed[prio].rb_node)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421 mask |= 1 << prio;
422 }
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700423
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424 p->prio_activity &= ~mask;
Stephen Hemminger87990462006-08-10 23:35:16 -0700425 cl = p;
426 p = cl->parent;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700427
Linus Torvalds1da177e2005-04-16 15:20:36 -0700428 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700429 if (cl->cmode == HTB_CAN_SEND && mask)
430 htb_remove_class_from_row(q, cl, mask);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431}
432
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700433static inline long htb_lowater(const struct htb_class *cl)
434{
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -0700435 if (htb_hysteresis)
436 return cl->cmode != HTB_CANT_SEND ? -cl->cbuffer : 0;
437 else
438 return 0;
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700439}
440static inline long htb_hiwater(const struct htb_class *cl)
441{
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -0700442 if (htb_hysteresis)
443 return cl->cmode == HTB_CAN_SEND ? -cl->buffer : 0;
444 else
445 return 0;
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700446}
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -0700447
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700448
Linus Torvalds1da177e2005-04-16 15:20:36 -0700449/**
450 * htb_class_mode - computes and returns current class mode
451 *
452 * It computes cl's mode at time cl->t_c+diff and returns it. If mode
453 * is not HTB_CAN_SEND then cl->pq_key is updated to time difference
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900454 * from now to time when cl will change its state.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700455 * Also it is worth to note that class mode doesn't change simply
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900456 * at cl->{c,}tokens == 0 but there can rather be hysteresis of
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457 * 0 .. -cl->{c,}buffer range. It is meant to limit number of
458 * mode transitions per time unit. The speed gain is about 1/6.
459 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700460static inline enum htb_cmode
461htb_class_mode(struct htb_class *cl, long *diff)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700462{
Stephen Hemminger87990462006-08-10 23:35:16 -0700463 long toks;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700464
Stephen Hemminger87990462006-08-10 23:35:16 -0700465 if ((toks = (cl->ctokens + *diff)) < htb_lowater(cl)) {
466 *diff = -toks;
467 return HTB_CANT_SEND;
468 }
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700469
Stephen Hemminger87990462006-08-10 23:35:16 -0700470 if ((toks = (cl->tokens + *diff)) >= htb_hiwater(cl))
471 return HTB_CAN_SEND;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472
Stephen Hemminger87990462006-08-10 23:35:16 -0700473 *diff = -toks;
474 return HTB_MAY_BORROW;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700475}
476
477/**
478 * htb_change_class_mode - changes classe's mode
479 *
480 * This should be the only way how to change classe's mode under normal
481 * cirsumstances. Routine will update feed lists linkage, change mode
482 * and add class to the wait event queue if appropriate. New mode should
483 * be different from old one and cl->pq_key has to be valid if changing
484 * to mode other than HTB_CAN_SEND (see htb_add_to_wait_tree).
485 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700486static void
Linus Torvalds1da177e2005-04-16 15:20:36 -0700487htb_change_class_mode(struct htb_sched *q, struct htb_class *cl, long *diff)
Stephen Hemminger87990462006-08-10 23:35:16 -0700488{
489 enum htb_cmode new_mode = htb_class_mode(cl, diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490
491 if (new_mode == cl->cmode)
Stephen Hemminger87990462006-08-10 23:35:16 -0700492 return;
493
494 if (cl->prio_activity) { /* not necessary: speed optimization */
495 if (cl->cmode != HTB_CANT_SEND)
496 htb_deactivate_prios(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497 cl->cmode = new_mode;
Stephen Hemminger87990462006-08-10 23:35:16 -0700498 if (new_mode != HTB_CANT_SEND)
499 htb_activate_prios(q, cl);
500 } else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501 cl->cmode = new_mode;
502}
503
504/**
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900505 * htb_activate - inserts leaf cl into appropriate active feeds
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506 *
507 * Routine learns (new) priority of leaf and activates feed chain
508 * for the prio. It can be called on already active leaf safely.
509 * It also adds leaf into droplist.
510 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700511static inline void htb_activate(struct htb_sched *q, struct htb_class *cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512{
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700513 WARN_ON(cl->level || !cl->un.leaf.q || !cl->un.leaf.q->q.qlen);
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700514
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515 if (!cl->prio_activity) {
Jarek Poplawskic19f7a32008-12-03 21:09:45 -0800516 cl->prio_activity = 1 << cl->prio;
Stephen Hemminger87990462006-08-10 23:35:16 -0700517 htb_activate_prios(q, cl);
518 list_add_tail(&cl->un.leaf.drop_list,
Jarek Poplawskic19f7a32008-12-03 21:09:45 -0800519 q->drops + cl->prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520 }
521}
522
523/**
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900524 * htb_deactivate - remove leaf cl from active feeds
Linus Torvalds1da177e2005-04-16 15:20:36 -0700525 *
526 * Make sure that leaf is active. In the other words it can't be called
527 * with non-active leaf. It also removes class from the drop list.
528 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700529static inline void htb_deactivate(struct htb_sched *q, struct htb_class *cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530{
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700531 WARN_ON(!cl->prio_activity);
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700532
Stephen Hemminger87990462006-08-10 23:35:16 -0700533 htb_deactivate_prios(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 cl->prio_activity = 0;
535 list_del_init(&cl->un.leaf.drop_list);
536}
537
538static int htb_enqueue(struct sk_buff *skb, struct Qdisc *sch)
539{
Jarek Poplawskif30ab412008-11-13 22:56:30 -0800540 int uninitialized_var(ret);
Stephen Hemminger87990462006-08-10 23:35:16 -0700541 struct htb_sched *q = qdisc_priv(sch);
542 struct htb_class *cl = htb_classify(skb, sch, &ret);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700543
Stephen Hemminger87990462006-08-10 23:35:16 -0700544 if (cl == HTB_DIRECT) {
545 /* enqueue to helper queue */
546 if (q->direct_queue.qlen < q->direct_qlen) {
547 __skb_queue_tail(&q->direct_queue, skb);
548 q->direct_pkts++;
549 } else {
550 kfree_skb(skb);
551 sch->qstats.drops++;
552 return NET_XMIT_DROP;
553 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700554#ifdef CONFIG_NET_CLS_ACT
Stephen Hemminger87990462006-08-10 23:35:16 -0700555 } else if (!cl) {
Jarek Poplawskic27f3392008-08-04 22:39:11 -0700556 if (ret & __NET_XMIT_BYPASS)
Stephen Hemminger87990462006-08-10 23:35:16 -0700557 sch->qstats.drops++;
558 kfree_skb(skb);
559 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700560#endif
Jarek Poplawski378a2f02008-08-04 22:31:03 -0700561 } else if ((ret = qdisc_enqueue(skb, cl->un.leaf.q)) != NET_XMIT_SUCCESS) {
562 if (net_xmit_drop_count(ret)) {
563 sch->qstats.drops++;
564 cl->qstats.drops++;
565 }
David S. Miller69747652008-08-17 23:55:36 -0700566 return ret;
Stephen Hemminger87990462006-08-10 23:35:16 -0700567 } else {
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700568 cl->bstats.packets +=
569 skb_is_gso(skb)?skb_shinfo(skb)->gso_segs:1;
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700570 cl->bstats.bytes += qdisc_pkt_len(skb);
Stephen Hemminger87990462006-08-10 23:35:16 -0700571 htb_activate(q, cl);
572 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573
Stephen Hemminger87990462006-08-10 23:35:16 -0700574 sch->q.qlen++;
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700575 sch->bstats.packets += skb_is_gso(skb)?skb_shinfo(skb)->gso_segs:1;
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700576 sch->bstats.bytes += qdisc_pkt_len(skb);
Stephen Hemminger87990462006-08-10 23:35:16 -0700577 return NET_XMIT_SUCCESS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700578}
579
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580/**
581 * htb_charge_class - charges amount "bytes" to leaf and ancestors
582 *
583 * Routine assumes that packet "bytes" long was dequeued from leaf cl
584 * borrowing from "level". It accounts bytes to ceil leaky bucket for
585 * leaf and all ancestors and to rate bucket for ancestors at levels
586 * "level" and higher. It also handles possible change of mode resulting
587 * from the update. Note that mode can also increase here (MAY_BORROW to
588 * CAN_SEND) because we can use more precise clock that event queue here.
589 * In such case we remove class from event queue first.
590 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700591static void htb_charge_class(struct htb_sched *q, struct htb_class *cl,
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700592 int level, struct sk_buff *skb)
Stephen Hemminger87990462006-08-10 23:35:16 -0700593{
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700594 int bytes = qdisc_pkt_len(skb);
Stephen Hemminger87990462006-08-10 23:35:16 -0700595 long toks, diff;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596 enum htb_cmode old_mode;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597
598#define HTB_ACCNT(T,B,R) toks = diff + cl->T; \
599 if (toks > cl->B) toks = cl->B; \
Jarek Poplawski23cb9132008-12-03 21:16:58 -0800600 toks -= (long) qdisc_l2t(cl->R, bytes); \
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601 if (toks <= -cl->mbuffer) toks = 1-cl->mbuffer; \
602 cl->T = toks
603
604 while (cl) {
Patrick McHardy03cc45c2007-03-23 11:29:11 -0700605 diff = psched_tdiff_bounded(q->now, cl->t_c, cl->mbuffer);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606 if (cl->level >= level) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700607 if (cl->level == level)
608 cl->xstats.lends++;
609 HTB_ACCNT(tokens, buffer, rate);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700610 } else {
611 cl->xstats.borrows++;
Stephen Hemminger87990462006-08-10 23:35:16 -0700612 cl->tokens += diff; /* we moved t_c; update tokens */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700614 HTB_ACCNT(ctokens, cbuffer, ceil);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700615 cl->t_c = q->now;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700616
Stephen Hemminger87990462006-08-10 23:35:16 -0700617 old_mode = cl->cmode;
618 diff = 0;
619 htb_change_class_mode(q, cl, &diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700620 if (old_mode != cl->cmode) {
621 if (old_mode != HTB_CAN_SEND)
Stephen Hemminger3696f622006-08-10 23:36:01 -0700622 htb_safe_rb_erase(&cl->pq_node, q->wait_pq + cl->level);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700623 if (cl->cmode != HTB_CAN_SEND)
Stephen Hemminger87990462006-08-10 23:35:16 -0700624 htb_add_to_wait_tree(q, cl, diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626
627 /* update byte stats except for leaves which are already updated */
628 if (cl->level) {
629 cl->bstats.bytes += bytes;
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700630 cl->bstats.packets += skb_is_gso(skb)?
631 skb_shinfo(skb)->gso_segs:1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700632 }
633 cl = cl->parent;
634 }
635}
636
637/**
638 * htb_do_events - make mode changes to classes at the level
639 *
Patrick McHardyfb983d42007-03-16 01:22:39 -0700640 * Scans event queue for pending events and applies them. Returns time of
Linus Torvalds1da177e2005-04-16 15:20:36 -0700641 * next pending event (0 for no event in pq).
Patrick McHardyfb983d42007-03-16 01:22:39 -0700642 * Note: Applied are events whose have cl->pq_key <= q->now.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643 */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700644static psched_time_t htb_do_events(struct htb_sched *q, int level)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645{
Martin Devera8f3ea332008-03-23 22:00:38 -0700646 /* don't run for longer than 2 jiffies; 2 is used instead of
647 1 to simplify things when jiffy is going to be incremented
648 too soon */
649 unsigned long stop_at = jiffies + 2;
650 while (time_before(jiffies, stop_at)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700651 struct htb_class *cl;
652 long diff;
Akinbou Mita30bdbe32006-10-12 01:52:05 -0700653 struct rb_node *p = rb_first(&q->wait_pq[level]);
654
Stephen Hemminger87990462006-08-10 23:35:16 -0700655 if (!p)
656 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700657
658 cl = rb_entry(p, struct htb_class, pq_node);
Patrick McHardyfb983d42007-03-16 01:22:39 -0700659 if (cl->pq_key > q->now)
660 return cl->pq_key;
661
Stephen Hemminger3696f622006-08-10 23:36:01 -0700662 htb_safe_rb_erase(p, q->wait_pq + level);
Patrick McHardy03cc45c2007-03-23 11:29:11 -0700663 diff = psched_tdiff_bounded(q->now, cl->t_c, cl->mbuffer);
Stephen Hemminger87990462006-08-10 23:35:16 -0700664 htb_change_class_mode(q, cl, &diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700665 if (cl->cmode != HTB_CAN_SEND)
Stephen Hemminger87990462006-08-10 23:35:16 -0700666 htb_add_to_wait_tree(q, cl, diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700667 }
Martin Devera8f3ea332008-03-23 22:00:38 -0700668 /* too much load - let's continue on next jiffie */
669 return q->now + PSCHED_TICKS_PER_SEC / HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670}
671
672/* Returns class->node+prio from id-tree where classe's id is >= id. NULL
673 is no such one exists. */
Stephen Hemminger87990462006-08-10 23:35:16 -0700674static struct rb_node *htb_id_find_next_upper(int prio, struct rb_node *n,
675 u32 id)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700676{
677 struct rb_node *r = NULL;
678 while (n) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700679 struct htb_class *cl =
680 rb_entry(n, struct htb_class, node[prio]);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700681 if (id == cl->common.classid)
Stephen Hemminger87990462006-08-10 23:35:16 -0700682 return n;
683
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700684 if (id > cl->common.classid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700685 n = n->rb_right;
686 } else {
687 r = n;
688 n = n->rb_left;
689 }
690 }
691 return r;
692}
693
694/**
695 * htb_lookup_leaf - returns next leaf class in DRR order
696 *
697 * Find leaf where current feed pointers points to.
698 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700699static struct htb_class *htb_lookup_leaf(struct rb_root *tree, int prio,
700 struct rb_node **pptr, u32 * pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700701{
702 int i;
703 struct {
704 struct rb_node *root;
705 struct rb_node **pptr;
706 u32 *pid;
Stephen Hemminger87990462006-08-10 23:35:16 -0700707 } stk[TC_HTB_MAXDEPTH], *sp = stk;
708
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700709 WARN_ON(!tree->rb_node);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 sp->root = tree->rb_node;
711 sp->pptr = pptr;
712 sp->pid = pid;
713
714 for (i = 0; i < 65535; i++) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700715 if (!*sp->pptr && *sp->pid) {
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900716 /* ptr was invalidated but id is valid - try to recover
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717 the original or next ptr */
Stephen Hemminger87990462006-08-10 23:35:16 -0700718 *sp->pptr =
719 htb_id_find_next_upper(prio, sp->root, *sp->pid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700720 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700721 *sp->pid = 0; /* ptr is valid now so that remove this hint as it
722 can become out of date quickly */
723 if (!*sp->pptr) { /* we are at right end; rewind & go up */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700724 *sp->pptr = sp->root;
Stephen Hemminger87990462006-08-10 23:35:16 -0700725 while ((*sp->pptr)->rb_left)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726 *sp->pptr = (*sp->pptr)->rb_left;
727 if (sp > stk) {
728 sp--;
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700729 WARN_ON(!*sp->pptr);
Stephen Hemminger87990462006-08-10 23:35:16 -0700730 if (!*sp->pptr)
731 return NULL;
732 htb_next_rb_node(sp->pptr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 }
734 } else {
735 struct htb_class *cl;
Stephen Hemminger87990462006-08-10 23:35:16 -0700736 cl = rb_entry(*sp->pptr, struct htb_class, node[prio]);
737 if (!cl->level)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738 return cl;
739 (++sp)->root = cl->un.inner.feed[prio].rb_node;
Stephen Hemminger87990462006-08-10 23:35:16 -0700740 sp->pptr = cl->un.inner.ptr + prio;
741 sp->pid = cl->un.inner.last_ptr_id + prio;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700742 }
743 }
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700744 WARN_ON(1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700745 return NULL;
746}
747
748/* dequeues packet at given priority and level; call only if
749 you are sure that there is active class at prio/level */
Stephen Hemminger87990462006-08-10 23:35:16 -0700750static struct sk_buff *htb_dequeue_tree(struct htb_sched *q, int prio,
751 int level)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752{
753 struct sk_buff *skb = NULL;
Stephen Hemminger87990462006-08-10 23:35:16 -0700754 struct htb_class *cl, *start;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700755 /* look initial class up in the row */
Stephen Hemminger87990462006-08-10 23:35:16 -0700756 start = cl = htb_lookup_leaf(q->row[level] + prio, prio,
757 q->ptr[level] + prio,
758 q->last_ptr_id[level] + prio);
759
Linus Torvalds1da177e2005-04-16 15:20:36 -0700760 do {
761next:
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700762 WARN_ON(!cl);
Stephen Hemminger87990462006-08-10 23:35:16 -0700763 if (!cl)
764 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700765
766 /* class can be empty - it is unlikely but can be true if leaf
767 qdisc drops packets in enqueue routine or if someone used
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900768 graft operation on the leaf since last dequeue;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700769 simply deactivate and skip such class */
770 if (unlikely(cl->un.leaf.q->q.qlen == 0)) {
771 struct htb_class *next;
Stephen Hemminger87990462006-08-10 23:35:16 -0700772 htb_deactivate(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700773
774 /* row/level might become empty */
775 if ((q->row_mask[level] & (1 << prio)) == 0)
Stephen Hemminger87990462006-08-10 23:35:16 -0700776 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777
Stephen Hemminger87990462006-08-10 23:35:16 -0700778 next = htb_lookup_leaf(q->row[level] + prio,
779 prio, q->ptr[level] + prio,
780 q->last_ptr_id[level] + prio);
781
782 if (cl == start) /* fix start if we just deleted it */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700783 start = next;
784 cl = next;
785 goto next;
786 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700787
788 skb = cl->un.leaf.q->dequeue(cl->un.leaf.q);
789 if (likely(skb != NULL))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700790 break;
791 if (!cl->warned) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700792 printk(KERN_WARNING
793 "htb: class %X isn't work conserving ?!\n",
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700794 cl->common.classid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700795 cl->warned = 1;
796 }
Jarek Poplawski633fe662008-12-03 21:09:10 -0800797
Stephen Hemminger87990462006-08-10 23:35:16 -0700798 htb_next_rb_node((level ? cl->parent->un.inner.ptr : q->
799 ptr[0]) + prio);
800 cl = htb_lookup_leaf(q->row[level] + prio, prio,
801 q->ptr[level] + prio,
802 q->last_ptr_id[level] + prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700803
804 } while (cl != start);
805
806 if (likely(skb != NULL)) {
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700807 cl->un.leaf.deficit[level] -= qdisc_pkt_len(skb);
808 if (cl->un.leaf.deficit[level] < 0) {
Jarek Poplawskic19f7a32008-12-03 21:09:45 -0800809 cl->un.leaf.deficit[level] += cl->quantum;
Stephen Hemminger87990462006-08-10 23:35:16 -0700810 htb_next_rb_node((level ? cl->parent->un.inner.ptr : q->
811 ptr[0]) + prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700812 }
813 /* this used to be after charge_class but this constelation
814 gives us slightly better performance */
815 if (!cl->un.leaf.q->q.qlen)
Stephen Hemminger87990462006-08-10 23:35:16 -0700816 htb_deactivate(q, cl);
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700817 htb_charge_class(q, cl, level, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700818 }
819 return skb;
820}
821
Linus Torvalds1da177e2005-04-16 15:20:36 -0700822static struct sk_buff *htb_dequeue(struct Qdisc *sch)
823{
824 struct sk_buff *skb = NULL;
825 struct htb_sched *q = qdisc_priv(sch);
826 int level;
Patrick McHardyfb983d42007-03-16 01:22:39 -0700827 psched_time_t next_event;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700828
829 /* try to dequeue direct packets as high prio (!) to minimize cpu work */
Stephen Hemminger87990462006-08-10 23:35:16 -0700830 skb = __skb_dequeue(&q->direct_queue);
831 if (skb != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700832 sch->flags &= ~TCQ_F_THROTTLED;
833 sch->q.qlen--;
834 return skb;
835 }
836
Stephen Hemminger87990462006-08-10 23:35:16 -0700837 if (!sch->q.qlen)
838 goto fin;
Patrick McHardy3bebcda2007-03-23 11:29:25 -0700839 q->now = psched_get_time();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700840
Patrick McHardyfb983d42007-03-16 01:22:39 -0700841 next_event = q->now + 5 * PSCHED_TICKS_PER_SEC;
Jarek Poplawski633fe662008-12-03 21:09:10 -0800842
Linus Torvalds1da177e2005-04-16 15:20:36 -0700843 for (level = 0; level < TC_HTB_MAXDEPTH; level++) {
844 /* common case optimization - skip event handler quickly */
845 int m;
Patrick McHardyfb983d42007-03-16 01:22:39 -0700846 psched_time_t event;
Stephen Hemminger87990462006-08-10 23:35:16 -0700847
Patrick McHardyfb983d42007-03-16 01:22:39 -0700848 if (q->now >= q->near_ev_cache[level]) {
849 event = htb_do_events(q, level);
Patrick McHardy2e4b3b02007-05-23 23:39:54 -0700850 if (!event)
851 event = q->now + PSCHED_TICKS_PER_SEC;
852 q->near_ev_cache[level] = event;
Patrick McHardyfb983d42007-03-16 01:22:39 -0700853 } else
854 event = q->near_ev_cache[level];
855
856 if (event && next_event > event)
857 next_event = event;
858
Linus Torvalds1da177e2005-04-16 15:20:36 -0700859 m = ~q->row_mask[level];
860 while (m != (int)(-1)) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700861 int prio = ffz(m);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700862 m |= 1 << prio;
Stephen Hemminger87990462006-08-10 23:35:16 -0700863 skb = htb_dequeue_tree(q, prio, level);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700864 if (likely(skb != NULL)) {
865 sch->q.qlen--;
866 sch->flags &= ~TCQ_F_THROTTLED;
867 goto fin;
868 }
869 }
870 }
Patrick McHardyfb983d42007-03-16 01:22:39 -0700871 sch->qstats.overlimits++;
872 qdisc_watchdog_schedule(&q->watchdog, next_event);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700873fin:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700874 return skb;
875}
876
877/* try to drop from each class (by prio) until one succeed */
Stephen Hemminger87990462006-08-10 23:35:16 -0700878static unsigned int htb_drop(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700879{
880 struct htb_sched *q = qdisc_priv(sch);
881 int prio;
882
883 for (prio = TC_HTB_NUMPRIO - 1; prio >= 0; prio--) {
884 struct list_head *p;
Stephen Hemminger87990462006-08-10 23:35:16 -0700885 list_for_each(p, q->drops + prio) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700886 struct htb_class *cl = list_entry(p, struct htb_class,
887 un.leaf.drop_list);
888 unsigned int len;
Stephen Hemminger87990462006-08-10 23:35:16 -0700889 if (cl->un.leaf.q->ops->drop &&
890 (len = cl->un.leaf.q->ops->drop(cl->un.leaf.q))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700891 sch->q.qlen--;
892 if (!cl->un.leaf.q->q.qlen)
Stephen Hemminger87990462006-08-10 23:35:16 -0700893 htb_deactivate(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700894 return len;
895 }
896 }
897 }
898 return 0;
899}
900
901/* reset all classes */
902/* always caled under BH & queue lock */
Stephen Hemminger87990462006-08-10 23:35:16 -0700903static void htb_reset(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700904{
905 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700906 struct htb_class *cl;
907 struct hlist_node *n;
908 unsigned int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700909
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700910 for (i = 0; i < q->clhash.hashsize; i++) {
911 hlist_for_each_entry(cl, n, &q->clhash.hash[i], common.hnode) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700912 if (cl->level)
Stephen Hemminger87990462006-08-10 23:35:16 -0700913 memset(&cl->un.inner, 0, sizeof(cl->un.inner));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700914 else {
Stephen Hemminger87990462006-08-10 23:35:16 -0700915 if (cl->un.leaf.q)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700916 qdisc_reset(cl->un.leaf.q);
917 INIT_LIST_HEAD(&cl->un.leaf.drop_list);
918 }
919 cl->prio_activity = 0;
920 cl->cmode = HTB_CAN_SEND;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700921
922 }
923 }
Patrick McHardyfb983d42007-03-16 01:22:39 -0700924 qdisc_watchdog_cancel(&q->watchdog);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700925 __skb_queue_purge(&q->direct_queue);
926 sch->q.qlen = 0;
Stephen Hemminger87990462006-08-10 23:35:16 -0700927 memset(q->row, 0, sizeof(q->row));
928 memset(q->row_mask, 0, sizeof(q->row_mask));
929 memset(q->wait_pq, 0, sizeof(q->wait_pq));
930 memset(q->ptr, 0, sizeof(q->ptr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700931 for (i = 0; i < TC_HTB_NUMPRIO; i++)
Stephen Hemminger87990462006-08-10 23:35:16 -0700932 INIT_LIST_HEAD(q->drops + i);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700933}
934
Patrick McHardy27a34212008-01-23 20:35:39 -0800935static const struct nla_policy htb_policy[TCA_HTB_MAX + 1] = {
936 [TCA_HTB_PARMS] = { .len = sizeof(struct tc_htb_opt) },
937 [TCA_HTB_INIT] = { .len = sizeof(struct tc_htb_glob) },
938 [TCA_HTB_CTAB] = { .type = NLA_BINARY, .len = TC_RTAB_SIZE },
939 [TCA_HTB_RTAB] = { .type = NLA_BINARY, .len = TC_RTAB_SIZE },
940};
941
Patrick McHardy1e904742008-01-22 22:11:17 -0800942static int htb_init(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700943{
944 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800945 struct nlattr *tb[TCA_HTB_INIT + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946 struct tc_htb_glob *gopt;
Patrick McHardycee63722008-01-23 20:33:32 -0800947 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700948 int i;
Patrick McHardycee63722008-01-23 20:33:32 -0800949
950 if (!opt)
951 return -EINVAL;
952
Patrick McHardy27a34212008-01-23 20:35:39 -0800953 err = nla_parse_nested(tb, TCA_HTB_INIT, opt, htb_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800954 if (err < 0)
955 return err;
956
Patrick McHardy27a34212008-01-23 20:35:39 -0800957 if (tb[TCA_HTB_INIT] == NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700958 printk(KERN_ERR "HTB: hey probably you have bad tc tool ?\n");
959 return -EINVAL;
960 }
Patrick McHardy1e904742008-01-22 22:11:17 -0800961 gopt = nla_data(tb[TCA_HTB_INIT]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700962 if (gopt->version != HTB_VER >> 16) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700963 printk(KERN_ERR
964 "HTB: need tc/htb version %d (minor is %d), you have %d\n",
965 HTB_VER >> 16, HTB_VER & 0xffff, gopt->version);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700966 return -EINVAL;
967 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700968
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700969 err = qdisc_class_hash_init(&q->clhash);
970 if (err < 0)
971 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700972 for (i = 0; i < TC_HTB_NUMPRIO; i++)
Stephen Hemminger87990462006-08-10 23:35:16 -0700973 INIT_LIST_HEAD(q->drops + i);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700974
Patrick McHardyfb983d42007-03-16 01:22:39 -0700975 qdisc_watchdog_init(&q->watchdog, sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700976 skb_queue_head_init(&q->direct_queue);
977
David S. Miller5ce2d482008-07-08 17:06:30 -0700978 q->direct_qlen = qdisc_dev(sch)->tx_queue_len;
Stephen Hemminger87990462006-08-10 23:35:16 -0700979 if (q->direct_qlen < 2) /* some devices have zero tx_queue_len */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700980 q->direct_qlen = 2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700981
Linus Torvalds1da177e2005-04-16 15:20:36 -0700982 if ((q->rate2quantum = gopt->rate2quantum) < 1)
983 q->rate2quantum = 1;
984 q->defcls = gopt->defcls;
985
986 return 0;
987}
988
989static int htb_dump(struct Qdisc *sch, struct sk_buff *skb)
990{
Jarek Poplawski102396a2008-08-29 14:21:52 -0700991 spinlock_t *root_lock = qdisc_root_sleeping_lock(sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700992 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800993 struct nlattr *nest;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700994 struct tc_htb_glob gopt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700995
David S. Miller7698b4f2008-07-16 01:42:40 -0700996 spin_lock_bh(root_lock);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800997
998 gopt.direct_pkts = q->direct_pkts;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700999 gopt.version = HTB_VER;
1000 gopt.rate2quantum = q->rate2quantum;
1001 gopt.defcls = q->defcls;
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001002 gopt.debug = 0;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001003
1004 nest = nla_nest_start(skb, TCA_OPTIONS);
1005 if (nest == NULL)
1006 goto nla_put_failure;
Patrick McHardy1e904742008-01-22 22:11:17 -08001007 NLA_PUT(skb, TCA_HTB_INIT, sizeof(gopt), &gopt);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001008 nla_nest_end(skb, nest);
1009
David S. Miller7698b4f2008-07-16 01:42:40 -07001010 spin_unlock_bh(root_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011 return skb->len;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001012
Patrick McHardy1e904742008-01-22 22:11:17 -08001013nla_put_failure:
David S. Miller7698b4f2008-07-16 01:42:40 -07001014 spin_unlock_bh(root_lock);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001015 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001016 return -1;
1017}
1018
1019static int htb_dump_class(struct Qdisc *sch, unsigned long arg,
Stephen Hemminger87990462006-08-10 23:35:16 -07001020 struct sk_buff *skb, struct tcmsg *tcm)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001021{
Stephen Hemminger87990462006-08-10 23:35:16 -07001022 struct htb_class *cl = (struct htb_class *)arg;
Jarek Poplawski102396a2008-08-29 14:21:52 -07001023 spinlock_t *root_lock = qdisc_root_sleeping_lock(sch);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001024 struct nlattr *nest;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001025 struct tc_htb_opt opt;
1026
David S. Miller7698b4f2008-07-16 01:42:40 -07001027 spin_lock_bh(root_lock);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001028 tcm->tcm_parent = cl->parent ? cl->parent->common.classid : TC_H_ROOT;
1029 tcm->tcm_handle = cl->common.classid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001030 if (!cl->level && cl->un.leaf.q)
1031 tcm->tcm_info = cl->un.leaf.q->handle;
1032
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001033 nest = nla_nest_start(skb, TCA_OPTIONS);
1034 if (nest == NULL)
1035 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036
Stephen Hemminger87990462006-08-10 23:35:16 -07001037 memset(&opt, 0, sizeof(opt));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001038
Stephen Hemminger87990462006-08-10 23:35:16 -07001039 opt.rate = cl->rate->rate;
1040 opt.buffer = cl->buffer;
1041 opt.ceil = cl->ceil->rate;
1042 opt.cbuffer = cl->cbuffer;
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001043 opt.quantum = cl->quantum;
1044 opt.prio = cl->prio;
Stephen Hemminger87990462006-08-10 23:35:16 -07001045 opt.level = cl->level;
Patrick McHardy1e904742008-01-22 22:11:17 -08001046 NLA_PUT(skb, TCA_HTB_PARMS, sizeof(opt), &opt);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001047
1048 nla_nest_end(skb, nest);
David S. Miller7698b4f2008-07-16 01:42:40 -07001049 spin_unlock_bh(root_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001050 return skb->len;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001051
Patrick McHardy1e904742008-01-22 22:11:17 -08001052nla_put_failure:
David S. Miller7698b4f2008-07-16 01:42:40 -07001053 spin_unlock_bh(root_lock);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001054 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001055 return -1;
1056}
1057
1058static int
Stephen Hemminger87990462006-08-10 23:35:16 -07001059htb_dump_class_stats(struct Qdisc *sch, unsigned long arg, struct gnet_dump *d)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001060{
Stephen Hemminger87990462006-08-10 23:35:16 -07001061 struct htb_class *cl = (struct htb_class *)arg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001062
Linus Torvalds1da177e2005-04-16 15:20:36 -07001063 if (!cl->level && cl->un.leaf.q)
1064 cl->qstats.qlen = cl->un.leaf.q->q.qlen;
1065 cl->xstats.tokens = cl->tokens;
1066 cl->xstats.ctokens = cl->ctokens;
1067
1068 if (gnet_stats_copy_basic(d, &cl->bstats) < 0 ||
1069 gnet_stats_copy_rate_est(d, &cl->rate_est) < 0 ||
1070 gnet_stats_copy_queue(d, &cl->qstats) < 0)
1071 return -1;
1072
1073 return gnet_stats_copy_app(d, &cl->xstats, sizeof(cl->xstats));
1074}
1075
1076static int htb_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
Stephen Hemminger87990462006-08-10 23:35:16 -07001077 struct Qdisc **old)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001078{
Stephen Hemminger87990462006-08-10 23:35:16 -07001079 struct htb_class *cl = (struct htb_class *)arg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001080
1081 if (cl && !cl->level) {
Patrick McHardy9f9afec2006-11-29 17:35:18 -08001082 if (new == NULL &&
David S. Miller5ce2d482008-07-08 17:06:30 -07001083 (new = qdisc_create_dflt(qdisc_dev(sch), sch->dev_queue,
David S. Millerbb949fb2008-07-08 16:55:56 -07001084 &pfifo_qdisc_ops,
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001085 cl->common.classid))
Stephen Hemminger87990462006-08-10 23:35:16 -07001086 == NULL)
1087 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001088 sch_tree_lock(sch);
Patrick McHardyb94c8af2008-11-20 04:11:36 -08001089 *old = cl->un.leaf.q;
1090 cl->un.leaf.q = new;
1091 if (*old != NULL) {
Patrick McHardy256d61b2006-11-29 17:37:05 -08001092 qdisc_tree_decrease_qlen(*old, (*old)->q.qlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001093 qdisc_reset(*old);
1094 }
1095 sch_tree_unlock(sch);
1096 return 0;
1097 }
1098 return -ENOENT;
1099}
1100
Stephen Hemminger87990462006-08-10 23:35:16 -07001101static struct Qdisc *htb_leaf(struct Qdisc *sch, unsigned long arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001102{
Stephen Hemminger87990462006-08-10 23:35:16 -07001103 struct htb_class *cl = (struct htb_class *)arg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001104 return (cl && !cl->level) ? cl->un.leaf.q : NULL;
1105}
1106
Patrick McHardy256d61b2006-11-29 17:37:05 -08001107static void htb_qlen_notify(struct Qdisc *sch, unsigned long arg)
1108{
1109 struct htb_class *cl = (struct htb_class *)arg;
1110
1111 if (cl->un.leaf.q->q.qlen == 0)
1112 htb_deactivate(qdisc_priv(sch), cl);
1113}
1114
Linus Torvalds1da177e2005-04-16 15:20:36 -07001115static unsigned long htb_get(struct Qdisc *sch, u32 classid)
1116{
Stephen Hemminger87990462006-08-10 23:35:16 -07001117 struct htb_class *cl = htb_find(classid, sch);
1118 if (cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001119 cl->refcnt++;
1120 return (unsigned long)cl;
1121}
1122
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001123static inline int htb_parent_last_child(struct htb_class *cl)
1124{
1125 if (!cl->parent)
1126 /* the root class */
1127 return 0;
Patrick McHardy42077592008-07-05 23:22:53 -07001128 if (cl->parent->children > 1)
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001129 /* not the last child */
1130 return 0;
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001131 return 1;
1132}
1133
Jarek Poplawski3ba08b02008-05-03 20:46:29 -07001134static void htb_parent_to_leaf(struct htb_sched *q, struct htb_class *cl,
1135 struct Qdisc *new_q)
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001136{
1137 struct htb_class *parent = cl->parent;
1138
Ilpo Järvinen547b7922008-07-25 21:43:18 -07001139 WARN_ON(cl->level || !cl->un.leaf.q || cl->prio_activity);
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001140
Jarek Poplawski3ba08b02008-05-03 20:46:29 -07001141 if (parent->cmode != HTB_CAN_SEND)
1142 htb_safe_rb_erase(&parent->pq_node, q->wait_pq + parent->level);
1143
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001144 parent->level = 0;
1145 memset(&parent->un.inner, 0, sizeof(parent->un.inner));
1146 INIT_LIST_HEAD(&parent->un.leaf.drop_list);
1147 parent->un.leaf.q = new_q ? new_q : &noop_qdisc;
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001148 parent->tokens = parent->buffer;
1149 parent->ctokens = parent->cbuffer;
Patrick McHardy3bebcda2007-03-23 11:29:25 -07001150 parent->t_c = psched_get_time();
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001151 parent->cmode = HTB_CAN_SEND;
1152}
1153
Stephen Hemminger87990462006-08-10 23:35:16 -07001154static void htb_destroy_class(struct Qdisc *sch, struct htb_class *cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001155{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001156 if (!cl->level) {
Ilpo Järvinen547b7922008-07-25 21:43:18 -07001157 WARN_ON(!cl->un.leaf.q);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158 qdisc_destroy(cl->un.leaf.q);
1159 }
Patrick McHardyee39e102007-07-02 22:48:13 -07001160 gen_kill_estimator(&cl->bstats, &cl->rate_est);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001161 qdisc_put_rtab(cl->rate);
1162 qdisc_put_rtab(cl->ceil);
Stephen Hemminger87990462006-08-10 23:35:16 -07001163
Patrick McHardyff31ab52008-07-01 19:52:38 -07001164 tcf_destroy_chain(&cl->filter_list);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001165 kfree(cl);
1166}
1167
1168/* always caled under BH & queue lock */
Stephen Hemminger87990462006-08-10 23:35:16 -07001169static void htb_destroy(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001170{
1171 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardyfbd8f132008-07-05 23:22:19 -07001172 struct hlist_node *n, *next;
1173 struct htb_class *cl;
1174 unsigned int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001175
Patrick McHardyfb983d42007-03-16 01:22:39 -07001176 qdisc_watchdog_cancel(&q->watchdog);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001177 /* This line used to be after htb_destroy_class call below
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +09001178 and surprisingly it worked in 2.4. But it must precede it
Linus Torvalds1da177e2005-04-16 15:20:36 -07001179 because filter need its target class alive to be able to call
1180 unbind_filter on it (without Oops). */
Patrick McHardyff31ab52008-07-01 19:52:38 -07001181 tcf_destroy_chain(&q->filter_list);
Stephen Hemminger87990462006-08-10 23:35:16 -07001182
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001183 for (i = 0; i < q->clhash.hashsize; i++) {
1184 hlist_for_each_entry(cl, n, &q->clhash.hash[i], common.hnode)
Patrick McHardyfbd8f132008-07-05 23:22:19 -07001185 tcf_destroy_chain(&cl->filter_list);
1186 }
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001187 for (i = 0; i < q->clhash.hashsize; i++) {
1188 hlist_for_each_entry_safe(cl, n, next, &q->clhash.hash[i],
1189 common.hnode)
Patrick McHardyfbd8f132008-07-05 23:22:19 -07001190 htb_destroy_class(sch, cl);
1191 }
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001192 qdisc_class_hash_destroy(&q->clhash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001193 __skb_queue_purge(&q->direct_queue);
1194}
1195
1196static int htb_delete(struct Qdisc *sch, unsigned long arg)
1197{
1198 struct htb_sched *q = qdisc_priv(sch);
Stephen Hemminger87990462006-08-10 23:35:16 -07001199 struct htb_class *cl = (struct htb_class *)arg;
Patrick McHardy256d61b2006-11-29 17:37:05 -08001200 unsigned int qlen;
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001201 struct Qdisc *new_q = NULL;
1202 int last_child = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001203
1204 // TODO: why don't allow to delete subtree ? references ? does
1205 // tc subsys quarantee us that in htb_destroy it holds no class
1206 // refs so that we can remove children safely there ?
Patrick McHardy42077592008-07-05 23:22:53 -07001207 if (cl->children || cl->filter_cnt)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001208 return -EBUSY;
Stephen Hemminger87990462006-08-10 23:35:16 -07001209
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001210 if (!cl->level && htb_parent_last_child(cl)) {
David S. Miller5ce2d482008-07-08 17:06:30 -07001211 new_q = qdisc_create_dflt(qdisc_dev(sch), sch->dev_queue,
David S. Millerbb949fb2008-07-08 16:55:56 -07001212 &pfifo_qdisc_ops,
1213 cl->parent->common.classid);
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001214 last_child = 1;
1215 }
1216
Linus Torvalds1da177e2005-04-16 15:20:36 -07001217 sch_tree_lock(sch);
Stephen Hemminger87990462006-08-10 23:35:16 -07001218
Patrick McHardy814a175e2006-11-29 17:34:50 -08001219 if (!cl->level) {
Patrick McHardy256d61b2006-11-29 17:37:05 -08001220 qlen = cl->un.leaf.q->q.qlen;
Patrick McHardy814a175e2006-11-29 17:34:50 -08001221 qdisc_reset(cl->un.leaf.q);
Patrick McHardy256d61b2006-11-29 17:37:05 -08001222 qdisc_tree_decrease_qlen(cl->un.leaf.q, qlen);
Patrick McHardy814a175e2006-11-29 17:34:50 -08001223 }
1224
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001225 /* delete from hash and active; remainder in destroy_class */
1226 qdisc_class_hash_remove(&q->clhash, &cl->common);
Jarek Poplawski26b284d2008-08-13 15:16:43 -07001227 if (cl->parent)
1228 cl->parent->children--;
Patrick McHardyc38c83c2007-03-27 14:04:24 -07001229
Linus Torvalds1da177e2005-04-16 15:20:36 -07001230 if (cl->prio_activity)
Stephen Hemminger87990462006-08-10 23:35:16 -07001231 htb_deactivate(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001232
Patrick McHardyfbd8f132008-07-05 23:22:19 -07001233 if (cl->cmode != HTB_CAN_SEND)
1234 htb_safe_rb_erase(&cl->pq_node, q->wait_pq + cl->level);
1235
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001236 if (last_child)
Jarek Poplawski3ba08b02008-05-03 20:46:29 -07001237 htb_parent_to_leaf(q, cl, new_q);
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001238
Linus Torvalds1da177e2005-04-16 15:20:36 -07001239 if (--cl->refcnt == 0)
Stephen Hemminger87990462006-08-10 23:35:16 -07001240 htb_destroy_class(sch, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001241
1242 sch_tree_unlock(sch);
1243 return 0;
1244}
1245
1246static void htb_put(struct Qdisc *sch, unsigned long arg)
1247{
Stephen Hemminger87990462006-08-10 23:35:16 -07001248 struct htb_class *cl = (struct htb_class *)arg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001249
1250 if (--cl->refcnt == 0)
Stephen Hemminger87990462006-08-10 23:35:16 -07001251 htb_destroy_class(sch, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001252}
1253
Stephen Hemminger87990462006-08-10 23:35:16 -07001254static int htb_change_class(struct Qdisc *sch, u32 classid,
Patrick McHardy1e904742008-01-22 22:11:17 -08001255 u32 parentid, struct nlattr **tca,
Stephen Hemminger87990462006-08-10 23:35:16 -07001256 unsigned long *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001257{
1258 int err = -EINVAL;
1259 struct htb_sched *q = qdisc_priv(sch);
Stephen Hemminger87990462006-08-10 23:35:16 -07001260 struct htb_class *cl = (struct htb_class *)*arg, *parent;
Patrick McHardy1e904742008-01-22 22:11:17 -08001261 struct nlattr *opt = tca[TCA_OPTIONS];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001262 struct qdisc_rate_table *rtab = NULL, *ctab = NULL;
Patrick McHardy1e904742008-01-22 22:11:17 -08001263 struct nlattr *tb[TCA_HTB_RTAB + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001264 struct tc_htb_opt *hopt;
1265
1266 /* extract all subattrs from opt attr */
Patrick McHardycee63722008-01-23 20:33:32 -08001267 if (!opt)
1268 goto failure;
1269
Patrick McHardy27a34212008-01-23 20:35:39 -08001270 err = nla_parse_nested(tb, TCA_HTB_RTAB, opt, htb_policy);
Patrick McHardycee63722008-01-23 20:33:32 -08001271 if (err < 0)
1272 goto failure;
1273
1274 err = -EINVAL;
Patrick McHardy27a34212008-01-23 20:35:39 -08001275 if (tb[TCA_HTB_PARMS] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001276 goto failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001277
Stephen Hemminger87990462006-08-10 23:35:16 -07001278 parent = parentid == TC_H_ROOT ? NULL : htb_find(parentid, sch);
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001279
Patrick McHardy1e904742008-01-22 22:11:17 -08001280 hopt = nla_data(tb[TCA_HTB_PARMS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281
Patrick McHardy1e904742008-01-22 22:11:17 -08001282 rtab = qdisc_get_rtab(&hopt->rate, tb[TCA_HTB_RTAB]);
1283 ctab = qdisc_get_rtab(&hopt->ceil, tb[TCA_HTB_CTAB]);
Stephen Hemminger87990462006-08-10 23:35:16 -07001284 if (!rtab || !ctab)
1285 goto failure;
1286
1287 if (!cl) { /* new class */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001288 struct Qdisc *new_q;
Stephen Hemminger3696f622006-08-10 23:36:01 -07001289 int prio;
Patrick McHardyee39e102007-07-02 22:48:13 -07001290 struct {
Patrick McHardy1e904742008-01-22 22:11:17 -08001291 struct nlattr nla;
Patrick McHardyee39e102007-07-02 22:48:13 -07001292 struct gnet_estimator opt;
1293 } est = {
Patrick McHardy1e904742008-01-22 22:11:17 -08001294 .nla = {
1295 .nla_len = nla_attr_size(sizeof(est.opt)),
1296 .nla_type = TCA_RATE,
Patrick McHardyee39e102007-07-02 22:48:13 -07001297 },
1298 .opt = {
1299 /* 4s interval, 16s averaging constant */
1300 .interval = 2,
1301 .ewma_log = 2,
1302 },
1303 };
Stephen Hemminger3696f622006-08-10 23:36:01 -07001304
Linus Torvalds1da177e2005-04-16 15:20:36 -07001305 /* check for valid classid */
Stephen Hemminger87990462006-08-10 23:35:16 -07001306 if (!classid || TC_H_MAJ(classid ^ sch->handle)
1307 || htb_find(classid, sch))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001308 goto failure;
1309
1310 /* check maximal depth */
1311 if (parent && parent->parent && parent->parent->level < 2) {
1312 printk(KERN_ERR "htb: tree is too deep\n");
1313 goto failure;
1314 }
1315 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -07001316 if ((cl = kzalloc(sizeof(*cl), GFP_KERNEL)) == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001317 goto failure;
Stephen Hemminger87990462006-08-10 23:35:16 -07001318
Stephen Hemminger71bcb092008-11-25 21:13:31 -08001319 err = gen_new_estimator(&cl->bstats, &cl->rate_est,
1320 qdisc_root_sleeping_lock(sch),
1321 tca[TCA_RATE] ? : &est.nla);
1322 if (err) {
1323 kfree(cl);
1324 goto failure;
1325 }
1326
Linus Torvalds1da177e2005-04-16 15:20:36 -07001327 cl->refcnt = 1;
Patrick McHardy42077592008-07-05 23:22:53 -07001328 cl->children = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001329 INIT_LIST_HEAD(&cl->un.leaf.drop_list);
Stephen Hemminger3696f622006-08-10 23:36:01 -07001330 RB_CLEAR_NODE(&cl->pq_node);
1331
1332 for (prio = 0; prio < TC_HTB_NUMPRIO; prio++)
1333 RB_CLEAR_NODE(&cl->node[prio]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001334
1335 /* create leaf qdisc early because it uses kmalloc(GFP_KERNEL)
1336 so that can't be used inside of sch_tree_lock
1337 -- thanks to Karlis Peisenieks */
David S. Miller5ce2d482008-07-08 17:06:30 -07001338 new_q = qdisc_create_dflt(qdisc_dev(sch), sch->dev_queue,
David S. Millerbb949fb2008-07-08 16:55:56 -07001339 &pfifo_qdisc_ops, classid);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001340 sch_tree_lock(sch);
1341 if (parent && !parent->level) {
Patrick McHardy256d61b2006-11-29 17:37:05 -08001342 unsigned int qlen = parent->un.leaf.q->q.qlen;
1343
Linus Torvalds1da177e2005-04-16 15:20:36 -07001344 /* turn parent into inner node */
Patrick McHardy256d61b2006-11-29 17:37:05 -08001345 qdisc_reset(parent->un.leaf.q);
1346 qdisc_tree_decrease_qlen(parent->un.leaf.q, qlen);
Stephen Hemminger87990462006-08-10 23:35:16 -07001347 qdisc_destroy(parent->un.leaf.q);
1348 if (parent->prio_activity)
1349 htb_deactivate(q, parent);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001350
1351 /* remove from evt list because of level change */
1352 if (parent->cmode != HTB_CAN_SEND) {
Stephen Hemminger3696f622006-08-10 23:36:01 -07001353 htb_safe_rb_erase(&parent->pq_node, q->wait_pq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001354 parent->cmode = HTB_CAN_SEND;
1355 }
1356 parent->level = (parent->parent ? parent->parent->level
Stephen Hemminger87990462006-08-10 23:35:16 -07001357 : TC_HTB_MAXDEPTH) - 1;
1358 memset(&parent->un.inner, 0, sizeof(parent->un.inner));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001359 }
1360 /* leaf (we) needs elementary qdisc */
1361 cl->un.leaf.q = new_q ? new_q : &noop_qdisc;
1362
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001363 cl->common.classid = classid;
Stephen Hemminger87990462006-08-10 23:35:16 -07001364 cl->parent = parent;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001365
1366 /* set class to be in HTB_CAN_SEND state */
1367 cl->tokens = hopt->buffer;
1368 cl->ctokens = hopt->cbuffer;
Patrick McHardy00c04af2007-03-16 01:23:02 -07001369 cl->mbuffer = 60 * PSCHED_TICKS_PER_SEC; /* 1min */
Patrick McHardy3bebcda2007-03-23 11:29:25 -07001370 cl->t_c = psched_get_time();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001371 cl->cmode = HTB_CAN_SEND;
1372
1373 /* attach to the hash list and parent's family */
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001374 qdisc_class_hash_insert(&q->clhash, &cl->common);
Patrick McHardy42077592008-07-05 23:22:53 -07001375 if (parent)
1376 parent->children++;
Patrick McHardyee39e102007-07-02 22:48:13 -07001377 } else {
Stephen Hemminger71bcb092008-11-25 21:13:31 -08001378 if (tca[TCA_RATE]) {
1379 err = gen_replace_estimator(&cl->bstats, &cl->rate_est,
1380 qdisc_root_sleeping_lock(sch),
1381 tca[TCA_RATE]);
1382 if (err)
1383 return err;
1384 }
Stephen Hemminger87990462006-08-10 23:35:16 -07001385 sch_tree_lock(sch);
Patrick McHardyee39e102007-07-02 22:48:13 -07001386 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001387
1388 /* it used to be a nasty bug here, we have to check that node
Stephen Hemminger87990462006-08-10 23:35:16 -07001389 is really leaf before changing cl->un.leaf ! */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001390 if (!cl->level) {
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001391 cl->quantum = rtab->rate.rate / q->rate2quantum;
1392 if (!hopt->quantum && cl->quantum < 1000) {
Stephen Hemminger87990462006-08-10 23:35:16 -07001393 printk(KERN_WARNING
1394 "HTB: quantum of class %X is small. Consider r2q change.\n",
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001395 cl->common.classid);
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001396 cl->quantum = 1000;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001397 }
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001398 if (!hopt->quantum && cl->quantum > 200000) {
Stephen Hemminger87990462006-08-10 23:35:16 -07001399 printk(KERN_WARNING
1400 "HTB: quantum of class %X is big. Consider r2q change.\n",
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001401 cl->common.classid);
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001402 cl->quantum = 200000;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403 }
1404 if (hopt->quantum)
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001405 cl->quantum = hopt->quantum;
1406 if ((cl->prio = hopt->prio) >= TC_HTB_NUMPRIO)
1407 cl->prio = TC_HTB_NUMPRIO - 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001408 }
1409
1410 cl->buffer = hopt->buffer;
1411 cl->cbuffer = hopt->cbuffer;
Stephen Hemminger87990462006-08-10 23:35:16 -07001412 if (cl->rate)
1413 qdisc_put_rtab(cl->rate);
1414 cl->rate = rtab;
1415 if (cl->ceil)
1416 qdisc_put_rtab(cl->ceil);
1417 cl->ceil = ctab;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001418 sch_tree_unlock(sch);
1419
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001420 qdisc_class_hash_grow(sch, &q->clhash);
1421
Linus Torvalds1da177e2005-04-16 15:20:36 -07001422 *arg = (unsigned long)cl;
1423 return 0;
1424
1425failure:
Stephen Hemminger87990462006-08-10 23:35:16 -07001426 if (rtab)
1427 qdisc_put_rtab(rtab);
1428 if (ctab)
1429 qdisc_put_rtab(ctab);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001430 return err;
1431}
1432
1433static struct tcf_proto **htb_find_tcf(struct Qdisc *sch, unsigned long arg)
1434{
1435 struct htb_sched *q = qdisc_priv(sch);
1436 struct htb_class *cl = (struct htb_class *)arg;
1437 struct tcf_proto **fl = cl ? &cl->filter_list : &q->filter_list;
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001438
Linus Torvalds1da177e2005-04-16 15:20:36 -07001439 return fl;
1440}
1441
1442static unsigned long htb_bind_filter(struct Qdisc *sch, unsigned long parent,
Stephen Hemminger87990462006-08-10 23:35:16 -07001443 u32 classid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001444{
Stephen Hemminger87990462006-08-10 23:35:16 -07001445 struct htb_class *cl = htb_find(classid, sch);
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001446
Linus Torvalds1da177e2005-04-16 15:20:36 -07001447 /*if (cl && !cl->level) return 0;
Stephen Hemminger87990462006-08-10 23:35:16 -07001448 The line above used to be there to prevent attaching filters to
1449 leaves. But at least tc_index filter uses this just to get class
1450 for other reasons so that we have to allow for it.
1451 ----
1452 19.6.2002 As Werner explained it is ok - bind filter is just
1453 another way to "lock" the class - unlike "get" this lock can
1454 be broken by class during destroy IIUC.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001455 */
Stephen Hemminger87990462006-08-10 23:35:16 -07001456 if (cl)
1457 cl->filter_cnt++;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001458 return (unsigned long)cl;
1459}
1460
1461static void htb_unbind_filter(struct Qdisc *sch, unsigned long arg)
1462{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001463 struct htb_class *cl = (struct htb_class *)arg;
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001464
Stephen Hemminger87990462006-08-10 23:35:16 -07001465 if (cl)
1466 cl->filter_cnt--;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001467}
1468
1469static void htb_walk(struct Qdisc *sch, struct qdisc_walker *arg)
1470{
1471 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001472 struct htb_class *cl;
1473 struct hlist_node *n;
1474 unsigned int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001475
1476 if (arg->stop)
1477 return;
1478
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001479 for (i = 0; i < q->clhash.hashsize; i++) {
1480 hlist_for_each_entry(cl, n, &q->clhash.hash[i], common.hnode) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001481 if (arg->count < arg->skip) {
1482 arg->count++;
1483 continue;
1484 }
1485 if (arg->fn(sch, (unsigned long)cl, arg) < 0) {
1486 arg->stop = 1;
1487 return;
1488 }
1489 arg->count++;
1490 }
1491 }
1492}
1493
Eric Dumazet20fea082007-11-14 01:44:41 -08001494static const struct Qdisc_class_ops htb_class_ops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001495 .graft = htb_graft,
1496 .leaf = htb_leaf,
Patrick McHardy256d61b2006-11-29 17:37:05 -08001497 .qlen_notify = htb_qlen_notify,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001498 .get = htb_get,
1499 .put = htb_put,
1500 .change = htb_change_class,
1501 .delete = htb_delete,
1502 .walk = htb_walk,
1503 .tcf_chain = htb_find_tcf,
1504 .bind_tcf = htb_bind_filter,
1505 .unbind_tcf = htb_unbind_filter,
1506 .dump = htb_dump_class,
1507 .dump_stats = htb_dump_class_stats,
1508};
1509
Eric Dumazet20fea082007-11-14 01:44:41 -08001510static struct Qdisc_ops htb_qdisc_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001511 .next = NULL,
1512 .cl_ops = &htb_class_ops,
1513 .id = "htb",
1514 .priv_size = sizeof(struct htb_sched),
1515 .enqueue = htb_enqueue,
1516 .dequeue = htb_dequeue,
Jarek Poplawski77be1552008-10-31 00:47:01 -07001517 .peek = qdisc_peek_dequeued,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001518 .drop = htb_drop,
1519 .init = htb_init,
1520 .reset = htb_reset,
1521 .destroy = htb_destroy,
1522 .change = NULL /* htb_change */,
1523 .dump = htb_dump,
1524 .owner = THIS_MODULE,
1525};
1526
1527static int __init htb_module_init(void)
1528{
Stephen Hemminger87990462006-08-10 23:35:16 -07001529 return register_qdisc(&htb_qdisc_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001530}
Stephen Hemminger87990462006-08-10 23:35:16 -07001531static void __exit htb_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001532{
Stephen Hemminger87990462006-08-10 23:35:16 -07001533 unregister_qdisc(&htb_qdisc_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001534}
Stephen Hemminger87990462006-08-10 23:35:16 -07001535
Linus Torvalds1da177e2005-04-16 15:20:36 -07001536module_init(htb_module_init)
1537module_exit(htb_module_exit)
1538MODULE_LICENSE("GPL");