blob: 77ff510ef8acb6e82bd956bcd2b6231b6110c2d9 [file] [log] [blame]
Stephen Hemminger87990462006-08-10 23:35:16 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * net/sched/sch_htb.c Hierarchical token bucket, feed tree version
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Martin Devera, <devik@cdi.cz>
10 *
11 * Credits (in time order) for older HTB versions:
12 * Stef Coene <stef.coene@docum.org>
13 * HTB support at LARTC mailing list
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +090014 * Ondrej Kraus, <krauso@barr.cz>
Linus Torvalds1da177e2005-04-16 15:20:36 -070015 * found missing INIT_QDISC(htb)
16 * Vladimir Smelhaus, Aamer Akhter, Bert Hubert
17 * helped a lot to locate nasty class stall bug
18 * Andi Kleen, Jamal Hadi, Bert Hubert
19 * code review and helpful comments on shaping
20 * Tomasz Wrona, <tw@eter.tym.pl>
21 * created test case so that I was able to fix nasty bug
22 * Wilfried Weissmann
23 * spotted bug in dequeue code and helped with fix
24 * Jiri Fojtasek
25 * fixed requeue routine
26 * and many others. thanks.
Linus Torvalds1da177e2005-04-16 15:20:36 -070027 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/module.h>
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -070029#include <linux/moduleparam.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/types.h>
31#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/string.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070033#include <linux/errno.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070034#include <linux/skbuff.h>
35#include <linux/list.h>
36#include <linux/compiler.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070037#include <linux/rbtree.h>
Patrick McHardy0ba48052007-07-02 22:49:07 -070038#include <net/netlink.h>
39#include <net/pkt_sched.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070040
41/* HTB algorithm.
42 Author: devik@cdi.cz
43 ========================================================================
44 HTB is like TBF with multiple classes. It is also similar to CBQ because
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +090045 it allows to assign priority to each class in hierarchy.
Linus Torvalds1da177e2005-04-16 15:20:36 -070046 In fact it is another implementation of Floyd's formal sharing.
47
48 Levels:
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +090049 Each class is assigned level. Leaf has ALWAYS level 0 and root
Linus Torvalds1da177e2005-04-16 15:20:36 -070050 classes have level TC_HTB_MAXDEPTH-1. Interior nodes has level
51 one less than their parent.
52*/
53
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -070054static int htb_hysteresis __read_mostly = 0; /* whether to use mode hysteresis for speedup */
Stephen Hemminger87990462006-08-10 23:35:16 -070055#define HTB_VER 0x30011 /* major must be matched with number suplied by TC as version */
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
57#if HTB_VER >> 16 != TC_HTB_PROTOVER
58#error "Mismatched sch_htb.c and pkt_sch.h"
59#endif
60
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -070061/* Module parameter and sysfs export */
62module_param (htb_hysteresis, int, 0640);
63MODULE_PARM_DESC(htb_hysteresis, "Hysteresis mode, less CPU load, less accurate");
64
Linus Torvalds1da177e2005-04-16 15:20:36 -070065/* used internaly to keep status of single class */
66enum htb_cmode {
Stephen Hemminger87990462006-08-10 23:35:16 -070067 HTB_CANT_SEND, /* class can't send and can't borrow */
68 HTB_MAY_BORROW, /* class can't send but may borrow */
69 HTB_CAN_SEND /* class can send */
Linus Torvalds1da177e2005-04-16 15:20:36 -070070};
71
72/* interior & leaf nodes; props specific to leaves are marked L: */
Stephen Hemminger87990462006-08-10 23:35:16 -070073struct htb_class {
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -070074 struct Qdisc_class_common common;
Stephen Hemminger87990462006-08-10 23:35:16 -070075 /* general class parameters */
Stephen Hemminger87990462006-08-10 23:35:16 -070076 struct gnet_stats_basic bstats;
77 struct gnet_stats_queue qstats;
78 struct gnet_stats_rate_est rate_est;
79 struct tc_htb_xstats xstats; /* our special stats */
80 int refcnt; /* usage count of this class */
Linus Torvalds1da177e2005-04-16 15:20:36 -070081
Stephen Hemminger87990462006-08-10 23:35:16 -070082 /* topology */
83 int level; /* our level (see above) */
Patrick McHardy42077592008-07-05 23:22:53 -070084 unsigned int children;
Stephen Hemminger87990462006-08-10 23:35:16 -070085 struct htb_class *parent; /* parent class */
Linus Torvalds1da177e2005-04-16 15:20:36 -070086
Jarek Poplawskic19f7a32008-12-03 21:09:45 -080087 int prio; /* these two are used only by leaves... */
88 int quantum; /* but stored for parent-to-leaf return */
89
Stephen Hemminger87990462006-08-10 23:35:16 -070090 union {
91 struct htb_class_leaf {
92 struct Qdisc *q;
Stephen Hemminger87990462006-08-10 23:35:16 -070093 int deficit[TC_HTB_MAXDEPTH];
94 struct list_head drop_list;
95 } leaf;
96 struct htb_class_inner {
97 struct rb_root feed[TC_HTB_NUMPRIO]; /* feed trees */
98 struct rb_node *ptr[TC_HTB_NUMPRIO]; /* current class ptr */
99 /* When class changes from state 1->2 and disconnects from
100 parent's feed then we lost ptr value and start from the
101 first child again. Here we store classid of the
102 last valid ptr (used when ptr is NULL). */
103 u32 last_ptr_id[TC_HTB_NUMPRIO];
104 } inner;
105 } un;
106 struct rb_node node[TC_HTB_NUMPRIO]; /* node for self or feed tree */
107 struct rb_node pq_node; /* node for event queue */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700108 psched_time_t pq_key;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Stephen Hemminger87990462006-08-10 23:35:16 -0700110 int prio_activity; /* for which prios are we active */
111 enum htb_cmode cmode; /* current mode of the class */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112
Stephen Hemminger87990462006-08-10 23:35:16 -0700113 /* class attached filters */
114 struct tcf_proto *filter_list;
115 int filter_cnt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116
Stephen Hemminger87990462006-08-10 23:35:16 -0700117 /* token bucket parameters */
118 struct qdisc_rate_table *rate; /* rate table of the class itself */
119 struct qdisc_rate_table *ceil; /* ceiling rate (limits borrows too) */
120 long buffer, cbuffer; /* token bucket depth/rate */
121 psched_tdiff_t mbuffer; /* max wait time */
122 long tokens, ctokens; /* current number of tokens */
123 psched_time_t t_c; /* checkpoint time */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124};
125
Stephen Hemminger87990462006-08-10 23:35:16 -0700126struct htb_sched {
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700127 struct Qdisc_class_hash clhash;
Stephen Hemminger0cef2962006-08-10 23:35:38 -0700128 struct list_head drops[TC_HTB_NUMPRIO];/* active leaves (for drops) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129
Stephen Hemminger87990462006-08-10 23:35:16 -0700130 /* self list - roots of self generating tree */
131 struct rb_root row[TC_HTB_MAXDEPTH][TC_HTB_NUMPRIO];
132 int row_mask[TC_HTB_MAXDEPTH];
133 struct rb_node *ptr[TC_HTB_MAXDEPTH][TC_HTB_NUMPRIO];
134 u32 last_ptr_id[TC_HTB_MAXDEPTH][TC_HTB_NUMPRIO];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135
Stephen Hemminger87990462006-08-10 23:35:16 -0700136 /* self wait list - roots of wait PQs per row */
137 struct rb_root wait_pq[TC_HTB_MAXDEPTH];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700138
Stephen Hemminger87990462006-08-10 23:35:16 -0700139 /* time of nearest event per level (row) */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700140 psched_time_t near_ev_cache[TC_HTB_MAXDEPTH];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700141
Stephen Hemminger87990462006-08-10 23:35:16 -0700142 int defcls; /* class where unclassified flows go to */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143
Stephen Hemminger87990462006-08-10 23:35:16 -0700144 /* filters for qdisc itself */
145 struct tcf_proto *filter_list;
Stephen Hemminger87990462006-08-10 23:35:16 -0700146
147 int rate2quantum; /* quant = rate / rate2quantum */
148 psched_time_t now; /* cached dequeue time */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700149 struct qdisc_watchdog watchdog;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150
Stephen Hemminger87990462006-08-10 23:35:16 -0700151 /* non shaped skbs; let them go directly thru */
152 struct sk_buff_head direct_queue;
153 int direct_qlen; /* max qlen of above */
154
155 long direct_pkts;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156};
157
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158/* find class in global hash table using given handle */
Stephen Hemminger87990462006-08-10 23:35:16 -0700159static inline struct htb_class *htb_find(u32 handle, struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160{
161 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700162 struct Qdisc_class_common *clc;
Stephen Hemminger0cef2962006-08-10 23:35:38 -0700163
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700164 clc = qdisc_class_find(&q->clhash, handle);
165 if (clc == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166 return NULL;
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700167 return container_of(clc, struct htb_class, common);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168}
169
170/**
171 * htb_classify - classify a packet into class
172 *
173 * It returns NULL if the packet should be dropped or -1 if the packet
174 * should be passed directly thru. In all other cases leaf class is returned.
175 * We allow direct class selection by classid in priority. The we examine
176 * filters in qdisc and in inner nodes (if higher filter points to the inner
177 * node). If we end up with classid MAJOR:0 we enqueue the skb into special
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900178 * internal fifo (direct). These packets then go directly thru. If we still
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179 * have no valid leaf we try to use MAJOR:default leaf. It still unsuccessfull
180 * then finish and return direct queue.
181 */
182#define HTB_DIRECT (struct htb_class*)-1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183
Stephen Hemminger87990462006-08-10 23:35:16 -0700184static struct htb_class *htb_classify(struct sk_buff *skb, struct Qdisc *sch,
185 int *qerr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186{
187 struct htb_sched *q = qdisc_priv(sch);
188 struct htb_class *cl;
189 struct tcf_result res;
190 struct tcf_proto *tcf;
191 int result;
192
193 /* allow to select class by setting skb->priority to valid classid;
194 note that nfmark can be used too by attaching filter fw with no
195 rules in it */
196 if (skb->priority == sch->handle)
Stephen Hemminger87990462006-08-10 23:35:16 -0700197 return HTB_DIRECT; /* X:0 (direct flow) selected */
198 if ((cl = htb_find(skb->priority, sch)) != NULL && cl->level == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199 return cl;
200
Jarek Poplawskic27f3392008-08-04 22:39:11 -0700201 *qerr = NET_XMIT_SUCCESS | __NET_XMIT_BYPASS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202 tcf = q->filter_list;
203 while (tcf && (result = tc_classify(skb, tcf, &res)) >= 0) {
204#ifdef CONFIG_NET_CLS_ACT
205 switch (result) {
206 case TC_ACT_QUEUED:
Stephen Hemminger87990462006-08-10 23:35:16 -0700207 case TC_ACT_STOLEN:
Jarek Poplawski378a2f02008-08-04 22:31:03 -0700208 *qerr = NET_XMIT_SUCCESS | __NET_XMIT_STOLEN;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700209 case TC_ACT_SHOT:
210 return NULL;
211 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700212#endif
Stephen Hemminger87990462006-08-10 23:35:16 -0700213 if ((cl = (void *)res.class) == NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214 if (res.classid == sch->handle)
Stephen Hemminger87990462006-08-10 23:35:16 -0700215 return HTB_DIRECT; /* X:0 (direct flow) */
216 if ((cl = htb_find(res.classid, sch)) == NULL)
217 break; /* filter selected invalid classid */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218 }
219 if (!cl->level)
Stephen Hemminger87990462006-08-10 23:35:16 -0700220 return cl; /* we hit leaf; return it */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221
222 /* we have got inner class; apply inner filter chain */
223 tcf = cl->filter_list;
224 }
225 /* classification failed; try to use default class */
Stephen Hemminger87990462006-08-10 23:35:16 -0700226 cl = htb_find(TC_H_MAKE(TC_H_MAJ(sch->handle), q->defcls), sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 if (!cl || cl->level)
Stephen Hemminger87990462006-08-10 23:35:16 -0700228 return HTB_DIRECT; /* bad default .. this is safe bet */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 return cl;
230}
231
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232/**
233 * htb_add_to_id_tree - adds class to the round robin list
234 *
235 * Routine adds class to the list (actually tree) sorted by classid.
236 * Make sure that class is not already on such list for given prio.
237 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700238static void htb_add_to_id_tree(struct rb_root *root,
239 struct htb_class *cl, int prio)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240{
241 struct rb_node **p = &root->rb_node, *parent = NULL;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700242
Linus Torvalds1da177e2005-04-16 15:20:36 -0700243 while (*p) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700244 struct htb_class *c;
245 parent = *p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246 c = rb_entry(parent, struct htb_class, node[prio]);
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700247
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700248 if (cl->common.classid > c->common.classid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 p = &parent->rb_right;
Stephen Hemminger87990462006-08-10 23:35:16 -0700250 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251 p = &parent->rb_left;
252 }
253 rb_link_node(&cl->node[prio], parent, p);
254 rb_insert_color(&cl->node[prio], root);
255}
256
257/**
258 * htb_add_to_wait_tree - adds class to the event queue with delay
259 *
260 * The class is added to priority event queue to indicate that class will
261 * change its mode in cl->pq_key microseconds. Make sure that class is not
262 * already in the queue.
263 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700264static void htb_add_to_wait_tree(struct htb_sched *q,
265 struct htb_class *cl, long delay)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266{
267 struct rb_node **p = &q->wait_pq[cl->level].rb_node, *parent = NULL;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700268
Patrick McHardyfb983d42007-03-16 01:22:39 -0700269 cl->pq_key = q->now + delay;
270 if (cl->pq_key == q->now)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271 cl->pq_key++;
272
273 /* update the nearest event cache */
Patrick McHardyfb983d42007-03-16 01:22:39 -0700274 if (q->near_ev_cache[cl->level] > cl->pq_key)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 q->near_ev_cache[cl->level] = cl->pq_key;
Stephen Hemminger87990462006-08-10 23:35:16 -0700276
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277 while (*p) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700278 struct htb_class *c;
279 parent = *p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280 c = rb_entry(parent, struct htb_class, pq_node);
Patrick McHardyfb983d42007-03-16 01:22:39 -0700281 if (cl->pq_key >= c->pq_key)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700282 p = &parent->rb_right;
Stephen Hemminger87990462006-08-10 23:35:16 -0700283 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284 p = &parent->rb_left;
285 }
286 rb_link_node(&cl->pq_node, parent, p);
287 rb_insert_color(&cl->pq_node, &q->wait_pq[cl->level]);
288}
289
290/**
291 * htb_next_rb_node - finds next node in binary tree
292 *
293 * When we are past last key we return NULL.
294 * Average complexity is 2 steps per call.
295 */
Stephen Hemminger3696f622006-08-10 23:36:01 -0700296static inline void htb_next_rb_node(struct rb_node **n)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297{
298 *n = rb_next(*n);
299}
300
301/**
302 * htb_add_class_to_row - add class to its row
303 *
304 * The class is added to row at priorities marked in mask.
305 * It does nothing if mask == 0.
306 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700307static inline void htb_add_class_to_row(struct htb_sched *q,
308 struct htb_class *cl, int mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700309{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 q->row_mask[cl->level] |= mask;
311 while (mask) {
312 int prio = ffz(~mask);
313 mask &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700314 htb_add_to_id_tree(q->row[cl->level] + prio, cl, prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 }
316}
317
Stephen Hemminger3696f622006-08-10 23:36:01 -0700318/* If this triggers, it is a bug in this code, but it need not be fatal */
319static void htb_safe_rb_erase(struct rb_node *rb, struct rb_root *root)
320{
Ismail Donmez81771b32006-10-03 13:49:10 -0700321 if (RB_EMPTY_NODE(rb)) {
Stephen Hemminger3696f622006-08-10 23:36:01 -0700322 WARN_ON(1);
323 } else {
324 rb_erase(rb, root);
325 RB_CLEAR_NODE(rb);
326 }
327}
328
329
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330/**
331 * htb_remove_class_from_row - removes class from its row
332 *
333 * The class is removed from row at priorities marked in mask.
334 * It does nothing if mask == 0.
335 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700336static inline void htb_remove_class_from_row(struct htb_sched *q,
337 struct htb_class *cl, int mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338{
339 int m = 0;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700340
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 while (mask) {
342 int prio = ffz(~mask);
Stephen Hemminger3696f622006-08-10 23:36:01 -0700343
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344 mask &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700345 if (q->ptr[cl->level][prio] == cl->node + prio)
346 htb_next_rb_node(q->ptr[cl->level] + prio);
Stephen Hemminger3696f622006-08-10 23:36:01 -0700347
348 htb_safe_rb_erase(cl->node + prio, q->row[cl->level] + prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700349 if (!q->row[cl->level][prio].rb_node)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350 m |= 1 << prio;
351 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352 q->row_mask[cl->level] &= ~m;
353}
354
355/**
356 * htb_activate_prios - creates active classe's feed chain
357 *
358 * The class is connected to ancestors and/or appropriate rows
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900359 * for priorities it is participating on. cl->cmode must be new
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360 * (activated) mode. It does nothing if cl->prio_activity == 0.
361 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700362static void htb_activate_prios(struct htb_sched *q, struct htb_class *cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363{
364 struct htb_class *p = cl->parent;
Stephen Hemminger87990462006-08-10 23:35:16 -0700365 long m, mask = cl->prio_activity;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700366
367 while (cl->cmode == HTB_MAY_BORROW && p && mask) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700368 m = mask;
369 while (m) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370 int prio = ffz(~m);
371 m &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700372
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373 if (p->un.inner.feed[prio].rb_node)
374 /* parent already has its feed in use so that
375 reset bit in mask as parent is already ok */
376 mask &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700377
378 htb_add_to_id_tree(p->un.inner.feed + prio, cl, prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380 p->prio_activity |= mask;
Stephen Hemminger87990462006-08-10 23:35:16 -0700381 cl = p;
382 p = cl->parent;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700383
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384 }
385 if (cl->cmode == HTB_CAN_SEND && mask)
Stephen Hemminger87990462006-08-10 23:35:16 -0700386 htb_add_class_to_row(q, cl, mask);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700387}
388
389/**
390 * htb_deactivate_prios - remove class from feed chain
391 *
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900392 * cl->cmode must represent old mode (before deactivation). It does
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393 * nothing if cl->prio_activity == 0. Class is removed from all feed
394 * chains and rows.
395 */
396static void htb_deactivate_prios(struct htb_sched *q, struct htb_class *cl)
397{
398 struct htb_class *p = cl->parent;
Stephen Hemminger87990462006-08-10 23:35:16 -0700399 long m, mask = cl->prio_activity;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400
401 while (cl->cmode == HTB_MAY_BORROW && p && mask) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700402 m = mask;
403 mask = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700404 while (m) {
405 int prio = ffz(~m);
406 m &= ~(1 << prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700407
408 if (p->un.inner.ptr[prio] == cl->node + prio) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700409 /* we are removing child which is pointed to from
410 parent feed - forget the pointer but remember
411 classid */
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700412 p->un.inner.last_ptr_id[prio] = cl->common.classid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700413 p->un.inner.ptr[prio] = NULL;
414 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700415
Stephen Hemminger3696f622006-08-10 23:36:01 -0700416 htb_safe_rb_erase(cl->node + prio, p->un.inner.feed + prio);
Stephen Hemminger87990462006-08-10 23:35:16 -0700417
418 if (!p->un.inner.feed[prio].rb_node)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700419 mask |= 1 << prio;
420 }
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700421
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422 p->prio_activity &= ~mask;
Stephen Hemminger87990462006-08-10 23:35:16 -0700423 cl = p;
424 p = cl->parent;
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700425
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700427 if (cl->cmode == HTB_CAN_SEND && mask)
428 htb_remove_class_from_row(q, cl, mask);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429}
430
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700431static inline long htb_lowater(const struct htb_class *cl)
432{
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -0700433 if (htb_hysteresis)
434 return cl->cmode != HTB_CANT_SEND ? -cl->cbuffer : 0;
435 else
436 return 0;
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700437}
438static inline long htb_hiwater(const struct htb_class *cl)
439{
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -0700440 if (htb_hysteresis)
441 return cl->cmode == HTB_CAN_SEND ? -cl->buffer : 0;
442 else
443 return 0;
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700444}
Jesper Dangaard Brouer47083fc2008-06-16 16:39:32 -0700445
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700446
Linus Torvalds1da177e2005-04-16 15:20:36 -0700447/**
448 * htb_class_mode - computes and returns current class mode
449 *
450 * It computes cl's mode at time cl->t_c+diff and returns it. If mode
451 * is not HTB_CAN_SEND then cl->pq_key is updated to time difference
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900452 * from now to time when cl will change its state.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700453 * Also it is worth to note that class mode doesn't change simply
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900454 * at cl->{c,}tokens == 0 but there can rather be hysteresis of
Linus Torvalds1da177e2005-04-16 15:20:36 -0700455 * 0 .. -cl->{c,}buffer range. It is meant to limit number of
456 * mode transitions per time unit. The speed gain is about 1/6.
457 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700458static inline enum htb_cmode
459htb_class_mode(struct htb_class *cl, long *diff)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700460{
Stephen Hemminger87990462006-08-10 23:35:16 -0700461 long toks;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700462
Stephen Hemminger87990462006-08-10 23:35:16 -0700463 if ((toks = (cl->ctokens + *diff)) < htb_lowater(cl)) {
464 *diff = -toks;
465 return HTB_CANT_SEND;
466 }
Stephen Hemminger18a63e82006-08-10 23:34:02 -0700467
Stephen Hemminger87990462006-08-10 23:35:16 -0700468 if ((toks = (cl->tokens + *diff)) >= htb_hiwater(cl))
469 return HTB_CAN_SEND;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700470
Stephen Hemminger87990462006-08-10 23:35:16 -0700471 *diff = -toks;
472 return HTB_MAY_BORROW;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473}
474
475/**
476 * htb_change_class_mode - changes classe's mode
477 *
478 * This should be the only way how to change classe's mode under normal
479 * cirsumstances. Routine will update feed lists linkage, change mode
480 * and add class to the wait event queue if appropriate. New mode should
481 * be different from old one and cl->pq_key has to be valid if changing
482 * to mode other than HTB_CAN_SEND (see htb_add_to_wait_tree).
483 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700484static void
Linus Torvalds1da177e2005-04-16 15:20:36 -0700485htb_change_class_mode(struct htb_sched *q, struct htb_class *cl, long *diff)
Stephen Hemminger87990462006-08-10 23:35:16 -0700486{
487 enum htb_cmode new_mode = htb_class_mode(cl, diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700488
489 if (new_mode == cl->cmode)
Stephen Hemminger87990462006-08-10 23:35:16 -0700490 return;
491
492 if (cl->prio_activity) { /* not necessary: speed optimization */
493 if (cl->cmode != HTB_CANT_SEND)
494 htb_deactivate_prios(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495 cl->cmode = new_mode;
Stephen Hemminger87990462006-08-10 23:35:16 -0700496 if (new_mode != HTB_CANT_SEND)
497 htb_activate_prios(q, cl);
498 } else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 cl->cmode = new_mode;
500}
501
502/**
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900503 * htb_activate - inserts leaf cl into appropriate active feeds
Linus Torvalds1da177e2005-04-16 15:20:36 -0700504 *
505 * Routine learns (new) priority of leaf and activates feed chain
506 * for the prio. It can be called on already active leaf safely.
507 * It also adds leaf into droplist.
508 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700509static inline void htb_activate(struct htb_sched *q, struct htb_class *cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510{
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700511 WARN_ON(cl->level || !cl->un.leaf.q || !cl->un.leaf.q->q.qlen);
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700512
Linus Torvalds1da177e2005-04-16 15:20:36 -0700513 if (!cl->prio_activity) {
Jarek Poplawskic19f7a32008-12-03 21:09:45 -0800514 cl->prio_activity = 1 << cl->prio;
Stephen Hemminger87990462006-08-10 23:35:16 -0700515 htb_activate_prios(q, cl);
516 list_add_tail(&cl->un.leaf.drop_list,
Jarek Poplawskic19f7a32008-12-03 21:09:45 -0800517 q->drops + cl->prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700518 }
519}
520
521/**
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900522 * htb_deactivate - remove leaf cl from active feeds
Linus Torvalds1da177e2005-04-16 15:20:36 -0700523 *
524 * Make sure that leaf is active. In the other words it can't be called
525 * with non-active leaf. It also removes class from the drop list.
526 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700527static inline void htb_deactivate(struct htb_sched *q, struct htb_class *cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700528{
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700529 WARN_ON(!cl->prio_activity);
Stephen Hemminger3bf72952006-08-10 23:31:08 -0700530
Stephen Hemminger87990462006-08-10 23:35:16 -0700531 htb_deactivate_prios(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700532 cl->prio_activity = 0;
533 list_del_init(&cl->un.leaf.drop_list);
534}
535
536static int htb_enqueue(struct sk_buff *skb, struct Qdisc *sch)
537{
Jarek Poplawskif30ab412008-11-13 22:56:30 -0800538 int uninitialized_var(ret);
Stephen Hemminger87990462006-08-10 23:35:16 -0700539 struct htb_sched *q = qdisc_priv(sch);
540 struct htb_class *cl = htb_classify(skb, sch, &ret);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700541
Stephen Hemminger87990462006-08-10 23:35:16 -0700542 if (cl == HTB_DIRECT) {
543 /* enqueue to helper queue */
544 if (q->direct_queue.qlen < q->direct_qlen) {
545 __skb_queue_tail(&q->direct_queue, skb);
546 q->direct_pkts++;
547 } else {
548 kfree_skb(skb);
549 sch->qstats.drops++;
550 return NET_XMIT_DROP;
551 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700552#ifdef CONFIG_NET_CLS_ACT
Stephen Hemminger87990462006-08-10 23:35:16 -0700553 } else if (!cl) {
Jarek Poplawskic27f3392008-08-04 22:39:11 -0700554 if (ret & __NET_XMIT_BYPASS)
Stephen Hemminger87990462006-08-10 23:35:16 -0700555 sch->qstats.drops++;
556 kfree_skb(skb);
557 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700558#endif
Jarek Poplawski378a2f02008-08-04 22:31:03 -0700559 } else if ((ret = qdisc_enqueue(skb, cl->un.leaf.q)) != NET_XMIT_SUCCESS) {
560 if (net_xmit_drop_count(ret)) {
561 sch->qstats.drops++;
562 cl->qstats.drops++;
563 }
David S. Miller69747652008-08-17 23:55:36 -0700564 return ret;
Stephen Hemminger87990462006-08-10 23:35:16 -0700565 } else {
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700566 cl->bstats.packets +=
567 skb_is_gso(skb)?skb_shinfo(skb)->gso_segs:1;
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700568 cl->bstats.bytes += qdisc_pkt_len(skb);
Stephen Hemminger87990462006-08-10 23:35:16 -0700569 htb_activate(q, cl);
570 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571
Stephen Hemminger87990462006-08-10 23:35:16 -0700572 sch->q.qlen++;
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700573 sch->bstats.packets += skb_is_gso(skb)?skb_shinfo(skb)->gso_segs:1;
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700574 sch->bstats.bytes += qdisc_pkt_len(skb);
Stephen Hemminger87990462006-08-10 23:35:16 -0700575 return NET_XMIT_SUCCESS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576}
577
Jarek Poplawski59e42202008-12-03 21:17:27 -0800578static inline void htb_accnt_tokens(struct htb_class *cl, int bytes, long diff)
579{
580 long toks = diff + cl->tokens;
581
582 if (toks > cl->buffer)
583 toks = cl->buffer;
584 toks -= (long) qdisc_l2t(cl->rate, bytes);
585 if (toks <= -cl->mbuffer)
586 toks = 1 - cl->mbuffer;
587
588 cl->tokens = toks;
589}
590
591static inline void htb_accnt_ctokens(struct htb_class *cl, int bytes, long diff)
592{
593 long toks = diff + cl->ctokens;
594
595 if (toks > cl->cbuffer)
596 toks = cl->cbuffer;
597 toks -= (long) qdisc_l2t(cl->ceil, bytes);
598 if (toks <= -cl->mbuffer)
599 toks = 1 - cl->mbuffer;
600
601 cl->ctokens = toks;
602}
603
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604/**
605 * htb_charge_class - charges amount "bytes" to leaf and ancestors
606 *
607 * Routine assumes that packet "bytes" long was dequeued from leaf cl
608 * borrowing from "level". It accounts bytes to ceil leaky bucket for
609 * leaf and all ancestors and to rate bucket for ancestors at levels
610 * "level" and higher. It also handles possible change of mode resulting
611 * from the update. Note that mode can also increase here (MAY_BORROW to
612 * CAN_SEND) because we can use more precise clock that event queue here.
613 * In such case we remove class from event queue first.
614 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700615static void htb_charge_class(struct htb_sched *q, struct htb_class *cl,
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700616 int level, struct sk_buff *skb)
Stephen Hemminger87990462006-08-10 23:35:16 -0700617{
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700618 int bytes = qdisc_pkt_len(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 enum htb_cmode old_mode;
Jarek Poplawski59e42202008-12-03 21:17:27 -0800620 long diff;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621
622 while (cl) {
Patrick McHardy03cc45c2007-03-23 11:29:11 -0700623 diff = psched_tdiff_bounded(q->now, cl->t_c, cl->mbuffer);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700624 if (cl->level >= level) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700625 if (cl->level == level)
626 cl->xstats.lends++;
Jarek Poplawski59e42202008-12-03 21:17:27 -0800627 htb_accnt_tokens(cl, bytes, diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700628 } else {
629 cl->xstats.borrows++;
Stephen Hemminger87990462006-08-10 23:35:16 -0700630 cl->tokens += diff; /* we moved t_c; update tokens */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631 }
Jarek Poplawski59e42202008-12-03 21:17:27 -0800632 htb_accnt_ctokens(cl, bytes, diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700633 cl->t_c = q->now;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634
Stephen Hemminger87990462006-08-10 23:35:16 -0700635 old_mode = cl->cmode;
636 diff = 0;
637 htb_change_class_mode(q, cl, &diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700638 if (old_mode != cl->cmode) {
639 if (old_mode != HTB_CAN_SEND)
Stephen Hemminger3696f622006-08-10 23:36:01 -0700640 htb_safe_rb_erase(&cl->pq_node, q->wait_pq + cl->level);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700641 if (cl->cmode != HTB_CAN_SEND)
Stephen Hemminger87990462006-08-10 23:35:16 -0700642 htb_add_to_wait_tree(q, cl, diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700644
645 /* update byte stats except for leaves which are already updated */
646 if (cl->level) {
647 cl->bstats.bytes += bytes;
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700648 cl->bstats.packets += skb_is_gso(skb)?
649 skb_shinfo(skb)->gso_segs:1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700650 }
651 cl = cl->parent;
652 }
653}
654
655/**
656 * htb_do_events - make mode changes to classes at the level
657 *
Patrick McHardyfb983d42007-03-16 01:22:39 -0700658 * Scans event queue for pending events and applies them. Returns time of
Linus Torvalds1da177e2005-04-16 15:20:36 -0700659 * next pending event (0 for no event in pq).
Patrick McHardyfb983d42007-03-16 01:22:39 -0700660 * Note: Applied are events whose have cl->pq_key <= q->now.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700661 */
Jarek Poplawskia73be042009-01-12 21:54:40 -0800662static psched_time_t htb_do_events(struct htb_sched *q, int level,
663 unsigned long start)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700664{
Martin Devera8f3ea332008-03-23 22:00:38 -0700665 /* don't run for longer than 2 jiffies; 2 is used instead of
666 1 to simplify things when jiffy is going to be incremented
667 too soon */
Jarek Poplawskia73be042009-01-12 21:54:40 -0800668 unsigned long stop_at = start + 2;
Martin Devera8f3ea332008-03-23 22:00:38 -0700669 while (time_before(jiffies, stop_at)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670 struct htb_class *cl;
671 long diff;
Akinbou Mita30bdbe32006-10-12 01:52:05 -0700672 struct rb_node *p = rb_first(&q->wait_pq[level]);
673
Stephen Hemminger87990462006-08-10 23:35:16 -0700674 if (!p)
675 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700676
677 cl = rb_entry(p, struct htb_class, pq_node);
Patrick McHardyfb983d42007-03-16 01:22:39 -0700678 if (cl->pq_key > q->now)
679 return cl->pq_key;
680
Stephen Hemminger3696f622006-08-10 23:36:01 -0700681 htb_safe_rb_erase(p, q->wait_pq + level);
Patrick McHardy03cc45c2007-03-23 11:29:11 -0700682 diff = psched_tdiff_bounded(q->now, cl->t_c, cl->mbuffer);
Stephen Hemminger87990462006-08-10 23:35:16 -0700683 htb_change_class_mode(q, cl, &diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684 if (cl->cmode != HTB_CAN_SEND)
Stephen Hemminger87990462006-08-10 23:35:16 -0700685 htb_add_to_wait_tree(q, cl, diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700686 }
Jarek Poplawskic0851342009-01-12 21:54:16 -0800687 /* too much load - let's continue on next jiffie (including above) */
688 return q->now + 2 * PSCHED_TICKS_PER_SEC / HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700689}
690
691/* Returns class->node+prio from id-tree where classe's id is >= id. NULL
692 is no such one exists. */
Stephen Hemminger87990462006-08-10 23:35:16 -0700693static struct rb_node *htb_id_find_next_upper(int prio, struct rb_node *n,
694 u32 id)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695{
696 struct rb_node *r = NULL;
697 while (n) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700698 struct htb_class *cl =
699 rb_entry(n, struct htb_class, node[prio]);
Stephen Hemminger87990462006-08-10 23:35:16 -0700700
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700701 if (id > cl->common.classid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700702 n = n->rb_right;
Jarek Poplawski1b5c0072008-12-09 22:34:40 -0800703 } else if (id < cl->common.classid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 r = n;
705 n = n->rb_left;
Jarek Poplawski1b5c0072008-12-09 22:34:40 -0800706 } else {
707 return n;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700708 }
709 }
710 return r;
711}
712
713/**
714 * htb_lookup_leaf - returns next leaf class in DRR order
715 *
716 * Find leaf where current feed pointers points to.
717 */
Stephen Hemminger87990462006-08-10 23:35:16 -0700718static struct htb_class *htb_lookup_leaf(struct rb_root *tree, int prio,
719 struct rb_node **pptr, u32 * pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700720{
721 int i;
722 struct {
723 struct rb_node *root;
724 struct rb_node **pptr;
725 u32 *pid;
Stephen Hemminger87990462006-08-10 23:35:16 -0700726 } stk[TC_HTB_MAXDEPTH], *sp = stk;
727
Jarek Poplawski512bb432008-12-09 22:35:02 -0800728 BUG_ON(!tree->rb_node);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729 sp->root = tree->rb_node;
730 sp->pptr = pptr;
731 sp->pid = pid;
732
733 for (i = 0; i < 65535; i++) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700734 if (!*sp->pptr && *sp->pid) {
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900735 /* ptr was invalidated but id is valid - try to recover
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736 the original or next ptr */
Stephen Hemminger87990462006-08-10 23:35:16 -0700737 *sp->pptr =
738 htb_id_find_next_upper(prio, sp->root, *sp->pid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700740 *sp->pid = 0; /* ptr is valid now so that remove this hint as it
741 can become out of date quickly */
742 if (!*sp->pptr) { /* we are at right end; rewind & go up */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743 *sp->pptr = sp->root;
Stephen Hemminger87990462006-08-10 23:35:16 -0700744 while ((*sp->pptr)->rb_left)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700745 *sp->pptr = (*sp->pptr)->rb_left;
746 if (sp > stk) {
747 sp--;
Jarek Poplawski512bb432008-12-09 22:35:02 -0800748 if (!*sp->pptr) {
749 WARN_ON(1);
Stephen Hemminger87990462006-08-10 23:35:16 -0700750 return NULL;
Jarek Poplawski512bb432008-12-09 22:35:02 -0800751 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700752 htb_next_rb_node(sp->pptr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700753 }
754 } else {
755 struct htb_class *cl;
Stephen Hemminger87990462006-08-10 23:35:16 -0700756 cl = rb_entry(*sp->pptr, struct htb_class, node[prio]);
757 if (!cl->level)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758 return cl;
759 (++sp)->root = cl->un.inner.feed[prio].rb_node;
Stephen Hemminger87990462006-08-10 23:35:16 -0700760 sp->pptr = cl->un.inner.ptr + prio;
761 sp->pid = cl->un.inner.last_ptr_id + prio;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762 }
763 }
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700764 WARN_ON(1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700765 return NULL;
766}
767
768/* dequeues packet at given priority and level; call only if
769 you are sure that there is active class at prio/level */
Stephen Hemminger87990462006-08-10 23:35:16 -0700770static struct sk_buff *htb_dequeue_tree(struct htb_sched *q, int prio,
771 int level)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772{
773 struct sk_buff *skb = NULL;
Stephen Hemminger87990462006-08-10 23:35:16 -0700774 struct htb_class *cl, *start;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775 /* look initial class up in the row */
Stephen Hemminger87990462006-08-10 23:35:16 -0700776 start = cl = htb_lookup_leaf(q->row[level] + prio, prio,
777 q->ptr[level] + prio,
778 q->last_ptr_id[level] + prio);
779
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780 do {
781next:
Jarek Poplawski512bb432008-12-09 22:35:02 -0800782 if (unlikely(!cl))
Stephen Hemminger87990462006-08-10 23:35:16 -0700783 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700784
785 /* class can be empty - it is unlikely but can be true if leaf
786 qdisc drops packets in enqueue routine or if someone used
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900787 graft operation on the leaf since last dequeue;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700788 simply deactivate and skip such class */
789 if (unlikely(cl->un.leaf.q->q.qlen == 0)) {
790 struct htb_class *next;
Stephen Hemminger87990462006-08-10 23:35:16 -0700791 htb_deactivate(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700792
793 /* row/level might become empty */
794 if ((q->row_mask[level] & (1 << prio)) == 0)
Stephen Hemminger87990462006-08-10 23:35:16 -0700795 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796
Stephen Hemminger87990462006-08-10 23:35:16 -0700797 next = htb_lookup_leaf(q->row[level] + prio,
798 prio, q->ptr[level] + prio,
799 q->last_ptr_id[level] + prio);
800
801 if (cl == start) /* fix start if we just deleted it */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700802 start = next;
803 cl = next;
804 goto next;
805 }
Stephen Hemminger87990462006-08-10 23:35:16 -0700806
807 skb = cl->un.leaf.q->dequeue(cl->un.leaf.q);
808 if (likely(skb != NULL))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700809 break;
Jarek Poplawski633fe662008-12-03 21:09:10 -0800810
Jarek Poplawskib00355d2009-02-01 01:12:42 -0800811 qdisc_warn_nonwc("htb", cl->un.leaf.q);
Stephen Hemminger87990462006-08-10 23:35:16 -0700812 htb_next_rb_node((level ? cl->parent->un.inner.ptr : q->
813 ptr[0]) + prio);
814 cl = htb_lookup_leaf(q->row[level] + prio, prio,
815 q->ptr[level] + prio,
816 q->last_ptr_id[level] + prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817
818 } while (cl != start);
819
820 if (likely(skb != NULL)) {
Jussi Kivilinna0abf77e2008-07-20 00:08:27 -0700821 cl->un.leaf.deficit[level] -= qdisc_pkt_len(skb);
822 if (cl->un.leaf.deficit[level] < 0) {
Jarek Poplawskic19f7a32008-12-03 21:09:45 -0800823 cl->un.leaf.deficit[level] += cl->quantum;
Stephen Hemminger87990462006-08-10 23:35:16 -0700824 htb_next_rb_node((level ? cl->parent->un.inner.ptr : q->
825 ptr[0]) + prio);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700826 }
827 /* this used to be after charge_class but this constelation
828 gives us slightly better performance */
829 if (!cl->un.leaf.q->q.qlen)
Stephen Hemminger87990462006-08-10 23:35:16 -0700830 htb_deactivate(q, cl);
Ranjit Manomohanc9726d62007-07-10 22:43:16 -0700831 htb_charge_class(q, cl, level, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700832 }
833 return skb;
834}
835
Linus Torvalds1da177e2005-04-16 15:20:36 -0700836static struct sk_buff *htb_dequeue(struct Qdisc *sch)
837{
838 struct sk_buff *skb = NULL;
839 struct htb_sched *q = qdisc_priv(sch);
840 int level;
Patrick McHardyfb983d42007-03-16 01:22:39 -0700841 psched_time_t next_event;
Jarek Poplawskia73be042009-01-12 21:54:40 -0800842 unsigned long start_at;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700843
844 /* try to dequeue direct packets as high prio (!) to minimize cpu work */
Stephen Hemminger87990462006-08-10 23:35:16 -0700845 skb = __skb_dequeue(&q->direct_queue);
846 if (skb != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700847 sch->flags &= ~TCQ_F_THROTTLED;
848 sch->q.qlen--;
849 return skb;
850 }
851
Stephen Hemminger87990462006-08-10 23:35:16 -0700852 if (!sch->q.qlen)
853 goto fin;
Patrick McHardy3bebcda2007-03-23 11:29:25 -0700854 q->now = psched_get_time();
Jarek Poplawskia73be042009-01-12 21:54:40 -0800855 start_at = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700856
Patrick McHardyfb983d42007-03-16 01:22:39 -0700857 next_event = q->now + 5 * PSCHED_TICKS_PER_SEC;
Jarek Poplawski633fe662008-12-03 21:09:10 -0800858
Linus Torvalds1da177e2005-04-16 15:20:36 -0700859 for (level = 0; level < TC_HTB_MAXDEPTH; level++) {
860 /* common case optimization - skip event handler quickly */
861 int m;
Patrick McHardyfb983d42007-03-16 01:22:39 -0700862 psched_time_t event;
Stephen Hemminger87990462006-08-10 23:35:16 -0700863
Patrick McHardyfb983d42007-03-16 01:22:39 -0700864 if (q->now >= q->near_ev_cache[level]) {
Jarek Poplawskia73be042009-01-12 21:54:40 -0800865 event = htb_do_events(q, level, start_at);
Patrick McHardy2e4b3b02007-05-23 23:39:54 -0700866 if (!event)
867 event = q->now + PSCHED_TICKS_PER_SEC;
868 q->near_ev_cache[level] = event;
Patrick McHardyfb983d42007-03-16 01:22:39 -0700869 } else
870 event = q->near_ev_cache[level];
871
Jarek Poplawskic0851342009-01-12 21:54:16 -0800872 if (next_event > event)
Patrick McHardyfb983d42007-03-16 01:22:39 -0700873 next_event = event;
874
Linus Torvalds1da177e2005-04-16 15:20:36 -0700875 m = ~q->row_mask[level];
876 while (m != (int)(-1)) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700877 int prio = ffz(m);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700878 m |= 1 << prio;
Stephen Hemminger87990462006-08-10 23:35:16 -0700879 skb = htb_dequeue_tree(q, prio, level);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880 if (likely(skb != NULL)) {
881 sch->q.qlen--;
882 sch->flags &= ~TCQ_F_THROTTLED;
883 goto fin;
884 }
885 }
886 }
Patrick McHardyfb983d42007-03-16 01:22:39 -0700887 sch->qstats.overlimits++;
888 qdisc_watchdog_schedule(&q->watchdog, next_event);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700889fin:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700890 return skb;
891}
892
893/* try to drop from each class (by prio) until one succeed */
Stephen Hemminger87990462006-08-10 23:35:16 -0700894static unsigned int htb_drop(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895{
896 struct htb_sched *q = qdisc_priv(sch);
897 int prio;
898
899 for (prio = TC_HTB_NUMPRIO - 1; prio >= 0; prio--) {
900 struct list_head *p;
Stephen Hemminger87990462006-08-10 23:35:16 -0700901 list_for_each(p, q->drops + prio) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700902 struct htb_class *cl = list_entry(p, struct htb_class,
903 un.leaf.drop_list);
904 unsigned int len;
Stephen Hemminger87990462006-08-10 23:35:16 -0700905 if (cl->un.leaf.q->ops->drop &&
906 (len = cl->un.leaf.q->ops->drop(cl->un.leaf.q))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700907 sch->q.qlen--;
908 if (!cl->un.leaf.q->q.qlen)
Stephen Hemminger87990462006-08-10 23:35:16 -0700909 htb_deactivate(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700910 return len;
911 }
912 }
913 }
914 return 0;
915}
916
917/* reset all classes */
918/* always caled under BH & queue lock */
Stephen Hemminger87990462006-08-10 23:35:16 -0700919static void htb_reset(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700920{
921 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700922 struct htb_class *cl;
923 struct hlist_node *n;
924 unsigned int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700925
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700926 for (i = 0; i < q->clhash.hashsize; i++) {
927 hlist_for_each_entry(cl, n, &q->clhash.hash[i], common.hnode) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700928 if (cl->level)
Stephen Hemminger87990462006-08-10 23:35:16 -0700929 memset(&cl->un.inner, 0, sizeof(cl->un.inner));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700930 else {
Stephen Hemminger87990462006-08-10 23:35:16 -0700931 if (cl->un.leaf.q)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700932 qdisc_reset(cl->un.leaf.q);
933 INIT_LIST_HEAD(&cl->un.leaf.drop_list);
934 }
935 cl->prio_activity = 0;
936 cl->cmode = HTB_CAN_SEND;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700937
938 }
939 }
Patrick McHardyfb983d42007-03-16 01:22:39 -0700940 qdisc_watchdog_cancel(&q->watchdog);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700941 __skb_queue_purge(&q->direct_queue);
942 sch->q.qlen = 0;
Stephen Hemminger87990462006-08-10 23:35:16 -0700943 memset(q->row, 0, sizeof(q->row));
944 memset(q->row_mask, 0, sizeof(q->row_mask));
945 memset(q->wait_pq, 0, sizeof(q->wait_pq));
946 memset(q->ptr, 0, sizeof(q->ptr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700947 for (i = 0; i < TC_HTB_NUMPRIO; i++)
Stephen Hemminger87990462006-08-10 23:35:16 -0700948 INIT_LIST_HEAD(q->drops + i);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700949}
950
Patrick McHardy27a34212008-01-23 20:35:39 -0800951static const struct nla_policy htb_policy[TCA_HTB_MAX + 1] = {
952 [TCA_HTB_PARMS] = { .len = sizeof(struct tc_htb_opt) },
953 [TCA_HTB_INIT] = { .len = sizeof(struct tc_htb_glob) },
954 [TCA_HTB_CTAB] = { .type = NLA_BINARY, .len = TC_RTAB_SIZE },
955 [TCA_HTB_RTAB] = { .type = NLA_BINARY, .len = TC_RTAB_SIZE },
956};
957
Patrick McHardy1e904742008-01-22 22:11:17 -0800958static int htb_init(struct Qdisc *sch, struct nlattr *opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700959{
960 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardy1e904742008-01-22 22:11:17 -0800961 struct nlattr *tb[TCA_HTB_INIT + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700962 struct tc_htb_glob *gopt;
Patrick McHardycee63722008-01-23 20:33:32 -0800963 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700964 int i;
Patrick McHardycee63722008-01-23 20:33:32 -0800965
966 if (!opt)
967 return -EINVAL;
968
Patrick McHardy27a34212008-01-23 20:35:39 -0800969 err = nla_parse_nested(tb, TCA_HTB_INIT, opt, htb_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800970 if (err < 0)
971 return err;
972
Patrick McHardy27a34212008-01-23 20:35:39 -0800973 if (tb[TCA_HTB_INIT] == NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700974 printk(KERN_ERR "HTB: hey probably you have bad tc tool ?\n");
975 return -EINVAL;
976 }
Patrick McHardy1e904742008-01-22 22:11:17 -0800977 gopt = nla_data(tb[TCA_HTB_INIT]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700978 if (gopt->version != HTB_VER >> 16) {
Stephen Hemminger87990462006-08-10 23:35:16 -0700979 printk(KERN_ERR
980 "HTB: need tc/htb version %d (minor is %d), you have %d\n",
981 HTB_VER >> 16, HTB_VER & 0xffff, gopt->version);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700982 return -EINVAL;
983 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700984
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -0700985 err = qdisc_class_hash_init(&q->clhash);
986 if (err < 0)
987 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700988 for (i = 0; i < TC_HTB_NUMPRIO; i++)
Stephen Hemminger87990462006-08-10 23:35:16 -0700989 INIT_LIST_HEAD(q->drops + i);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700990
Patrick McHardyfb983d42007-03-16 01:22:39 -0700991 qdisc_watchdog_init(&q->watchdog, sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700992 skb_queue_head_init(&q->direct_queue);
993
David S. Miller5ce2d482008-07-08 17:06:30 -0700994 q->direct_qlen = qdisc_dev(sch)->tx_queue_len;
Stephen Hemminger87990462006-08-10 23:35:16 -0700995 if (q->direct_qlen < 2) /* some devices have zero tx_queue_len */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700996 q->direct_qlen = 2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700997
Linus Torvalds1da177e2005-04-16 15:20:36 -0700998 if ((q->rate2quantum = gopt->rate2quantum) < 1)
999 q->rate2quantum = 1;
1000 q->defcls = gopt->defcls;
1001
1002 return 0;
1003}
1004
1005static int htb_dump(struct Qdisc *sch, struct sk_buff *skb)
1006{
Jarek Poplawski102396a2008-08-29 14:21:52 -07001007 spinlock_t *root_lock = qdisc_root_sleeping_lock(sch);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001008 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001009 struct nlattr *nest;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001010 struct tc_htb_glob gopt;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011
David S. Miller7698b4f2008-07-16 01:42:40 -07001012 spin_lock_bh(root_lock);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001013
1014 gopt.direct_pkts = q->direct_pkts;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015 gopt.version = HTB_VER;
1016 gopt.rate2quantum = q->rate2quantum;
1017 gopt.defcls = q->defcls;
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001018 gopt.debug = 0;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001019
1020 nest = nla_nest_start(skb, TCA_OPTIONS);
1021 if (nest == NULL)
1022 goto nla_put_failure;
Patrick McHardy1e904742008-01-22 22:11:17 -08001023 NLA_PUT(skb, TCA_HTB_INIT, sizeof(gopt), &gopt);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001024 nla_nest_end(skb, nest);
1025
David S. Miller7698b4f2008-07-16 01:42:40 -07001026 spin_unlock_bh(root_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001027 return skb->len;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001028
Patrick McHardy1e904742008-01-22 22:11:17 -08001029nla_put_failure:
David S. Miller7698b4f2008-07-16 01:42:40 -07001030 spin_unlock_bh(root_lock);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001031 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001032 return -1;
1033}
1034
1035static int htb_dump_class(struct Qdisc *sch, unsigned long arg,
Stephen Hemminger87990462006-08-10 23:35:16 -07001036 struct sk_buff *skb, struct tcmsg *tcm)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001037{
Stephen Hemminger87990462006-08-10 23:35:16 -07001038 struct htb_class *cl = (struct htb_class *)arg;
Jarek Poplawski102396a2008-08-29 14:21:52 -07001039 spinlock_t *root_lock = qdisc_root_sleeping_lock(sch);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001040 struct nlattr *nest;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001041 struct tc_htb_opt opt;
1042
David S. Miller7698b4f2008-07-16 01:42:40 -07001043 spin_lock_bh(root_lock);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001044 tcm->tcm_parent = cl->parent ? cl->parent->common.classid : TC_H_ROOT;
1045 tcm->tcm_handle = cl->common.classid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001046 if (!cl->level && cl->un.leaf.q)
1047 tcm->tcm_info = cl->un.leaf.q->handle;
1048
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001049 nest = nla_nest_start(skb, TCA_OPTIONS);
1050 if (nest == NULL)
1051 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001052
Stephen Hemminger87990462006-08-10 23:35:16 -07001053 memset(&opt, 0, sizeof(opt));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001054
Stephen Hemminger87990462006-08-10 23:35:16 -07001055 opt.rate = cl->rate->rate;
1056 opt.buffer = cl->buffer;
1057 opt.ceil = cl->ceil->rate;
1058 opt.cbuffer = cl->cbuffer;
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001059 opt.quantum = cl->quantum;
1060 opt.prio = cl->prio;
Stephen Hemminger87990462006-08-10 23:35:16 -07001061 opt.level = cl->level;
Patrick McHardy1e904742008-01-22 22:11:17 -08001062 NLA_PUT(skb, TCA_HTB_PARMS, sizeof(opt), &opt);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001063
1064 nla_nest_end(skb, nest);
David S. Miller7698b4f2008-07-16 01:42:40 -07001065 spin_unlock_bh(root_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001066 return skb->len;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001067
Patrick McHardy1e904742008-01-22 22:11:17 -08001068nla_put_failure:
David S. Miller7698b4f2008-07-16 01:42:40 -07001069 spin_unlock_bh(root_lock);
Patrick McHardy4b3550ef2008-01-23 20:34:11 -08001070 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001071 return -1;
1072}
1073
1074static int
Stephen Hemminger87990462006-08-10 23:35:16 -07001075htb_dump_class_stats(struct Qdisc *sch, unsigned long arg, struct gnet_dump *d)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001076{
Stephen Hemminger87990462006-08-10 23:35:16 -07001077 struct htb_class *cl = (struct htb_class *)arg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001078
Linus Torvalds1da177e2005-04-16 15:20:36 -07001079 if (!cl->level && cl->un.leaf.q)
1080 cl->qstats.qlen = cl->un.leaf.q->q.qlen;
1081 cl->xstats.tokens = cl->tokens;
1082 cl->xstats.ctokens = cl->ctokens;
1083
1084 if (gnet_stats_copy_basic(d, &cl->bstats) < 0 ||
1085 gnet_stats_copy_rate_est(d, &cl->rate_est) < 0 ||
1086 gnet_stats_copy_queue(d, &cl->qstats) < 0)
1087 return -1;
1088
1089 return gnet_stats_copy_app(d, &cl->xstats, sizeof(cl->xstats));
1090}
1091
1092static int htb_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
Stephen Hemminger87990462006-08-10 23:35:16 -07001093 struct Qdisc **old)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001094{
Stephen Hemminger87990462006-08-10 23:35:16 -07001095 struct htb_class *cl = (struct htb_class *)arg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001096
1097 if (cl && !cl->level) {
Patrick McHardy9f9afec2006-11-29 17:35:18 -08001098 if (new == NULL &&
David S. Miller5ce2d482008-07-08 17:06:30 -07001099 (new = qdisc_create_dflt(qdisc_dev(sch), sch->dev_queue,
David S. Millerbb949fb2008-07-08 16:55:56 -07001100 &pfifo_qdisc_ops,
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001101 cl->common.classid))
Stephen Hemminger87990462006-08-10 23:35:16 -07001102 == NULL)
1103 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001104 sch_tree_lock(sch);
Patrick McHardyb94c8af2008-11-20 04:11:36 -08001105 *old = cl->un.leaf.q;
1106 cl->un.leaf.q = new;
1107 if (*old != NULL) {
Patrick McHardy256d61b2006-11-29 17:37:05 -08001108 qdisc_tree_decrease_qlen(*old, (*old)->q.qlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001109 qdisc_reset(*old);
1110 }
1111 sch_tree_unlock(sch);
1112 return 0;
1113 }
1114 return -ENOENT;
1115}
1116
Stephen Hemminger87990462006-08-10 23:35:16 -07001117static struct Qdisc *htb_leaf(struct Qdisc *sch, unsigned long arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001118{
Stephen Hemminger87990462006-08-10 23:35:16 -07001119 struct htb_class *cl = (struct htb_class *)arg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001120 return (cl && !cl->level) ? cl->un.leaf.q : NULL;
1121}
1122
Patrick McHardy256d61b2006-11-29 17:37:05 -08001123static void htb_qlen_notify(struct Qdisc *sch, unsigned long arg)
1124{
1125 struct htb_class *cl = (struct htb_class *)arg;
1126
1127 if (cl->un.leaf.q->q.qlen == 0)
1128 htb_deactivate(qdisc_priv(sch), cl);
1129}
1130
Linus Torvalds1da177e2005-04-16 15:20:36 -07001131static unsigned long htb_get(struct Qdisc *sch, u32 classid)
1132{
Stephen Hemminger87990462006-08-10 23:35:16 -07001133 struct htb_class *cl = htb_find(classid, sch);
1134 if (cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001135 cl->refcnt++;
1136 return (unsigned long)cl;
1137}
1138
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001139static inline int htb_parent_last_child(struct htb_class *cl)
1140{
1141 if (!cl->parent)
1142 /* the root class */
1143 return 0;
Patrick McHardy42077592008-07-05 23:22:53 -07001144 if (cl->parent->children > 1)
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001145 /* not the last child */
1146 return 0;
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001147 return 1;
1148}
1149
Jarek Poplawski3ba08b02008-05-03 20:46:29 -07001150static void htb_parent_to_leaf(struct htb_sched *q, struct htb_class *cl,
1151 struct Qdisc *new_q)
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001152{
1153 struct htb_class *parent = cl->parent;
1154
Ilpo Järvinen547b7922008-07-25 21:43:18 -07001155 WARN_ON(cl->level || !cl->un.leaf.q || cl->prio_activity);
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001156
Jarek Poplawski3ba08b02008-05-03 20:46:29 -07001157 if (parent->cmode != HTB_CAN_SEND)
1158 htb_safe_rb_erase(&parent->pq_node, q->wait_pq + parent->level);
1159
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001160 parent->level = 0;
1161 memset(&parent->un.inner, 0, sizeof(parent->un.inner));
1162 INIT_LIST_HEAD(&parent->un.leaf.drop_list);
1163 parent->un.leaf.q = new_q ? new_q : &noop_qdisc;
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001164 parent->tokens = parent->buffer;
1165 parent->ctokens = parent->cbuffer;
Patrick McHardy3bebcda2007-03-23 11:29:25 -07001166 parent->t_c = psched_get_time();
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001167 parent->cmode = HTB_CAN_SEND;
1168}
1169
Stephen Hemminger87990462006-08-10 23:35:16 -07001170static void htb_destroy_class(struct Qdisc *sch, struct htb_class *cl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001171{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001172 if (!cl->level) {
Ilpo Järvinen547b7922008-07-25 21:43:18 -07001173 WARN_ON(!cl->un.leaf.q);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001174 qdisc_destroy(cl->un.leaf.q);
1175 }
Patrick McHardyee39e102007-07-02 22:48:13 -07001176 gen_kill_estimator(&cl->bstats, &cl->rate_est);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001177 qdisc_put_rtab(cl->rate);
1178 qdisc_put_rtab(cl->ceil);
Stephen Hemminger87990462006-08-10 23:35:16 -07001179
Patrick McHardyff31ab52008-07-01 19:52:38 -07001180 tcf_destroy_chain(&cl->filter_list);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001181 kfree(cl);
1182}
1183
1184/* always caled under BH & queue lock */
Stephen Hemminger87990462006-08-10 23:35:16 -07001185static void htb_destroy(struct Qdisc *sch)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001186{
1187 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardyfbd8f132008-07-05 23:22:19 -07001188 struct hlist_node *n, *next;
1189 struct htb_class *cl;
1190 unsigned int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001191
Patrick McHardyfb983d42007-03-16 01:22:39 -07001192 qdisc_watchdog_cancel(&q->watchdog);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001193 /* This line used to be after htb_destroy_class call below
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +09001194 and surprisingly it worked in 2.4. But it must precede it
Linus Torvalds1da177e2005-04-16 15:20:36 -07001195 because filter need its target class alive to be able to call
1196 unbind_filter on it (without Oops). */
Patrick McHardyff31ab52008-07-01 19:52:38 -07001197 tcf_destroy_chain(&q->filter_list);
Stephen Hemminger87990462006-08-10 23:35:16 -07001198
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001199 for (i = 0; i < q->clhash.hashsize; i++) {
1200 hlist_for_each_entry(cl, n, &q->clhash.hash[i], common.hnode)
Patrick McHardyfbd8f132008-07-05 23:22:19 -07001201 tcf_destroy_chain(&cl->filter_list);
1202 }
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001203 for (i = 0; i < q->clhash.hashsize; i++) {
1204 hlist_for_each_entry_safe(cl, n, next, &q->clhash.hash[i],
1205 common.hnode)
Patrick McHardyfbd8f132008-07-05 23:22:19 -07001206 htb_destroy_class(sch, cl);
1207 }
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001208 qdisc_class_hash_destroy(&q->clhash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001209 __skb_queue_purge(&q->direct_queue);
1210}
1211
1212static int htb_delete(struct Qdisc *sch, unsigned long arg)
1213{
1214 struct htb_sched *q = qdisc_priv(sch);
Stephen Hemminger87990462006-08-10 23:35:16 -07001215 struct htb_class *cl = (struct htb_class *)arg;
Patrick McHardy256d61b2006-11-29 17:37:05 -08001216 unsigned int qlen;
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001217 struct Qdisc *new_q = NULL;
1218 int last_child = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001219
1220 // TODO: why don't allow to delete subtree ? references ? does
1221 // tc subsys quarantee us that in htb_destroy it holds no class
1222 // refs so that we can remove children safely there ?
Patrick McHardy42077592008-07-05 23:22:53 -07001223 if (cl->children || cl->filter_cnt)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001224 return -EBUSY;
Stephen Hemminger87990462006-08-10 23:35:16 -07001225
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001226 if (!cl->level && htb_parent_last_child(cl)) {
David S. Miller5ce2d482008-07-08 17:06:30 -07001227 new_q = qdisc_create_dflt(qdisc_dev(sch), sch->dev_queue,
David S. Millerbb949fb2008-07-08 16:55:56 -07001228 &pfifo_qdisc_ops,
1229 cl->parent->common.classid);
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001230 last_child = 1;
1231 }
1232
Linus Torvalds1da177e2005-04-16 15:20:36 -07001233 sch_tree_lock(sch);
Stephen Hemminger87990462006-08-10 23:35:16 -07001234
Patrick McHardy814a175e2006-11-29 17:34:50 -08001235 if (!cl->level) {
Patrick McHardy256d61b2006-11-29 17:37:05 -08001236 qlen = cl->un.leaf.q->q.qlen;
Patrick McHardy814a175e2006-11-29 17:34:50 -08001237 qdisc_reset(cl->un.leaf.q);
Patrick McHardy256d61b2006-11-29 17:37:05 -08001238 qdisc_tree_decrease_qlen(cl->un.leaf.q, qlen);
Patrick McHardy814a175e2006-11-29 17:34:50 -08001239 }
1240
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001241 /* delete from hash and active; remainder in destroy_class */
1242 qdisc_class_hash_remove(&q->clhash, &cl->common);
Jarek Poplawski26b284d2008-08-13 15:16:43 -07001243 if (cl->parent)
1244 cl->parent->children--;
Patrick McHardyc38c83c2007-03-27 14:04:24 -07001245
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246 if (cl->prio_activity)
Stephen Hemminger87990462006-08-10 23:35:16 -07001247 htb_deactivate(q, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001248
Patrick McHardyfbd8f132008-07-05 23:22:19 -07001249 if (cl->cmode != HTB_CAN_SEND)
1250 htb_safe_rb_erase(&cl->pq_node, q->wait_pq + cl->level);
1251
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001252 if (last_child)
Jarek Poplawski3ba08b02008-05-03 20:46:29 -07001253 htb_parent_to_leaf(q, cl, new_q);
Jarek Poplawski160d5e12006-12-08 00:26:56 -08001254
Linus Torvalds1da177e2005-04-16 15:20:36 -07001255 if (--cl->refcnt == 0)
Stephen Hemminger87990462006-08-10 23:35:16 -07001256 htb_destroy_class(sch, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001257
1258 sch_tree_unlock(sch);
1259 return 0;
1260}
1261
1262static void htb_put(struct Qdisc *sch, unsigned long arg)
1263{
Stephen Hemminger87990462006-08-10 23:35:16 -07001264 struct htb_class *cl = (struct htb_class *)arg;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001265
1266 if (--cl->refcnt == 0)
Stephen Hemminger87990462006-08-10 23:35:16 -07001267 htb_destroy_class(sch, cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001268}
1269
Stephen Hemminger87990462006-08-10 23:35:16 -07001270static int htb_change_class(struct Qdisc *sch, u32 classid,
Patrick McHardy1e904742008-01-22 22:11:17 -08001271 u32 parentid, struct nlattr **tca,
Stephen Hemminger87990462006-08-10 23:35:16 -07001272 unsigned long *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001273{
1274 int err = -EINVAL;
1275 struct htb_sched *q = qdisc_priv(sch);
Stephen Hemminger87990462006-08-10 23:35:16 -07001276 struct htb_class *cl = (struct htb_class *)*arg, *parent;
Patrick McHardy1e904742008-01-22 22:11:17 -08001277 struct nlattr *opt = tca[TCA_OPTIONS];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001278 struct qdisc_rate_table *rtab = NULL, *ctab = NULL;
Patrick McHardy1e904742008-01-22 22:11:17 -08001279 struct nlattr *tb[TCA_HTB_RTAB + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001280 struct tc_htb_opt *hopt;
1281
1282 /* extract all subattrs from opt attr */
Patrick McHardycee63722008-01-23 20:33:32 -08001283 if (!opt)
1284 goto failure;
1285
Patrick McHardy27a34212008-01-23 20:35:39 -08001286 err = nla_parse_nested(tb, TCA_HTB_RTAB, opt, htb_policy);
Patrick McHardycee63722008-01-23 20:33:32 -08001287 if (err < 0)
1288 goto failure;
1289
1290 err = -EINVAL;
Patrick McHardy27a34212008-01-23 20:35:39 -08001291 if (tb[TCA_HTB_PARMS] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001292 goto failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293
Stephen Hemminger87990462006-08-10 23:35:16 -07001294 parent = parentid == TC_H_ROOT ? NULL : htb_find(parentid, sch);
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001295
Patrick McHardy1e904742008-01-22 22:11:17 -08001296 hopt = nla_data(tb[TCA_HTB_PARMS]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001297
Patrick McHardy1e904742008-01-22 22:11:17 -08001298 rtab = qdisc_get_rtab(&hopt->rate, tb[TCA_HTB_RTAB]);
1299 ctab = qdisc_get_rtab(&hopt->ceil, tb[TCA_HTB_CTAB]);
Stephen Hemminger87990462006-08-10 23:35:16 -07001300 if (!rtab || !ctab)
1301 goto failure;
1302
1303 if (!cl) { /* new class */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001304 struct Qdisc *new_q;
Stephen Hemminger3696f622006-08-10 23:36:01 -07001305 int prio;
Patrick McHardyee39e102007-07-02 22:48:13 -07001306 struct {
Patrick McHardy1e904742008-01-22 22:11:17 -08001307 struct nlattr nla;
Patrick McHardyee39e102007-07-02 22:48:13 -07001308 struct gnet_estimator opt;
1309 } est = {
Patrick McHardy1e904742008-01-22 22:11:17 -08001310 .nla = {
1311 .nla_len = nla_attr_size(sizeof(est.opt)),
1312 .nla_type = TCA_RATE,
Patrick McHardyee39e102007-07-02 22:48:13 -07001313 },
1314 .opt = {
1315 /* 4s interval, 16s averaging constant */
1316 .interval = 2,
1317 .ewma_log = 2,
1318 },
1319 };
Stephen Hemminger3696f622006-08-10 23:36:01 -07001320
Linus Torvalds1da177e2005-04-16 15:20:36 -07001321 /* check for valid classid */
Stephen Hemminger87990462006-08-10 23:35:16 -07001322 if (!classid || TC_H_MAJ(classid ^ sch->handle)
1323 || htb_find(classid, sch))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324 goto failure;
1325
1326 /* check maximal depth */
1327 if (parent && parent->parent && parent->parent->level < 2) {
1328 printk(KERN_ERR "htb: tree is too deep\n");
1329 goto failure;
1330 }
1331 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -07001332 if ((cl = kzalloc(sizeof(*cl), GFP_KERNEL)) == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001333 goto failure;
Stephen Hemminger87990462006-08-10 23:35:16 -07001334
Stephen Hemminger71bcb092008-11-25 21:13:31 -08001335 err = gen_new_estimator(&cl->bstats, &cl->rate_est,
1336 qdisc_root_sleeping_lock(sch),
1337 tca[TCA_RATE] ? : &est.nla);
1338 if (err) {
1339 kfree(cl);
1340 goto failure;
1341 }
1342
Linus Torvalds1da177e2005-04-16 15:20:36 -07001343 cl->refcnt = 1;
Patrick McHardy42077592008-07-05 23:22:53 -07001344 cl->children = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001345 INIT_LIST_HEAD(&cl->un.leaf.drop_list);
Stephen Hemminger3696f622006-08-10 23:36:01 -07001346 RB_CLEAR_NODE(&cl->pq_node);
1347
1348 for (prio = 0; prio < TC_HTB_NUMPRIO; prio++)
1349 RB_CLEAR_NODE(&cl->node[prio]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001350
1351 /* create leaf qdisc early because it uses kmalloc(GFP_KERNEL)
1352 so that can't be used inside of sch_tree_lock
1353 -- thanks to Karlis Peisenieks */
David S. Miller5ce2d482008-07-08 17:06:30 -07001354 new_q = qdisc_create_dflt(qdisc_dev(sch), sch->dev_queue,
David S. Millerbb949fb2008-07-08 16:55:56 -07001355 &pfifo_qdisc_ops, classid);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001356 sch_tree_lock(sch);
1357 if (parent && !parent->level) {
Patrick McHardy256d61b2006-11-29 17:37:05 -08001358 unsigned int qlen = parent->un.leaf.q->q.qlen;
1359
Linus Torvalds1da177e2005-04-16 15:20:36 -07001360 /* turn parent into inner node */
Patrick McHardy256d61b2006-11-29 17:37:05 -08001361 qdisc_reset(parent->un.leaf.q);
1362 qdisc_tree_decrease_qlen(parent->un.leaf.q, qlen);
Stephen Hemminger87990462006-08-10 23:35:16 -07001363 qdisc_destroy(parent->un.leaf.q);
1364 if (parent->prio_activity)
1365 htb_deactivate(q, parent);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001366
1367 /* remove from evt list because of level change */
1368 if (parent->cmode != HTB_CAN_SEND) {
Stephen Hemminger3696f622006-08-10 23:36:01 -07001369 htb_safe_rb_erase(&parent->pq_node, q->wait_pq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001370 parent->cmode = HTB_CAN_SEND;
1371 }
1372 parent->level = (parent->parent ? parent->parent->level
Stephen Hemminger87990462006-08-10 23:35:16 -07001373 : TC_HTB_MAXDEPTH) - 1;
1374 memset(&parent->un.inner, 0, sizeof(parent->un.inner));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001375 }
1376 /* leaf (we) needs elementary qdisc */
1377 cl->un.leaf.q = new_q ? new_q : &noop_qdisc;
1378
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001379 cl->common.classid = classid;
Stephen Hemminger87990462006-08-10 23:35:16 -07001380 cl->parent = parent;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001381
1382 /* set class to be in HTB_CAN_SEND state */
1383 cl->tokens = hopt->buffer;
1384 cl->ctokens = hopt->cbuffer;
Patrick McHardy00c04af2007-03-16 01:23:02 -07001385 cl->mbuffer = 60 * PSCHED_TICKS_PER_SEC; /* 1min */
Patrick McHardy3bebcda2007-03-23 11:29:25 -07001386 cl->t_c = psched_get_time();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001387 cl->cmode = HTB_CAN_SEND;
1388
1389 /* attach to the hash list and parent's family */
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001390 qdisc_class_hash_insert(&q->clhash, &cl->common);
Patrick McHardy42077592008-07-05 23:22:53 -07001391 if (parent)
1392 parent->children++;
Patrick McHardyee39e102007-07-02 22:48:13 -07001393 } else {
Stephen Hemminger71bcb092008-11-25 21:13:31 -08001394 if (tca[TCA_RATE]) {
1395 err = gen_replace_estimator(&cl->bstats, &cl->rate_est,
1396 qdisc_root_sleeping_lock(sch),
1397 tca[TCA_RATE]);
1398 if (err)
1399 return err;
1400 }
Stephen Hemminger87990462006-08-10 23:35:16 -07001401 sch_tree_lock(sch);
Patrick McHardyee39e102007-07-02 22:48:13 -07001402 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403
1404 /* it used to be a nasty bug here, we have to check that node
Stephen Hemminger87990462006-08-10 23:35:16 -07001405 is really leaf before changing cl->un.leaf ! */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001406 if (!cl->level) {
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001407 cl->quantum = rtab->rate.rate / q->rate2quantum;
1408 if (!hopt->quantum && cl->quantum < 1000) {
Stephen Hemminger87990462006-08-10 23:35:16 -07001409 printk(KERN_WARNING
1410 "HTB: quantum of class %X is small. Consider r2q change.\n",
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001411 cl->common.classid);
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001412 cl->quantum = 1000;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001413 }
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001414 if (!hopt->quantum && cl->quantum > 200000) {
Stephen Hemminger87990462006-08-10 23:35:16 -07001415 printk(KERN_WARNING
1416 "HTB: quantum of class %X is big. Consider r2q change.\n",
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001417 cl->common.classid);
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001418 cl->quantum = 200000;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001419 }
1420 if (hopt->quantum)
Jarek Poplawskic19f7a32008-12-03 21:09:45 -08001421 cl->quantum = hopt->quantum;
1422 if ((cl->prio = hopt->prio) >= TC_HTB_NUMPRIO)
1423 cl->prio = TC_HTB_NUMPRIO - 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001424 }
1425
1426 cl->buffer = hopt->buffer;
1427 cl->cbuffer = hopt->cbuffer;
Stephen Hemminger87990462006-08-10 23:35:16 -07001428 if (cl->rate)
1429 qdisc_put_rtab(cl->rate);
1430 cl->rate = rtab;
1431 if (cl->ceil)
1432 qdisc_put_rtab(cl->ceil);
1433 cl->ceil = ctab;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001434 sch_tree_unlock(sch);
1435
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001436 qdisc_class_hash_grow(sch, &q->clhash);
1437
Linus Torvalds1da177e2005-04-16 15:20:36 -07001438 *arg = (unsigned long)cl;
1439 return 0;
1440
1441failure:
Stephen Hemminger87990462006-08-10 23:35:16 -07001442 if (rtab)
1443 qdisc_put_rtab(rtab);
1444 if (ctab)
1445 qdisc_put_rtab(ctab);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001446 return err;
1447}
1448
1449static struct tcf_proto **htb_find_tcf(struct Qdisc *sch, unsigned long arg)
1450{
1451 struct htb_sched *q = qdisc_priv(sch);
1452 struct htb_class *cl = (struct htb_class *)arg;
1453 struct tcf_proto **fl = cl ? &cl->filter_list : &q->filter_list;
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001454
Linus Torvalds1da177e2005-04-16 15:20:36 -07001455 return fl;
1456}
1457
1458static unsigned long htb_bind_filter(struct Qdisc *sch, unsigned long parent,
Stephen Hemminger87990462006-08-10 23:35:16 -07001459 u32 classid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001460{
Stephen Hemminger87990462006-08-10 23:35:16 -07001461 struct htb_class *cl = htb_find(classid, sch);
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001462
Linus Torvalds1da177e2005-04-16 15:20:36 -07001463 /*if (cl && !cl->level) return 0;
Stephen Hemminger87990462006-08-10 23:35:16 -07001464 The line above used to be there to prevent attaching filters to
1465 leaves. But at least tc_index filter uses this just to get class
1466 for other reasons so that we have to allow for it.
1467 ----
1468 19.6.2002 As Werner explained it is ok - bind filter is just
1469 another way to "lock" the class - unlike "get" this lock can
1470 be broken by class during destroy IIUC.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001471 */
Stephen Hemminger87990462006-08-10 23:35:16 -07001472 if (cl)
1473 cl->filter_cnt++;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001474 return (unsigned long)cl;
1475}
1476
1477static void htb_unbind_filter(struct Qdisc *sch, unsigned long arg)
1478{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001479 struct htb_class *cl = (struct htb_class *)arg;
Stephen Hemminger3bf72952006-08-10 23:31:08 -07001480
Stephen Hemminger87990462006-08-10 23:35:16 -07001481 if (cl)
1482 cl->filter_cnt--;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001483}
1484
1485static void htb_walk(struct Qdisc *sch, struct qdisc_walker *arg)
1486{
1487 struct htb_sched *q = qdisc_priv(sch);
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001488 struct htb_class *cl;
1489 struct hlist_node *n;
1490 unsigned int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001491
1492 if (arg->stop)
1493 return;
1494
Patrick McHardyf4c1f3e2008-07-05 23:22:35 -07001495 for (i = 0; i < q->clhash.hashsize; i++) {
1496 hlist_for_each_entry(cl, n, &q->clhash.hash[i], common.hnode) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001497 if (arg->count < arg->skip) {
1498 arg->count++;
1499 continue;
1500 }
1501 if (arg->fn(sch, (unsigned long)cl, arg) < 0) {
1502 arg->stop = 1;
1503 return;
1504 }
1505 arg->count++;
1506 }
1507 }
1508}
1509
Eric Dumazet20fea082007-11-14 01:44:41 -08001510static const struct Qdisc_class_ops htb_class_ops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001511 .graft = htb_graft,
1512 .leaf = htb_leaf,
Patrick McHardy256d61b2006-11-29 17:37:05 -08001513 .qlen_notify = htb_qlen_notify,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001514 .get = htb_get,
1515 .put = htb_put,
1516 .change = htb_change_class,
1517 .delete = htb_delete,
1518 .walk = htb_walk,
1519 .tcf_chain = htb_find_tcf,
1520 .bind_tcf = htb_bind_filter,
1521 .unbind_tcf = htb_unbind_filter,
1522 .dump = htb_dump_class,
1523 .dump_stats = htb_dump_class_stats,
1524};
1525
Eric Dumazet20fea082007-11-14 01:44:41 -08001526static struct Qdisc_ops htb_qdisc_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001527 .next = NULL,
1528 .cl_ops = &htb_class_ops,
1529 .id = "htb",
1530 .priv_size = sizeof(struct htb_sched),
1531 .enqueue = htb_enqueue,
1532 .dequeue = htb_dequeue,
Jarek Poplawski77be1552008-10-31 00:47:01 -07001533 .peek = qdisc_peek_dequeued,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001534 .drop = htb_drop,
1535 .init = htb_init,
1536 .reset = htb_reset,
1537 .destroy = htb_destroy,
1538 .change = NULL /* htb_change */,
1539 .dump = htb_dump,
1540 .owner = THIS_MODULE,
1541};
1542
1543static int __init htb_module_init(void)
1544{
Stephen Hemminger87990462006-08-10 23:35:16 -07001545 return register_qdisc(&htb_qdisc_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001546}
Stephen Hemminger87990462006-08-10 23:35:16 -07001547static void __exit htb_module_exit(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001548{
Stephen Hemminger87990462006-08-10 23:35:16 -07001549 unregister_qdisc(&htb_qdisc_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001550}
Stephen Hemminger87990462006-08-10 23:35:16 -07001551
Linus Torvalds1da177e2005-04-16 15:20:36 -07001552module_init(htb_module_init)
1553module_exit(htb_module_exit)
1554MODULE_LICENSE("GPL");