blob: 02fa82792dab8334d1dc14408f7ed42a4db0c141 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/sched/cls_rsvp.h Template file for RSVPv[46] classifiers.
3 *
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 */
11
12/*
13 Comparing to general packet classification problem,
14 RSVP needs only sevaral relatively simple rules:
15
16 * (dst, protocol) are always specified,
17 so that we are able to hash them.
18 * src may be exact, or may be wildcard, so that
19 we can keep a hash table plus one wildcard entry.
20 * source port (or flow label) is important only if src is given.
21
22 IMPLEMENTATION.
23
24 We use a two level hash table: The top level is keyed by
25 destination address and protocol ID, every bucket contains a list
26 of "rsvp sessions", identified by destination address, protocol and
27 DPI(="Destination Port ID"): triple (key, mask, offset).
28
29 Every bucket has a smaller hash table keyed by source address
30 (cf. RSVP flowspec) and one wildcard entry for wildcard reservations.
31 Every bucket is again a list of "RSVP flows", selected by
32 source address and SPI(="Source Port ID" here rather than
33 "security parameter index"): triple (key, mask, offset).
34
35
36 NOTE 1. All the packets with IPv6 extension headers (but AH and ESP)
37 and all fragmented packets go to the best-effort traffic class.
38
39
40 NOTE 2. Two "port id"'s seems to be redundant, rfc2207 requires
41 only one "Generalized Port Identifier". So that for classic
42 ah, esp (and udp,tcp) both *pi should coincide or one of them
43 should be wildcard.
44
45 At first sight, this redundancy is just a waste of CPU
46 resources. But DPI and SPI add the possibility to assign different
47 priorities to GPIs. Look also at note 4 about tunnels below.
48
49
50 NOTE 3. One complication is the case of tunneled packets.
51 We implement it as following: if the first lookup
52 matches a special session with "tunnelhdr" value not zero,
53 flowid doesn't contain the true flow ID, but the tunnel ID (1...255).
54 In this case, we pull tunnelhdr bytes and restart lookup
55 with tunnel ID added to the list of keys. Simple and stupid 8)8)
56 It's enough for PIMREG and IPIP.
57
58
59 NOTE 4. Two GPIs make it possible to parse even GRE packets.
60 F.e. DPI can select ETH_P_IP (and necessary flags to make
61 tunnelhdr correct) in GRE protocol field and SPI matches
62 GRE key. Is it not nice? 8)8)
63
64
65 Well, as result, despite its simplicity, we get a pretty
66 powerful classification engine. */
67
Linus Torvalds1da177e2005-04-16 15:20:36 -070068
Eric Dumazetcc7ec452011-01-19 19:26:56 +000069struct rsvp_head {
Linus Torvalds1da177e2005-04-16 15:20:36 -070070 u32 tmap[256/32];
71 u32 hgenerator;
72 u8 tgenerator;
John Fastabendb929d862014-09-12 20:09:49 -070073 struct rsvp_session __rcu *ht[256];
74 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070075};
76
Eric Dumazetcc7ec452011-01-19 19:26:56 +000077struct rsvp_session {
John Fastabendb929d862014-09-12 20:09:49 -070078 struct rsvp_session __rcu *next;
79 __be32 dst[RSVP_DST_LEN];
80 struct tc_rsvp_gpi dpi;
81 u8 protocol;
82 u8 tunnelid;
Linus Torvalds1da177e2005-04-16 15:20:36 -070083 /* 16 (src,sport) hash slots, and one wildcard source slot */
John Fastabendb929d862014-09-12 20:09:49 -070084 struct rsvp_filter __rcu *ht[16 + 1];
85 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -070086};
87
88
Eric Dumazetcc7ec452011-01-19 19:26:56 +000089struct rsvp_filter {
John Fastabendb929d862014-09-12 20:09:49 -070090 struct rsvp_filter __rcu *next;
91 __be32 src[RSVP_DST_LEN];
92 struct tc_rsvp_gpi spi;
93 u8 tunnelhdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -070094
John Fastabendb929d862014-09-12 20:09:49 -070095 struct tcf_result res;
96 struct tcf_exts exts;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
John Fastabendb929d862014-09-12 20:09:49 -070098 u32 handle;
99 struct rsvp_session *sess;
100 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101};
102
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000103static inline unsigned int hash_dst(__be32 *dst, u8 protocol, u8 tunnelid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000105 unsigned int h = (__force __u32)dst[RSVP_DST_LEN - 1];
106
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107 h ^= h>>16;
108 h ^= h>>8;
109 return (h ^ protocol ^ tunnelid) & 0xFF;
110}
111
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000112static inline unsigned int hash_src(__be32 *src)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000114 unsigned int h = (__force __u32)src[RSVP_DST_LEN-1];
115
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116 h ^= h>>16;
117 h ^= h>>8;
118 h ^= h>>4;
119 return h & 0xF;
120}
121
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122#define RSVP_APPLY_RESULT() \
123{ \
124 int r = tcf_exts_exec(skb, &f->exts, res); \
125 if (r < 0) \
126 continue; \
127 else if (r > 0) \
128 return r; \
129}
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900130
Eric Dumazetdc7f9f62011-07-05 23:25:42 +0000131static int rsvp_classify(struct sk_buff *skb, const struct tcf_proto *tp,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132 struct tcf_result *res)
133{
John Fastabendb929d862014-09-12 20:09:49 -0700134 struct rsvp_head *head = rcu_dereference_bh(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 struct rsvp_session *s;
136 struct rsvp_filter *f;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000137 unsigned int h1, h2;
Al Viro66c6f522006-11-20 18:07:51 -0800138 __be32 *dst, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 u8 protocol;
140 u8 tunnelid = 0;
141 u8 *xprt;
142#if RSVP_DST_LEN == 4
Changli Gao12dc96d2010-08-04 04:55:40 +0000143 struct ipv6hdr *nhptr;
144
145 if (!pskb_network_may_pull(skb, sizeof(*nhptr)))
146 return -1;
147 nhptr = ipv6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148#else
Changli Gao12dc96d2010-08-04 04:55:40 +0000149 struct iphdr *nhptr;
150
151 if (!pskb_network_may_pull(skb, sizeof(*nhptr)))
152 return -1;
153 nhptr = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154#endif
155
156restart:
157
158#if RSVP_DST_LEN == 4
159 src = &nhptr->saddr.s6_addr32[0];
160 dst = &nhptr->daddr.s6_addr32[0];
161 protocol = nhptr->nexthdr;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000162 xprt = ((u8 *)nhptr) + sizeof(struct ipv6hdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163#else
164 src = &nhptr->saddr;
165 dst = &nhptr->daddr;
166 protocol = nhptr->protocol;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000167 xprt = ((u8 *)nhptr) + (nhptr->ihl<<2);
Paul Gortmaker56f8a752011-06-21 20:33:34 -0700168 if (ip_is_fragment(nhptr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169 return -1;
170#endif
171
172 h1 = hash_dst(dst, protocol, tunnelid);
173 h2 = hash_src(src);
174
John Fastabendb929d862014-09-12 20:09:49 -0700175 for (s = rcu_dereference_bh(head->ht[h1]); s;
176 s = rcu_dereference_bh(s->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000177 if (dst[RSVP_DST_LEN-1] == s->dst[RSVP_DST_LEN - 1] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178 protocol == s->protocol &&
Joe Perchesf64f9e72009-11-29 16:55:45 -0800179 !(s->dpi.mask &
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000180 (*(u32 *)(xprt + s->dpi.offset) ^ s->dpi.key)) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800182 dst[0] == s->dst[0] &&
183 dst[1] == s->dst[1] &&
184 dst[2] == s->dst[2] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700185#endif
Joe Perchesf64f9e72009-11-29 16:55:45 -0800186 tunnelid == s->tunnelid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700187
John Fastabendb929d862014-09-12 20:09:49 -0700188 for (f = rcu_dereference_bh(s->ht[h2]); f;
189 f = rcu_dereference_bh(f->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000190 if (src[RSVP_DST_LEN-1] == f->src[RSVP_DST_LEN - 1] &&
191 !(f->spi.mask & (*(u32 *)(xprt + f->spi.offset) ^ f->spi.key))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800193 &&
194 src[0] == f->src[0] &&
195 src[1] == f->src[1] &&
196 src[2] == f->src[2]
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197#endif
198 ) {
199 *res = f->res;
200 RSVP_APPLY_RESULT();
201
202matched:
203 if (f->tunnelhdr == 0)
204 return 0;
205
206 tunnelid = f->res.classid;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000207 nhptr = (void *)(xprt + f->tunnelhdr - sizeof(*nhptr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208 goto restart;
209 }
210 }
211
212 /* And wildcard bucket... */
John Fastabendb929d862014-09-12 20:09:49 -0700213 for (f = rcu_dereference_bh(s->ht[16]); f;
214 f = rcu_dereference_bh(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215 *res = f->res;
216 RSVP_APPLY_RESULT();
217 goto matched;
218 }
219 return -1;
220 }
221 }
222 return -1;
223}
224
John Fastabend53dfd502014-09-26 10:02:50 -0700225static void rsvp_replace(struct tcf_proto *tp, struct rsvp_filter *n, u32 h)
226{
227 struct rsvp_head *head = rtnl_dereference(tp->root);
228 struct rsvp_session *s;
229 struct rsvp_filter __rcu **ins;
230 struct rsvp_filter *pins;
231 unsigned int h1 = h & 0xFF;
232 unsigned int h2 = (h >> 8) & 0xFF;
233
234 for (s = rtnl_dereference(head->ht[h1]); s;
235 s = rtnl_dereference(s->next)) {
236 for (ins = &s->ht[h2], pins = rtnl_dereference(*ins); ;
237 ins = &pins->next, pins = rtnl_dereference(*ins)) {
238 if (pins->handle == h) {
239 RCU_INIT_POINTER(n->next, pins->next);
240 rcu_assign_pointer(*ins, n);
241 return;
242 }
243 }
244 }
245
246 /* Something went wrong if we are trying to replace a non-existant
247 * node. Mind as well halt instead of silently failing.
248 */
249 BUG_ON(1);
250}
251
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252static unsigned long rsvp_get(struct tcf_proto *tp, u32 handle)
253{
John Fastabendb929d862014-09-12 20:09:49 -0700254 struct rsvp_head *head = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 struct rsvp_session *s;
256 struct rsvp_filter *f;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000257 unsigned int h1 = handle & 0xFF;
258 unsigned int h2 = (handle >> 8) & 0xFF;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700259
260 if (h2 > 16)
261 return 0;
262
John Fastabendb929d862014-09-12 20:09:49 -0700263 for (s = rtnl_dereference(head->ht[h1]); s;
264 s = rtnl_dereference(s->next)) {
265 for (f = rtnl_dereference(s->ht[h2]); f;
266 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267 if (f->handle == handle)
268 return (unsigned long)f;
269 }
270 }
271 return 0;
272}
273
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274static int rsvp_init(struct tcf_proto *tp)
275{
276 struct rsvp_head *data;
277
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700278 data = kzalloc(sizeof(struct rsvp_head), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 if (data) {
John Fastabendb929d862014-09-12 20:09:49 -0700280 rcu_assign_pointer(tp->root, data);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281 return 0;
282 }
283 return -ENOBUFS;
284}
285
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000286static void
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287rsvp_delete_filter(struct tcf_proto *tp, struct rsvp_filter *f)
288{
289 tcf_unbind_filter(tp, &f->res);
WANG Cong18d02642014-09-25 10:26:37 -0700290 tcf_exts_destroy(&f->exts);
John Fastabendb929d862014-09-12 20:09:49 -0700291 kfree_rcu(f, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292}
293
Cong Wang1e052be2015-03-06 11:47:59 -0800294static bool rsvp_destroy(struct tcf_proto *tp, bool force)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295{
John Fastabendb929d862014-09-12 20:09:49 -0700296 struct rsvp_head *data = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 int h1, h2;
298
299 if (data == NULL)
Cong Wang1e052be2015-03-06 11:47:59 -0800300 return true;
301
302 if (!force) {
303 for (h1 = 0; h1 < 256; h1++) {
304 if (rcu_access_pointer(data->ht[h1]))
305 return false;
306 }
307 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700308
John Fastabendb929d862014-09-12 20:09:49 -0700309 RCU_INIT_POINTER(tp->root, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000311 for (h1 = 0; h1 < 256; h1++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 struct rsvp_session *s;
313
John Fastabendb929d862014-09-12 20:09:49 -0700314 while ((s = rtnl_dereference(data->ht[h1])) != NULL) {
315 RCU_INIT_POINTER(data->ht[h1], s->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700316
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000317 for (h2 = 0; h2 <= 16; h2++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318 struct rsvp_filter *f;
319
John Fastabendb929d862014-09-12 20:09:49 -0700320 while ((f = rtnl_dereference(s->ht[h2])) != NULL) {
321 rcu_assign_pointer(s->ht[h2], f->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322 rsvp_delete_filter(tp, f);
323 }
324 }
John Fastabendb929d862014-09-12 20:09:49 -0700325 kfree_rcu(s, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700326 }
327 }
John Fastabendb929d862014-09-12 20:09:49 -0700328 kfree_rcu(data, rcu);
Cong Wang1e052be2015-03-06 11:47:59 -0800329 return true;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330}
331
332static int rsvp_delete(struct tcf_proto *tp, unsigned long arg)
333{
John Fastabendb929d862014-09-12 20:09:49 -0700334 struct rsvp_head *head = rtnl_dereference(tp->root);
335 struct rsvp_filter *nfp, *f = (struct rsvp_filter *)arg;
336 struct rsvp_filter __rcu **fp;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000337 unsigned int h = f->handle;
John Fastabendb929d862014-09-12 20:09:49 -0700338 struct rsvp_session __rcu **sp;
339 struct rsvp_session *nsp, *s = f->sess;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 int i;
341
John Fastabendb929d862014-09-12 20:09:49 -0700342 fp = &s->ht[(h >> 8) & 0xFF];
343 for (nfp = rtnl_dereference(*fp); nfp;
344 fp = &nfp->next, nfp = rtnl_dereference(*fp)) {
345 if (nfp == f) {
346 RCU_INIT_POINTER(*fp, f->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347 rsvp_delete_filter(tp, f);
348
349 /* Strip tree */
350
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000351 for (i = 0; i <= 16; i++)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352 if (s->ht[i])
353 return 0;
354
355 /* OK, session has no flows */
John Fastabendb929d862014-09-12 20:09:49 -0700356 sp = &head->ht[h & 0xFF];
357 for (nsp = rtnl_dereference(*sp); nsp;
358 sp = &nsp->next, nsp = rtnl_dereference(*sp)) {
359 if (nsp == s) {
360 RCU_INIT_POINTER(*sp, s->next);
361 kfree_rcu(s, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 return 0;
363 }
364 }
365
366 return 0;
367 }
368 }
369 return 0;
370}
371
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000372static unsigned int gen_handle(struct tcf_proto *tp, unsigned salt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373{
John Fastabendb929d862014-09-12 20:09:49 -0700374 struct rsvp_head *data = rtnl_dereference(tp->root);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375 int i = 0xFFFF;
376
377 while (i-- > 0) {
378 u32 h;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000379
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380 if ((data->hgenerator += 0x10000) == 0)
381 data->hgenerator = 0x10000;
382 h = data->hgenerator|salt;
383 if (rsvp_get(tp, h) == 0)
384 return h;
385 }
386 return 0;
387}
388
389static int tunnel_bts(struct rsvp_head *data)
390{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000391 int n = data->tgenerator >> 5;
392 u32 b = 1 << (data->tgenerator & 0x1F);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900393
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000394 if (data->tmap[n] & b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 return 0;
396 data->tmap[n] |= b;
397 return 1;
398}
399
400static void tunnel_recycle(struct rsvp_head *data)
401{
John Fastabendb929d862014-09-12 20:09:49 -0700402 struct rsvp_session __rcu **sht = data->ht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700403 u32 tmap[256/32];
404 int h1, h2;
405
406 memset(tmap, 0, sizeof(tmap));
407
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000408 for (h1 = 0; h1 < 256; h1++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700409 struct rsvp_session *s;
John Fastabendb929d862014-09-12 20:09:49 -0700410 for (s = rtnl_dereference(sht[h1]); s;
411 s = rtnl_dereference(s->next)) {
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000412 for (h2 = 0; h2 <= 16; h2++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700413 struct rsvp_filter *f;
414
John Fastabendb929d862014-09-12 20:09:49 -0700415 for (f = rtnl_dereference(s->ht[h2]); f;
416 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 if (f->tunnelhdr == 0)
418 continue;
419 data->tgenerator = f->res.classid;
420 tunnel_bts(data);
421 }
422 }
423 }
424 }
425
426 memcpy(data->tmap, tmap, sizeof(tmap));
427}
428
429static u32 gen_tunnel(struct rsvp_head *data)
430{
431 int i, k;
432
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000433 for (k = 0; k < 2; k++) {
434 for (i = 255; i > 0; i--) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435 if (++data->tgenerator == 0)
436 data->tgenerator = 1;
437 if (tunnel_bts(data))
438 return data->tgenerator;
439 }
440 tunnel_recycle(data);
441 }
442 return 0;
443}
444
Patrick McHardy6fa8c012008-01-23 20:36:12 -0800445static const struct nla_policy rsvp_policy[TCA_RSVP_MAX + 1] = {
446 [TCA_RSVP_CLASSID] = { .type = NLA_U32 },
447 [TCA_RSVP_DST] = { .type = NLA_BINARY,
448 .len = RSVP_DST_LEN * sizeof(u32) },
449 [TCA_RSVP_SRC] = { .type = NLA_BINARY,
450 .len = RSVP_DST_LEN * sizeof(u32) },
451 [TCA_RSVP_PINFO] = { .len = sizeof(struct tc_rsvp_pinfo) },
452};
453
Benjamin LaHaisec1b52732013-01-14 05:15:39 +0000454static int rsvp_change(struct net *net, struct sk_buff *in_skb,
Eric W. Biedermanaf4c6642012-05-25 13:42:45 -0600455 struct tcf_proto *tp, unsigned long base,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456 u32 handle,
Patrick McHardyadd93b62008-01-22 22:11:33 -0800457 struct nlattr **tca,
Cong Wang2f7ef2f2014-04-25 13:54:06 -0700458 unsigned long *arg, bool ovr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700459{
John Fastabendb929d862014-09-12 20:09:49 -0700460 struct rsvp_head *data = rtnl_dereference(tp->root);
461 struct rsvp_filter *f, *nfp;
462 struct rsvp_filter __rcu **fp;
463 struct rsvp_session *nsp, *s;
464 struct rsvp_session __rcu **sp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700465 struct tc_rsvp_pinfo *pinfo = NULL;
Igor Maravić27e95a82011-08-30 03:12:55 +0000466 struct nlattr *opt = tca[TCA_OPTIONS];
Patrick McHardyadd93b62008-01-22 22:11:33 -0800467 struct nlattr *tb[TCA_RSVP_MAX + 1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700468 struct tcf_exts e;
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000469 unsigned int h1, h2;
Al Viro66c6f522006-11-20 18:07:51 -0800470 __be32 *dst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700471 int err;
472
473 if (opt == NULL)
474 return handle ? -EINVAL : 0;
475
Patrick McHardy6fa8c012008-01-23 20:36:12 -0800476 err = nla_parse_nested(tb, TCA_RSVP_MAX, opt, rsvp_policy);
Patrick McHardycee63722008-01-23 20:33:32 -0800477 if (err < 0)
478 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700479
WANG Cong5da57f42013-12-15 20:15:07 -0800480 tcf_exts_init(&e, TCA_RSVP_ACT, TCA_RSVP_POLICE);
Cong Wang2f7ef2f2014-04-25 13:54:06 -0700481 err = tcf_exts_validate(net, tp, tb, tca[TCA_RATE], &e, ovr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700482 if (err < 0)
483 return err;
484
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000485 f = (struct rsvp_filter *)*arg;
486 if (f) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700487 /* Node exists: adjust only classid */
John Fastabend53dfd502014-09-26 10:02:50 -0700488 struct rsvp_filter *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700489
490 if (f->handle != handle && handle)
491 goto errout2;
John Fastabend53dfd502014-09-26 10:02:50 -0700492
493 n = kmemdup(f, sizeof(*f), GFP_KERNEL);
494 if (!n) {
495 err = -ENOMEM;
496 goto errout2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497 }
498
John Fastabend53dfd502014-09-26 10:02:50 -0700499 tcf_exts_init(&n->exts, TCA_RSVP_ACT, TCA_RSVP_POLICE);
500
501 if (tb[TCA_RSVP_CLASSID]) {
502 n->res.classid = nla_get_u32(tb[TCA_RSVP_CLASSID]);
503 tcf_bind_filter(tp, &n->res, base);
504 }
505
506 tcf_exts_change(tp, &n->exts, &e);
507 rsvp_replace(tp, n, handle);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 return 0;
509 }
510
511 /* Now more serious part... */
512 err = -EINVAL;
513 if (handle)
514 goto errout2;
Igor Maravić27e95a82011-08-30 03:12:55 +0000515 if (tb[TCA_RSVP_DST] == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700516 goto errout2;
517
518 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700519 f = kzalloc(sizeof(struct rsvp_filter), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520 if (f == NULL)
521 goto errout2;
522
WANG Cong5da57f42013-12-15 20:15:07 -0800523 tcf_exts_init(&f->exts, TCA_RSVP_ACT, TCA_RSVP_POLICE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 h2 = 16;
Igor Maravić27e95a82011-08-30 03:12:55 +0000525 if (tb[TCA_RSVP_SRC]) {
526 memcpy(f->src, nla_data(tb[TCA_RSVP_SRC]), sizeof(f->src));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700527 h2 = hash_src(f->src);
528 }
Igor Maravić27e95a82011-08-30 03:12:55 +0000529 if (tb[TCA_RSVP_PINFO]) {
530 pinfo = nla_data(tb[TCA_RSVP_PINFO]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700531 f->spi = pinfo->spi;
532 f->tunnelhdr = pinfo->tunnelhdr;
533 }
Igor Maravić27e95a82011-08-30 03:12:55 +0000534 if (tb[TCA_RSVP_CLASSID])
535 f->res.classid = nla_get_u32(tb[TCA_RSVP_CLASSID]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536
Igor Maravić27e95a82011-08-30 03:12:55 +0000537 dst = nla_data(tb[TCA_RSVP_DST]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700538 h1 = hash_dst(dst, pinfo ? pinfo->protocol : 0, pinfo ? pinfo->tunnelid : 0);
539
540 err = -ENOMEM;
541 if ((f->handle = gen_handle(tp, h1 | (h2<<8))) == 0)
542 goto errout;
543
544 if (f->tunnelhdr) {
545 err = -EINVAL;
546 if (f->res.classid > 255)
547 goto errout;
548
549 err = -ENOMEM;
550 if (f->res.classid == 0 &&
551 (f->res.classid = gen_tunnel(data)) == 0)
552 goto errout;
553 }
554
John Fastabendb929d862014-09-12 20:09:49 -0700555 for (sp = &data->ht[h1];
556 (s = rtnl_dereference(*sp)) != NULL;
557 sp = &s->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700558 if (dst[RSVP_DST_LEN-1] == s->dst[RSVP_DST_LEN-1] &&
559 pinfo && pinfo->protocol == s->protocol &&
Joe Perchesf64f9e72009-11-29 16:55:45 -0800560 memcmp(&pinfo->dpi, &s->dpi, sizeof(s->dpi)) == 0 &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561#if RSVP_DST_LEN == 4
Joe Perchesf64f9e72009-11-29 16:55:45 -0800562 dst[0] == s->dst[0] &&
563 dst[1] == s->dst[1] &&
564 dst[2] == s->dst[2] &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565#endif
Joe Perchesf64f9e72009-11-29 16:55:45 -0800566 pinfo->tunnelid == s->tunnelid) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700567
568insert:
569 /* OK, we found appropriate session */
570
571 fp = &s->ht[h2];
572
573 f->sess = s;
574 if (f->tunnelhdr == 0)
575 tcf_bind_filter(tp, &f->res, base);
576
577 tcf_exts_change(tp, &f->exts, &e);
578
John Fastabendb929d862014-09-12 20:09:49 -0700579 fp = &s->ht[h2];
580 for (nfp = rtnl_dereference(*fp); nfp;
581 fp = &nfp->next, nfp = rtnl_dereference(*fp)) {
582 __u32 mask = nfp->spi.mask & f->spi.mask;
583
584 if (mask != f->spi.mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700585 break;
John Fastabendb929d862014-09-12 20:09:49 -0700586 }
587 RCU_INIT_POINTER(f->next, nfp);
588 rcu_assign_pointer(*fp, f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589
590 *arg = (unsigned long)f;
591 return 0;
592 }
593 }
594
595 /* No session found. Create new one. */
596
597 err = -ENOBUFS;
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700598 s = kzalloc(sizeof(struct rsvp_session), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700599 if (s == NULL)
600 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601 memcpy(s->dst, dst, sizeof(s->dst));
602
603 if (pinfo) {
604 s->dpi = pinfo->dpi;
605 s->protocol = pinfo->protocol;
606 s->tunnelid = pinfo->tunnelid;
607 }
John Fastabendb929d862014-09-12 20:09:49 -0700608 sp = &data->ht[h1];
609 for (nsp = rtnl_dereference(*sp); nsp;
610 sp = &nsp->next, nsp = rtnl_dereference(*sp)) {
611 if ((nsp->dpi.mask & s->dpi.mask) != s->dpi.mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700612 break;
613 }
John Fastabendb929d862014-09-12 20:09:49 -0700614 RCU_INIT_POINTER(s->next, nsp);
615 rcu_assign_pointer(*sp, s);
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900616
Linus Torvalds1da177e2005-04-16 15:20:36 -0700617 goto insert;
618
619errout:
Jesper Juhla51482b2005-11-08 09:41:34 -0800620 kfree(f);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621errout2:
WANG Cong18d02642014-09-25 10:26:37 -0700622 tcf_exts_destroy(&e);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700623 return err;
624}
625
626static void rsvp_walk(struct tcf_proto *tp, struct tcf_walker *arg)
627{
John Fastabendb929d862014-09-12 20:09:49 -0700628 struct rsvp_head *head = rtnl_dereference(tp->root);
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000629 unsigned int h, h1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630
631 if (arg->stop)
632 return;
633
634 for (h = 0; h < 256; h++) {
635 struct rsvp_session *s;
636
John Fastabendb929d862014-09-12 20:09:49 -0700637 for (s = rtnl_dereference(head->ht[h]); s;
638 s = rtnl_dereference(s->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700639 for (h1 = 0; h1 <= 16; h1++) {
640 struct rsvp_filter *f;
641
John Fastabendb929d862014-09-12 20:09:49 -0700642 for (f = rtnl_dereference(s->ht[h1]); f;
643 f = rtnl_dereference(f->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700644 if (arg->count < arg->skip) {
645 arg->count++;
646 continue;
647 }
648 if (arg->fn(tp, (unsigned long)f, arg) < 0) {
649 arg->stop = 1;
650 return;
651 }
652 arg->count++;
653 }
654 }
655 }
656 }
657}
658
WANG Cong832d1d52014-01-09 16:14:01 -0800659static int rsvp_dump(struct net *net, struct tcf_proto *tp, unsigned long fh,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700660 struct sk_buff *skb, struct tcmsg *t)
661{
Eric Dumazetcc7ec452011-01-19 19:26:56 +0000662 struct rsvp_filter *f = (struct rsvp_filter *)fh;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700663 struct rsvp_session *s;
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800664 struct nlattr *nest;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700665 struct tc_rsvp_pinfo pinfo;
666
667 if (f == NULL)
668 return skb->len;
669 s = f->sess;
670
671 t->tcm_handle = f->handle;
672
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800673 nest = nla_nest_start(skb, TCA_OPTIONS);
674 if (nest == NULL)
675 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700676
David S. Miller1b34ec42012-03-29 05:11:39 -0400677 if (nla_put(skb, TCA_RSVP_DST, sizeof(s->dst), &s->dst))
678 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700679 pinfo.dpi = s->dpi;
680 pinfo.spi = f->spi;
681 pinfo.protocol = s->protocol;
682 pinfo.tunnelid = s->tunnelid;
683 pinfo.tunnelhdr = f->tunnelhdr;
Patrick McHardy8a470772005-06-28 12:56:45 -0700684 pinfo.pad = 0;
David S. Miller1b34ec42012-03-29 05:11:39 -0400685 if (nla_put(skb, TCA_RSVP_PINFO, sizeof(pinfo), &pinfo))
686 goto nla_put_failure;
687 if (f->res.classid &&
688 nla_put_u32(skb, TCA_RSVP_CLASSID, f->res.classid))
689 goto nla_put_failure;
690 if (((f->handle >> 8) & 0xFF) != 16 &&
691 nla_put(skb, TCA_RSVP_SRC, sizeof(f->src), f->src))
692 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700693
WANG Cong5da57f42013-12-15 20:15:07 -0800694 if (tcf_exts_dump(skb, &f->exts) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -0800695 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700696
Patrick McHardy4b3550ef2008-01-23 20:34:11 -0800697 nla_nest_end(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698
WANG Cong5da57f42013-12-15 20:15:07 -0800699 if (tcf_exts_dump_stats(skb, &f->exts) < 0)
Patrick McHardyadd93b62008-01-22 22:11:33 -0800700 goto nla_put_failure;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700701 return skb->len;
702
Patrick McHardyadd93b62008-01-22 22:11:33 -0800703nla_put_failure:
Jiri Pirko6ea3b442014-12-09 22:23:29 +0100704 nla_nest_cancel(skb, nest);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700705 return -1;
706}
707
Igor Maravić27e95a82011-08-30 03:12:55 +0000708static struct tcf_proto_ops RSVP_OPS __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700709 .kind = RSVP_ID,
710 .classify = rsvp_classify,
711 .init = rsvp_init,
712 .destroy = rsvp_destroy,
713 .get = rsvp_get,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700714 .change = rsvp_change,
715 .delete = rsvp_delete,
716 .walk = rsvp_walk,
717 .dump = rsvp_dump,
718 .owner = THIS_MODULE,
719};
720
721static int __init init_rsvp(void)
722{
723 return register_tcf_proto_ops(&RSVP_OPS);
724}
725
YOSHIFUJI Hideaki10297b92007-02-09 23:25:16 +0900726static void __exit exit_rsvp(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727{
728 unregister_tcf_proto_ops(&RSVP_OPS);
729}
730
731module_init(init_rsvp)
732module_exit(exit_rsvp)