blob: 1010b469d7d3440a4f9980c13bfaf280fd6a3e0e [file] [log] [blame]
Robert Olsson19baf832005-06-21 12:43:18 -07001/*
2 * This program is free software; you can redistribute it and/or
3 * modify it under the terms of the GNU General Public License
4 * as published by the Free Software Foundation; either version
5 * 2 of the License, or (at your option) any later version.
6 *
7 * Robert Olsson <robert.olsson@its.uu.se> Uppsala Universitet
8 * & Swedish University of Agricultural Sciences.
9 *
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090010 * Jens Laas <jens.laas@data.slu.se> Swedish University of
Robert Olsson19baf832005-06-21 12:43:18 -070011 * Agricultural Sciences.
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090012 *
Robert Olsson19baf832005-06-21 12:43:18 -070013 * Hans Liss <hans.liss@its.uu.se> Uppsala Universitet
14 *
15 * This work is based on the LPC-trie which is originally descibed in:
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090016 *
Robert Olsson19baf832005-06-21 12:43:18 -070017 * An experimental study of compression methods for dynamic tries
18 * Stefan Nilsson and Matti Tikkanen. Algorithmica, 33(1):19-33, 2002.
19 * http://www.nada.kth.se/~snilsson/public/papers/dyntrie2/
20 *
21 *
22 * IP-address lookup using LC-tries. Stefan Nilsson and Gunnar Karlsson
23 * IEEE Journal on Selected Areas in Communications, 17(6):1083-1092, June 1999
24 *
25 * Version: $Id: fib_trie.c,v 1.3 2005/06/08 14:20:01 robert Exp $
26 *
27 *
28 * Code from fib_hash has been reused which includes the following header:
29 *
30 *
31 * INET An implementation of the TCP/IP protocol suite for the LINUX
32 * operating system. INET is implemented using the BSD Socket
33 * interface as the means of communication with the user level.
34 *
35 * IPv4 FIB: lookup engine and maintenance routines.
36 *
37 *
38 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
39 *
40 * This program is free software; you can redistribute it and/or
41 * modify it under the terms of the GNU General Public License
42 * as published by the Free Software Foundation; either version
43 * 2 of the License, or (at your option) any later version.
Robert Olssonfd966252005-12-22 11:25:10 -080044 *
45 * Substantial contributions to this work comes from:
46 *
47 * David S. Miller, <davem@davemloft.net>
48 * Stephen Hemminger <shemminger@osdl.org>
49 * Paul E. McKenney <paulmck@us.ibm.com>
50 * Patrick McHardy <kaber@trash.net>
Robert Olsson19baf832005-06-21 12:43:18 -070051 */
52
Robert Olsson05eee482007-03-19 16:27:37 -070053#define VERSION "0.408"
Robert Olsson19baf832005-06-21 12:43:18 -070054
Robert Olsson19baf832005-06-21 12:43:18 -070055#include <asm/uaccess.h>
56#include <asm/system.h>
Jiri Slaby1977f032007-10-18 23:40:25 -070057#include <linux/bitops.h>
Robert Olsson19baf832005-06-21 12:43:18 -070058#include <linux/types.h>
59#include <linux/kernel.h>
Robert Olsson19baf832005-06-21 12:43:18 -070060#include <linux/mm.h>
61#include <linux/string.h>
62#include <linux/socket.h>
63#include <linux/sockios.h>
64#include <linux/errno.h>
65#include <linux/in.h>
66#include <linux/inet.h>
Stephen Hemmingercd8787a2006-01-03 14:38:34 -080067#include <linux/inetdevice.h>
Robert Olsson19baf832005-06-21 12:43:18 -070068#include <linux/netdevice.h>
69#include <linux/if_arp.h>
70#include <linux/proc_fs.h>
Robert Olsson2373ce12005-08-25 13:01:29 -070071#include <linux/rcupdate.h>
Robert Olsson19baf832005-06-21 12:43:18 -070072#include <linux/skbuff.h>
73#include <linux/netlink.h>
74#include <linux/init.h>
75#include <linux/list.h>
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020076#include <net/net_namespace.h>
Robert Olsson19baf832005-06-21 12:43:18 -070077#include <net/ip.h>
78#include <net/protocol.h>
79#include <net/route.h>
80#include <net/tcp.h>
81#include <net/sock.h>
82#include <net/ip_fib.h>
83#include "fib_lookup.h"
84
85#undef CONFIG_IP_FIB_TRIE_STATS
Robert Olsson06ef9212006-03-20 21:35:01 -080086#define MAX_STAT_DEPTH 32
Robert Olsson19baf832005-06-21 12:43:18 -070087
Robert Olsson19baf832005-06-21 12:43:18 -070088#define KEYLENGTH (8*sizeof(t_key))
Robert Olsson19baf832005-06-21 12:43:18 -070089
Robert Olsson19baf832005-06-21 12:43:18 -070090typedef unsigned int t_key;
91
92#define T_TNODE 0
93#define T_LEAF 1
94#define NODE_TYPE_MASK 0x1UL
Robert Olsson2373ce12005-08-25 13:01:29 -070095#define NODE_TYPE(node) ((node)->parent & NODE_TYPE_MASK)
96
Olof Johansson91b9a272005-08-09 20:24:39 -070097#define IS_TNODE(n) (!(n->parent & T_LEAF))
98#define IS_LEAF(n) (n->parent & T_LEAF)
Robert Olsson19baf832005-06-21 12:43:18 -070099
100struct node {
Olof Johansson91b9a272005-08-09 20:24:39 -0700101 t_key key;
102 unsigned long parent;
Robert Olsson19baf832005-06-21 12:43:18 -0700103};
104
105struct leaf {
Olof Johansson91b9a272005-08-09 20:24:39 -0700106 t_key key;
107 unsigned long parent;
Robert Olsson19baf832005-06-21 12:43:18 -0700108 struct hlist_head list;
Robert Olsson2373ce12005-08-25 13:01:29 -0700109 struct rcu_head rcu;
Robert Olsson19baf832005-06-21 12:43:18 -0700110};
111
112struct leaf_info {
113 struct hlist_node hlist;
Robert Olsson2373ce12005-08-25 13:01:29 -0700114 struct rcu_head rcu;
Robert Olsson19baf832005-06-21 12:43:18 -0700115 int plen;
116 struct list_head falh;
117};
118
119struct tnode {
Olof Johansson91b9a272005-08-09 20:24:39 -0700120 t_key key;
121 unsigned long parent;
122 unsigned short pos:5; /* 2log(KEYLENGTH) bits needed */
123 unsigned short bits:5; /* 2log(KEYLENGTH) bits needed */
124 unsigned short full_children; /* KEYLENGTH bits needed */
125 unsigned short empty_children; /* KEYLENGTH bits needed */
Robert Olsson2373ce12005-08-25 13:01:29 -0700126 struct rcu_head rcu;
Olof Johansson91b9a272005-08-09 20:24:39 -0700127 struct node *child[0];
Robert Olsson19baf832005-06-21 12:43:18 -0700128};
129
130#ifdef CONFIG_IP_FIB_TRIE_STATS
131struct trie_use_stats {
132 unsigned int gets;
133 unsigned int backtrack;
134 unsigned int semantic_match_passed;
135 unsigned int semantic_match_miss;
136 unsigned int null_node_hit;
Robert Olsson2f368952005-07-05 15:02:40 -0700137 unsigned int resize_node_skipped;
Robert Olsson19baf832005-06-21 12:43:18 -0700138};
139#endif
140
141struct trie_stat {
142 unsigned int totdepth;
143 unsigned int maxdepth;
144 unsigned int tnodes;
145 unsigned int leaves;
146 unsigned int nullpointers;
Robert Olsson06ef9212006-03-20 21:35:01 -0800147 unsigned int nodesizes[MAX_STAT_DEPTH];
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700148};
Robert Olsson19baf832005-06-21 12:43:18 -0700149
150struct trie {
Olof Johansson91b9a272005-08-09 20:24:39 -0700151 struct node *trie;
Robert Olsson19baf832005-06-21 12:43:18 -0700152#ifdef CONFIG_IP_FIB_TRIE_STATS
153 struct trie_use_stats stats;
154#endif
Olof Johansson91b9a272005-08-09 20:24:39 -0700155 int size;
Robert Olsson19baf832005-06-21 12:43:18 -0700156 unsigned int revision;
157};
158
Robert Olsson19baf832005-06-21 12:43:18 -0700159static void put_child(struct trie *t, struct tnode *tn, int i, struct node *n);
160static void tnode_put_child_reorg(struct tnode *tn, int i, struct node *n, int wasfull);
Robert Olsson19baf832005-06-21 12:43:18 -0700161static struct node *resize(struct trie *t, struct tnode *tn);
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700162static struct tnode *inflate(struct trie *t, struct tnode *tn);
163static struct tnode *halve(struct trie *t, struct tnode *tn);
Robert Olsson19baf832005-06-21 12:43:18 -0700164static void tnode_free(struct tnode *tn);
Robert Olsson19baf832005-06-21 12:43:18 -0700165
Christoph Lametere18b8902006-12-06 20:33:20 -0800166static struct kmem_cache *fn_alias_kmem __read_mostly;
Robert Olsson19baf832005-06-21 12:43:18 -0700167static struct trie *trie_local = NULL, *trie_main = NULL;
168
Stephen Hemminger06801912007-08-10 15:22:13 -0700169static inline struct tnode *node_parent(struct node *node)
170{
171 struct tnode *ret;
172
173 ret = (struct tnode *)(node->parent & ~NODE_TYPE_MASK);
174 return rcu_dereference(ret);
175}
176
177static inline void node_set_parent(struct node *node, struct tnode *ptr)
178{
179 rcu_assign_pointer(node->parent,
180 (unsigned long)ptr | NODE_TYPE(node));
181}
Robert Olsson2373ce12005-08-25 13:01:29 -0700182
183/* rcu_read_lock needs to be hold by caller from readside */
184
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700185static inline struct node *tnode_get_child(struct tnode *tn, int i)
Robert Olsson19baf832005-06-21 12:43:18 -0700186{
Olof Johansson91b9a272005-08-09 20:24:39 -0700187 BUG_ON(i >= 1 << tn->bits);
Robert Olsson19baf832005-06-21 12:43:18 -0700188
Robert Olsson2373ce12005-08-25 13:01:29 -0700189 return rcu_dereference(tn->child[i]);
Robert Olsson19baf832005-06-21 12:43:18 -0700190}
191
Stephen Hemmignerbb435b82005-08-09 20:25:39 -0700192static inline int tnode_child_length(const struct tnode *tn)
Robert Olsson19baf832005-06-21 12:43:18 -0700193{
Olof Johansson91b9a272005-08-09 20:24:39 -0700194 return 1 << tn->bits;
Robert Olsson19baf832005-06-21 12:43:18 -0700195}
196
Stephen Hemmingerab66b4a2007-08-10 15:22:58 -0700197static inline t_key mask_pfx(t_key k, unsigned short l)
198{
199 return (l == 0) ? 0 : k >> (KEYLENGTH-l) << (KEYLENGTH-l);
200}
201
Robert Olsson19baf832005-06-21 12:43:18 -0700202static inline t_key tkey_extract_bits(t_key a, int offset, int bits)
203{
Olof Johansson91b9a272005-08-09 20:24:39 -0700204 if (offset < KEYLENGTH)
Robert Olsson19baf832005-06-21 12:43:18 -0700205 return ((t_key)(a << offset)) >> (KEYLENGTH - bits);
Olof Johansson91b9a272005-08-09 20:24:39 -0700206 else
Robert Olsson19baf832005-06-21 12:43:18 -0700207 return 0;
208}
209
210static inline int tkey_equals(t_key a, t_key b)
211{
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700212 return a == b;
Robert Olsson19baf832005-06-21 12:43:18 -0700213}
214
215static inline int tkey_sub_equals(t_key a, int offset, int bits, t_key b)
216{
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700217 if (bits == 0 || offset >= KEYLENGTH)
218 return 1;
Olof Johansson91b9a272005-08-09 20:24:39 -0700219 bits = bits > KEYLENGTH ? KEYLENGTH : bits;
220 return ((a ^ b) << offset) >> (KEYLENGTH - bits) == 0;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700221}
Robert Olsson19baf832005-06-21 12:43:18 -0700222
223static inline int tkey_mismatch(t_key a, int offset, t_key b)
224{
225 t_key diff = a ^ b;
226 int i = offset;
227
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700228 if (!diff)
229 return 0;
230 while ((diff << i) >> (KEYLENGTH-1) == 0)
Robert Olsson19baf832005-06-21 12:43:18 -0700231 i++;
232 return i;
233}
234
Robert Olsson19baf832005-06-21 12:43:18 -0700235/*
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900236 To understand this stuff, an understanding of keys and all their bits is
237 necessary. Every node in the trie has a key associated with it, but not
Robert Olsson19baf832005-06-21 12:43:18 -0700238 all of the bits in that key are significant.
239
240 Consider a node 'n' and its parent 'tp'.
241
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900242 If n is a leaf, every bit in its key is significant. Its presence is
243 necessitated by path compression, since during a tree traversal (when
244 searching for a leaf - unless we are doing an insertion) we will completely
245 ignore all skipped bits we encounter. Thus we need to verify, at the end of
246 a potentially successful search, that we have indeed been walking the
Robert Olsson19baf832005-06-21 12:43:18 -0700247 correct key path.
248
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900249 Note that we can never "miss" the correct key in the tree if present by
250 following the wrong path. Path compression ensures that segments of the key
251 that are the same for all keys with a given prefix are skipped, but the
252 skipped part *is* identical for each node in the subtrie below the skipped
253 bit! trie_insert() in this implementation takes care of that - note the
Robert Olsson19baf832005-06-21 12:43:18 -0700254 call to tkey_sub_equals() in trie_insert().
255
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900256 if n is an internal node - a 'tnode' here, the various parts of its key
Robert Olsson19baf832005-06-21 12:43:18 -0700257 have many different meanings.
258
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900259 Example:
Robert Olsson19baf832005-06-21 12:43:18 -0700260 _________________________________________________________________
261 | i | i | i | i | i | i | i | N | N | N | S | S | S | S | S | C |
262 -----------------------------------------------------------------
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900263 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
Robert Olsson19baf832005-06-21 12:43:18 -0700264
265 _________________________________________________________________
266 | C | C | C | u | u | u | u | u | u | u | u | u | u | u | u | u |
267 -----------------------------------------------------------------
268 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
269
270 tp->pos = 7
271 tp->bits = 3
272 n->pos = 15
Olof Johansson91b9a272005-08-09 20:24:39 -0700273 n->bits = 4
Robert Olsson19baf832005-06-21 12:43:18 -0700274
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900275 First, let's just ignore the bits that come before the parent tp, that is
276 the bits from 0 to (tp->pos-1). They are *known* but at this point we do
Robert Olsson19baf832005-06-21 12:43:18 -0700277 not use them for anything.
278
279 The bits from (tp->pos) to (tp->pos + tp->bits - 1) - "N", above - are the
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900280 index into the parent's child array. That is, they will be used to find
Robert Olsson19baf832005-06-21 12:43:18 -0700281 'n' among tp's children.
282
283 The bits from (tp->pos + tp->bits) to (n->pos - 1) - "S" - are skipped bits
284 for the node n.
285
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900286 All the bits we have seen so far are significant to the node n. The rest
Robert Olsson19baf832005-06-21 12:43:18 -0700287 of the bits are really not needed or indeed known in n->key.
288
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900289 The bits from (n->pos) to (n->pos + n->bits - 1) - "C" - are the index into
Robert Olsson19baf832005-06-21 12:43:18 -0700290 n's child array, and will of course be different for each child.
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900291
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700292
Robert Olsson19baf832005-06-21 12:43:18 -0700293 The rest of the bits, from (n->pos + n->bits) onward, are completely unknown
294 at this point.
295
296*/
297
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700298static inline void check_tnode(const struct tnode *tn)
Robert Olsson19baf832005-06-21 12:43:18 -0700299{
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700300 WARN_ON(tn && tn->pos+tn->bits > 32);
Robert Olsson19baf832005-06-21 12:43:18 -0700301}
302
303static int halve_threshold = 25;
304static int inflate_threshold = 50;
Robert Olsson965ffea2007-03-19 16:29:58 -0700305static int halve_threshold_root = 8;
306static int inflate_threshold_root = 15;
Robert Olsson19baf832005-06-21 12:43:18 -0700307
Robert Olsson2373ce12005-08-25 13:01:29 -0700308
309static void __alias_free_mem(struct rcu_head *head)
310{
311 struct fib_alias *fa = container_of(head, struct fib_alias, rcu);
312 kmem_cache_free(fn_alias_kmem, fa);
313}
314
315static inline void alias_free_mem_rcu(struct fib_alias *fa)
316{
317 call_rcu(&fa->rcu, __alias_free_mem);
318}
319
320static void __leaf_free_rcu(struct rcu_head *head)
321{
322 kfree(container_of(head, struct leaf, rcu));
323}
324
Robert Olsson2373ce12005-08-25 13:01:29 -0700325static void __leaf_info_free_rcu(struct rcu_head *head)
326{
327 kfree(container_of(head, struct leaf_info, rcu));
328}
329
330static inline void free_leaf_info(struct leaf_info *leaf)
331{
332 call_rcu(&leaf->rcu, __leaf_info_free_rcu);
333}
334
335static struct tnode *tnode_alloc(unsigned int size)
336{
337 struct page *pages;
338
339 if (size <= PAGE_SIZE)
340 return kcalloc(size, 1, GFP_KERNEL);
341
342 pages = alloc_pages(GFP_KERNEL|__GFP_ZERO, get_order(size));
343 if (!pages)
344 return NULL;
345
346 return page_address(pages);
347}
348
349static void __tnode_free_rcu(struct rcu_head *head)
350{
351 struct tnode *tn = container_of(head, struct tnode, rcu);
352 unsigned int size = sizeof(struct tnode) +
353 (1 << tn->bits) * sizeof(struct node *);
354
355 if (size <= PAGE_SIZE)
356 kfree(tn);
357 else
358 free_pages((unsigned long)tn, get_order(size));
359}
360
361static inline void tnode_free(struct tnode *tn)
362{
Stephen Hemminger132adf52007-03-08 20:44:43 -0800363 if (IS_LEAF(tn)) {
Robert Olsson550e29b2006-04-04 12:53:35 -0700364 struct leaf *l = (struct leaf *) tn;
365 call_rcu_bh(&l->rcu, __leaf_free_rcu);
Stephen Hemminger132adf52007-03-08 20:44:43 -0800366 } else
Robert Olsson550e29b2006-04-04 12:53:35 -0700367 call_rcu(&tn->rcu, __tnode_free_rcu);
Robert Olsson2373ce12005-08-25 13:01:29 -0700368}
369
Robert Olsson19baf832005-06-21 12:43:18 -0700370static struct leaf *leaf_new(void)
371{
372 struct leaf *l = kmalloc(sizeof(struct leaf), GFP_KERNEL);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700373 if (l) {
Robert Olsson2373ce12005-08-25 13:01:29 -0700374 l->parent = T_LEAF;
Robert Olsson19baf832005-06-21 12:43:18 -0700375 INIT_HLIST_HEAD(&l->list);
376 }
377 return l;
378}
379
380static struct leaf_info *leaf_info_new(int plen)
381{
382 struct leaf_info *li = kmalloc(sizeof(struct leaf_info), GFP_KERNEL);
Robert Olsson2373ce12005-08-25 13:01:29 -0700383 if (li) {
384 li->plen = plen;
385 INIT_LIST_HEAD(&li->falh);
Patrick McHardyf0e36f82005-07-05 14:44:55 -0700386 }
Robert Olsson2373ce12005-08-25 13:01:29 -0700387 return li;
Patrick McHardyf0e36f82005-07-05 14:44:55 -0700388}
389
Robert Olsson19baf832005-06-21 12:43:18 -0700390static struct tnode* tnode_new(t_key key, int pos, int bits)
391{
392 int nchildren = 1<<bits;
393 int sz = sizeof(struct tnode) + nchildren * sizeof(struct node *);
Patrick McHardyf0e36f82005-07-05 14:44:55 -0700394 struct tnode *tn = tnode_alloc(sz);
Robert Olsson19baf832005-06-21 12:43:18 -0700395
Olof Johansson91b9a272005-08-09 20:24:39 -0700396 if (tn) {
Robert Olsson19baf832005-06-21 12:43:18 -0700397 memset(tn, 0, sz);
Robert Olsson2373ce12005-08-25 13:01:29 -0700398 tn->parent = T_TNODE;
Robert Olsson19baf832005-06-21 12:43:18 -0700399 tn->pos = pos;
400 tn->bits = bits;
401 tn->key = key;
402 tn->full_children = 0;
403 tn->empty_children = 1<<bits;
404 }
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700405
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700406 pr_debug("AT %p s=%u %u\n", tn, (unsigned int) sizeof(struct tnode),
407 (unsigned int) (sizeof(struct node) * 1<<bits));
Robert Olsson19baf832005-06-21 12:43:18 -0700408 return tn;
409}
410
Robert Olsson19baf832005-06-21 12:43:18 -0700411/*
412 * Check whether a tnode 'n' is "full", i.e. it is an internal node
413 * and no bits are skipped. See discussion in dyntree paper p. 6
414 */
415
Stephen Hemmignerbb435b82005-08-09 20:25:39 -0700416static inline int tnode_full(const struct tnode *tn, const struct node *n)
Robert Olsson19baf832005-06-21 12:43:18 -0700417{
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700418 if (n == NULL || IS_LEAF(n))
Robert Olsson19baf832005-06-21 12:43:18 -0700419 return 0;
420
421 return ((struct tnode *) n)->pos == tn->pos + tn->bits;
422}
423
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700424static inline void put_child(struct trie *t, struct tnode *tn, int i, struct node *n)
Robert Olsson19baf832005-06-21 12:43:18 -0700425{
426 tnode_put_child_reorg(tn, i, n, -1);
427}
428
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700429 /*
Robert Olsson19baf832005-06-21 12:43:18 -0700430 * Add a child at position i overwriting the old value.
431 * Update the value of full_children and empty_children.
432 */
433
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700434static void tnode_put_child_reorg(struct tnode *tn, int i, struct node *n, int wasfull)
Robert Olsson19baf832005-06-21 12:43:18 -0700435{
Robert Olsson2373ce12005-08-25 13:01:29 -0700436 struct node *chi = tn->child[i];
Robert Olsson19baf832005-06-21 12:43:18 -0700437 int isfull;
438
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700439 BUG_ON(i >= 1<<tn->bits);
440
Robert Olsson19baf832005-06-21 12:43:18 -0700441
442 /* update emptyChildren */
443 if (n == NULL && chi != NULL)
444 tn->empty_children++;
445 else if (n != NULL && chi == NULL)
446 tn->empty_children--;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700447
Robert Olsson19baf832005-06-21 12:43:18 -0700448 /* update fullChildren */
Olof Johansson91b9a272005-08-09 20:24:39 -0700449 if (wasfull == -1)
Robert Olsson19baf832005-06-21 12:43:18 -0700450 wasfull = tnode_full(tn, chi);
451
452 isfull = tnode_full(tn, n);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700453 if (wasfull && !isfull)
Robert Olsson19baf832005-06-21 12:43:18 -0700454 tn->full_children--;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700455 else if (!wasfull && isfull)
Robert Olsson19baf832005-06-21 12:43:18 -0700456 tn->full_children++;
Olof Johansson91b9a272005-08-09 20:24:39 -0700457
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700458 if (n)
Stephen Hemminger06801912007-08-10 15:22:13 -0700459 node_set_parent(n, tn);
Robert Olsson19baf832005-06-21 12:43:18 -0700460
Robert Olsson2373ce12005-08-25 13:01:29 -0700461 rcu_assign_pointer(tn->child[i], n);
Robert Olsson19baf832005-06-21 12:43:18 -0700462}
463
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700464static struct node *resize(struct trie *t, struct tnode *tn)
Robert Olsson19baf832005-06-21 12:43:18 -0700465{
466 int i;
Robert Olsson2f368952005-07-05 15:02:40 -0700467 int err = 0;
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700468 struct tnode *old_tn;
Robert Olssone6308be2005-10-04 13:01:58 -0700469 int inflate_threshold_use;
470 int halve_threshold_use;
Robert Olsson05eee482007-03-19 16:27:37 -0700471 int max_resize;
Robert Olsson19baf832005-06-21 12:43:18 -0700472
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900473 if (!tn)
Robert Olsson19baf832005-06-21 12:43:18 -0700474 return NULL;
475
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700476 pr_debug("In tnode_resize %p inflate_threshold=%d threshold=%d\n",
477 tn, inflate_threshold, halve_threshold);
Robert Olsson19baf832005-06-21 12:43:18 -0700478
479 /* No children */
480 if (tn->empty_children == tnode_child_length(tn)) {
481 tnode_free(tn);
482 return NULL;
483 }
484 /* One child */
485 if (tn->empty_children == tnode_child_length(tn) - 1)
486 for (i = 0; i < tnode_child_length(tn); i++) {
Olof Johansson91b9a272005-08-09 20:24:39 -0700487 struct node *n;
Robert Olsson19baf832005-06-21 12:43:18 -0700488
Olof Johansson91b9a272005-08-09 20:24:39 -0700489 n = tn->child[i];
Robert Olsson2373ce12005-08-25 13:01:29 -0700490 if (!n)
Olof Johansson91b9a272005-08-09 20:24:39 -0700491 continue;
Olof Johansson91b9a272005-08-09 20:24:39 -0700492
493 /* compress one level */
Stephen Hemminger06801912007-08-10 15:22:13 -0700494 node_set_parent(n, NULL);
Olof Johansson91b9a272005-08-09 20:24:39 -0700495 tnode_free(tn);
496 return n;
Robert Olsson19baf832005-06-21 12:43:18 -0700497 }
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700498 /*
Robert Olsson19baf832005-06-21 12:43:18 -0700499 * Double as long as the resulting node has a number of
500 * nonempty nodes that are above the threshold.
501 */
502
503 /*
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700504 * From "Implementing a dynamic compressed trie" by Stefan Nilsson of
505 * the Helsinki University of Technology and Matti Tikkanen of Nokia
Robert Olsson19baf832005-06-21 12:43:18 -0700506 * Telecommunications, page 6:
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700507 * "A node is doubled if the ratio of non-empty children to all
Robert Olsson19baf832005-06-21 12:43:18 -0700508 * children in the *doubled* node is at least 'high'."
509 *
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700510 * 'high' in this instance is the variable 'inflate_threshold'. It
511 * is expressed as a percentage, so we multiply it with
512 * tnode_child_length() and instead of multiplying by 2 (since the
513 * child array will be doubled by inflate()) and multiplying
514 * the left-hand side by 100 (to handle the percentage thing) we
Robert Olsson19baf832005-06-21 12:43:18 -0700515 * multiply the left-hand side by 50.
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700516 *
517 * The left-hand side may look a bit weird: tnode_child_length(tn)
518 * - tn->empty_children is of course the number of non-null children
519 * in the current node. tn->full_children is the number of "full"
Robert Olsson19baf832005-06-21 12:43:18 -0700520 * children, that is non-null tnodes with a skip value of 0.
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700521 * All of those will be doubled in the resulting inflated tnode, so
Robert Olsson19baf832005-06-21 12:43:18 -0700522 * we just count them one extra time here.
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700523 *
Robert Olsson19baf832005-06-21 12:43:18 -0700524 * A clearer way to write this would be:
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700525 *
Robert Olsson19baf832005-06-21 12:43:18 -0700526 * to_be_doubled = tn->full_children;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700527 * not_to_be_doubled = tnode_child_length(tn) - tn->empty_children -
Robert Olsson19baf832005-06-21 12:43:18 -0700528 * tn->full_children;
529 *
530 * new_child_length = tnode_child_length(tn) * 2;
531 *
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700532 * new_fill_factor = 100 * (not_to_be_doubled + 2*to_be_doubled) /
Robert Olsson19baf832005-06-21 12:43:18 -0700533 * new_child_length;
534 * if (new_fill_factor >= inflate_threshold)
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700535 *
536 * ...and so on, tho it would mess up the while () loop.
537 *
Robert Olsson19baf832005-06-21 12:43:18 -0700538 * anyway,
539 * 100 * (not_to_be_doubled + 2*to_be_doubled) / new_child_length >=
540 * inflate_threshold
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700541 *
Robert Olsson19baf832005-06-21 12:43:18 -0700542 * avoid a division:
543 * 100 * (not_to_be_doubled + 2*to_be_doubled) >=
544 * inflate_threshold * new_child_length
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700545 *
Robert Olsson19baf832005-06-21 12:43:18 -0700546 * expand not_to_be_doubled and to_be_doubled, and shorten:
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700547 * 100 * (tnode_child_length(tn) - tn->empty_children +
Olof Johansson91b9a272005-08-09 20:24:39 -0700548 * tn->full_children) >= inflate_threshold * new_child_length
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700549 *
Robert Olsson19baf832005-06-21 12:43:18 -0700550 * expand new_child_length:
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700551 * 100 * (tnode_child_length(tn) - tn->empty_children +
Olof Johansson91b9a272005-08-09 20:24:39 -0700552 * tn->full_children) >=
Robert Olsson19baf832005-06-21 12:43:18 -0700553 * inflate_threshold * tnode_child_length(tn) * 2
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700554 *
Robert Olsson19baf832005-06-21 12:43:18 -0700555 * shorten again:
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700556 * 50 * (tn->full_children + tnode_child_length(tn) -
Olof Johansson91b9a272005-08-09 20:24:39 -0700557 * tn->empty_children) >= inflate_threshold *
Robert Olsson19baf832005-06-21 12:43:18 -0700558 * tnode_child_length(tn)
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700559 *
Robert Olsson19baf832005-06-21 12:43:18 -0700560 */
561
562 check_tnode(tn);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700563
Robert Olssone6308be2005-10-04 13:01:58 -0700564 /* Keep root node larger */
565
Stephen Hemminger132adf52007-03-08 20:44:43 -0800566 if (!tn->parent)
Robert Olssone6308be2005-10-04 13:01:58 -0700567 inflate_threshold_use = inflate_threshold_root;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900568 else
Robert Olssone6308be2005-10-04 13:01:58 -0700569 inflate_threshold_use = inflate_threshold;
570
Robert Olsson2f368952005-07-05 15:02:40 -0700571 err = 0;
Robert Olsson05eee482007-03-19 16:27:37 -0700572 max_resize = 10;
573 while ((tn->full_children > 0 && max_resize-- &&
Robert Olsson19baf832005-06-21 12:43:18 -0700574 50 * (tn->full_children + tnode_child_length(tn) - tn->empty_children) >=
Robert Olssone6308be2005-10-04 13:01:58 -0700575 inflate_threshold_use * tnode_child_length(tn))) {
Robert Olsson19baf832005-06-21 12:43:18 -0700576
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700577 old_tn = tn;
578 tn = inflate(t, tn);
579 if (IS_ERR(tn)) {
580 tn = old_tn;
Robert Olsson2f368952005-07-05 15:02:40 -0700581#ifdef CONFIG_IP_FIB_TRIE_STATS
582 t->stats.resize_node_skipped++;
583#endif
584 break;
585 }
Robert Olsson19baf832005-06-21 12:43:18 -0700586 }
587
Robert Olsson05eee482007-03-19 16:27:37 -0700588 if (max_resize < 0) {
589 if (!tn->parent)
590 printk(KERN_WARNING "Fix inflate_threshold_root. Now=%d size=%d bits\n",
591 inflate_threshold_root, tn->bits);
592 else
593 printk(KERN_WARNING "Fix inflate_threshold. Now=%d size=%d bits\n",
594 inflate_threshold, tn->bits);
595 }
596
Robert Olsson19baf832005-06-21 12:43:18 -0700597 check_tnode(tn);
598
599 /*
600 * Halve as long as the number of empty children in this
601 * node is above threshold.
602 */
Robert Olsson2f368952005-07-05 15:02:40 -0700603
Robert Olssone6308be2005-10-04 13:01:58 -0700604
605 /* Keep root node larger */
606
Stephen Hemminger132adf52007-03-08 20:44:43 -0800607 if (!tn->parent)
Robert Olssone6308be2005-10-04 13:01:58 -0700608 halve_threshold_use = halve_threshold_root;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900609 else
Robert Olssone6308be2005-10-04 13:01:58 -0700610 halve_threshold_use = halve_threshold;
611
Robert Olsson2f368952005-07-05 15:02:40 -0700612 err = 0;
Robert Olsson05eee482007-03-19 16:27:37 -0700613 max_resize = 10;
614 while (tn->bits > 1 && max_resize-- &&
Robert Olsson19baf832005-06-21 12:43:18 -0700615 100 * (tnode_child_length(tn) - tn->empty_children) <
Robert Olssone6308be2005-10-04 13:01:58 -0700616 halve_threshold_use * tnode_child_length(tn)) {
Robert Olsson19baf832005-06-21 12:43:18 -0700617
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700618 old_tn = tn;
619 tn = halve(t, tn);
620 if (IS_ERR(tn)) {
621 tn = old_tn;
Robert Olsson2f368952005-07-05 15:02:40 -0700622#ifdef CONFIG_IP_FIB_TRIE_STATS
623 t->stats.resize_node_skipped++;
624#endif
625 break;
626 }
627 }
628
Robert Olsson05eee482007-03-19 16:27:37 -0700629 if (max_resize < 0) {
630 if (!tn->parent)
631 printk(KERN_WARNING "Fix halve_threshold_root. Now=%d size=%d bits\n",
632 halve_threshold_root, tn->bits);
633 else
634 printk(KERN_WARNING "Fix halve_threshold. Now=%d size=%d bits\n",
635 halve_threshold, tn->bits);
636 }
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700637
Robert Olsson19baf832005-06-21 12:43:18 -0700638 /* Only one child remains */
Robert Olsson19baf832005-06-21 12:43:18 -0700639 if (tn->empty_children == tnode_child_length(tn) - 1)
640 for (i = 0; i < tnode_child_length(tn); i++) {
Olof Johansson91b9a272005-08-09 20:24:39 -0700641 struct node *n;
642
Olof Johansson91b9a272005-08-09 20:24:39 -0700643 n = tn->child[i];
Robert Olsson2373ce12005-08-25 13:01:29 -0700644 if (!n)
Olof Johansson91b9a272005-08-09 20:24:39 -0700645 continue;
Olof Johansson91b9a272005-08-09 20:24:39 -0700646
647 /* compress one level */
648
Stephen Hemminger06801912007-08-10 15:22:13 -0700649 node_set_parent(n, NULL);
Olof Johansson91b9a272005-08-09 20:24:39 -0700650 tnode_free(tn);
651 return n;
Robert Olsson19baf832005-06-21 12:43:18 -0700652 }
653
654 return (struct node *) tn;
655}
656
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700657static struct tnode *inflate(struct trie *t, struct tnode *tn)
Robert Olsson19baf832005-06-21 12:43:18 -0700658{
659 struct tnode *inode;
660 struct tnode *oldtnode = tn;
661 int olen = tnode_child_length(tn);
662 int i;
663
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700664 pr_debug("In inflate\n");
Robert Olsson19baf832005-06-21 12:43:18 -0700665
666 tn = tnode_new(oldtnode->key, oldtnode->pos, oldtnode->bits + 1);
667
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700668 if (!tn)
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700669 return ERR_PTR(-ENOMEM);
Robert Olsson2f368952005-07-05 15:02:40 -0700670
671 /*
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700672 * Preallocate and store tnodes before the actual work so we
673 * don't get into an inconsistent state if memory allocation
674 * fails. In case of failure we return the oldnode and inflate
Robert Olsson2f368952005-07-05 15:02:40 -0700675 * of tnode is ignored.
676 */
Olof Johansson91b9a272005-08-09 20:24:39 -0700677
678 for (i = 0; i < olen; i++) {
Robert Olsson2f368952005-07-05 15:02:40 -0700679 struct tnode *inode = (struct tnode *) tnode_get_child(oldtnode, i);
680
681 if (inode &&
682 IS_TNODE(inode) &&
683 inode->pos == oldtnode->pos + oldtnode->bits &&
684 inode->bits > 1) {
685 struct tnode *left, *right;
Stephen Hemmingerab66b4a2007-08-10 15:22:58 -0700686 t_key m = ~0U << (KEYLENGTH - 1) >> inode->pos;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700687
Robert Olsson2f368952005-07-05 15:02:40 -0700688 left = tnode_new(inode->key&(~m), inode->pos + 1,
689 inode->bits - 1);
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700690 if (!left)
691 goto nomem;
Olof Johansson91b9a272005-08-09 20:24:39 -0700692
Robert Olsson2f368952005-07-05 15:02:40 -0700693 right = tnode_new(inode->key|m, inode->pos + 1,
694 inode->bits - 1);
695
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900696 if (!right) {
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700697 tnode_free(left);
698 goto nomem;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900699 }
Robert Olsson2f368952005-07-05 15:02:40 -0700700
701 put_child(t, tn, 2*i, (struct node *) left);
702 put_child(t, tn, 2*i+1, (struct node *) right);
703 }
704 }
705
Olof Johansson91b9a272005-08-09 20:24:39 -0700706 for (i = 0; i < olen; i++) {
Robert Olsson19baf832005-06-21 12:43:18 -0700707 struct node *node = tnode_get_child(oldtnode, i);
Olof Johansson91b9a272005-08-09 20:24:39 -0700708 struct tnode *left, *right;
709 int size, j;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700710
Robert Olsson19baf832005-06-21 12:43:18 -0700711 /* An empty child */
712 if (node == NULL)
713 continue;
714
715 /* A leaf or an internal node with skipped bits */
716
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700717 if (IS_LEAF(node) || ((struct tnode *) node)->pos >
Robert Olsson19baf832005-06-21 12:43:18 -0700718 tn->pos + tn->bits - 1) {
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700719 if (tkey_extract_bits(node->key, oldtnode->pos + oldtnode->bits,
Robert Olsson19baf832005-06-21 12:43:18 -0700720 1) == 0)
721 put_child(t, tn, 2*i, node);
722 else
723 put_child(t, tn, 2*i+1, node);
724 continue;
725 }
726
727 /* An internal node with two children */
728 inode = (struct tnode *) node;
729
730 if (inode->bits == 1) {
731 put_child(t, tn, 2*i, inode->child[0]);
732 put_child(t, tn, 2*i+1, inode->child[1]);
733
734 tnode_free(inode);
Olof Johansson91b9a272005-08-09 20:24:39 -0700735 continue;
Robert Olsson19baf832005-06-21 12:43:18 -0700736 }
737
Olof Johansson91b9a272005-08-09 20:24:39 -0700738 /* An internal node with more than two children */
Robert Olsson19baf832005-06-21 12:43:18 -0700739
Olof Johansson91b9a272005-08-09 20:24:39 -0700740 /* We will replace this node 'inode' with two new
741 * ones, 'left' and 'right', each with half of the
742 * original children. The two new nodes will have
743 * a position one bit further down the key and this
744 * means that the "significant" part of their keys
745 * (see the discussion near the top of this file)
746 * will differ by one bit, which will be "0" in
747 * left's key and "1" in right's key. Since we are
748 * moving the key position by one step, the bit that
749 * we are moving away from - the bit at position
750 * (inode->pos) - is the one that will differ between
751 * left and right. So... we synthesize that bit in the
752 * two new keys.
753 * The mask 'm' below will be a single "one" bit at
754 * the position (inode->pos)
755 */
Robert Olsson19baf832005-06-21 12:43:18 -0700756
Olof Johansson91b9a272005-08-09 20:24:39 -0700757 /* Use the old key, but set the new significant
758 * bit to zero.
759 */
Robert Olsson19baf832005-06-21 12:43:18 -0700760
Olof Johansson91b9a272005-08-09 20:24:39 -0700761 left = (struct tnode *) tnode_get_child(tn, 2*i);
762 put_child(t, tn, 2*i, NULL);
Robert Olsson19baf832005-06-21 12:43:18 -0700763
Olof Johansson91b9a272005-08-09 20:24:39 -0700764 BUG_ON(!left);
Robert Olsson2f368952005-07-05 15:02:40 -0700765
Olof Johansson91b9a272005-08-09 20:24:39 -0700766 right = (struct tnode *) tnode_get_child(tn, 2*i+1);
767 put_child(t, tn, 2*i+1, NULL);
Robert Olsson2f368952005-07-05 15:02:40 -0700768
Olof Johansson91b9a272005-08-09 20:24:39 -0700769 BUG_ON(!right);
Robert Olsson2f368952005-07-05 15:02:40 -0700770
Olof Johansson91b9a272005-08-09 20:24:39 -0700771 size = tnode_child_length(left);
772 for (j = 0; j < size; j++) {
773 put_child(t, left, j, inode->child[j]);
774 put_child(t, right, j, inode->child[j + size]);
Robert Olsson19baf832005-06-21 12:43:18 -0700775 }
Olof Johansson91b9a272005-08-09 20:24:39 -0700776 put_child(t, tn, 2*i, resize(t, left));
777 put_child(t, tn, 2*i+1, resize(t, right));
778
779 tnode_free(inode);
Robert Olsson19baf832005-06-21 12:43:18 -0700780 }
781 tnode_free(oldtnode);
782 return tn;
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700783nomem:
784 {
785 int size = tnode_child_length(tn);
786 int j;
787
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700788 for (j = 0; j < size; j++)
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700789 if (tn->child[j])
790 tnode_free((struct tnode *)tn->child[j]);
791
792 tnode_free(tn);
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700793
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700794 return ERR_PTR(-ENOMEM);
795 }
Robert Olsson19baf832005-06-21 12:43:18 -0700796}
797
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700798static struct tnode *halve(struct trie *t, struct tnode *tn)
Robert Olsson19baf832005-06-21 12:43:18 -0700799{
800 struct tnode *oldtnode = tn;
801 struct node *left, *right;
802 int i;
803 int olen = tnode_child_length(tn);
804
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700805 pr_debug("In halve\n");
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700806
807 tn = tnode_new(oldtnode->key, oldtnode->pos, oldtnode->bits - 1);
Robert Olsson19baf832005-06-21 12:43:18 -0700808
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700809 if (!tn)
810 return ERR_PTR(-ENOMEM);
Robert Olsson2f368952005-07-05 15:02:40 -0700811
812 /*
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700813 * Preallocate and store tnodes before the actual work so we
814 * don't get into an inconsistent state if memory allocation
815 * fails. In case of failure we return the oldnode and halve
Robert Olsson2f368952005-07-05 15:02:40 -0700816 * of tnode is ignored.
817 */
818
Olof Johansson91b9a272005-08-09 20:24:39 -0700819 for (i = 0; i < olen; i += 2) {
Robert Olsson2f368952005-07-05 15:02:40 -0700820 left = tnode_get_child(oldtnode, i);
821 right = tnode_get_child(oldtnode, i+1);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700822
Robert Olsson2f368952005-07-05 15:02:40 -0700823 /* Two nonempty children */
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700824 if (left && right) {
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700825 struct tnode *newn;
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700826
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700827 newn = tnode_new(left->key, tn->pos + tn->bits, 1);
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700828
829 if (!newn)
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700830 goto nomem;
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700831
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700832 put_child(t, tn, i/2, (struct node *)newn);
Robert Olsson2f368952005-07-05 15:02:40 -0700833 }
Robert Olsson2f368952005-07-05 15:02:40 -0700834
Robert Olsson2f368952005-07-05 15:02:40 -0700835 }
Robert Olsson19baf832005-06-21 12:43:18 -0700836
Olof Johansson91b9a272005-08-09 20:24:39 -0700837 for (i = 0; i < olen; i += 2) {
838 struct tnode *newBinNode;
839
Robert Olsson19baf832005-06-21 12:43:18 -0700840 left = tnode_get_child(oldtnode, i);
841 right = tnode_get_child(oldtnode, i+1);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700842
Robert Olsson19baf832005-06-21 12:43:18 -0700843 /* At least one of the children is empty */
844 if (left == NULL) {
845 if (right == NULL) /* Both are empty */
846 continue;
847 put_child(t, tn, i/2, right);
Olof Johansson91b9a272005-08-09 20:24:39 -0700848 continue;
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700849 }
Olof Johansson91b9a272005-08-09 20:24:39 -0700850
851 if (right == NULL) {
Robert Olsson19baf832005-06-21 12:43:18 -0700852 put_child(t, tn, i/2, left);
Olof Johansson91b9a272005-08-09 20:24:39 -0700853 continue;
854 }
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700855
Robert Olsson19baf832005-06-21 12:43:18 -0700856 /* Two nonempty children */
Olof Johansson91b9a272005-08-09 20:24:39 -0700857 newBinNode = (struct tnode *) tnode_get_child(tn, i/2);
858 put_child(t, tn, i/2, NULL);
Olof Johansson91b9a272005-08-09 20:24:39 -0700859 put_child(t, newBinNode, 0, left);
860 put_child(t, newBinNode, 1, right);
861 put_child(t, tn, i/2, resize(t, newBinNode));
Robert Olsson19baf832005-06-21 12:43:18 -0700862 }
863 tnode_free(oldtnode);
864 return tn;
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700865nomem:
866 {
867 int size = tnode_child_length(tn);
868 int j;
869
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700870 for (j = 0; j < size; j++)
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700871 if (tn->child[j])
872 tnode_free((struct tnode *)tn->child[j]);
873
874 tnode_free(tn);
Stephen Hemminger0c7770c2005-08-23 21:59:41 -0700875
Robert Olsson2f80b3c2005-08-09 20:25:06 -0700876 return ERR_PTR(-ENOMEM);
877 }
Robert Olsson19baf832005-06-21 12:43:18 -0700878}
879
Olof Johansson91b9a272005-08-09 20:24:39 -0700880static void trie_init(struct trie *t)
Robert Olsson19baf832005-06-21 12:43:18 -0700881{
Olof Johansson91b9a272005-08-09 20:24:39 -0700882 if (!t)
883 return;
884
885 t->size = 0;
Robert Olsson2373ce12005-08-25 13:01:29 -0700886 rcu_assign_pointer(t->trie, NULL);
Olof Johansson91b9a272005-08-09 20:24:39 -0700887 t->revision = 0;
Robert Olsson19baf832005-06-21 12:43:18 -0700888#ifdef CONFIG_IP_FIB_TRIE_STATS
Olof Johansson91b9a272005-08-09 20:24:39 -0700889 memset(&t->stats, 0, sizeof(struct trie_use_stats));
Robert Olsson19baf832005-06-21 12:43:18 -0700890#endif
Robert Olsson19baf832005-06-21 12:43:18 -0700891}
892
Robert Olsson772cb712005-09-19 15:31:18 -0700893/* readside must use rcu_read_lock currently dump routines
Robert Olsson2373ce12005-08-25 13:01:29 -0700894 via get_fa_head and dump */
895
Robert Olsson772cb712005-09-19 15:31:18 -0700896static struct leaf_info *find_leaf_info(struct leaf *l, int plen)
Robert Olsson19baf832005-06-21 12:43:18 -0700897{
Robert Olsson772cb712005-09-19 15:31:18 -0700898 struct hlist_head *head = &l->list;
Robert Olsson19baf832005-06-21 12:43:18 -0700899 struct hlist_node *node;
900 struct leaf_info *li;
901
Robert Olsson2373ce12005-08-25 13:01:29 -0700902 hlist_for_each_entry_rcu(li, node, head, hlist)
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700903 if (li->plen == plen)
Robert Olsson19baf832005-06-21 12:43:18 -0700904 return li;
Olof Johansson91b9a272005-08-09 20:24:39 -0700905
Robert Olsson19baf832005-06-21 12:43:18 -0700906 return NULL;
907}
908
909static inline struct list_head * get_fa_head(struct leaf *l, int plen)
910{
Robert Olsson772cb712005-09-19 15:31:18 -0700911 struct leaf_info *li = find_leaf_info(l, plen);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700912
Olof Johansson91b9a272005-08-09 20:24:39 -0700913 if (!li)
914 return NULL;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700915
Olof Johansson91b9a272005-08-09 20:24:39 -0700916 return &li->falh;
Robert Olsson19baf832005-06-21 12:43:18 -0700917}
918
919static void insert_leaf_info(struct hlist_head *head, struct leaf_info *new)
920{
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900921 struct leaf_info *li = NULL, *last = NULL;
922 struct hlist_node *node;
Robert Olsson19baf832005-06-21 12:43:18 -0700923
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900924 if (hlist_empty(head)) {
925 hlist_add_head_rcu(&new->hlist, head);
926 } else {
927 hlist_for_each_entry(li, node, head, hlist) {
928 if (new->plen > li->plen)
929 break;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700930
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900931 last = li;
932 }
933 if (last)
934 hlist_add_after_rcu(&last->hlist, &new->hlist);
935 else
936 hlist_add_before_rcu(&new->hlist, &li->hlist);
937 }
Robert Olsson19baf832005-06-21 12:43:18 -0700938}
939
Robert Olsson2373ce12005-08-25 13:01:29 -0700940/* rcu_read_lock needs to be hold by caller from readside */
941
Robert Olsson19baf832005-06-21 12:43:18 -0700942static struct leaf *
943fib_find_node(struct trie *t, u32 key)
944{
945 int pos;
946 struct tnode *tn;
947 struct node *n;
948
949 pos = 0;
Robert Olsson2373ce12005-08-25 13:01:29 -0700950 n = rcu_dereference(t->trie);
Robert Olsson19baf832005-06-21 12:43:18 -0700951
952 while (n != NULL && NODE_TYPE(n) == T_TNODE) {
953 tn = (struct tnode *) n;
Olof Johansson91b9a272005-08-09 20:24:39 -0700954
Robert Olsson19baf832005-06-21 12:43:18 -0700955 check_tnode(tn);
Olof Johansson91b9a272005-08-09 20:24:39 -0700956
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700957 if (tkey_sub_equals(tn->key, pos, tn->pos-pos, key)) {
Olof Johansson91b9a272005-08-09 20:24:39 -0700958 pos = tn->pos + tn->bits;
Robert Olsson19baf832005-06-21 12:43:18 -0700959 n = tnode_get_child(tn, tkey_extract_bits(key, tn->pos, tn->bits));
Olof Johansson91b9a272005-08-09 20:24:39 -0700960 } else
Robert Olsson19baf832005-06-21 12:43:18 -0700961 break;
962 }
963 /* Case we have found a leaf. Compare prefixes */
964
Olof Johansson91b9a272005-08-09 20:24:39 -0700965 if (n != NULL && IS_LEAF(n) && tkey_equals(key, n->key))
966 return (struct leaf *)n;
967
Robert Olsson19baf832005-06-21 12:43:18 -0700968 return NULL;
969}
970
971static struct node *trie_rebalance(struct trie *t, struct tnode *tn)
972{
Robert Olsson19baf832005-06-21 12:43:18 -0700973 int wasfull;
Stephen Hemminger06801912007-08-10 15:22:13 -0700974 t_key cindex, key = tn->key;
975 struct tnode *tp;
Robert Olsson19baf832005-06-21 12:43:18 -0700976
Stephen Hemminger06801912007-08-10 15:22:13 -0700977 while (tn != NULL && (tp = node_parent((struct node *)tn)) != NULL) {
Robert Olsson19baf832005-06-21 12:43:18 -0700978 cindex = tkey_extract_bits(key, tp->pos, tp->bits);
979 wasfull = tnode_full(tp, tnode_get_child(tp, cindex));
980 tn = (struct tnode *) resize (t, (struct tnode *)tn);
981 tnode_put_child_reorg((struct tnode *)tp, cindex,(struct node*)tn, wasfull);
Olof Johansson91b9a272005-08-09 20:24:39 -0700982
Stephen Hemminger06801912007-08-10 15:22:13 -0700983 tp = node_parent((struct node *) tn);
984 if (!tp)
Robert Olsson19baf832005-06-21 12:43:18 -0700985 break;
Stephen Hemminger06801912007-08-10 15:22:13 -0700986 tn = tp;
Robert Olsson19baf832005-06-21 12:43:18 -0700987 }
Stephen Hemminger06801912007-08-10 15:22:13 -0700988
Robert Olsson19baf832005-06-21 12:43:18 -0700989 /* Handle last (top) tnode */
Stephen Hemmingerc877efb2005-07-19 14:01:51 -0700990 if (IS_TNODE(tn))
Robert Olsson19baf832005-06-21 12:43:18 -0700991 tn = (struct tnode*) resize(t, (struct tnode *)tn);
992
993 return (struct node*) tn;
994}
995
Robert Olsson2373ce12005-08-25 13:01:29 -0700996/* only used from updater-side */
997
Robert Olssonf835e472005-06-28 15:00:39 -0700998static struct list_head *
999fib_insert_node(struct trie *t, int *err, u32 key, int plen)
Robert Olsson19baf832005-06-21 12:43:18 -07001000{
1001 int pos, newpos;
1002 struct tnode *tp = NULL, *tn = NULL;
1003 struct node *n;
1004 struct leaf *l;
1005 int missbit;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001006 struct list_head *fa_head = NULL;
Robert Olsson19baf832005-06-21 12:43:18 -07001007 struct leaf_info *li;
1008 t_key cindex;
1009
1010 pos = 0;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001011 n = t->trie;
Robert Olsson19baf832005-06-21 12:43:18 -07001012
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001013 /* If we point to NULL, stop. Either the tree is empty and we should
1014 * just put a new leaf in if, or we have reached an empty child slot,
Robert Olsson19baf832005-06-21 12:43:18 -07001015 * and we should just put our new leaf in that.
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001016 * If we point to a T_TNODE, check if it matches our key. Note that
1017 * a T_TNODE might be skipping any number of bits - its 'pos' need
Robert Olsson19baf832005-06-21 12:43:18 -07001018 * not be the parent's 'pos'+'bits'!
1019 *
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001020 * If it does match the current key, get pos/bits from it, extract
Robert Olsson19baf832005-06-21 12:43:18 -07001021 * the index from our key, push the T_TNODE and walk the tree.
1022 *
1023 * If it doesn't, we have to replace it with a new T_TNODE.
1024 *
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001025 * If we point to a T_LEAF, it might or might not have the same key
1026 * as we do. If it does, just change the value, update the T_LEAF's
1027 * value, and return it.
Robert Olsson19baf832005-06-21 12:43:18 -07001028 * If it doesn't, we need to replace it with a T_TNODE.
1029 */
1030
1031 while (n != NULL && NODE_TYPE(n) == T_TNODE) {
1032 tn = (struct tnode *) n;
Olof Johansson91b9a272005-08-09 20:24:39 -07001033
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001034 check_tnode(tn);
Olof Johansson91b9a272005-08-09 20:24:39 -07001035
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001036 if (tkey_sub_equals(tn->key, pos, tn->pos-pos, key)) {
Robert Olsson19baf832005-06-21 12:43:18 -07001037 tp = tn;
Olof Johansson91b9a272005-08-09 20:24:39 -07001038 pos = tn->pos + tn->bits;
Robert Olsson19baf832005-06-21 12:43:18 -07001039 n = tnode_get_child(tn, tkey_extract_bits(key, tn->pos, tn->bits));
1040
Stephen Hemminger06801912007-08-10 15:22:13 -07001041 BUG_ON(n && node_parent(n) != tn);
Olof Johansson91b9a272005-08-09 20:24:39 -07001042 } else
Robert Olsson19baf832005-06-21 12:43:18 -07001043 break;
1044 }
1045
1046 /*
1047 * n ----> NULL, LEAF or TNODE
1048 *
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001049 * tp is n's (parent) ----> NULL or TNODE
Robert Olsson19baf832005-06-21 12:43:18 -07001050 */
1051
Olof Johansson91b9a272005-08-09 20:24:39 -07001052 BUG_ON(tp && IS_LEAF(tp));
Robert Olsson19baf832005-06-21 12:43:18 -07001053
1054 /* Case 1: n is a leaf. Compare prefixes */
1055
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001056 if (n != NULL && IS_LEAF(n) && tkey_equals(key, n->key)) {
Olof Johansson91b9a272005-08-09 20:24:39 -07001057 struct leaf *l = (struct leaf *) n;
1058
Robert Olsson19baf832005-06-21 12:43:18 -07001059 li = leaf_info_new(plen);
Olof Johansson91b9a272005-08-09 20:24:39 -07001060
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001061 if (!li) {
Robert Olssonf835e472005-06-28 15:00:39 -07001062 *err = -ENOMEM;
1063 goto err;
1064 }
Robert Olsson19baf832005-06-21 12:43:18 -07001065
1066 fa_head = &li->falh;
1067 insert_leaf_info(&l->list, li);
1068 goto done;
1069 }
1070 t->size++;
1071 l = leaf_new();
1072
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001073 if (!l) {
Robert Olssonf835e472005-06-28 15:00:39 -07001074 *err = -ENOMEM;
1075 goto err;
1076 }
Robert Olsson19baf832005-06-21 12:43:18 -07001077
1078 l->key = key;
1079 li = leaf_info_new(plen);
1080
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001081 if (!li) {
Robert Olssonf835e472005-06-28 15:00:39 -07001082 tnode_free((struct tnode *) l);
1083 *err = -ENOMEM;
1084 goto err;
1085 }
Robert Olsson19baf832005-06-21 12:43:18 -07001086
1087 fa_head = &li->falh;
1088 insert_leaf_info(&l->list, li);
1089
Robert Olsson19baf832005-06-21 12:43:18 -07001090 if (t->trie && n == NULL) {
Olof Johansson91b9a272005-08-09 20:24:39 -07001091 /* Case 2: n is NULL, and will just insert a new leaf */
Robert Olsson19baf832005-06-21 12:43:18 -07001092
Stephen Hemminger06801912007-08-10 15:22:13 -07001093 node_set_parent((struct node *)l, tp);
Robert Olsson19baf832005-06-21 12:43:18 -07001094
Olof Johansson91b9a272005-08-09 20:24:39 -07001095 cindex = tkey_extract_bits(key, tp->pos, tp->bits);
1096 put_child(t, (struct tnode *)tp, cindex, (struct node *)l);
1097 } else {
1098 /* Case 3: n is a LEAF or a TNODE and the key doesn't match. */
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001099 /*
1100 * Add a new tnode here
Robert Olsson19baf832005-06-21 12:43:18 -07001101 * first tnode need some special handling
1102 */
1103
1104 if (tp)
Olof Johansson91b9a272005-08-09 20:24:39 -07001105 pos = tp->pos+tp->bits;
Robert Olsson19baf832005-06-21 12:43:18 -07001106 else
Olof Johansson91b9a272005-08-09 20:24:39 -07001107 pos = 0;
1108
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001109 if (n) {
Robert Olsson19baf832005-06-21 12:43:18 -07001110 newpos = tkey_mismatch(key, pos, n->key);
1111 tn = tnode_new(n->key, newpos, 1);
Olof Johansson91b9a272005-08-09 20:24:39 -07001112 } else {
Robert Olsson19baf832005-06-21 12:43:18 -07001113 newpos = 0;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001114 tn = tnode_new(key, newpos, 1); /* First tnode */
Robert Olsson19baf832005-06-21 12:43:18 -07001115 }
Robert Olsson19baf832005-06-21 12:43:18 -07001116
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001117 if (!tn) {
Robert Olssonf835e472005-06-28 15:00:39 -07001118 free_leaf_info(li);
1119 tnode_free((struct tnode *) l);
1120 *err = -ENOMEM;
1121 goto err;
Olof Johansson91b9a272005-08-09 20:24:39 -07001122 }
1123
Stephen Hemminger06801912007-08-10 15:22:13 -07001124 node_set_parent((struct node *)tn, tp);
Robert Olsson19baf832005-06-21 12:43:18 -07001125
Olof Johansson91b9a272005-08-09 20:24:39 -07001126 missbit = tkey_extract_bits(key, newpos, 1);
Robert Olsson19baf832005-06-21 12:43:18 -07001127 put_child(t, tn, missbit, (struct node *)l);
1128 put_child(t, tn, 1-missbit, n);
1129
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001130 if (tp) {
Robert Olsson19baf832005-06-21 12:43:18 -07001131 cindex = tkey_extract_bits(key, tp->pos, tp->bits);
1132 put_child(t, (struct tnode *)tp, cindex, (struct node *)tn);
Olof Johansson91b9a272005-08-09 20:24:39 -07001133 } else {
Robert Olsson2373ce12005-08-25 13:01:29 -07001134 rcu_assign_pointer(t->trie, (struct node *)tn); /* First tnode */
Robert Olsson19baf832005-06-21 12:43:18 -07001135 tp = tn;
1136 }
1137 }
Olof Johansson91b9a272005-08-09 20:24:39 -07001138
1139 if (tp && tp->pos + tp->bits > 32)
Stephen Hemminger78c66712005-09-21 00:15:39 -07001140 printk(KERN_WARNING "fib_trie tp=%p pos=%d, bits=%d, key=%0x plen=%d\n",
Robert Olsson19baf832005-06-21 12:43:18 -07001141 tp, tp->pos, tp->bits, key, plen);
Olof Johansson91b9a272005-08-09 20:24:39 -07001142
Robert Olsson19baf832005-06-21 12:43:18 -07001143 /* Rebalance the trie */
Robert Olsson2373ce12005-08-25 13:01:29 -07001144
1145 rcu_assign_pointer(t->trie, trie_rebalance(t, tp));
Robert Olssonf835e472005-06-28 15:00:39 -07001146done:
1147 t->revision++;
Olof Johansson91b9a272005-08-09 20:24:39 -07001148err:
Robert Olsson19baf832005-06-21 12:43:18 -07001149 return fa_head;
1150}
1151
Robert Olssond562f1f2007-03-26 14:22:22 -07001152/*
1153 * Caller must hold RTNL.
1154 */
Thomas Graf4e902c52006-08-17 18:14:52 -07001155static int fn_trie_insert(struct fib_table *tb, struct fib_config *cfg)
Robert Olsson19baf832005-06-21 12:43:18 -07001156{
1157 struct trie *t = (struct trie *) tb->tb_data;
1158 struct fib_alias *fa, *new_fa;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001159 struct list_head *fa_head = NULL;
Robert Olsson19baf832005-06-21 12:43:18 -07001160 struct fib_info *fi;
Thomas Graf4e902c52006-08-17 18:14:52 -07001161 int plen = cfg->fc_dst_len;
1162 u8 tos = cfg->fc_tos;
Robert Olsson19baf832005-06-21 12:43:18 -07001163 u32 key, mask;
1164 int err;
1165 struct leaf *l;
1166
1167 if (plen > 32)
1168 return -EINVAL;
1169
Thomas Graf4e902c52006-08-17 18:14:52 -07001170 key = ntohl(cfg->fc_dst);
Robert Olsson19baf832005-06-21 12:43:18 -07001171
Patrick McHardy2dfe55b2006-08-10 23:08:33 -07001172 pr_debug("Insert table=%u %08x/%d\n", tb->tb_id, key, plen);
Robert Olsson19baf832005-06-21 12:43:18 -07001173
Olof Johansson91b9a272005-08-09 20:24:39 -07001174 mask = ntohl(inet_make_mask(plen));
Robert Olsson19baf832005-06-21 12:43:18 -07001175
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001176 if (key & ~mask)
Robert Olsson19baf832005-06-21 12:43:18 -07001177 return -EINVAL;
1178
1179 key = key & mask;
1180
Thomas Graf4e902c52006-08-17 18:14:52 -07001181 fi = fib_create_info(cfg);
1182 if (IS_ERR(fi)) {
1183 err = PTR_ERR(fi);
Robert Olsson19baf832005-06-21 12:43:18 -07001184 goto err;
Thomas Graf4e902c52006-08-17 18:14:52 -07001185 }
Robert Olsson19baf832005-06-21 12:43:18 -07001186
1187 l = fib_find_node(t, key);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001188 fa = NULL;
Robert Olsson19baf832005-06-21 12:43:18 -07001189
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001190 if (l) {
Robert Olsson19baf832005-06-21 12:43:18 -07001191 fa_head = get_fa_head(l, plen);
1192 fa = fib_find_alias(fa_head, tos, fi->fib_priority);
1193 }
1194
1195 /* Now fa, if non-NULL, points to the first fib alias
1196 * with the same keys [prefix,tos,priority], if such key already
1197 * exists or to the node before which we will insert new one.
1198 *
1199 * If fa is NULL, we will need to allocate a new one and
1200 * insert to the head of f.
1201 *
1202 * If f is NULL, no fib node matched the destination key
1203 * and we need to allocate a new one of those as well.
1204 */
1205
Olof Johansson91b9a272005-08-09 20:24:39 -07001206 if (fa && fa->fa_info->fib_priority == fi->fib_priority) {
Robert Olsson19baf832005-06-21 12:43:18 -07001207 struct fib_alias *fa_orig;
1208
1209 err = -EEXIST;
Thomas Graf4e902c52006-08-17 18:14:52 -07001210 if (cfg->fc_nlflags & NLM_F_EXCL)
Robert Olsson19baf832005-06-21 12:43:18 -07001211 goto out;
1212
Thomas Graf4e902c52006-08-17 18:14:52 -07001213 if (cfg->fc_nlflags & NLM_F_REPLACE) {
Robert Olsson19baf832005-06-21 12:43:18 -07001214 struct fib_info *fi_drop;
1215 u8 state;
1216
Joonwoo Park67250332008-01-18 03:45:18 -08001217 if (fi->fib_treeref > 1)
1218 goto out;
1219
Robert Olsson2373ce12005-08-25 13:01:29 -07001220 err = -ENOBUFS;
Christoph Lametere94b1762006-12-06 20:33:17 -08001221 new_fa = kmem_cache_alloc(fn_alias_kmem, GFP_KERNEL);
Robert Olsson2373ce12005-08-25 13:01:29 -07001222 if (new_fa == NULL)
1223 goto out;
Robert Olsson19baf832005-06-21 12:43:18 -07001224
1225 fi_drop = fa->fa_info;
Robert Olsson2373ce12005-08-25 13:01:29 -07001226 new_fa->fa_tos = fa->fa_tos;
1227 new_fa->fa_info = fi;
Thomas Graf4e902c52006-08-17 18:14:52 -07001228 new_fa->fa_type = cfg->fc_type;
1229 new_fa->fa_scope = cfg->fc_scope;
Robert Olsson19baf832005-06-21 12:43:18 -07001230 state = fa->fa_state;
Robert Olsson2373ce12005-08-25 13:01:29 -07001231 new_fa->fa_state &= ~FA_S_ACCESSED;
Robert Olsson19baf832005-06-21 12:43:18 -07001232
Robert Olsson2373ce12005-08-25 13:01:29 -07001233 list_replace_rcu(&fa->fa_list, &new_fa->fa_list);
1234 alias_free_mem_rcu(fa);
Robert Olsson19baf832005-06-21 12:43:18 -07001235
1236 fib_release_info(fi_drop);
1237 if (state & FA_S_ACCESSED)
Olof Johansson91b9a272005-08-09 20:24:39 -07001238 rt_cache_flush(-1);
Milan Kocianb8f55832007-05-23 14:55:06 -07001239 rtmsg_fib(RTM_NEWROUTE, htonl(key), new_fa, plen,
1240 tb->tb_id, &cfg->fc_nlinfo, NLM_F_REPLACE);
Robert Olsson19baf832005-06-21 12:43:18 -07001241
Olof Johansson91b9a272005-08-09 20:24:39 -07001242 goto succeeded;
Robert Olsson19baf832005-06-21 12:43:18 -07001243 }
1244 /* Error if we find a perfect match which
1245 * uses the same scope, type, and nexthop
1246 * information.
1247 */
1248 fa_orig = fa;
1249 list_for_each_entry(fa, fa_orig->fa_list.prev, fa_list) {
1250 if (fa->fa_tos != tos)
1251 break;
1252 if (fa->fa_info->fib_priority != fi->fib_priority)
1253 break;
Thomas Graf4e902c52006-08-17 18:14:52 -07001254 if (fa->fa_type == cfg->fc_type &&
1255 fa->fa_scope == cfg->fc_scope &&
Robert Olsson19baf832005-06-21 12:43:18 -07001256 fa->fa_info == fi) {
1257 goto out;
1258 }
1259 }
Thomas Graf4e902c52006-08-17 18:14:52 -07001260 if (!(cfg->fc_nlflags & NLM_F_APPEND))
Robert Olsson19baf832005-06-21 12:43:18 -07001261 fa = fa_orig;
1262 }
1263 err = -ENOENT;
Thomas Graf4e902c52006-08-17 18:14:52 -07001264 if (!(cfg->fc_nlflags & NLM_F_CREATE))
Robert Olsson19baf832005-06-21 12:43:18 -07001265 goto out;
1266
1267 err = -ENOBUFS;
Christoph Lametere94b1762006-12-06 20:33:17 -08001268 new_fa = kmem_cache_alloc(fn_alias_kmem, GFP_KERNEL);
Robert Olsson19baf832005-06-21 12:43:18 -07001269 if (new_fa == NULL)
1270 goto out;
1271
1272 new_fa->fa_info = fi;
1273 new_fa->fa_tos = tos;
Thomas Graf4e902c52006-08-17 18:14:52 -07001274 new_fa->fa_type = cfg->fc_type;
1275 new_fa->fa_scope = cfg->fc_scope;
Robert Olsson19baf832005-06-21 12:43:18 -07001276 new_fa->fa_state = 0;
Robert Olsson19baf832005-06-21 12:43:18 -07001277 /*
1278 * Insert new entry to the list.
1279 */
1280
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001281 if (!fa_head) {
Robert Olssonf835e472005-06-28 15:00:39 -07001282 err = 0;
Herbert Xub47b2ec2006-07-12 13:29:56 -07001283 fa_head = fib_insert_node(t, &err, key, plen);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001284 if (err)
Robert Olssonf835e472005-06-28 15:00:39 -07001285 goto out_free_new_fa;
1286 }
Robert Olsson19baf832005-06-21 12:43:18 -07001287
Robert Olsson2373ce12005-08-25 13:01:29 -07001288 list_add_tail_rcu(&new_fa->fa_list,
1289 (fa ? &fa->fa_list : fa_head));
Robert Olsson19baf832005-06-21 12:43:18 -07001290
1291 rt_cache_flush(-1);
Thomas Graf4e902c52006-08-17 18:14:52 -07001292 rtmsg_fib(RTM_NEWROUTE, htonl(key), new_fa, plen, tb->tb_id,
Milan Kocianb8f55832007-05-23 14:55:06 -07001293 &cfg->fc_nlinfo, 0);
Robert Olsson19baf832005-06-21 12:43:18 -07001294succeeded:
1295 return 0;
Robert Olssonf835e472005-06-28 15:00:39 -07001296
1297out_free_new_fa:
1298 kmem_cache_free(fn_alias_kmem, new_fa);
Robert Olsson19baf832005-06-21 12:43:18 -07001299out:
1300 fib_release_info(fi);
Olof Johansson91b9a272005-08-09 20:24:39 -07001301err:
Robert Olsson19baf832005-06-21 12:43:18 -07001302 return err;
1303}
1304
Robert Olsson2373ce12005-08-25 13:01:29 -07001305
Robert Olsson772cb712005-09-19 15:31:18 -07001306/* should be called with rcu_read_lock */
Stephen Hemminger0c7770c2005-08-23 21:59:41 -07001307static inline int check_leaf(struct trie *t, struct leaf *l,
1308 t_key key, int *plen, const struct flowi *flp,
Patrick McHardy06c74272005-08-23 22:06:09 -07001309 struct fib_result *res)
Robert Olsson19baf832005-06-21 12:43:18 -07001310{
Patrick McHardy06c74272005-08-23 22:06:09 -07001311 int err, i;
Al Viro888454c2006-09-19 13:42:46 -07001312 __be32 mask;
Robert Olsson19baf832005-06-21 12:43:18 -07001313 struct leaf_info *li;
1314 struct hlist_head *hhead = &l->list;
1315 struct hlist_node *node;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001316
Robert Olsson2373ce12005-08-25 13:01:29 -07001317 hlist_for_each_entry_rcu(li, node, hhead, hlist) {
Robert Olsson19baf832005-06-21 12:43:18 -07001318 i = li->plen;
Al Viro888454c2006-09-19 13:42:46 -07001319 mask = inet_make_mask(i);
1320 if (l->key != (key & ntohl(mask)))
Robert Olsson19baf832005-06-21 12:43:18 -07001321 continue;
1322
Al Viro888454c2006-09-19 13:42:46 -07001323 if ((err = fib_semantic_match(&li->falh, flp, res, htonl(l->key), mask, i)) <= 0) {
Robert Olsson19baf832005-06-21 12:43:18 -07001324 *plen = i;
1325#ifdef CONFIG_IP_FIB_TRIE_STATS
1326 t->stats.semantic_match_passed++;
1327#endif
Patrick McHardy06c74272005-08-23 22:06:09 -07001328 return err;
Robert Olsson19baf832005-06-21 12:43:18 -07001329 }
1330#ifdef CONFIG_IP_FIB_TRIE_STATS
1331 t->stats.semantic_match_miss++;
1332#endif
1333 }
Patrick McHardy06c74272005-08-23 22:06:09 -07001334 return 1;
Robert Olsson19baf832005-06-21 12:43:18 -07001335}
1336
1337static int
1338fn_trie_lookup(struct fib_table *tb, const struct flowi *flp, struct fib_result *res)
1339{
1340 struct trie *t = (struct trie *) tb->tb_data;
1341 int plen, ret = 0;
1342 struct node *n;
1343 struct tnode *pn;
1344 int pos, bits;
Olof Johansson91b9a272005-08-09 20:24:39 -07001345 t_key key = ntohl(flp->fl4_dst);
Robert Olsson19baf832005-06-21 12:43:18 -07001346 int chopped_off;
1347 t_key cindex = 0;
1348 int current_prefix_length = KEYLENGTH;
Olof Johansson91b9a272005-08-09 20:24:39 -07001349 struct tnode *cn;
1350 t_key node_prefix, key_prefix, pref_mismatch;
1351 int mp;
1352
Robert Olsson2373ce12005-08-25 13:01:29 -07001353 rcu_read_lock();
Robert Olsson19baf832005-06-21 12:43:18 -07001354
Robert Olsson2373ce12005-08-25 13:01:29 -07001355 n = rcu_dereference(t->trie);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001356 if (!n)
Robert Olsson19baf832005-06-21 12:43:18 -07001357 goto failed;
1358
1359#ifdef CONFIG_IP_FIB_TRIE_STATS
1360 t->stats.gets++;
1361#endif
1362
1363 /* Just a leaf? */
1364 if (IS_LEAF(n)) {
Patrick McHardy06c74272005-08-23 22:06:09 -07001365 if ((ret = check_leaf(t, (struct leaf *)n, key, &plen, flp, res)) <= 0)
Robert Olsson19baf832005-06-21 12:43:18 -07001366 goto found;
1367 goto failed;
1368 }
1369 pn = (struct tnode *) n;
1370 chopped_off = 0;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001371
Olof Johansson91b9a272005-08-09 20:24:39 -07001372 while (pn) {
Robert Olsson19baf832005-06-21 12:43:18 -07001373 pos = pn->pos;
1374 bits = pn->bits;
1375
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001376 if (!chopped_off)
Stephen Hemmingerab66b4a2007-08-10 15:22:58 -07001377 cindex = tkey_extract_bits(mask_pfx(key, current_prefix_length),
1378 pos, bits);
Robert Olsson19baf832005-06-21 12:43:18 -07001379
1380 n = tnode_get_child(pn, cindex);
1381
1382 if (n == NULL) {
1383#ifdef CONFIG_IP_FIB_TRIE_STATS
1384 t->stats.null_node_hit++;
1385#endif
1386 goto backtrace;
1387 }
1388
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001389 if (IS_LEAF(n)) {
Patrick McHardy06c74272005-08-23 22:06:09 -07001390 if ((ret = check_leaf(t, (struct leaf *)n, key, &plen, flp, res)) <= 0)
Robert Olsson19baf832005-06-21 12:43:18 -07001391 goto found;
Olof Johansson91b9a272005-08-09 20:24:39 -07001392 else
1393 goto backtrace;
1394 }
1395
1396#define HL_OPTIMIZE
1397#ifdef HL_OPTIMIZE
1398 cn = (struct tnode *)n;
1399
1400 /*
1401 * It's a tnode, and we can do some extra checks here if we
1402 * like, to avoid descending into a dead-end branch.
1403 * This tnode is in the parent's child array at index
1404 * key[p_pos..p_pos+p_bits] but potentially with some bits
1405 * chopped off, so in reality the index may be just a
1406 * subprefix, padded with zero at the end.
1407 * We can also take a look at any skipped bits in this
1408 * tnode - everything up to p_pos is supposed to be ok,
1409 * and the non-chopped bits of the index (se previous
1410 * paragraph) are also guaranteed ok, but the rest is
1411 * considered unknown.
1412 *
1413 * The skipped bits are key[pos+bits..cn->pos].
1414 */
1415
1416 /* If current_prefix_length < pos+bits, we are already doing
1417 * actual prefix matching, which means everything from
1418 * pos+(bits-chopped_off) onward must be zero along some
1419 * branch of this subtree - otherwise there is *no* valid
1420 * prefix present. Here we can only check the skipped
1421 * bits. Remember, since we have already indexed into the
1422 * parent's child array, we know that the bits we chopped of
1423 * *are* zero.
1424 */
1425
1426 /* NOTA BENE: CHECKING ONLY SKIPPED BITS FOR THE NEW NODE HERE */
1427
1428 if (current_prefix_length < pos+bits) {
1429 if (tkey_extract_bits(cn->key, current_prefix_length,
1430 cn->pos - current_prefix_length) != 0 ||
1431 !(cn->child[0]))
1432 goto backtrace;
1433 }
1434
1435 /*
1436 * If chopped_off=0, the index is fully validated and we
1437 * only need to look at the skipped bits for this, the new,
1438 * tnode. What we actually want to do is to find out if
1439 * these skipped bits match our key perfectly, or if we will
1440 * have to count on finding a matching prefix further down,
1441 * because if we do, we would like to have some way of
1442 * verifying the existence of such a prefix at this point.
1443 */
1444
1445 /* The only thing we can do at this point is to verify that
1446 * any such matching prefix can indeed be a prefix to our
1447 * key, and if the bits in the node we are inspecting that
1448 * do not match our key are not ZERO, this cannot be true.
1449 * Thus, find out where there is a mismatch (before cn->pos)
1450 * and verify that all the mismatching bits are zero in the
1451 * new tnode's key.
1452 */
1453
1454 /* Note: We aren't very concerned about the piece of the key
1455 * that precede pn->pos+pn->bits, since these have already been
1456 * checked. The bits after cn->pos aren't checked since these are
1457 * by definition "unknown" at this point. Thus, what we want to
1458 * see is if we are about to enter the "prefix matching" state,
1459 * and in that case verify that the skipped bits that will prevail
1460 * throughout this subtree are zero, as they have to be if we are
1461 * to find a matching prefix.
1462 */
1463
Stephen Hemmingerab66b4a2007-08-10 15:22:58 -07001464 node_prefix = mask_pfx(cn->key, cn->pos);
1465 key_prefix = mask_pfx(key, cn->pos);
Olof Johansson91b9a272005-08-09 20:24:39 -07001466 pref_mismatch = key_prefix^node_prefix;
1467 mp = 0;
1468
1469 /* In short: If skipped bits in this node do not match the search
1470 * key, enter the "prefix matching" state.directly.
1471 */
1472 if (pref_mismatch) {
1473 while (!(pref_mismatch & (1<<(KEYLENGTH-1)))) {
1474 mp++;
1475 pref_mismatch = pref_mismatch <<1;
1476 }
1477 key_prefix = tkey_extract_bits(cn->key, mp, cn->pos-mp);
1478
1479 if (key_prefix != 0)
1480 goto backtrace;
1481
1482 if (current_prefix_length >= cn->pos)
1483 current_prefix_length = mp;
1484 }
1485#endif
1486 pn = (struct tnode *)n; /* Descend */
1487 chopped_off = 0;
1488 continue;
1489
Robert Olsson19baf832005-06-21 12:43:18 -07001490backtrace:
1491 chopped_off++;
1492
1493 /* As zero don't change the child key (cindex) */
Olof Johansson91b9a272005-08-09 20:24:39 -07001494 while ((chopped_off <= pn->bits) && !(cindex & (1<<(chopped_off-1))))
Robert Olsson19baf832005-06-21 12:43:18 -07001495 chopped_off++;
Robert Olsson19baf832005-06-21 12:43:18 -07001496
1497 /* Decrease current_... with bits chopped off */
1498 if (current_prefix_length > pn->pos + pn->bits - chopped_off)
1499 current_prefix_length = pn->pos + pn->bits - chopped_off;
Olof Johansson91b9a272005-08-09 20:24:39 -07001500
Robert Olsson19baf832005-06-21 12:43:18 -07001501 /*
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001502 * Either we do the actual chop off according or if we have
Robert Olsson19baf832005-06-21 12:43:18 -07001503 * chopped off all bits in this tnode walk up to our parent.
1504 */
1505
Olof Johansson91b9a272005-08-09 20:24:39 -07001506 if (chopped_off <= pn->bits) {
Robert Olsson19baf832005-06-21 12:43:18 -07001507 cindex &= ~(1 << (chopped_off-1));
Olof Johansson91b9a272005-08-09 20:24:39 -07001508 } else {
Stephen Hemminger06801912007-08-10 15:22:13 -07001509 struct tnode *parent = node_parent((struct node *) pn);
1510 if (!parent)
Robert Olsson19baf832005-06-21 12:43:18 -07001511 goto failed;
Olof Johansson91b9a272005-08-09 20:24:39 -07001512
Robert Olsson19baf832005-06-21 12:43:18 -07001513 /* Get Child's index */
Stephen Hemminger06801912007-08-10 15:22:13 -07001514 cindex = tkey_extract_bits(pn->key, parent->pos, parent->bits);
1515 pn = parent;
Robert Olsson19baf832005-06-21 12:43:18 -07001516 chopped_off = 0;
1517
1518#ifdef CONFIG_IP_FIB_TRIE_STATS
1519 t->stats.backtrack++;
1520#endif
1521 goto backtrace;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001522 }
Robert Olsson19baf832005-06-21 12:43:18 -07001523 }
1524failed:
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001525 ret = 1;
Robert Olsson19baf832005-06-21 12:43:18 -07001526found:
Robert Olsson2373ce12005-08-25 13:01:29 -07001527 rcu_read_unlock();
Robert Olsson19baf832005-06-21 12:43:18 -07001528 return ret;
1529}
1530
Robert Olsson2373ce12005-08-25 13:01:29 -07001531/* only called from updater side */
Robert Olsson19baf832005-06-21 12:43:18 -07001532static int trie_leaf_remove(struct trie *t, t_key key)
1533{
1534 t_key cindex;
1535 struct tnode *tp = NULL;
1536 struct node *n = t->trie;
1537 struct leaf *l;
1538
Stephen Hemminger0c7770c2005-08-23 21:59:41 -07001539 pr_debug("entering trie_leaf_remove(%p)\n", n);
Robert Olsson19baf832005-06-21 12:43:18 -07001540
1541 /* Note that in the case skipped bits, those bits are *not* checked!
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001542 * When we finish this, we will have NULL or a T_LEAF, and the
Robert Olsson19baf832005-06-21 12:43:18 -07001543 * T_LEAF may or may not match our key.
1544 */
1545
Olof Johansson91b9a272005-08-09 20:24:39 -07001546 while (n != NULL && IS_TNODE(n)) {
Robert Olsson19baf832005-06-21 12:43:18 -07001547 struct tnode *tn = (struct tnode *) n;
1548 check_tnode(tn);
1549 n = tnode_get_child(tn ,tkey_extract_bits(key, tn->pos, tn->bits));
1550
Stephen Hemminger06801912007-08-10 15:22:13 -07001551 BUG_ON(n && node_parent(n) != tn);
Olof Johansson91b9a272005-08-09 20:24:39 -07001552 }
Robert Olsson19baf832005-06-21 12:43:18 -07001553 l = (struct leaf *) n;
1554
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001555 if (!n || !tkey_equals(l->key, key))
Robert Olsson19baf832005-06-21 12:43:18 -07001556 return 0;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001557
1558 /*
1559 * Key found.
1560 * Remove the leaf and rebalance the tree
Robert Olsson19baf832005-06-21 12:43:18 -07001561 */
1562
1563 t->revision++;
1564 t->size--;
1565
Stephen Hemminger06801912007-08-10 15:22:13 -07001566 tp = node_parent(n);
Robert Olsson19baf832005-06-21 12:43:18 -07001567 tnode_free((struct tnode *) n);
1568
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001569 if (tp) {
Robert Olsson19baf832005-06-21 12:43:18 -07001570 cindex = tkey_extract_bits(key, tp->pos, tp->bits);
1571 put_child(t, (struct tnode *)tp, cindex, NULL);
Robert Olsson2373ce12005-08-25 13:01:29 -07001572 rcu_assign_pointer(t->trie, trie_rebalance(t, tp));
Olof Johansson91b9a272005-08-09 20:24:39 -07001573 } else
Robert Olsson2373ce12005-08-25 13:01:29 -07001574 rcu_assign_pointer(t->trie, NULL);
Robert Olsson19baf832005-06-21 12:43:18 -07001575
1576 return 1;
1577}
1578
Robert Olssond562f1f2007-03-26 14:22:22 -07001579/*
1580 * Caller must hold RTNL.
1581 */
Thomas Graf4e902c52006-08-17 18:14:52 -07001582static int fn_trie_delete(struct fib_table *tb, struct fib_config *cfg)
Robert Olsson19baf832005-06-21 12:43:18 -07001583{
1584 struct trie *t = (struct trie *) tb->tb_data;
1585 u32 key, mask;
Thomas Graf4e902c52006-08-17 18:14:52 -07001586 int plen = cfg->fc_dst_len;
1587 u8 tos = cfg->fc_tos;
Robert Olsson19baf832005-06-21 12:43:18 -07001588 struct fib_alias *fa, *fa_to_delete;
1589 struct list_head *fa_head;
1590 struct leaf *l;
Olof Johansson91b9a272005-08-09 20:24:39 -07001591 struct leaf_info *li;
1592
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001593 if (plen > 32)
Robert Olsson19baf832005-06-21 12:43:18 -07001594 return -EINVAL;
1595
Thomas Graf4e902c52006-08-17 18:14:52 -07001596 key = ntohl(cfg->fc_dst);
Olof Johansson91b9a272005-08-09 20:24:39 -07001597 mask = ntohl(inet_make_mask(plen));
Robert Olsson19baf832005-06-21 12:43:18 -07001598
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001599 if (key & ~mask)
Robert Olsson19baf832005-06-21 12:43:18 -07001600 return -EINVAL;
1601
1602 key = key & mask;
1603 l = fib_find_node(t, key);
1604
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001605 if (!l)
Robert Olsson19baf832005-06-21 12:43:18 -07001606 return -ESRCH;
1607
1608 fa_head = get_fa_head(l, plen);
1609 fa = fib_find_alias(fa_head, tos, 0);
1610
1611 if (!fa)
1612 return -ESRCH;
1613
Stephen Hemminger0c7770c2005-08-23 21:59:41 -07001614 pr_debug("Deleting %08x/%d tos=%d t=%p\n", key, plen, tos, t);
Robert Olsson19baf832005-06-21 12:43:18 -07001615
1616 fa_to_delete = NULL;
1617 fa_head = fa->fa_list.prev;
Robert Olsson2373ce12005-08-25 13:01:29 -07001618
Robert Olsson19baf832005-06-21 12:43:18 -07001619 list_for_each_entry(fa, fa_head, fa_list) {
1620 struct fib_info *fi = fa->fa_info;
1621
1622 if (fa->fa_tos != tos)
1623 break;
1624
Thomas Graf4e902c52006-08-17 18:14:52 -07001625 if ((!cfg->fc_type || fa->fa_type == cfg->fc_type) &&
1626 (cfg->fc_scope == RT_SCOPE_NOWHERE ||
1627 fa->fa_scope == cfg->fc_scope) &&
1628 (!cfg->fc_protocol ||
1629 fi->fib_protocol == cfg->fc_protocol) &&
1630 fib_nh_match(cfg, fi) == 0) {
Robert Olsson19baf832005-06-21 12:43:18 -07001631 fa_to_delete = fa;
1632 break;
1633 }
1634 }
1635
Olof Johansson91b9a272005-08-09 20:24:39 -07001636 if (!fa_to_delete)
1637 return -ESRCH;
Robert Olsson19baf832005-06-21 12:43:18 -07001638
Olof Johansson91b9a272005-08-09 20:24:39 -07001639 fa = fa_to_delete;
Thomas Graf4e902c52006-08-17 18:14:52 -07001640 rtmsg_fib(RTM_DELROUTE, htonl(key), fa, plen, tb->tb_id,
Milan Kocianb8f55832007-05-23 14:55:06 -07001641 &cfg->fc_nlinfo, 0);
Robert Olsson19baf832005-06-21 12:43:18 -07001642
Olof Johansson91b9a272005-08-09 20:24:39 -07001643 l = fib_find_node(t, key);
Robert Olsson772cb712005-09-19 15:31:18 -07001644 li = find_leaf_info(l, plen);
Robert Olsson19baf832005-06-21 12:43:18 -07001645
Robert Olsson2373ce12005-08-25 13:01:29 -07001646 list_del_rcu(&fa->fa_list);
Robert Olsson19baf832005-06-21 12:43:18 -07001647
Olof Johansson91b9a272005-08-09 20:24:39 -07001648 if (list_empty(fa_head)) {
Robert Olsson2373ce12005-08-25 13:01:29 -07001649 hlist_del_rcu(&li->hlist);
Olof Johansson91b9a272005-08-09 20:24:39 -07001650 free_leaf_info(li);
Robert Olsson2373ce12005-08-25 13:01:29 -07001651 }
Olof Johansson91b9a272005-08-09 20:24:39 -07001652
1653 if (hlist_empty(&l->list))
1654 trie_leaf_remove(t, key);
1655
1656 if (fa->fa_state & FA_S_ACCESSED)
1657 rt_cache_flush(-1);
1658
Robert Olsson2373ce12005-08-25 13:01:29 -07001659 fib_release_info(fa->fa_info);
1660 alias_free_mem_rcu(fa);
Olof Johansson91b9a272005-08-09 20:24:39 -07001661 return 0;
Robert Olsson19baf832005-06-21 12:43:18 -07001662}
1663
1664static int trie_flush_list(struct trie *t, struct list_head *head)
1665{
1666 struct fib_alias *fa, *fa_node;
1667 int found = 0;
1668
1669 list_for_each_entry_safe(fa, fa_node, head, fa_list) {
1670 struct fib_info *fi = fa->fa_info;
Robert Olsson19baf832005-06-21 12:43:18 -07001671
Robert Olsson2373ce12005-08-25 13:01:29 -07001672 if (fi && (fi->fib_flags & RTNH_F_DEAD)) {
1673 list_del_rcu(&fa->fa_list);
1674 fib_release_info(fa->fa_info);
1675 alias_free_mem_rcu(fa);
Robert Olsson19baf832005-06-21 12:43:18 -07001676 found++;
1677 }
1678 }
1679 return found;
1680}
1681
1682static int trie_flush_leaf(struct trie *t, struct leaf *l)
1683{
1684 int found = 0;
1685 struct hlist_head *lih = &l->list;
1686 struct hlist_node *node, *tmp;
1687 struct leaf_info *li = NULL;
1688
1689 hlist_for_each_entry_safe(li, node, tmp, lih, hlist) {
Robert Olsson19baf832005-06-21 12:43:18 -07001690 found += trie_flush_list(t, &li->falh);
1691
1692 if (list_empty(&li->falh)) {
Robert Olsson2373ce12005-08-25 13:01:29 -07001693 hlist_del_rcu(&li->hlist);
Robert Olsson19baf832005-06-21 12:43:18 -07001694 free_leaf_info(li);
1695 }
1696 }
1697 return found;
1698}
1699
Robert Olsson2373ce12005-08-25 13:01:29 -07001700/* rcu_read_lock needs to be hold by caller from readside */
1701
Robert Olsson19baf832005-06-21 12:43:18 -07001702static struct leaf *nextleaf(struct trie *t, struct leaf *thisleaf)
1703{
1704 struct node *c = (struct node *) thisleaf;
1705 struct tnode *p;
1706 int idx;
Robert Olsson2373ce12005-08-25 13:01:29 -07001707 struct node *trie = rcu_dereference(t->trie);
Robert Olsson19baf832005-06-21 12:43:18 -07001708
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001709 if (c == NULL) {
Robert Olsson2373ce12005-08-25 13:01:29 -07001710 if (trie == NULL)
Robert Olsson19baf832005-06-21 12:43:18 -07001711 return NULL;
1712
Robert Olsson2373ce12005-08-25 13:01:29 -07001713 if (IS_LEAF(trie)) /* trie w. just a leaf */
1714 return (struct leaf *) trie;
Robert Olsson19baf832005-06-21 12:43:18 -07001715
Robert Olsson2373ce12005-08-25 13:01:29 -07001716 p = (struct tnode*) trie; /* Start */
Olof Johansson91b9a272005-08-09 20:24:39 -07001717 } else
Stephen Hemminger06801912007-08-10 15:22:13 -07001718 p = node_parent(c);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001719
Robert Olsson19baf832005-06-21 12:43:18 -07001720 while (p) {
1721 int pos, last;
1722
1723 /* Find the next child of the parent */
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001724 if (c)
1725 pos = 1 + tkey_extract_bits(c->key, p->pos, p->bits);
1726 else
Robert Olsson19baf832005-06-21 12:43:18 -07001727 pos = 0;
1728
1729 last = 1 << p->bits;
Olof Johansson91b9a272005-08-09 20:24:39 -07001730 for (idx = pos; idx < last ; idx++) {
Robert Olsson2373ce12005-08-25 13:01:29 -07001731 c = rcu_dereference(p->child[idx]);
1732
1733 if (!c)
Olof Johansson91b9a272005-08-09 20:24:39 -07001734 continue;
Robert Olsson19baf832005-06-21 12:43:18 -07001735
Olof Johansson91b9a272005-08-09 20:24:39 -07001736 /* Decend if tnode */
Robert Olsson2373ce12005-08-25 13:01:29 -07001737 while (IS_TNODE(c)) {
1738 p = (struct tnode *) c;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001739 idx = 0;
Robert Olsson19baf832005-06-21 12:43:18 -07001740
Olof Johansson91b9a272005-08-09 20:24:39 -07001741 /* Rightmost non-NULL branch */
1742 if (p && IS_TNODE(p))
Robert Olsson2373ce12005-08-25 13:01:29 -07001743 while (!(c = rcu_dereference(p->child[idx]))
1744 && idx < (1<<p->bits)) idx++;
Robert Olsson19baf832005-06-21 12:43:18 -07001745
Olof Johansson91b9a272005-08-09 20:24:39 -07001746 /* Done with this tnode? */
Robert Olsson2373ce12005-08-25 13:01:29 -07001747 if (idx >= (1 << p->bits) || !c)
Olof Johansson91b9a272005-08-09 20:24:39 -07001748 goto up;
Robert Olsson19baf832005-06-21 12:43:18 -07001749 }
Robert Olsson2373ce12005-08-25 13:01:29 -07001750 return (struct leaf *) c;
Robert Olsson19baf832005-06-21 12:43:18 -07001751 }
1752up:
1753 /* No more children go up one step */
Olof Johansson91b9a272005-08-09 20:24:39 -07001754 c = (struct node *) p;
Stephen Hemminger06801912007-08-10 15:22:13 -07001755 p = node_parent(c);
Robert Olsson19baf832005-06-21 12:43:18 -07001756 }
1757 return NULL; /* Ready. Root of trie */
1758}
1759
Robert Olssond562f1f2007-03-26 14:22:22 -07001760/*
1761 * Caller must hold RTNL.
1762 */
Robert Olsson19baf832005-06-21 12:43:18 -07001763static int fn_trie_flush(struct fib_table *tb)
1764{
1765 struct trie *t = (struct trie *) tb->tb_data;
1766 struct leaf *ll = NULL, *l = NULL;
1767 int found = 0, h;
1768
1769 t->revision++;
1770
Olof Johansson91b9a272005-08-09 20:24:39 -07001771 for (h = 0; (l = nextleaf(t, l)) != NULL; h++) {
Robert Olsson19baf832005-06-21 12:43:18 -07001772 found += trie_flush_leaf(t, l);
1773
1774 if (ll && hlist_empty(&ll->list))
1775 trie_leaf_remove(t, ll->key);
1776 ll = l;
1777 }
1778
1779 if (ll && hlist_empty(&ll->list))
1780 trie_leaf_remove(t, ll->key);
1781
Stephen Hemminger0c7770c2005-08-23 21:59:41 -07001782 pr_debug("trie_flush found=%d\n", found);
Robert Olsson19baf832005-06-21 12:43:18 -07001783 return found;
1784}
1785
Olof Johansson91b9a272005-08-09 20:24:39 -07001786static int trie_last_dflt = -1;
Robert Olsson19baf832005-06-21 12:43:18 -07001787
1788static void
1789fn_trie_select_default(struct fib_table *tb, const struct flowi *flp, struct fib_result *res)
1790{
1791 struct trie *t = (struct trie *) tb->tb_data;
1792 int order, last_idx;
1793 struct fib_info *fi = NULL;
1794 struct fib_info *last_resort;
1795 struct fib_alias *fa = NULL;
1796 struct list_head *fa_head;
1797 struct leaf *l;
1798
1799 last_idx = -1;
1800 last_resort = NULL;
1801 order = -1;
1802
Robert Olsson2373ce12005-08-25 13:01:29 -07001803 rcu_read_lock();
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001804
Robert Olsson19baf832005-06-21 12:43:18 -07001805 l = fib_find_node(t, 0);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001806 if (!l)
Robert Olsson19baf832005-06-21 12:43:18 -07001807 goto out;
1808
1809 fa_head = get_fa_head(l, 0);
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001810 if (!fa_head)
Robert Olsson19baf832005-06-21 12:43:18 -07001811 goto out;
1812
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001813 if (list_empty(fa_head))
Robert Olsson19baf832005-06-21 12:43:18 -07001814 goto out;
1815
Robert Olsson2373ce12005-08-25 13:01:29 -07001816 list_for_each_entry_rcu(fa, fa_head, fa_list) {
Robert Olsson19baf832005-06-21 12:43:18 -07001817 struct fib_info *next_fi = fa->fa_info;
Olof Johansson91b9a272005-08-09 20:24:39 -07001818
Robert Olsson19baf832005-06-21 12:43:18 -07001819 if (fa->fa_scope != res->scope ||
1820 fa->fa_type != RTN_UNICAST)
1821 continue;
Olof Johansson91b9a272005-08-09 20:24:39 -07001822
Robert Olsson19baf832005-06-21 12:43:18 -07001823 if (next_fi->fib_priority > res->fi->fib_priority)
1824 break;
1825 if (!next_fi->fib_nh[0].nh_gw ||
1826 next_fi->fib_nh[0].nh_scope != RT_SCOPE_LINK)
1827 continue;
1828 fa->fa_state |= FA_S_ACCESSED;
Olof Johansson91b9a272005-08-09 20:24:39 -07001829
Robert Olsson19baf832005-06-21 12:43:18 -07001830 if (fi == NULL) {
1831 if (next_fi != res->fi)
1832 break;
1833 } else if (!fib_detect_death(fi, order, &last_resort,
1834 &last_idx, &trie_last_dflt)) {
1835 if (res->fi)
1836 fib_info_put(res->fi);
1837 res->fi = fi;
1838 atomic_inc(&fi->fib_clntref);
1839 trie_last_dflt = order;
1840 goto out;
1841 }
1842 fi = next_fi;
1843 order++;
1844 }
1845 if (order <= 0 || fi == NULL) {
1846 trie_last_dflt = -1;
1847 goto out;
1848 }
1849
1850 if (!fib_detect_death(fi, order, &last_resort, &last_idx, &trie_last_dflt)) {
1851 if (res->fi)
1852 fib_info_put(res->fi);
1853 res->fi = fi;
1854 atomic_inc(&fi->fib_clntref);
1855 trie_last_dflt = order;
1856 goto out;
1857 }
1858 if (last_idx >= 0) {
1859 if (res->fi)
1860 fib_info_put(res->fi);
1861 res->fi = last_resort;
1862 if (last_resort)
1863 atomic_inc(&last_resort->fib_clntref);
1864 }
1865 trie_last_dflt = last_idx;
1866 out:;
Robert Olsson2373ce12005-08-25 13:01:29 -07001867 rcu_read_unlock();
Robert Olsson19baf832005-06-21 12:43:18 -07001868}
1869
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001870static int fn_trie_dump_fa(t_key key, int plen, struct list_head *fah, struct fib_table *tb,
Robert Olsson19baf832005-06-21 12:43:18 -07001871 struct sk_buff *skb, struct netlink_callback *cb)
1872{
1873 int i, s_i;
1874 struct fib_alias *fa;
1875
Al Viro32ab5f82006-09-26 22:21:45 -07001876 __be32 xkey = htonl(key);
Robert Olsson19baf832005-06-21 12:43:18 -07001877
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001878 s_i = cb->args[4];
Robert Olsson19baf832005-06-21 12:43:18 -07001879 i = 0;
1880
Robert Olsson2373ce12005-08-25 13:01:29 -07001881 /* rcu_read_lock is hold by caller */
1882
1883 list_for_each_entry_rcu(fa, fah, fa_list) {
Robert Olsson19baf832005-06-21 12:43:18 -07001884 if (i < s_i) {
1885 i++;
1886 continue;
1887 }
Stephen Hemminger78c66712005-09-21 00:15:39 -07001888 BUG_ON(!fa->fa_info);
Robert Olsson19baf832005-06-21 12:43:18 -07001889
1890 if (fib_dump_info(skb, NETLINK_CB(cb->skb).pid,
1891 cb->nlh->nlmsg_seq,
1892 RTM_NEWROUTE,
1893 tb->tb_id,
1894 fa->fa_type,
1895 fa->fa_scope,
Thomas Grafbe403ea2006-08-17 18:15:17 -07001896 xkey,
Robert Olsson19baf832005-06-21 12:43:18 -07001897 plen,
1898 fa->fa_tos,
David S. Miller90f66912005-06-21 14:43:28 -07001899 fa->fa_info, 0) < 0) {
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001900 cb->args[4] = i;
Robert Olsson19baf832005-06-21 12:43:18 -07001901 return -1;
Olof Johansson91b9a272005-08-09 20:24:39 -07001902 }
Robert Olsson19baf832005-06-21 12:43:18 -07001903 i++;
1904 }
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001905 cb->args[4] = i;
Robert Olsson19baf832005-06-21 12:43:18 -07001906 return skb->len;
1907}
1908
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001909static int fn_trie_dump_plen(struct trie *t, int plen, struct fib_table *tb, struct sk_buff *skb,
Robert Olsson19baf832005-06-21 12:43:18 -07001910 struct netlink_callback *cb)
1911{
1912 int h, s_h;
1913 struct list_head *fa_head;
1914 struct leaf *l = NULL;
Robert Olsson19baf832005-06-21 12:43:18 -07001915
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001916 s_h = cb->args[3];
Robert Olsson19baf832005-06-21 12:43:18 -07001917
Olof Johansson91b9a272005-08-09 20:24:39 -07001918 for (h = 0; (l = nextleaf(t, l)) != NULL; h++) {
Robert Olsson19baf832005-06-21 12:43:18 -07001919 if (h < s_h)
1920 continue;
1921 if (h > s_h)
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001922 memset(&cb->args[4], 0,
1923 sizeof(cb->args) - 4*sizeof(cb->args[0]));
Robert Olsson19baf832005-06-21 12:43:18 -07001924
1925 fa_head = get_fa_head(l, plen);
Olof Johansson91b9a272005-08-09 20:24:39 -07001926
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001927 if (!fa_head)
Robert Olsson19baf832005-06-21 12:43:18 -07001928 continue;
1929
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07001930 if (list_empty(fa_head))
Robert Olsson19baf832005-06-21 12:43:18 -07001931 continue;
1932
1933 if (fn_trie_dump_fa(l->key, plen, fa_head, tb, skb, cb)<0) {
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001934 cb->args[3] = h;
Robert Olsson19baf832005-06-21 12:43:18 -07001935 return -1;
1936 }
1937 }
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001938 cb->args[3] = h;
Robert Olsson19baf832005-06-21 12:43:18 -07001939 return skb->len;
1940}
1941
1942static int fn_trie_dump(struct fib_table *tb, struct sk_buff *skb, struct netlink_callback *cb)
1943{
1944 int m, s_m;
1945 struct trie *t = (struct trie *) tb->tb_data;
1946
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001947 s_m = cb->args[2];
Robert Olsson19baf832005-06-21 12:43:18 -07001948
Robert Olsson2373ce12005-08-25 13:01:29 -07001949 rcu_read_lock();
Olof Johansson91b9a272005-08-09 20:24:39 -07001950 for (m = 0; m <= 32; m++) {
Robert Olsson19baf832005-06-21 12:43:18 -07001951 if (m < s_m)
1952 continue;
1953 if (m > s_m)
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001954 memset(&cb->args[3], 0,
1955 sizeof(cb->args) - 3*sizeof(cb->args[0]));
Robert Olsson19baf832005-06-21 12:43:18 -07001956
1957 if (fn_trie_dump_plen(t, 32-m, tb, skb, cb)<0) {
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001958 cb->args[2] = m;
Robert Olsson19baf832005-06-21 12:43:18 -07001959 goto out;
1960 }
1961 }
Robert Olsson2373ce12005-08-25 13:01:29 -07001962 rcu_read_unlock();
Patrick McHardy1af5a8c2006-08-10 23:10:46 -07001963 cb->args[2] = m;
Robert Olsson19baf832005-06-21 12:43:18 -07001964 return skb->len;
Olof Johansson91b9a272005-08-09 20:24:39 -07001965out:
Robert Olsson2373ce12005-08-25 13:01:29 -07001966 rcu_read_unlock();
Robert Olsson19baf832005-06-21 12:43:18 -07001967 return -1;
1968}
1969
1970/* Fix more generic FIB names for init later */
1971
1972#ifdef CONFIG_IP_MULTIPLE_TABLES
Patrick McHardy2dfe55b2006-08-10 23:08:33 -07001973struct fib_table * fib_hash_init(u32 id)
Robert Olsson19baf832005-06-21 12:43:18 -07001974#else
Patrick McHardy2dfe55b2006-08-10 23:08:33 -07001975struct fib_table * __init fib_hash_init(u32 id)
Robert Olsson19baf832005-06-21 12:43:18 -07001976#endif
1977{
1978 struct fib_table *tb;
1979 struct trie *t;
1980
1981 if (fn_alias_kmem == NULL)
1982 fn_alias_kmem = kmem_cache_create("ip_fib_alias",
1983 sizeof(struct fib_alias),
1984 0, SLAB_HWCACHE_ALIGN,
Paul Mundt20c2df82007-07-20 10:11:58 +09001985 NULL);
Robert Olsson19baf832005-06-21 12:43:18 -07001986
1987 tb = kmalloc(sizeof(struct fib_table) + sizeof(struct trie),
1988 GFP_KERNEL);
1989 if (tb == NULL)
1990 return NULL;
1991
1992 tb->tb_id = id;
1993 tb->tb_lookup = fn_trie_lookup;
1994 tb->tb_insert = fn_trie_insert;
1995 tb->tb_delete = fn_trie_delete;
1996 tb->tb_flush = fn_trie_flush;
1997 tb->tb_select_default = fn_trie_select_default;
1998 tb->tb_dump = fn_trie_dump;
1999 memset(tb->tb_data, 0, sizeof(struct trie));
2000
2001 t = (struct trie *) tb->tb_data;
2002
2003 trie_init(t);
2004
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07002005 if (id == RT_TABLE_LOCAL)
Olof Johansson91b9a272005-08-09 20:24:39 -07002006 trie_local = t;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07002007 else if (id == RT_TABLE_MAIN)
Olof Johansson91b9a272005-08-09 20:24:39 -07002008 trie_main = t;
Robert Olsson19baf832005-06-21 12:43:18 -07002009
2010 if (id == RT_TABLE_LOCAL)
Stephen Hemminger78c66712005-09-21 00:15:39 -07002011 printk(KERN_INFO "IPv4 FIB: Using LC-trie version %s\n", VERSION);
Robert Olsson19baf832005-06-21 12:43:18 -07002012
2013 return tb;
2014}
2015
Robert Olsson19baf832005-06-21 12:43:18 -07002016#ifdef CONFIG_PROC_FS
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002017/* Depth first Trie walk iterator */
2018struct fib_trie_iter {
2019 struct tnode *tnode;
2020 struct trie *trie;
2021 unsigned index;
2022 unsigned depth;
2023};
Robert Olsson19baf832005-06-21 12:43:18 -07002024
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002025static struct node *fib_trie_get_next(struct fib_trie_iter *iter)
Robert Olsson19baf832005-06-21 12:43:18 -07002026{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002027 struct tnode *tn = iter->tnode;
2028 unsigned cindex = iter->index;
2029 struct tnode *p;
2030
Eric W. Biederman6640e692007-01-24 14:42:04 -08002031 /* A single entry routing table */
2032 if (!tn)
2033 return NULL;
2034
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002035 pr_debug("get_next iter={node=%p index=%d depth=%d}\n",
2036 iter->tnode, iter->index, iter->depth);
2037rescan:
2038 while (cindex < (1<<tn->bits)) {
2039 struct node *n = tnode_get_child(tn, cindex);
2040
2041 if (n) {
2042 if (IS_LEAF(n)) {
2043 iter->tnode = tn;
2044 iter->index = cindex + 1;
2045 } else {
2046 /* push down one level */
2047 iter->tnode = (struct tnode *) n;
2048 iter->index = 0;
2049 ++iter->depth;
2050 }
2051 return n;
2052 }
2053
2054 ++cindex;
2055 }
2056
2057 /* Current node exhausted, pop back up */
Stephen Hemminger06801912007-08-10 15:22:13 -07002058 p = node_parent((struct node *)tn);
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002059 if (p) {
2060 cindex = tkey_extract_bits(tn->key, p->pos, p->bits)+1;
2061 tn = p;
2062 --iter->depth;
2063 goto rescan;
2064 }
2065
2066 /* got root? */
Robert Olsson19baf832005-06-21 12:43:18 -07002067 return NULL;
2068}
2069
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002070static struct node *fib_trie_get_first(struct fib_trie_iter *iter,
2071 struct trie *t)
Robert Olsson19baf832005-06-21 12:43:18 -07002072{
Robert Olsson5ddf0eb2006-03-20 21:34:12 -08002073 struct node *n ;
2074
Stephen Hemminger132adf52007-03-08 20:44:43 -08002075 if (!t)
Robert Olsson5ddf0eb2006-03-20 21:34:12 -08002076 return NULL;
2077
2078 n = rcu_dereference(t->trie);
2079
Stephen Hemminger132adf52007-03-08 20:44:43 -08002080 if (!iter)
Robert Olsson5ddf0eb2006-03-20 21:34:12 -08002081 return NULL;
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002082
Eric W. Biederman6640e692007-01-24 14:42:04 -08002083 if (n) {
2084 if (IS_TNODE(n)) {
2085 iter->tnode = (struct tnode *) n;
2086 iter->trie = t;
2087 iter->index = 0;
2088 iter->depth = 1;
2089 } else {
2090 iter->tnode = NULL;
2091 iter->trie = t;
2092 iter->index = 0;
2093 iter->depth = 0;
2094 }
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002095 return n;
2096 }
Robert Olsson19baf832005-06-21 12:43:18 -07002097 return NULL;
2098}
2099
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002100static void trie_collect_stats(struct trie *t, struct trie_stat *s)
Robert Olsson19baf832005-06-21 12:43:18 -07002101{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002102 struct node *n;
2103 struct fib_trie_iter iter;
Robert Olsson19baf832005-06-21 12:43:18 -07002104
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002105 memset(s, 0, sizeof(*s));
Robert Olsson19baf832005-06-21 12:43:18 -07002106
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002107 rcu_read_lock();
2108 for (n = fib_trie_get_first(&iter, t); n;
2109 n = fib_trie_get_next(&iter)) {
2110 if (IS_LEAF(n)) {
2111 s->leaves++;
2112 s->totdepth += iter.depth;
2113 if (iter.depth > s->maxdepth)
2114 s->maxdepth = iter.depth;
2115 } else {
2116 const struct tnode *tn = (const struct tnode *) n;
2117 int i;
Robert Olsson19baf832005-06-21 12:43:18 -07002118
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002119 s->tnodes++;
Stephen Hemminger132adf52007-03-08 20:44:43 -08002120 if (tn->bits < MAX_STAT_DEPTH)
Robert Olsson06ef9212006-03-20 21:35:01 -08002121 s->nodesizes[tn->bits]++;
2122
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002123 for (i = 0; i < (1<<tn->bits); i++)
2124 if (!tn->child[i])
2125 s->nullpointers++;
2126 }
2127 }
2128 rcu_read_unlock();
Robert Olsson19baf832005-06-21 12:43:18 -07002129}
2130
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07002131/*
Robert Olsson19baf832005-06-21 12:43:18 -07002132 * This outputs /proc/net/fib_triestats
Robert Olsson19baf832005-06-21 12:43:18 -07002133 */
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002134static void trie_show_stats(struct seq_file *seq, struct trie_stat *stat)
Robert Olsson19baf832005-06-21 12:43:18 -07002135{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002136 unsigned i, max, pointers, bytes, avdepth;
Robert Olsson19baf832005-06-21 12:43:18 -07002137
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002138 if (stat->leaves)
2139 avdepth = stat->totdepth*100 / stat->leaves;
2140 else
2141 avdepth = 0;
Robert Olsson19baf832005-06-21 12:43:18 -07002142
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002143 seq_printf(seq, "\tAver depth: %d.%02d\n", avdepth / 100, avdepth % 100 );
2144 seq_printf(seq, "\tMax depth: %u\n", stat->maxdepth);
Robert Olsson19baf832005-06-21 12:43:18 -07002145
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002146 seq_printf(seq, "\tLeaves: %u\n", stat->leaves);
Olof Johansson91b9a272005-08-09 20:24:39 -07002147
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002148 bytes = sizeof(struct leaf) * stat->leaves;
2149 seq_printf(seq, "\tInternal nodes: %d\n\t", stat->tnodes);
2150 bytes += sizeof(struct tnode) * stat->tnodes;
Robert Olsson19baf832005-06-21 12:43:18 -07002151
Robert Olsson06ef9212006-03-20 21:35:01 -08002152 max = MAX_STAT_DEPTH;
2153 while (max > 0 && stat->nodesizes[max-1] == 0)
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002154 max--;
Robert Olsson19baf832005-06-21 12:43:18 -07002155
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002156 pointers = 0;
2157 for (i = 1; i <= max; i++)
2158 if (stat->nodesizes[i] != 0) {
2159 seq_printf(seq, " %d: %d", i, stat->nodesizes[i]);
2160 pointers += (1<<i) * stat->nodesizes[i];
2161 }
2162 seq_putc(seq, '\n');
2163 seq_printf(seq, "\tPointers: %d\n", pointers);
Robert Olsson19baf832005-06-21 12:43:18 -07002164
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002165 bytes += sizeof(struct node *) * pointers;
2166 seq_printf(seq, "Null ptrs: %d\n", stat->nullpointers);
2167 seq_printf(seq, "Total size: %d kB\n", (bytes + 1023) / 1024);
Robert Olsson19baf832005-06-21 12:43:18 -07002168
2169#ifdef CONFIG_IP_FIB_TRIE_STATS
2170 seq_printf(seq, "Counters:\n---------\n");
2171 seq_printf(seq,"gets = %d\n", t->stats.gets);
2172 seq_printf(seq,"backtracks = %d\n", t->stats.backtrack);
2173 seq_printf(seq,"semantic match passed = %d\n", t->stats.semantic_match_passed);
2174 seq_printf(seq,"semantic match miss = %d\n", t->stats.semantic_match_miss);
2175 seq_printf(seq,"null node hit= %d\n", t->stats.null_node_hit);
Robert Olsson2f368952005-07-05 15:02:40 -07002176 seq_printf(seq,"skipped node resize = %d\n", t->stats.resize_node_skipped);
Robert Olsson19baf832005-06-21 12:43:18 -07002177#ifdef CLEAR_STATS
2178 memset(&(t->stats), 0, sizeof(t->stats));
2179#endif
2180#endif /* CONFIG_IP_FIB_TRIE_STATS */
2181}
2182
2183static int fib_triestat_seq_show(struct seq_file *seq, void *v)
2184{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002185 struct trie_stat *stat;
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07002186
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002187 stat = kmalloc(sizeof(*stat), GFP_KERNEL);
2188 if (!stat)
2189 return -ENOMEM;
Robert Olsson19baf832005-06-21 12:43:18 -07002190
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002191 seq_printf(seq, "Basic info: size of leaf: %Zd bytes, size of tnode: %Zd bytes.\n",
2192 sizeof(struct leaf), sizeof(struct tnode));
Olof Johansson91b9a272005-08-09 20:24:39 -07002193
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002194 if (trie_local) {
2195 seq_printf(seq, "Local:\n");
2196 trie_collect_stats(trie_local, stat);
2197 trie_show_stats(seq, stat);
Robert Olsson19baf832005-06-21 12:43:18 -07002198 }
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002199
2200 if (trie_main) {
2201 seq_printf(seq, "Main:\n");
2202 trie_collect_stats(trie_main, stat);
2203 trie_show_stats(seq, stat);
2204 }
2205 kfree(stat);
2206
Robert Olsson19baf832005-06-21 12:43:18 -07002207 return 0;
2208}
2209
Robert Olsson19baf832005-06-21 12:43:18 -07002210static int fib_triestat_seq_open(struct inode *inode, struct file *file)
2211{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002212 return single_open(file, fib_triestat_seq_show, NULL);
Robert Olsson19baf832005-06-21 12:43:18 -07002213}
2214
Arjan van de Ven9a321442007-02-12 00:55:35 -08002215static const struct file_operations fib_triestat_fops = {
Stephen Hemmingerc877efb2005-07-19 14:01:51 -07002216 .owner = THIS_MODULE,
2217 .open = fib_triestat_seq_open,
2218 .read = seq_read,
2219 .llseek = seq_lseek,
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002220 .release = single_release,
Robert Olsson19baf832005-06-21 12:43:18 -07002221};
2222
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002223static struct node *fib_trie_get_idx(struct fib_trie_iter *iter,
2224 loff_t pos)
Robert Olsson19baf832005-06-21 12:43:18 -07002225{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002226 loff_t idx = 0;
2227 struct node *n;
Robert Olsson19baf832005-06-21 12:43:18 -07002228
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002229 for (n = fib_trie_get_first(iter, trie_local);
2230 n; ++idx, n = fib_trie_get_next(iter)) {
2231 if (pos == idx)
2232 return n;
2233 }
Robert Olsson19baf832005-06-21 12:43:18 -07002234
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002235 for (n = fib_trie_get_first(iter, trie_main);
2236 n; ++idx, n = fib_trie_get_next(iter)) {
2237 if (pos == idx)
2238 return n;
2239 }
Robert Olsson19baf832005-06-21 12:43:18 -07002240 return NULL;
2241}
2242
2243static void *fib_trie_seq_start(struct seq_file *seq, loff_t *pos)
2244{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002245 rcu_read_lock();
2246 if (*pos == 0)
Olof Johansson91b9a272005-08-09 20:24:39 -07002247 return SEQ_START_TOKEN;
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002248 return fib_trie_get_idx(seq->private, *pos - 1);
Robert Olsson19baf832005-06-21 12:43:18 -07002249}
2250
2251static void *fib_trie_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2252{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002253 struct fib_trie_iter *iter = seq->private;
2254 void *l = v;
2255
Robert Olsson19baf832005-06-21 12:43:18 -07002256 ++*pos;
Olof Johansson91b9a272005-08-09 20:24:39 -07002257 if (v == SEQ_START_TOKEN)
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002258 return fib_trie_get_idx(iter, 0);
Olof Johansson91b9a272005-08-09 20:24:39 -07002259
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002260 v = fib_trie_get_next(iter);
2261 BUG_ON(v == l);
2262 if (v)
2263 return v;
2264
2265 /* continue scan in next trie */
2266 if (iter->trie == trie_local)
2267 return fib_trie_get_first(iter, trie_main);
2268
2269 return NULL;
Robert Olsson19baf832005-06-21 12:43:18 -07002270}
2271
2272static void fib_trie_seq_stop(struct seq_file *seq, void *v)
2273{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002274 rcu_read_unlock();
Robert Olsson19baf832005-06-21 12:43:18 -07002275}
2276
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002277static void seq_indent(struct seq_file *seq, int n)
2278{
2279 while (n-- > 0) seq_puts(seq, " ");
2280}
Robert Olsson19baf832005-06-21 12:43:18 -07002281
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002282static inline const char *rtn_scope(enum rt_scope_t s)
2283{
2284 static char buf[32];
2285
Stephen Hemminger132adf52007-03-08 20:44:43 -08002286 switch (s) {
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002287 case RT_SCOPE_UNIVERSE: return "universe";
2288 case RT_SCOPE_SITE: return "site";
2289 case RT_SCOPE_LINK: return "link";
2290 case RT_SCOPE_HOST: return "host";
2291 case RT_SCOPE_NOWHERE: return "nowhere";
2292 default:
2293 snprintf(buf, sizeof(buf), "scope=%d", s);
2294 return buf;
2295 }
2296}
2297
2298static const char *rtn_type_names[__RTN_MAX] = {
2299 [RTN_UNSPEC] = "UNSPEC",
2300 [RTN_UNICAST] = "UNICAST",
2301 [RTN_LOCAL] = "LOCAL",
2302 [RTN_BROADCAST] = "BROADCAST",
2303 [RTN_ANYCAST] = "ANYCAST",
2304 [RTN_MULTICAST] = "MULTICAST",
2305 [RTN_BLACKHOLE] = "BLACKHOLE",
2306 [RTN_UNREACHABLE] = "UNREACHABLE",
2307 [RTN_PROHIBIT] = "PROHIBIT",
2308 [RTN_THROW] = "THROW",
2309 [RTN_NAT] = "NAT",
2310 [RTN_XRESOLVE] = "XRESOLVE",
2311};
2312
2313static inline const char *rtn_type(unsigned t)
2314{
2315 static char buf[32];
2316
2317 if (t < __RTN_MAX && rtn_type_names[t])
2318 return rtn_type_names[t];
2319 snprintf(buf, sizeof(buf), "type %d", t);
2320 return buf;
2321}
2322
2323/* Pretty print the trie */
Robert Olsson19baf832005-06-21 12:43:18 -07002324static int fib_trie_seq_show(struct seq_file *seq, void *v)
2325{
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002326 const struct fib_trie_iter *iter = seq->private;
2327 struct node *n = v;
Robert Olsson19baf832005-06-21 12:43:18 -07002328
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002329 if (v == SEQ_START_TOKEN)
2330 return 0;
Robert Olsson19baf832005-06-21 12:43:18 -07002331
Stephen Hemminger06801912007-08-10 15:22:13 -07002332 if (!node_parent(n)) {
Robert Olsson095b8502007-01-26 19:06:01 -08002333 if (iter->trie == trie_local)
2334 seq_puts(seq, "<local>:\n");
2335 else
2336 seq_puts(seq, "<main>:\n");
2337 }
2338
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002339 if (IS_TNODE(n)) {
2340 struct tnode *tn = (struct tnode *) n;
Stephen Hemmingerab66b4a2007-08-10 15:22:58 -07002341 __be32 prf = htonl(mask_pfx(tn->key, tn->pos));
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002342
Robert Olsson1d25cd62005-09-19 15:29:52 -07002343 seq_indent(seq, iter->depth-1);
2344 seq_printf(seq, " +-- %d.%d.%d.%d/%d %d %d %d\n",
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002345 NIPQUAD(prf), tn->pos, tn->bits, tn->full_children,
Robert Olsson1d25cd62005-09-19 15:29:52 -07002346 tn->empty_children);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09002347
Olof Johansson91b9a272005-08-09 20:24:39 -07002348 } else {
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002349 struct leaf *l = (struct leaf *) n;
2350 int i;
Al Viro32ab5f82006-09-26 22:21:45 -07002351 __be32 val = htonl(l->key);
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002352
2353 seq_indent(seq, iter->depth);
2354 seq_printf(seq, " |-- %d.%d.%d.%d\n", NIPQUAD(val));
2355 for (i = 32; i >= 0; i--) {
Robert Olsson772cb712005-09-19 15:31:18 -07002356 struct leaf_info *li = find_leaf_info(l, i);
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002357 if (li) {
2358 struct fib_alias *fa;
2359 list_for_each_entry_rcu(fa, &li->falh, fa_list) {
2360 seq_indent(seq, iter->depth+1);
2361 seq_printf(seq, " /%d %s %s", i,
2362 rtn_scope(fa->fa_scope),
2363 rtn_type(fa->fa_type));
2364 if (fa->fa_tos)
2365 seq_printf(seq, "tos =%d\n",
2366 fa->fa_tos);
2367 seq_putc(seq, '\n');
2368 }
2369 }
2370 }
Robert Olsson19baf832005-06-21 12:43:18 -07002371 }
2372
2373 return 0;
2374}
2375
Stephen Hemmingerf6908082007-03-12 14:34:29 -07002376static const struct seq_operations fib_trie_seq_ops = {
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002377 .start = fib_trie_seq_start,
2378 .next = fib_trie_seq_next,
2379 .stop = fib_trie_seq_stop,
2380 .show = fib_trie_seq_show,
Robert Olsson19baf832005-06-21 12:43:18 -07002381};
2382
2383static int fib_trie_seq_open(struct inode *inode, struct file *file)
2384{
Pavel Emelyanovcf7732e2007-10-10 02:29:29 -07002385 return seq_open_private(file, &fib_trie_seq_ops,
2386 sizeof(struct fib_trie_iter));
Robert Olsson19baf832005-06-21 12:43:18 -07002387}
2388
Arjan van de Ven9a321442007-02-12 00:55:35 -08002389static const struct file_operations fib_trie_fops = {
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002390 .owner = THIS_MODULE,
2391 .open = fib_trie_seq_open,
2392 .read = seq_read,
2393 .llseek = seq_lseek,
2394 .release = seq_release_private,
2395};
2396
Al Viro32ab5f82006-09-26 22:21:45 -07002397static unsigned fib_flag_trans(int type, __be32 mask, const struct fib_info *fi)
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002398{
2399 static unsigned type2flags[RTN_MAX + 1] = {
2400 [7] = RTF_REJECT, [8] = RTF_REJECT,
2401 };
2402 unsigned flags = type2flags[type];
2403
2404 if (fi && fi->fib_nh->nh_gw)
2405 flags |= RTF_GATEWAY;
Al Viro32ab5f82006-09-26 22:21:45 -07002406 if (mask == htonl(0xFFFFFFFF))
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002407 flags |= RTF_HOST;
2408 flags |= RTF_UP;
2409 return flags;
2410}
2411
2412/*
2413 * This outputs /proc/net/route.
2414 * The format of the file is not supposed to be changed
2415 * and needs to be same as fib_hash output to avoid breaking
2416 * legacy utilities
2417 */
2418static int fib_route_seq_show(struct seq_file *seq, void *v)
2419{
Patrick McHardyc9e53cb2005-11-20 21:09:00 -08002420 const struct fib_trie_iter *iter = seq->private;
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002421 struct leaf *l = v;
2422 int i;
2423 char bf[128];
2424
2425 if (v == SEQ_START_TOKEN) {
2426 seq_printf(seq, "%-127s\n", "Iface\tDestination\tGateway "
2427 "\tFlags\tRefCnt\tUse\tMetric\tMask\t\tMTU"
2428 "\tWindow\tIRTT");
2429 return 0;
2430 }
2431
Patrick McHardyc9e53cb2005-11-20 21:09:00 -08002432 if (iter->trie == trie_local)
2433 return 0;
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002434 if (IS_TNODE(l))
2435 return 0;
2436
2437 for (i=32; i>=0; i--) {
Robert Olsson772cb712005-09-19 15:31:18 -07002438 struct leaf_info *li = find_leaf_info(l, i);
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002439 struct fib_alias *fa;
Al Viro32ab5f82006-09-26 22:21:45 -07002440 __be32 mask, prefix;
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002441
2442 if (!li)
2443 continue;
2444
2445 mask = inet_make_mask(li->plen);
2446 prefix = htonl(l->key);
2447
2448 list_for_each_entry_rcu(fa, &li->falh, fa_list) {
Herbert Xu1371e372005-10-15 09:42:39 +10002449 const struct fib_info *fi = fa->fa_info;
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002450 unsigned flags = fib_flag_trans(fa->fa_type, mask, fi);
2451
2452 if (fa->fa_type == RTN_BROADCAST
2453 || fa->fa_type == RTN_MULTICAST)
2454 continue;
2455
2456 if (fi)
2457 snprintf(bf, sizeof(bf),
2458 "%s\t%08X\t%08X\t%04X\t%d\t%u\t%d\t%08X\t%d\t%u\t%u",
2459 fi->fib_dev ? fi->fib_dev->name : "*",
2460 prefix,
2461 fi->fib_nh->nh_gw, flags, 0, 0,
2462 fi->fib_priority,
2463 mask,
2464 (fi->fib_advmss ? fi->fib_advmss + 40 : 0),
2465 fi->fib_window,
2466 fi->fib_rtt >> 3);
2467 else
2468 snprintf(bf, sizeof(bf),
2469 "*\t%08X\t%08X\t%04X\t%d\t%u\t%d\t%08X\t%d\t%u\t%u",
2470 prefix, 0, flags, 0, 0, 0,
2471 mask, 0, 0, 0);
2472
2473 seq_printf(seq, "%-127s\n", bf);
2474 }
2475 }
2476
2477 return 0;
2478}
2479
Stephen Hemmingerf6908082007-03-12 14:34:29 -07002480static const struct seq_operations fib_route_seq_ops = {
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002481 .start = fib_trie_seq_start,
2482 .next = fib_trie_seq_next,
2483 .stop = fib_trie_seq_stop,
2484 .show = fib_route_seq_show,
2485};
2486
2487static int fib_route_seq_open(struct inode *inode, struct file *file)
2488{
Pavel Emelyanovcf7732e2007-10-10 02:29:29 -07002489 return seq_open_private(file, &fib_route_seq_ops,
2490 sizeof(struct fib_trie_iter));
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002491}
2492
Arjan van de Ven9a321442007-02-12 00:55:35 -08002493static const struct file_operations fib_route_fops = {
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002494 .owner = THIS_MODULE,
2495 .open = fib_route_seq_open,
2496 .read = seq_read,
2497 .llseek = seq_lseek,
2498 .release = seq_release_private,
Robert Olsson19baf832005-06-21 12:43:18 -07002499};
2500
2501int __init fib_proc_init(void)
2502{
Eric W. Biederman457c4cb2007-09-12 12:01:34 +02002503 if (!proc_net_fops_create(&init_net, "fib_trie", S_IRUGO, &fib_trie_fops))
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002504 goto out1;
2505
Eric W. Biederman457c4cb2007-09-12 12:01:34 +02002506 if (!proc_net_fops_create(&init_net, "fib_triestat", S_IRUGO, &fib_triestat_fops))
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002507 goto out2;
2508
Eric W. Biederman457c4cb2007-09-12 12:01:34 +02002509 if (!proc_net_fops_create(&init_net, "route", S_IRUGO, &fib_route_fops))
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002510 goto out3;
2511
Robert Olsson19baf832005-06-21 12:43:18 -07002512 return 0;
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002513
2514out3:
Eric W. Biederman457c4cb2007-09-12 12:01:34 +02002515 proc_net_remove(&init_net, "fib_triestat");
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002516out2:
Eric W. Biederman457c4cb2007-09-12 12:01:34 +02002517 proc_net_remove(&init_net, "fib_trie");
Stephen Hemmingercb7b5932005-09-09 13:35:42 -07002518out1:
2519 return -ENOMEM;
Robert Olsson19baf832005-06-21 12:43:18 -07002520}
2521
2522void __init fib_proc_exit(void)
2523{
Eric W. Biederman457c4cb2007-09-12 12:01:34 +02002524 proc_net_remove(&init_net, "fib_trie");
2525 proc_net_remove(&init_net, "fib_triestat");
2526 proc_net_remove(&init_net, "route");
Robert Olsson19baf832005-06-21 12:43:18 -07002527}
2528
2529#endif /* CONFIG_PROC_FS */