blob: 5e0196084f1e8ad4c22c54165915309f7b330bc5 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
5 *
6 * Definitions for the Forwarding Information Base.
7 *
8 * Authors: A.N.Kuznetsov, <kuznet@ms2.inr.ac.ru>
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
14 */
15
16#ifndef _NET_IP_FIB_H
17#define _NET_IP_FIB_H
18
Linus Torvalds1da177e2005-04-16 15:20:36 -070019#include <net/flow.h>
20#include <linux/seq_file.h>
David S. Miller4895c772012-07-17 04:19:00 -070021#include <linux/rcupdate.h>
Thomas Grafe1ef4bf2006-08-04 03:39:22 -070022#include <net/fib_rules.h>
David S. Miller8e773272012-06-11 00:01:52 -070023#include <net/inetpeer.h>
Eric Dumazetd26b3a72012-07-31 05:45:30 +000024#include <linux/percpu.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025
Thomas Graf4e902c52006-08-17 18:14:52 -070026struct fib_config {
Thomas Graf4e902c52006-08-17 18:14:52 -070027 u8 fc_dst_len;
Thomas Graf4e902c52006-08-17 18:14:52 -070028 u8 fc_tos;
29 u8 fc_protocol;
30 u8 fc_scope;
31 u8 fc_type;
Thomas Grafb52f0702006-10-18 20:26:36 -070032 /* 3 bytes unused */
Thomas Graf4e902c52006-08-17 18:14:52 -070033 u32 fc_table;
Al Viro6d85c102006-09-26 22:15:46 -070034 __be32 fc_dst;
Al Viro6d85c102006-09-26 22:15:46 -070035 __be32 fc_gw;
Thomas Graf4e902c52006-08-17 18:14:52 -070036 int fc_oif;
37 u32 fc_flags;
38 u32 fc_priority;
Al Viro6d85c102006-09-26 22:15:46 -070039 __be32 fc_prefsrc;
Thomas Graf4e902c52006-08-17 18:14:52 -070040 struct nlattr *fc_mx;
41 struct rtnexthop *fc_mp;
42 int fc_mx_len;
43 int fc_mp_len;
44 u32 fc_flow;
Thomas Graf4e902c52006-08-17 18:14:52 -070045 u32 fc_nlflags;
46 struct nl_info fc_nlinfo;
Roopa Prabhu571e7222015-07-21 10:43:47 +020047 struct nlattr *fc_encap;
48 u16 fc_encap_type;
49};
Linus Torvalds1da177e2005-04-16 15:20:36 -070050
51struct fib_info;
David S. Millerf2bb4be2012-07-17 12:20:47 -070052struct rtable;
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
David S. Miller4895c772012-07-17 04:19:00 -070054struct fib_nh_exception {
55 struct fib_nh_exception __rcu *fnhe_next;
Timo Teräs5aad1de2013-05-27 20:46:33 +000056 int fnhe_genid;
David S. Miller4895c772012-07-17 04:19:00 -070057 __be32 fnhe_daddr;
58 u32 fnhe_pmtu;
Julian Anastasovaee06da2012-07-18 10:15:35 +000059 __be32 fnhe_gw;
David S. Miller4895c772012-07-17 04:19:00 -070060 unsigned long fnhe_expires;
Timo Teräs2ffae992013-06-27 10:27:05 +030061 struct rtable __rcu *fnhe_rth_input;
62 struct rtable __rcu *fnhe_rth_output;
David S. Miller4895c772012-07-17 04:19:00 -070063 unsigned long fnhe_stamp;
64};
65
66struct fnhe_hash_bucket {
67 struct fib_nh_exception __rcu *chain;
68};
69
Eric Dumazetd546c622014-09-04 08:21:31 -070070#define FNHE_HASH_SHIFT 11
71#define FNHE_HASH_SIZE (1 << FNHE_HASH_SHIFT)
David S. Miller4895c772012-07-17 04:19:00 -070072#define FNHE_RECLAIM_DEPTH 5
73
Linus Torvalds1da177e2005-04-16 15:20:36 -070074struct fib_nh {
75 struct net_device *nh_dev;
76 struct hlist_node nh_hash;
77 struct fib_info *nh_parent;
Eric Dumazet95c96172012-04-15 05:58:06 +000078 unsigned int nh_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -070079 unsigned char nh_scope;
80#ifdef CONFIG_IP_ROUTE_MULTIPATH
81 int nh_weight;
82 int nh_power;
83#endif
Patrick McHardyc7066f72011-01-14 13:36:42 +010084#ifdef CONFIG_IP_ROUTE_CLASSID
Linus Torvalds1da177e2005-04-16 15:20:36 -070085 __u32 nh_tclassid;
86#endif
87 int nh_oif;
Al Viroed49e3c2006-09-26 22:13:54 -070088 __be32 nh_gw;
David S. Miller1fc050a2011-03-07 20:54:48 -080089 __be32 nh_saddr;
David S. Miller436c3b62011-03-24 17:42:21 -070090 int nh_saddr_genid;
Eric Dumazetd26b3a72012-07-31 05:45:30 +000091 struct rtable __rcu * __percpu *nh_pcpu_rth_output;
Eric Dumazet54764bb2012-07-31 01:08:23 +000092 struct rtable __rcu *nh_rth_input;
Eric Dumazetcaa41522014-09-03 22:21:56 -070093 struct fnhe_hash_bucket __rcu *nh_exceptions;
Roopa Prabhu571e7222015-07-21 10:43:47 +020094 struct lwtunnel_state *nh_lwtstate;
Linus Torvalds1da177e2005-04-16 15:20:36 -070095};
96
97/*
98 * This structure contains data shared by many of routes.
99 */
100
101struct fib_info {
102 struct hlist_node fib_hash;
103 struct hlist_node fib_lhash;
Denis V. Lunev7462bd742008-01-31 18:49:32 -0800104 struct net *fib_net;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105 int fib_treeref;
106 atomic_t fib_clntref;
Eric Dumazet95c96172012-04-15 05:58:06 +0000107 unsigned int fib_flags;
David S. Miller37e826c2011-03-24 18:06:47 -0700108 unsigned char fib_dead;
109 unsigned char fib_protocol;
110 unsigned char fib_scope;
Eric Dumazetf4ef85b2012-10-04 01:25:26 +0000111 unsigned char fib_type;
Al Virob83738a2006-09-26 22:14:15 -0700112 __be32 fib_prefsrc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113 u32 fib_priority;
David S. Miller9c150e82011-01-28 14:01:25 -0800114 u32 *fib_metrics;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115#define fib_mtu fib_metrics[RTAX_MTU-1]
116#define fib_window fib_metrics[RTAX_WINDOW-1]
117#define fib_rtt fib_metrics[RTAX_RTT-1]
118#define fib_advmss fib_metrics[RTAX_ADVMSS-1]
119 int fib_nhs;
120#ifdef CONFIG_IP_ROUTE_MULTIPATH
121 int fib_power;
122#endif
Eric Dumazetebc0ffa2010-10-05 10:41:36 +0000123 struct rcu_head rcu;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124 struct fib_nh fib_nh[0];
125#define fib_dev fib_nh[0].nh_dev
126};
127
128
129#ifdef CONFIG_IP_MULTIPLE_TABLES
130struct fib_rule;
131#endif
132
David S. Miller5b470442011-01-31 16:10:03 -0800133struct fib_table;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134struct fib_result {
135 unsigned char prefixlen;
136 unsigned char nh_sel;
137 unsigned char type;
138 unsigned char scope;
David S. Miller85b91b02012-07-13 08:21:29 -0700139 u32 tclassid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700140 struct fib_info *fi;
David S. Miller5b470442011-01-31 16:10:03 -0800141 struct fib_table *table;
Alexander Duyck56315f92015-02-25 15:31:31 -0800142 struct hlist_head *fa_head;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143};
144
Robert Olsson246955f2005-06-20 13:36:39 -0700145struct fib_result_nl {
Al Viro80e856e2006-09-26 22:19:36 -0700146 __be32 fl_addr; /* To be looked up*/
Thomas Graf5f3008932006-11-09 15:21:41 -0800147 u32 fl_mark;
Robert Olsson246955f2005-06-20 13:36:39 -0700148 unsigned char fl_tos;
149 unsigned char fl_scope;
150 unsigned char tb_id_in;
151
152 unsigned char tb_id; /* Results */
153 unsigned char prefixlen;
154 unsigned char nh_sel;
155 unsigned char type;
156 unsigned char scope;
157 int err;
158};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159
160#ifdef CONFIG_IP_ROUTE_MULTIPATH
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161#define FIB_RES_NH(res) ((res).fi->fib_nh[(res).nh_sel])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162#else /* CONFIG_IP_ROUTE_MULTIPATH */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163#define FIB_RES_NH(res) ((res).fi->fib_nh[0])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164#endif /* CONFIG_IP_ROUTE_MULTIPATH */
165
Denis V. Lunev5b9e12d2013-03-13 00:24:15 +0000166#ifdef CONFIG_IP_MULTIPLE_TABLES
167#define FIB_TABLE_HASHSZ 256
168#else
169#define FIB_TABLE_HASHSZ 2
170#endif
171
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700172__be32 fib_info_update_nh_saddr(struct net *net, struct fib_nh *nh);
David S. Miller436c3b62011-03-24 17:42:21 -0700173
174#define FIB_RES_SADDR(net, res) \
175 ((FIB_RES_NH(res).nh_saddr_genid == \
176 atomic_read(&(net)->ipv4.dev_addr_genid)) ? \
177 FIB_RES_NH(res).nh_saddr : \
178 fib_info_update_nh_saddr((net), &FIB_RES_NH(res)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179#define FIB_RES_GW(res) (FIB_RES_NH(res).nh_gw)
180#define FIB_RES_DEV(res) (FIB_RES_NH(res).nh_dev)
181#define FIB_RES_OIF(res) (FIB_RES_NH(res).nh_oif)
182
David S. Miller436c3b62011-03-24 17:42:21 -0700183#define FIB_RES_PREFSRC(net, res) ((res).fi->fib_prefsrc ? : \
184 FIB_RES_SADDR(net, res))
David S. Miller1fc050a2011-03-07 20:54:48 -0800185
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186struct fib_table {
David S. Miller8e773272012-06-11 00:01:52 -0700187 struct hlist_node tb_hlist;
188 u32 tb_id;
189 int tb_default;
190 int tb_num_default;
Alexander Duycka7e53532015-03-04 15:02:44 -0800191 struct rcu_head rcu;
Alexander Duyck0ddcf432015-03-06 13:47:00 -0800192 unsigned long *tb_data;
193 unsigned long __data[0];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194};
195
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700196int fib_table_lookup(struct fib_table *tb, const struct flowi4 *flp,
197 struct fib_result *res, int fib_flags);
198int fib_table_insert(struct fib_table *, struct fib_config *);
199int fib_table_delete(struct fib_table *, struct fib_config *);
200int fib_table_dump(struct fib_table *table, struct sk_buff *skb,
201 struct netlink_callback *cb);
202int fib_table_flush(struct fib_table *table);
Alexander Duyck0ddcf432015-03-06 13:47:00 -0800203struct fib_table *fib_trie_unmerge(struct fib_table *main_tb);
Scott Feldman104616e2015-03-05 21:21:16 -0800204void fib_table_flush_external(struct fib_table *table);
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700205void fib_free_table(struct fib_table *tb);
Pavel Emelyanov4aa2c462010-10-28 02:00:43 +0000206
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207#ifndef CONFIG_IP_MULTIPLE_TABLES
208
Alexander Duycka5a519b2014-12-02 10:58:21 -0800209#define TABLE_LOCAL_INDEX (RT_TABLE_LOCAL & (FIB_TABLE_HASHSZ - 1))
210#define TABLE_MAIN_INDEX (RT_TABLE_MAIN & (FIB_TABLE_HASHSZ - 1))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211
Denis V. Lunev8ad49422008-01-10 03:24:11 -0800212static inline struct fib_table *fib_get_table(struct net *net, u32 id)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213{
Alexander Duycka7e53532015-03-04 15:02:44 -0800214 struct hlist_node *tb_hlist;
Denis V. Lunev93456b62008-01-10 03:23:38 -0800215 struct hlist_head *ptr;
216
217 ptr = id == RT_TABLE_LOCAL ?
Denis V. Luneve4aef8a2008-01-10 03:28:24 -0800218 &net->ipv4.fib_table_hash[TABLE_LOCAL_INDEX] :
219 &net->ipv4.fib_table_hash[TABLE_MAIN_INDEX];
Alexander Duycka7e53532015-03-04 15:02:44 -0800220
221 tb_hlist = rcu_dereference_rtnl(hlist_first_rcu(ptr));
222
223 return hlist_entry(tb_hlist, struct fib_table, tb_hlist);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224}
225
Denis V. Lunev8ad49422008-01-10 03:24:11 -0800226static inline struct fib_table *fib_new_table(struct net *net, u32 id)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227{
Denis V. Lunev8ad49422008-01-10 03:24:11 -0800228 return fib_get_table(net, id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229}
230
David S. Miller22bd5b92011-03-11 19:54:08 -0500231static inline int fib_lookup(struct net *net, const struct flowi4 *flp,
Andy Gospodarek0eeb0752015-06-23 13:45:37 -0400232 struct fib_result *res, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233{
Alexander Duycka7e53532015-03-04 15:02:44 -0800234 struct fib_table *tb;
Alexander Duyck0ddcf432015-03-06 13:47:00 -0800235 int err = -ENETUNREACH;
Denis V. Lunev93456b62008-01-10 03:23:38 -0800236
Alexander Duyck345e9b52014-12-31 10:56:24 -0800237 rcu_read_lock();
Denis V. Lunev93456b62008-01-10 03:23:38 -0800238
Alexander Duyck0ddcf432015-03-06 13:47:00 -0800239 tb = fib_get_table(net, RT_TABLE_MAIN);
Andy Gospodarek0eeb0752015-06-23 13:45:37 -0400240 if (tb && !fib_table_lookup(tb, flp, res, flags | FIB_LOOKUP_NOREF))
Alexander Duyck0ddcf432015-03-06 13:47:00 -0800241 err = 0;
Alexander Duyck345e9b52014-12-31 10:56:24 -0800242
243 rcu_read_unlock();
244
245 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246}
247
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248#else /* CONFIG_IP_MULTIPLE_TABLES */
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700249int __net_init fib4_rules_init(struct net *net);
250void __net_exit fib4_rules_exit(struct net *net);
Pavel Emelyanovc3e9a352007-11-06 23:34:04 -0800251
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700252struct fib_table *fib_new_table(struct net *net, u32 id);
253struct fib_table *fib_get_table(struct net *net, u32 id);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
Andy Gospodarek0eeb0752015-06-23 13:45:37 -0400255int __fib_lookup(struct net *net, struct flowi4 *flp,
256 struct fib_result *res, unsigned int flags);
David S. Millerf4530fa2012-07-05 22:13:13 -0700257
258static inline int fib_lookup(struct net *net, struct flowi4 *flp,
Andy Gospodarek0eeb0752015-06-23 13:45:37 -0400259 struct fib_result *res, unsigned int flags)
David S. Millerf4530fa2012-07-05 22:13:13 -0700260{
Alexander Duycka7e53532015-03-04 15:02:44 -0800261 struct fib_table *tb;
262 int err;
Alexander Duyck345e9b52014-12-31 10:56:24 -0800263
Andy Gospodarek0eeb0752015-06-23 13:45:37 -0400264 flags |= FIB_LOOKUP_NOREF;
Alexander Duycka7e53532015-03-04 15:02:44 -0800265 if (net->ipv4.fib_has_custom_rules)
Andy Gospodarek0eeb0752015-06-23 13:45:37 -0400266 return __fib_lookup(net, flp, res, flags);
Alexander Duyck345e9b52014-12-31 10:56:24 -0800267
Alexander Duycka7e53532015-03-04 15:02:44 -0800268 rcu_read_lock();
Alexander Duyck345e9b52014-12-31 10:56:24 -0800269
Alexander Duycka7e53532015-03-04 15:02:44 -0800270 res->tclassid = 0;
Alexander Duyck345e9b52014-12-31 10:56:24 -0800271
Alexander Duycka7e53532015-03-04 15:02:44 -0800272 for (err = 0; !err; err = -ENETUNREACH) {
Alexander Duycka7e53532015-03-04 15:02:44 -0800273 tb = rcu_dereference_rtnl(net->ipv4.fib_main);
Andy Gospodarek0eeb0752015-06-23 13:45:37 -0400274 if (tb && !fib_table_lookup(tb, flp, res, flags))
Alexander Duycka7e53532015-03-04 15:02:44 -0800275 break;
276
277 tb = rcu_dereference_rtnl(net->ipv4.fib_default);
Andy Gospodarek0eeb0752015-06-23 13:45:37 -0400278 if (tb && !fib_table_lookup(tb, flp, res, flags))
Alexander Duycka7e53532015-03-04 15:02:44 -0800279 break;
David S. Millerf4530fa2012-07-05 22:13:13 -0700280 }
Alexander Duycka7e53532015-03-04 15:02:44 -0800281
282 rcu_read_unlock();
283
284 return err;
David S. Millerf4530fa2012-07-05 22:13:13 -0700285}
286
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287#endif /* CONFIG_IP_MULTIPLE_TABLES */
288
289/* Exported by fib_frontend.c */
Patrick McHardyef7c79e2007-06-05 12:38:30 -0700290extern const struct nla_policy rtm_ipv4_policy[];
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700291void ip_fib_init(void);
292__be32 fib_compute_spec_dst(struct sk_buff *skb);
293int fib_validate_source(struct sk_buff *skb, __be32 src, __be32 dst,
294 u8 tos, int oif, struct net_device *dev,
295 struct in_device *idev, u32 *itag);
296void fib_select_default(struct fib_result *res);
David S. Miller7a9bc9b2012-06-29 01:32:45 -0700297#ifdef CONFIG_IP_ROUTE_CLASSID
David S. Millerf4530fa2012-07-05 22:13:13 -0700298static inline int fib_num_tclassid_users(struct net *net)
299{
300 return net->ipv4.fib_num_tclassid_users;
301}
David S. Miller7a9bc9b2012-06-29 01:32:45 -0700302#else
David S. Millerf4530fa2012-07-05 22:13:13 -0700303static inline int fib_num_tclassid_users(struct net *net)
304{
305 return 0;
306}
David S. Miller7a9bc9b2012-06-29 01:32:45 -0700307#endif
Alexander Duyck0ddcf432015-03-06 13:47:00 -0800308int fib_unmerge(struct net *net);
Scott Feldman104616e2015-03-05 21:21:16 -0800309void fib_flush_external(struct net *net);
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -0200310
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311/* Exported by fib_semantics.c */
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700312int ip_fib_check_default(__be32 gw, struct net_device *dev);
Andy Gospodarek8a3d0312015-06-23 13:45:36 -0400313int fib_sync_down_dev(struct net_device *dev, unsigned long event);
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700314int fib_sync_down_addr(struct net *net, __be32 local);
Andy Gospodarek8a3d0312015-06-23 13:45:36 -0400315int fib_sync_up(struct net_device *dev, unsigned int nh_flags);
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700316void fib_select_multipath(struct fib_result *res);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317
David S. Miller5348ba82011-02-01 15:30:56 -0800318/* Exported by fib_trie.c */
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700319void fib_trie_init(void);
Alexander Duyck0ddcf432015-03-06 13:47:00 -0800320struct fib_table *fib_trie_table(u32 id, struct fib_table *alias);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321
David S. Millerb6bf3ca2011-02-16 22:04:57 -0800322static inline void fib_combine_itag(u32 *itag, const struct fib_result *res)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323{
Patrick McHardyc7066f72011-01-14 13:36:42 +0100324#ifdef CONFIG_IP_ROUTE_CLASSID
Linus Torvalds1da177e2005-04-16 15:20:36 -0700325#ifdef CONFIG_IP_MULTIPLE_TABLES
326 u32 rtag;
327#endif
328 *itag = FIB_RES_NH(*res).nh_tclassid<<16;
329#ifdef CONFIG_IP_MULTIPLE_TABLES
David S. Miller85b91b02012-07-13 08:21:29 -0700330 rtag = res->tclassid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331 if (*itag == 0)
332 *itag = (rtag<<16);
333 *itag |= (rtag>>16);
334#endif
335#endif
336}
337
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700338void free_fib_info(struct fib_info *fi);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339
340static inline void fib_info_put(struct fib_info *fi)
341{
342 if (atomic_dec_and_test(&fi->fib_clntref))
343 free_fib_info(fi);
344}
345
Arnaldo Carvalho de Melo20380732005-08-16 02:18:02 -0300346#ifdef CONFIG_PROC_FS
Joe Perches5c3a0fd2013-09-21 10:22:42 -0700347int __net_init fib_proc_init(struct net *net);
348void __net_exit fib_proc_exit(struct net *net);
Li Zefancc8274f2008-02-05 02:54:16 -0800349#else
350static inline int fib_proc_init(struct net *net)
351{
352 return 0;
353}
354static inline void fib_proc_exit(struct net *net)
355{
356}
Arnaldo Carvalho de Melo20380732005-08-16 02:18:02 -0300357#endif
358
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359#endif /* _NET_FIB_H */