blob: 720d90653a8e1dabfc041269449c065dcd83de17 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/dst.h Protocol independent destination cache definitions.
3 *
4 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
5 *
6 */
7
8#ifndef _NET_DST_H
9#define _NET_DST_H
10
Alexey Dobriyan86393e52009-08-29 01:34:49 +000011#include <net/dst_ops.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020012#include <linux/netdevice.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <linux/rtnetlink.h>
14#include <linux/rcupdate.h>
15#include <linux/jiffies.h>
16#include <net/neighbour.h>
17#include <asm/processor.h>
18
19/*
20 * 0 - no debugging messages
21 * 1 - rare events and bugs (default)
22 * 2 - trace mode.
23 */
24#define RT_CACHE_DEBUG 0
25
26#define DST_GC_MIN (HZ/10)
27#define DST_GC_INC (HZ/2)
28#define DST_GC_MAX (120*HZ)
29
30/* Each dst_entry has reference count and sits in some parent list(s).
31 * When it is removed from parent list, it is "freed" (dst_free).
32 * After this it enters dead state (dst->obsolete > 0) and if its refcnt
33 * is zero, it can be destroyed immediately, otherwise it is added
34 * to gc list and garbage collector periodically checks the refcnt.
35 */
36
37struct sk_buff;
38
39struct dst_entry
40{
Eric Dumazet1e19e022007-02-09 16:26:55 -080041 struct rcu_head rcu_head;
Linus Torvalds1da177e2005-04-16 15:20:36 -070042 struct dst_entry *child;
43 struct net_device *dev;
Herbert Xuc4d54112005-04-19 20:46:37 -070044 short error;
45 short obsolete;
Linus Torvalds1da177e2005-04-16 15:20:36 -070046 int flags;
47#define DST_HOST 1
48#define DST_NOXFRM 2
49#define DST_NOPOLICY 4
50#define DST_NOHASH 8
Linus Torvalds1da177e2005-04-16 15:20:36 -070051 unsigned long expires;
52
53 unsigned short header_len; /* more space at head required */
54 unsigned short trailer_len; /* space to reserve at tail */
55
Eric Dumazet69a73822008-01-22 06:18:34 -080056 unsigned int rate_tokens;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070057 unsigned long rate_last; /* rate limiting for ICMP */
Eric Dumazet69a73822008-01-22 06:18:34 -080058
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070059 struct dst_entry *path;
Linus Torvalds1da177e2005-04-16 15:20:36 -070060
Linus Torvalds1da177e2005-04-16 15:20:36 -070061 struct neighbour *neighbour;
62 struct hh_cache *hh;
Alexey Dobriyandef8b4f2008-10-28 13:24:06 -070063#ifdef CONFIG_XFRM
Linus Torvalds1da177e2005-04-16 15:20:36 -070064 struct xfrm_state *xfrm;
Eric Dumazet5635c102008-11-16 19:46:36 -080065#else
66 void *__pad1;
Alexey Dobriyandef8b4f2008-10-28 13:24:06 -070067#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070068 int (*input)(struct sk_buff*);
69 int (*output)(struct sk_buff*);
70
Linus Torvalds1da177e2005-04-16 15:20:36 -070071 struct dst_ops *ops;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070072
73 u32 metrics[RTAX_MAX];
74
75#ifdef CONFIG_NET_CLS_ROUTE
76 __u32 tclassid;
Eric Dumazet5635c102008-11-16 19:46:36 -080077#else
78 __u32 __pad2;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070079#endif
80
Eric Dumazet5635c102008-11-16 19:46:36 -080081
82 /*
83 * Align __refcnt to a 64 bytes alignment
84 * (L1_CACHE_SIZE would be too much)
85 */
86#ifdef CONFIG_64BIT
87 long __pad_to_align_refcnt[2];
88#else
89 long __pad_to_align_refcnt[1];
90#endif
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070091 /*
92 * __refcnt wants to be on a different cache line from
93 * input/output/ops or performance tanks badly
94 */
Eric Dumazet1e19e022007-02-09 16:26:55 -080095 atomic_t __refcnt; /* client references */
96 int __use;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070097 unsigned long lastuse;
Eric Dumazet1e19e022007-02-09 16:26:55 -080098 union {
99 struct dst_entry *next;
100 struct rtable *rt_next;
101 struct rt6_info *rt6_next;
102 struct dn_route *dn_next;
103 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104};
105
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106#ifdef __KERNEL__
107
108static inline u32
109dst_metric(const struct dst_entry *dst, int metric)
110{
111 return dst->metrics[metric-1];
112}
113
114static inline u32 dst_mtu(const struct dst_entry *dst)
115{
116 u32 mtu = dst_metric(dst, RTAX_MTU);
117 /*
118 * Alexey put it here, so ask him about it :)
119 */
120 barrier();
121 return mtu;
122}
123
Stephen Hemmingerc1e20f72008-07-18 23:02:15 -0700124/* RTT metrics are stored in milliseconds for user ABI, but used as jiffies */
125static inline unsigned long dst_metric_rtt(const struct dst_entry *dst, int metric)
126{
127 return msecs_to_jiffies(dst_metric(dst, metric));
128}
129
130static inline void set_dst_metric_rtt(struct dst_entry *dst, int metric,
131 unsigned long rtt)
132{
133 dst->metrics[metric-1] = jiffies_to_msecs(rtt);
134}
135
Linus Torvalds1da177e2005-04-16 15:20:36 -0700136static inline u32
137dst_allfrag(const struct dst_entry *dst)
138{
139 int ret = dst_metric(dst, RTAX_FEATURES) & RTAX_FEATURE_ALLFRAG;
140 /* Yes, _exactly_. This is paranoia. */
141 barrier();
142 return ret;
143}
144
145static inline int
146dst_metric_locked(struct dst_entry *dst, int metric)
147{
148 return dst_metric(dst, RTAX_LOCK) & (1<<metric);
149}
150
151static inline void dst_hold(struct dst_entry * dst)
152{
Eric Dumazet5635c102008-11-16 19:46:36 -0800153 /*
154 * If your kernel compilation stops here, please check
155 * __pad_to_align_refcnt declaration in struct dst_entry
156 */
157 BUILD_BUG_ON(offsetof(struct dst_entry, __refcnt) & 63);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158 atomic_inc(&dst->__refcnt);
159}
160
Pavel Emelyanov03f49f32007-11-10 21:28:34 -0800161static inline void dst_use(struct dst_entry *dst, unsigned long time)
162{
163 dst_hold(dst);
164 dst->__use++;
165 dst->lastuse = time;
166}
167
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168static inline
169struct dst_entry * dst_clone(struct dst_entry * dst)
170{
171 if (dst)
172 atomic_inc(&dst->__refcnt);
173 return dst;
174}
175
Ilpo Järvinen8d330862008-03-27 17:53:31 -0700176extern void dst_release(struct dst_entry *dst);
Eric Dumazetadf30902009-06-02 05:19:30 +0000177static inline void skb_dst_drop(struct sk_buff *skb)
178{
179 if (skb->_skb_dst)
180 dst_release(skb_dst(skb));
181 skb->_skb_dst = 0UL;
182}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183
184/* Children define the path of the packet through the
185 * Linux networking. Thus, destinations are stackable.
186 */
187
188static inline struct dst_entry *dst_pop(struct dst_entry *dst)
189{
190 struct dst_entry *child = dst_clone(dst->child);
191
192 dst_release(dst);
193 return child;
194}
195
Herbert Xu352e5122007-11-13 21:34:06 -0800196extern int dst_discard(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197extern void * dst_alloc(struct dst_ops * ops);
198extern void __dst_free(struct dst_entry * dst);
199extern struct dst_entry *dst_destroy(struct dst_entry * dst);
200
201static inline void dst_free(struct dst_entry * dst)
202{
203 if (dst->obsolete > 1)
204 return;
205 if (!atomic_read(&dst->__refcnt)) {
206 dst = dst_destroy(dst);
207 if (!dst)
208 return;
209 }
210 __dst_free(dst);
211}
212
213static inline void dst_rcu_free(struct rcu_head *head)
214{
215 struct dst_entry *dst = container_of(head, struct dst_entry, rcu_head);
216 dst_free(dst);
217}
218
219static inline void dst_confirm(struct dst_entry *dst)
220{
221 if (dst)
222 neigh_confirm(dst->neighbour);
223}
224
Krishna Kumarea94ff32009-10-19 23:46:45 +0000225static inline void dst_negative_advice(struct dst_entry **dst_p,
226 struct sock *sk)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227{
228 struct dst_entry * dst = *dst_p;
Krishna Kumarea94ff32009-10-19 23:46:45 +0000229 if (dst && dst->ops->negative_advice) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230 *dst_p = dst->ops->negative_advice(dst);
Krishna Kumarea94ff32009-10-19 23:46:45 +0000231
232 if (dst != *dst_p) {
233 extern void sk_reset_txq(struct sock *sk);
234
235 sk_reset_txq(sk);
236 }
237 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238}
239
240static inline void dst_link_failure(struct sk_buff *skb)
241{
Eric Dumazetadf30902009-06-02 05:19:30 +0000242 struct dst_entry *dst = skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700243 if (dst && dst->ops && dst->ops->link_failure)
244 dst->ops->link_failure(skb);
245}
246
247static inline void dst_set_expires(struct dst_entry *dst, int timeout)
248{
249 unsigned long expires = jiffies + timeout;
250
251 if (expires == 0)
252 expires = 1;
253
254 if (dst->expires == 0 || time_before(expires, dst->expires))
255 dst->expires = expires;
256}
257
258/* Output packet to network from transport. */
259static inline int dst_output(struct sk_buff *skb)
260{
Eric Dumazetadf30902009-06-02 05:19:30 +0000261 return skb_dst(skb)->output(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262}
263
264/* Input packet from network to transport. */
265static inline int dst_input(struct sk_buff *skb)
266{
Eric Dumazetadf30902009-06-02 05:19:30 +0000267 return skb_dst(skb)->input(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268}
269
270static inline struct dst_entry *dst_check(struct dst_entry *dst, u32 cookie)
271{
272 if (dst->obsolete)
273 dst = dst->ops->check(dst, cookie);
274 return dst;
275}
276
277extern void dst_init(void);
278
Herbert Xu815f4e52007-12-12 10:36:59 -0800279/* Flags for xfrm_lookup flags argument. */
280enum {
281 XFRM_LOOKUP_WAIT = 1 << 0,
Herbert Xu8b7817f2007-12-12 10:44:43 -0800282 XFRM_LOOKUP_ICMP = 1 << 1,
Herbert Xu815f4e52007-12-12 10:36:59 -0800283};
284
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285struct flowi;
286#ifndef CONFIG_XFRM
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800287static inline int xfrm_lookup(struct net *net, struct dst_entry **dst_p,
288 struct flowi *fl, struct sock *sk, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289{
290 return 0;
291}
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800292static inline int __xfrm_lookup(struct net *net, struct dst_entry **dst_p,
293 struct flowi *fl, struct sock *sk, int flags)
David S. Miller14e50e52007-05-24 18:17:54 -0700294{
295 return 0;
296}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297#else
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800298extern int xfrm_lookup(struct net *net, struct dst_entry **dst_p,
299 struct flowi *fl, struct sock *sk, int flags);
300extern int __xfrm_lookup(struct net *net, struct dst_entry **dst_p,
301 struct flowi *fl, struct sock *sk, int flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302#endif
303#endif
304
305#endif /* _NET_DST_H */