blob: 7fc409c19b37e9e9c6d692724258e64d71c12596 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/dst.h Protocol independent destination cache definitions.
3 *
4 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
5 *
6 */
7
8#ifndef _NET_DST_H
9#define _NET_DST_H
10
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020011#include <linux/netdevice.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/rtnetlink.h>
13#include <linux/rcupdate.h>
14#include <linux/jiffies.h>
15#include <net/neighbour.h>
16#include <asm/processor.h>
17
18/*
19 * 0 - no debugging messages
20 * 1 - rare events and bugs (default)
21 * 2 - trace mode.
22 */
23#define RT_CACHE_DEBUG 0
24
25#define DST_GC_MIN (HZ/10)
26#define DST_GC_INC (HZ/2)
27#define DST_GC_MAX (120*HZ)
28
29/* Each dst_entry has reference count and sits in some parent list(s).
30 * When it is removed from parent list, it is "freed" (dst_free).
31 * After this it enters dead state (dst->obsolete > 0) and if its refcnt
32 * is zero, it can be destroyed immediately, otherwise it is added
33 * to gc list and garbage collector periodically checks the refcnt.
34 */
35
36struct sk_buff;
37
38struct dst_entry
39{
Eric Dumazet1e19e022007-02-09 16:26:55 -080040 struct rcu_head rcu_head;
Linus Torvalds1da177e2005-04-16 15:20:36 -070041 struct dst_entry *child;
42 struct net_device *dev;
Herbert Xuc4d54112005-04-19 20:46:37 -070043 short error;
44 short obsolete;
Linus Torvalds1da177e2005-04-16 15:20:36 -070045 int flags;
46#define DST_HOST 1
47#define DST_NOXFRM 2
48#define DST_NOPOLICY 4
49#define DST_NOHASH 8
Linus Torvalds1da177e2005-04-16 15:20:36 -070050 unsigned long expires;
51
52 unsigned short header_len; /* more space at head required */
53 unsigned short trailer_len; /* space to reserve at tail */
54
Eric Dumazet69a73822008-01-22 06:18:34 -080055 unsigned int rate_tokens;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070056 unsigned long rate_last; /* rate limiting for ICMP */
Eric Dumazet69a73822008-01-22 06:18:34 -080057
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070058 struct dst_entry *path;
Linus Torvalds1da177e2005-04-16 15:20:36 -070059
Linus Torvalds1da177e2005-04-16 15:20:36 -070060 struct neighbour *neighbour;
61 struct hh_cache *hh;
Alexey Dobriyandef8b4f2008-10-28 13:24:06 -070062#ifdef CONFIG_XFRM
Linus Torvalds1da177e2005-04-16 15:20:36 -070063 struct xfrm_state *xfrm;
Eric Dumazet5635c102008-11-16 19:46:36 -080064#else
65 void *__pad1;
Alexey Dobriyandef8b4f2008-10-28 13:24:06 -070066#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070067 int (*input)(struct sk_buff*);
68 int (*output)(struct sk_buff*);
69
Linus Torvalds1da177e2005-04-16 15:20:36 -070070 struct dst_ops *ops;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070071
72 u32 metrics[RTAX_MAX];
73
74#ifdef CONFIG_NET_CLS_ROUTE
75 __u32 tclassid;
Eric Dumazet5635c102008-11-16 19:46:36 -080076#else
77 __u32 __pad2;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070078#endif
79
Eric Dumazet5635c102008-11-16 19:46:36 -080080
81 /*
82 * Align __refcnt to a 64 bytes alignment
83 * (L1_CACHE_SIZE would be too much)
84 */
85#ifdef CONFIG_64BIT
86 long __pad_to_align_refcnt[2];
87#else
88 long __pad_to_align_refcnt[1];
89#endif
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070090 /*
91 * __refcnt wants to be on a different cache line from
92 * input/output/ops or performance tanks badly
93 */
Eric Dumazet1e19e022007-02-09 16:26:55 -080094 atomic_t __refcnt; /* client references */
95 int __use;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070096 unsigned long lastuse;
Eric Dumazet1e19e022007-02-09 16:26:55 -080097 union {
98 struct dst_entry *next;
99 struct rtable *rt_next;
100 struct rt6_info *rt6_next;
101 struct dn_route *dn_next;
102 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103};
104
105
106struct dst_ops
107{
108 unsigned short family;
Al Virod77072e2006-09-28 14:20:34 -0700109 __be16 protocol;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110 unsigned gc_thresh;
111
Daniel Lezcano569d3642008-01-18 03:56:57 -0800112 int (*gc)(struct dst_ops *ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113 struct dst_entry * (*check)(struct dst_entry *, __u32 cookie);
114 void (*destroy)(struct dst_entry *);
115 void (*ifdown)(struct dst_entry *,
116 struct net_device *dev, int how);
117 struct dst_entry * (*negative_advice)(struct dst_entry *);
118 void (*link_failure)(struct sk_buff *);
119 void (*update_pmtu)(struct dst_entry *dst, u32 mtu);
Herbert Xu862b82c2007-11-13 21:43:11 -0800120 int (*local_out)(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121
122 atomic_t entries;
Christoph Lametere18b8902006-12-06 20:33:20 -0800123 struct kmem_cache *kmem_cachep;
Daniel Lezcanod4fa26f2008-01-18 03:58:07 -0800124 struct net *dst_net;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125};
126
127#ifdef __KERNEL__
128
129static inline u32
130dst_metric(const struct dst_entry *dst, int metric)
131{
132 return dst->metrics[metric-1];
133}
134
135static inline u32 dst_mtu(const struct dst_entry *dst)
136{
137 u32 mtu = dst_metric(dst, RTAX_MTU);
138 /*
139 * Alexey put it here, so ask him about it :)
140 */
141 barrier();
142 return mtu;
143}
144
Stephen Hemmingerc1e20f72008-07-18 23:02:15 -0700145/* RTT metrics are stored in milliseconds for user ABI, but used as jiffies */
146static inline unsigned long dst_metric_rtt(const struct dst_entry *dst, int metric)
147{
148 return msecs_to_jiffies(dst_metric(dst, metric));
149}
150
151static inline void set_dst_metric_rtt(struct dst_entry *dst, int metric,
152 unsigned long rtt)
153{
154 dst->metrics[metric-1] = jiffies_to_msecs(rtt);
155}
156
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157static inline u32
158dst_allfrag(const struct dst_entry *dst)
159{
160 int ret = dst_metric(dst, RTAX_FEATURES) & RTAX_FEATURE_ALLFRAG;
161 /* Yes, _exactly_. This is paranoia. */
162 barrier();
163 return ret;
164}
165
166static inline int
167dst_metric_locked(struct dst_entry *dst, int metric)
168{
169 return dst_metric(dst, RTAX_LOCK) & (1<<metric);
170}
171
172static inline void dst_hold(struct dst_entry * dst)
173{
Eric Dumazet5635c102008-11-16 19:46:36 -0800174 /*
175 * If your kernel compilation stops here, please check
176 * __pad_to_align_refcnt declaration in struct dst_entry
177 */
178 BUILD_BUG_ON(offsetof(struct dst_entry, __refcnt) & 63);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179 atomic_inc(&dst->__refcnt);
180}
181
Pavel Emelyanov03f49f32007-11-10 21:28:34 -0800182static inline void dst_use(struct dst_entry *dst, unsigned long time)
183{
184 dst_hold(dst);
185 dst->__use++;
186 dst->lastuse = time;
187}
188
Linus Torvalds1da177e2005-04-16 15:20:36 -0700189static inline
190struct dst_entry * dst_clone(struct dst_entry * dst)
191{
192 if (dst)
193 atomic_inc(&dst->__refcnt);
194 return dst;
195}
196
Ilpo Järvinen8d330862008-03-27 17:53:31 -0700197extern void dst_release(struct dst_entry *dst);
Eric Dumazetadf30902009-06-02 05:19:30 +0000198static inline void skb_dst_drop(struct sk_buff *skb)
199{
200 if (skb->_skb_dst)
201 dst_release(skb_dst(skb));
202 skb->_skb_dst = 0UL;
203}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204
205/* Children define the path of the packet through the
206 * Linux networking. Thus, destinations are stackable.
207 */
208
209static inline struct dst_entry *dst_pop(struct dst_entry *dst)
210{
211 struct dst_entry *child = dst_clone(dst->child);
212
213 dst_release(dst);
214 return child;
215}
216
Herbert Xu352e5122007-11-13 21:34:06 -0800217extern int dst_discard(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218extern void * dst_alloc(struct dst_ops * ops);
219extern void __dst_free(struct dst_entry * dst);
220extern struct dst_entry *dst_destroy(struct dst_entry * dst);
221
222static inline void dst_free(struct dst_entry * dst)
223{
224 if (dst->obsolete > 1)
225 return;
226 if (!atomic_read(&dst->__refcnt)) {
227 dst = dst_destroy(dst);
228 if (!dst)
229 return;
230 }
231 __dst_free(dst);
232}
233
234static inline void dst_rcu_free(struct rcu_head *head)
235{
236 struct dst_entry *dst = container_of(head, struct dst_entry, rcu_head);
237 dst_free(dst);
238}
239
240static inline void dst_confirm(struct dst_entry *dst)
241{
242 if (dst)
243 neigh_confirm(dst->neighbour);
244}
245
246static inline void dst_negative_advice(struct dst_entry **dst_p)
247{
248 struct dst_entry * dst = *dst_p;
249 if (dst && dst->ops->negative_advice)
250 *dst_p = dst->ops->negative_advice(dst);
251}
252
253static inline void dst_link_failure(struct sk_buff *skb)
254{
Eric Dumazetadf30902009-06-02 05:19:30 +0000255 struct dst_entry *dst = skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256 if (dst && dst->ops && dst->ops->link_failure)
257 dst->ops->link_failure(skb);
258}
259
260static inline void dst_set_expires(struct dst_entry *dst, int timeout)
261{
262 unsigned long expires = jiffies + timeout;
263
264 if (expires == 0)
265 expires = 1;
266
267 if (dst->expires == 0 || time_before(expires, dst->expires))
268 dst->expires = expires;
269}
270
271/* Output packet to network from transport. */
272static inline int dst_output(struct sk_buff *skb)
273{
Eric Dumazetadf30902009-06-02 05:19:30 +0000274 return skb_dst(skb)->output(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275}
276
277/* Input packet from network to transport. */
278static inline int dst_input(struct sk_buff *skb)
279{
Eric Dumazetadf30902009-06-02 05:19:30 +0000280 return skb_dst(skb)->input(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281}
282
283static inline struct dst_entry *dst_check(struct dst_entry *dst, u32 cookie)
284{
285 if (dst->obsolete)
286 dst = dst->ops->check(dst, cookie);
287 return dst;
288}
289
290extern void dst_init(void);
291
Herbert Xu815f4e52007-12-12 10:36:59 -0800292/* Flags for xfrm_lookup flags argument. */
293enum {
294 XFRM_LOOKUP_WAIT = 1 << 0,
Herbert Xu8b7817f2007-12-12 10:44:43 -0800295 XFRM_LOOKUP_ICMP = 1 << 1,
Herbert Xu815f4e52007-12-12 10:36:59 -0800296};
297
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298struct flowi;
299#ifndef CONFIG_XFRM
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800300static inline int xfrm_lookup(struct net *net, struct dst_entry **dst_p,
301 struct flowi *fl, struct sock *sk, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302{
303 return 0;
304}
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800305static inline int __xfrm_lookup(struct net *net, struct dst_entry **dst_p,
306 struct flowi *fl, struct sock *sk, int flags)
David S. Miller14e50e52007-05-24 18:17:54 -0700307{
308 return 0;
309}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310#else
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800311extern int xfrm_lookup(struct net *net, struct dst_entry **dst_p,
312 struct flowi *fl, struct sock *sk, int flags);
313extern int __xfrm_lookup(struct net *net, struct dst_entry **dst_p,
314 struct flowi *fl, struct sock *sk, int flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315#endif
316#endif
317
318#endif /* _NET_DST_H */