blob: 5a900ddcf10dbbf4a0021ebc3023c41f028575f6 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * net/dst.h Protocol independent destination cache definitions.
3 *
4 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
5 *
6 */
7
8#ifndef _NET_DST_H
9#define _NET_DST_H
10
Alexey Dobriyan86393e52009-08-29 01:34:49 +000011#include <net/dst_ops.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020012#include <linux/netdevice.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <linux/rtnetlink.h>
14#include <linux/rcupdate.h>
15#include <linux/jiffies.h>
16#include <net/neighbour.h>
17#include <asm/processor.h>
18
19/*
20 * 0 - no debugging messages
21 * 1 - rare events and bugs (default)
22 * 2 - trace mode.
23 */
24#define RT_CACHE_DEBUG 0
25
26#define DST_GC_MIN (HZ/10)
27#define DST_GC_INC (HZ/2)
28#define DST_GC_MAX (120*HZ)
29
30/* Each dst_entry has reference count and sits in some parent list(s).
31 * When it is removed from parent list, it is "freed" (dst_free).
32 * After this it enters dead state (dst->obsolete > 0) and if its refcnt
33 * is zero, it can be destroyed immediately, otherwise it is added
34 * to gc list and garbage collector periodically checks the refcnt.
35 */
36
37struct sk_buff;
38
39struct dst_entry
40{
Eric Dumazet1e19e022007-02-09 16:26:55 -080041 struct rcu_head rcu_head;
Linus Torvalds1da177e2005-04-16 15:20:36 -070042 struct dst_entry *child;
43 struct net_device *dev;
Herbert Xuc4d54112005-04-19 20:46:37 -070044 short error;
45 short obsolete;
Linus Torvalds1da177e2005-04-16 15:20:36 -070046 int flags;
47#define DST_HOST 1
48#define DST_NOXFRM 2
49#define DST_NOPOLICY 4
50#define DST_NOHASH 8
Linus Torvalds1da177e2005-04-16 15:20:36 -070051 unsigned long expires;
52
53 unsigned short header_len; /* more space at head required */
54 unsigned short trailer_len; /* space to reserve at tail */
55
Eric Dumazet69a73822008-01-22 06:18:34 -080056 unsigned int rate_tokens;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070057 unsigned long rate_last; /* rate limiting for ICMP */
Eric Dumazet69a73822008-01-22 06:18:34 -080058
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070059 struct dst_entry *path;
Linus Torvalds1da177e2005-04-16 15:20:36 -070060
Linus Torvalds1da177e2005-04-16 15:20:36 -070061 struct neighbour *neighbour;
62 struct hh_cache *hh;
Alexey Dobriyandef8b4f2008-10-28 13:24:06 -070063#ifdef CONFIG_XFRM
Linus Torvalds1da177e2005-04-16 15:20:36 -070064 struct xfrm_state *xfrm;
Eric Dumazet5635c102008-11-16 19:46:36 -080065#else
66 void *__pad1;
Alexey Dobriyandef8b4f2008-10-28 13:24:06 -070067#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070068 int (*input)(struct sk_buff*);
69 int (*output)(struct sk_buff*);
70
Linus Torvalds1da177e2005-04-16 15:20:36 -070071 struct dst_ops *ops;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070072
73 u32 metrics[RTAX_MAX];
74
75#ifdef CONFIG_NET_CLS_ROUTE
76 __u32 tclassid;
Eric Dumazet5635c102008-11-16 19:46:36 -080077#else
78 __u32 __pad2;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070079#endif
80
Eric Dumazet5635c102008-11-16 19:46:36 -080081
82 /*
83 * Align __refcnt to a 64 bytes alignment
84 * (L1_CACHE_SIZE would be too much)
85 */
86#ifdef CONFIG_64BIT
87 long __pad_to_align_refcnt[2];
88#else
89 long __pad_to_align_refcnt[1];
90#endif
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070091 /*
92 * __refcnt wants to be on a different cache line from
93 * input/output/ops or performance tanks badly
94 */
Eric Dumazet1e19e022007-02-09 16:26:55 -080095 atomic_t __refcnt; /* client references */
96 int __use;
Zhang Yanminf1dd9c32008-03-12 22:52:37 -070097 unsigned long lastuse;
Eric Dumazet1e19e022007-02-09 16:26:55 -080098 union {
99 struct dst_entry *next;
100 struct rtable *rt_next;
101 struct rt6_info *rt6_next;
102 struct dn_route *dn_next;
103 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104};
105
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106#ifdef __KERNEL__
107
108static inline u32
109dst_metric(const struct dst_entry *dst, int metric)
110{
111 return dst->metrics[metric-1];
112}
113
114static inline u32 dst_mtu(const struct dst_entry *dst)
115{
116 u32 mtu = dst_metric(dst, RTAX_MTU);
117 /*
118 * Alexey put it here, so ask him about it :)
119 */
120 barrier();
121 return mtu;
122}
123
Stephen Hemmingerc1e20f72008-07-18 23:02:15 -0700124/* RTT metrics are stored in milliseconds for user ABI, but used as jiffies */
125static inline unsigned long dst_metric_rtt(const struct dst_entry *dst, int metric)
126{
127 return msecs_to_jiffies(dst_metric(dst, metric));
128}
129
130static inline void set_dst_metric_rtt(struct dst_entry *dst, int metric,
131 unsigned long rtt)
132{
133 dst->metrics[metric-1] = jiffies_to_msecs(rtt);
134}
135
Linus Torvalds1da177e2005-04-16 15:20:36 -0700136static inline u32
137dst_allfrag(const struct dst_entry *dst)
138{
139 int ret = dst_metric(dst, RTAX_FEATURES) & RTAX_FEATURE_ALLFRAG;
140 /* Yes, _exactly_. This is paranoia. */
141 barrier();
142 return ret;
143}
144
145static inline int
146dst_metric_locked(struct dst_entry *dst, int metric)
147{
148 return dst_metric(dst, RTAX_LOCK) & (1<<metric);
149}
150
151static inline void dst_hold(struct dst_entry * dst)
152{
Eric Dumazet5635c102008-11-16 19:46:36 -0800153 /*
154 * If your kernel compilation stops here, please check
155 * __pad_to_align_refcnt declaration in struct dst_entry
156 */
157 BUILD_BUG_ON(offsetof(struct dst_entry, __refcnt) & 63);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158 atomic_inc(&dst->__refcnt);
159}
160
Pavel Emelyanov03f49f32007-11-10 21:28:34 -0800161static inline void dst_use(struct dst_entry *dst, unsigned long time)
162{
163 dst_hold(dst);
164 dst->__use++;
165 dst->lastuse = time;
166}
167
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168static inline
169struct dst_entry * dst_clone(struct dst_entry * dst)
170{
171 if (dst)
172 atomic_inc(&dst->__refcnt);
173 return dst;
174}
175
Ilpo Järvinen8d330862008-03-27 17:53:31 -0700176extern void dst_release(struct dst_entry *dst);
Eric Dumazetadf30902009-06-02 05:19:30 +0000177static inline void skb_dst_drop(struct sk_buff *skb)
178{
179 if (skb->_skb_dst)
180 dst_release(skb_dst(skb));
181 skb->_skb_dst = 0UL;
182}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183
184/* Children define the path of the packet through the
185 * Linux networking. Thus, destinations are stackable.
186 */
187
188static inline struct dst_entry *dst_pop(struct dst_entry *dst)
189{
190 struct dst_entry *child = dst_clone(dst->child);
191
192 dst_release(dst);
193 return child;
194}
195
Herbert Xu352e5122007-11-13 21:34:06 -0800196extern int dst_discard(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197extern void * dst_alloc(struct dst_ops * ops);
198extern void __dst_free(struct dst_entry * dst);
199extern struct dst_entry *dst_destroy(struct dst_entry * dst);
200
201static inline void dst_free(struct dst_entry * dst)
202{
203 if (dst->obsolete > 1)
204 return;
205 if (!atomic_read(&dst->__refcnt)) {
206 dst = dst_destroy(dst);
207 if (!dst)
208 return;
209 }
210 __dst_free(dst);
211}
212
213static inline void dst_rcu_free(struct rcu_head *head)
214{
215 struct dst_entry *dst = container_of(head, struct dst_entry, rcu_head);
216 dst_free(dst);
217}
218
219static inline void dst_confirm(struct dst_entry *dst)
220{
221 if (dst)
222 neigh_confirm(dst->neighbour);
223}
224
225static inline void dst_negative_advice(struct dst_entry **dst_p)
226{
227 struct dst_entry * dst = *dst_p;
228 if (dst && dst->ops->negative_advice)
229 *dst_p = dst->ops->negative_advice(dst);
230}
231
232static inline void dst_link_failure(struct sk_buff *skb)
233{
Eric Dumazetadf30902009-06-02 05:19:30 +0000234 struct dst_entry *dst = skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235 if (dst && dst->ops && dst->ops->link_failure)
236 dst->ops->link_failure(skb);
237}
238
239static inline void dst_set_expires(struct dst_entry *dst, int timeout)
240{
241 unsigned long expires = jiffies + timeout;
242
243 if (expires == 0)
244 expires = 1;
245
246 if (dst->expires == 0 || time_before(expires, dst->expires))
247 dst->expires = expires;
248}
249
250/* Output packet to network from transport. */
251static inline int dst_output(struct sk_buff *skb)
252{
Eric Dumazetadf30902009-06-02 05:19:30 +0000253 return skb_dst(skb)->output(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254}
255
256/* Input packet from network to transport. */
257static inline int dst_input(struct sk_buff *skb)
258{
Eric Dumazetadf30902009-06-02 05:19:30 +0000259 return skb_dst(skb)->input(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260}
261
262static inline struct dst_entry *dst_check(struct dst_entry *dst, u32 cookie)
263{
264 if (dst->obsolete)
265 dst = dst->ops->check(dst, cookie);
266 return dst;
267}
268
269extern void dst_init(void);
270
Herbert Xu815f4e52007-12-12 10:36:59 -0800271/* Flags for xfrm_lookup flags argument. */
272enum {
273 XFRM_LOOKUP_WAIT = 1 << 0,
Herbert Xu8b7817f2007-12-12 10:44:43 -0800274 XFRM_LOOKUP_ICMP = 1 << 1,
Herbert Xu815f4e52007-12-12 10:36:59 -0800275};
276
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277struct flowi;
278#ifndef CONFIG_XFRM
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800279static inline int xfrm_lookup(struct net *net, struct dst_entry **dst_p,
280 struct flowi *fl, struct sock *sk, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281{
282 return 0;
283}
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800284static inline int __xfrm_lookup(struct net *net, struct dst_entry **dst_p,
285 struct flowi *fl, struct sock *sk, int flags)
David S. Miller14e50e52007-05-24 18:17:54 -0700286{
287 return 0;
288}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289#else
Alexey Dobriyan52479b62008-11-25 17:35:18 -0800290extern int xfrm_lookup(struct net *net, struct dst_entry **dst_p,
291 struct flowi *fl, struct sock *sk, int flags);
292extern int __xfrm_lookup(struct net *net, struct dst_entry **dst_p,
293 struct flowi *fl, struct sock *sk, int flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294#endif
295#endif
296
297#endif /* _NET_DST_H */