blob: de1b26aa5720f011616413d87d852f94d46f9c52 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Common framework for low-level network console, dump, and debugger code
3 *
4 * Sep 8 2003 Matt Mackall <mpm@selenic.com>
5 *
6 * based on the netconsole code from:
7 *
8 * Copyright (C) 2001 Ingo Molnar <mingo@redhat.com>
9 * Copyright (C) 2002 Red Hat, Inc.
10 */
11
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/netdevice.h>
13#include <linux/etherdevice.h>
14#include <linux/string.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020015#include <linux/if_arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/inetdevice.h>
17#include <linux/inet.h>
18#include <linux/interrupt.h>
19#include <linux/netpoll.h>
20#include <linux/sched.h>
21#include <linux/delay.h>
22#include <linux/rcupdate.h>
23#include <linux/workqueue.h>
24#include <net/tcp.h>
25#include <net/udp.h>
26#include <asm/unaligned.h>
27
28/*
29 * We maintain a small pool of fully-sized skbs, to make sure the
30 * message gets out even in extreme OOM situations.
31 */
32
33#define MAX_UDP_CHUNK 1460
34#define MAX_SKBS 32
35#define MAX_QUEUE_DEPTH (MAX_SKBS / 2)
36
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -080037static struct sk_buff_head skb_pool;
Linus Torvalds1da177e2005-04-16 15:20:36 -070038
39static atomic_t trapped;
40
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -070041#define USEC_PER_POLL 50
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#define NETPOLL_RX_ENABLED 1
43#define NETPOLL_RX_DROP 2
44
45#define MAX_SKB_SIZE \
46 (MAX_UDP_CHUNK + sizeof(struct udphdr) + \
47 sizeof(struct iphdr) + sizeof(struct ethhdr))
48
49static void zap_completion_queue(void);
Neil Horman068c6e92006-06-26 00:04:27 -070050static void arp_reply(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
David Howellsc4028952006-11-22 14:57:56 +000052static void queue_process(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -070053{
David Howells4c1ac1b2006-12-05 14:37:56 +000054 struct netpoll_info *npinfo =
55 container_of(work, struct netpoll_info, tx_work.work);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056 struct sk_buff *skb;
Ingo Molnar36405432006-12-12 17:20:42 +010057 unsigned long flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -070058
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070059 while ((skb = skb_dequeue(&npinfo->txq))) {
60 struct net_device *dev = skb->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070062 if (!netif_device_present(dev) || !netif_running(dev)) {
63 __kfree_skb(skb);
64 continue;
65 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
Ingo Molnar36405432006-12-12 17:20:42 +010067 local_irq_save(flags);
68 netif_tx_lock(dev);
Peter P Waskiewicz Jrf25f4e42007-07-06 13:36:20 -070069 if ((netif_queue_stopped(dev) ||
70 netif_subqueue_stopped(dev, skb->queue_mapping)) ||
71 dev->hard_start_xmit(skb, dev) != NETDEV_TX_OK) {
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070072 skb_queue_head(&npinfo->txq, skb);
Ingo Molnar36405432006-12-12 17:20:42 +010073 netif_tx_unlock(dev);
74 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -070075
Jarek Poplawski25442ca2007-07-05 17:42:44 -070076 schedule_delayed_work(&npinfo->tx_work, HZ/10);
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070077 return;
78 }
Ingo Molnar36405432006-12-12 17:20:42 +010079 netif_tx_unlock(dev);
80 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -070081 }
82}
83
Al Virob51655b2006-11-14 21:40:42 -080084static __sum16 checksum_udp(struct sk_buff *skb, struct udphdr *uh,
85 unsigned short ulen, __be32 saddr, __be32 daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -070086{
Al Virod6f5493c2006-11-14 21:26:08 -080087 __wsum psum;
Herbert Xufb286bb2005-11-10 13:01:24 -080088
Herbert Xu60476372007-04-09 11:59:39 -070089 if (uh->check == 0 || skb_csum_unnecessary(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -070090 return 0;
91
Herbert Xufb286bb2005-11-10 13:01:24 -080092 psum = csum_tcpudp_nofold(saddr, daddr, ulen, IPPROTO_UDP, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
Patrick McHardy84fa7932006-08-29 16:44:56 -070094 if (skb->ip_summed == CHECKSUM_COMPLETE &&
Al Virod3bc23e2006-11-14 21:24:49 -080095 !csum_fold(csum_add(psum, skb->csum)))
Herbert Xufb286bb2005-11-10 13:01:24 -080096 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
Herbert Xufb286bb2005-11-10 13:01:24 -080098 skb->csum = psum;
99
100 return __skb_checksum_complete(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101}
102
103/*
104 * Check whether delayed processing was scheduled for our NIC. If so,
105 * we attempt to grab the poll lock and use ->poll() to pump the card.
106 * If this fails, either we've recursed in ->poll() or it's already
107 * running on another CPU.
108 *
109 * Note: we don't mask interrupts with this lock because we're using
110 * trylock here and interrupts are already disabled in the softirq
111 * case. Further, we test the poll_owner to avoid recursion on UP
112 * systems where the lock doesn't exist.
113 *
114 * In cases where there is bi-directional communications, reading only
115 * one message at a time can lead to packets being dropped by the
116 * network adapter, forcing superfluous retries and possibly timeouts.
117 * Thus, we set our budget to greater than 1.
118 */
119static void poll_napi(struct netpoll *np)
120{
Jeff Moyer115c1d62005-06-22 22:05:31 -0700121 struct netpoll_info *npinfo = np->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122 int budget = 16;
123
124 if (test_bit(__LINK_STATE_RX_SCHED, &np->dev->state) &&
Jeff Moyer115c1d62005-06-22 22:05:31 -0700125 npinfo->poll_owner != smp_processor_id() &&
126 spin_trylock(&npinfo->poll_lock)) {
127 npinfo->rx_flags |= NETPOLL_RX_DROP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128 atomic_inc(&trapped);
129
130 np->dev->poll(np->dev, &budget);
131
132 atomic_dec(&trapped);
Jeff Moyer115c1d62005-06-22 22:05:31 -0700133 npinfo->rx_flags &= ~NETPOLL_RX_DROP;
134 spin_unlock(&npinfo->poll_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 }
136}
137
Neil Horman068c6e92006-06-26 00:04:27 -0700138static void service_arp_queue(struct netpoll_info *npi)
139{
140 struct sk_buff *skb;
141
142 if (unlikely(!npi))
143 return;
144
145 skb = skb_dequeue(&npi->arp_tx);
146
147 while (skb != NULL) {
148 arp_reply(skb);
149 skb = skb_dequeue(&npi->arp_tx);
150 }
Neil Horman068c6e92006-06-26 00:04:27 -0700151}
152
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153void netpoll_poll(struct netpoll *np)
154{
David S. Millerc68b9072006-11-14 20:40:49 -0800155 if (!np->dev || !netif_running(np->dev) || !np->dev->poll_controller)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156 return;
157
158 /* Process pending work on NIC */
159 np->dev->poll_controller(np->dev);
160 if (np->dev->poll)
161 poll_napi(np);
162
Neil Horman068c6e92006-06-26 00:04:27 -0700163 service_arp_queue(np->dev->npinfo);
164
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165 zap_completion_queue();
166}
167
168static void refill_skbs(void)
169{
170 struct sk_buff *skb;
171 unsigned long flags;
172
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800173 spin_lock_irqsave(&skb_pool.lock, flags);
174 while (skb_pool.qlen < MAX_SKBS) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700175 skb = alloc_skb(MAX_SKB_SIZE, GFP_ATOMIC);
176 if (!skb)
177 break;
178
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800179 __skb_queue_tail(&skb_pool, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 }
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800181 spin_unlock_irqrestore(&skb_pool.lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182}
183
184static void zap_completion_queue(void)
185{
186 unsigned long flags;
187 struct softnet_data *sd = &get_cpu_var(softnet_data);
188
189 if (sd->completion_queue) {
190 struct sk_buff *clist;
191
192 local_irq_save(flags);
193 clist = sd->completion_queue;
194 sd->completion_queue = NULL;
195 local_irq_restore(flags);
196
197 while (clist != NULL) {
198 struct sk_buff *skb = clist;
199 clist = clist->next;
David S. Millerc68b9072006-11-14 20:40:49 -0800200 if (skb->destructor)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700201 dev_kfree_skb_any(skb); /* put this one back */
202 else
203 __kfree_skb(skb);
204 }
205 }
206
207 put_cpu_var(softnet_data);
208}
209
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800210static struct sk_buff *find_skb(struct netpoll *np, int len, int reserve)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211{
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800212 int count = 0;
213 struct sk_buff *skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214
215 zap_completion_queue();
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800216 refill_skbs();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217repeat:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218
219 skb = alloc_skb(len, GFP_ATOMIC);
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800220 if (!skb)
221 skb = skb_dequeue(&skb_pool);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222
223 if (!skb) {
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800224 if (++count < 10) {
225 netpoll_poll(np);
226 goto repeat;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 }
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800228 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 }
230
231 atomic_set(&skb->users, 1);
232 skb_reserve(skb, reserve);
233 return skb;
234}
235
236static void netpoll_send_skb(struct netpoll *np, struct sk_buff *skb)
237{
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700238 int status = NETDEV_TX_BUSY;
239 unsigned long tries;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900240 struct net_device *dev = np->dev;
241 struct netpoll_info *npinfo = np->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900243 if (!npinfo || !netif_running(dev) || !netif_device_present(dev)) {
244 __kfree_skb(skb);
245 return;
246 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700248 /* don't get messages out of order, and no recursion */
David S. Millerc68b9072006-11-14 20:40:49 -0800249 if (skb_queue_len(&npinfo->txq) == 0 &&
Andrew Mortone37b8d92006-12-09 14:01:49 -0800250 npinfo->poll_owner != smp_processor_id()) {
Andrew Mortona49f99f2006-12-11 17:24:46 -0800251 unsigned long flags;
252
253 local_irq_save(flags);
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700254 /* try until next clock tick */
255 for (tries = jiffies_to_usecs(1)/USEC_PER_POLL;
256 tries > 0; --tries) {
257 if (netif_tx_trylock(dev)) {
Peter P Waskiewicz Jrf25f4e42007-07-06 13:36:20 -0700258 if (!netif_queue_stopped(dev) &&
259 !netif_subqueue_stopped(dev, skb->queue_mapping))
Andrew Mortone37b8d92006-12-09 14:01:49 -0800260 status = dev->hard_start_xmit(skb, dev);
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700261 netif_tx_unlock(dev);
Matt Mackallf0d34592005-08-11 19:25:11 -0700262
Andrew Mortone37b8d92006-12-09 14:01:49 -0800263 if (status == NETDEV_TX_OK)
264 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265
Andrew Mortone37b8d92006-12-09 14:01:49 -0800266 }
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700267
268 /* tickle device maybe there is some cleanup */
269 netpoll_poll(np);
270
271 udelay(USEC_PER_POLL);
Matt Mackall0db1d6f2005-08-11 19:25:54 -0700272 }
Andrew Mortona49f99f2006-12-11 17:24:46 -0800273 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700276 if (status != NETDEV_TX_OK) {
Stephen Hemminger5de4a472006-10-26 15:46:55 -0700277 skb_queue_tail(&npinfo->txq, skb);
David Howells4c1ac1b2006-12-05 14:37:56 +0000278 schedule_delayed_work(&npinfo->tx_work,0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280}
281
282void netpoll_send_udp(struct netpoll *np, const char *msg, int len)
283{
284 int total_len, eth_len, ip_len, udp_len;
285 struct sk_buff *skb;
286 struct udphdr *udph;
287 struct iphdr *iph;
288 struct ethhdr *eth;
289
290 udp_len = len + sizeof(*udph);
291 ip_len = eth_len = udp_len + sizeof(*iph);
292 total_len = eth_len + ETH_HLEN + NET_IP_ALIGN;
293
294 skb = find_skb(np, total_len, total_len - len);
295 if (!skb)
296 return;
297
Arnaldo Carvalho de Melo27d7ff42007-03-31 11:55:19 -0300298 skb_copy_to_linear_data(skb, msg, len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299 skb->len += len;
300
Arnaldo Carvalho de Melo4bedb452007-03-13 14:28:48 -0300301 skb_push(skb, sizeof(*udph));
302 skb_reset_transport_header(skb);
303 udph = udp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700304 udph->source = htons(np->local_port);
305 udph->dest = htons(np->remote_port);
306 udph->len = htons(udp_len);
307 udph->check = 0;
Chris Lalancette8e365ee2006-11-07 14:56:19 -0800308 udph->check = csum_tcpudp_magic(htonl(np->local_ip),
309 htonl(np->remote_ip),
310 udp_len, IPPROTO_UDP,
311 csum_partial((unsigned char *)udph, udp_len, 0));
312 if (udph->check == 0)
Al Viro5e57dff2006-11-20 18:08:13 -0800313 udph->check = CSUM_MANGLED_0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314
Arnaldo Carvalho de Meloe2d1bca2007-04-10 20:46:21 -0700315 skb_push(skb, sizeof(*iph));
316 skb_reset_network_header(skb);
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700317 iph = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318
319 /* iph->version = 4; iph->ihl = 5; */
320 put_unaligned(0x45, (unsigned char *)iph);
321 iph->tos = 0;
322 put_unaligned(htons(ip_len), &(iph->tot_len));
323 iph->id = 0;
324 iph->frag_off = 0;
325 iph->ttl = 64;
326 iph->protocol = IPPROTO_UDP;
327 iph->check = 0;
328 put_unaligned(htonl(np->local_ip), &(iph->saddr));
329 put_unaligned(htonl(np->remote_ip), &(iph->daddr));
330 iph->check = ip_fast_csum((unsigned char *)iph, iph->ihl);
331
332 eth = (struct ethhdr *) skb_push(skb, ETH_HLEN);
Arnaldo Carvalho de Melo459a98e2007-03-19 15:30:44 -0700333 skb_reset_mac_header(skb);
Stephen Hemminger206daaf2006-10-19 23:58:23 -0700334 skb->protocol = eth->h_proto = htons(ETH_P_IP);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 memcpy(eth->h_source, np->local_mac, 6);
336 memcpy(eth->h_dest, np->remote_mac, 6);
337
338 skb->dev = np->dev;
339
340 netpoll_send_skb(np, skb);
341}
342
343static void arp_reply(struct sk_buff *skb)
344{
Jeff Moyer115c1d62005-06-22 22:05:31 -0700345 struct netpoll_info *npinfo = skb->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346 struct arphdr *arp;
347 unsigned char *arp_ptr;
348 int size, type = ARPOP_REPLY, ptype = ETH_P_ARP;
Al Viro252e33462006-11-14 20:48:11 -0800349 __be32 sip, tip;
Neil Horman47bbec02006-12-08 00:05:55 -0800350 unsigned char *sha;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 struct sk_buff *send_skb;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700352 struct netpoll *np = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700354 if (npinfo->rx_np && npinfo->rx_np->dev == skb->dev)
355 np = npinfo->rx_np;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700356 if (!np)
357 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358
359 /* No arp on this interface */
360 if (skb->dev->flags & IFF_NOARP)
361 return;
362
363 if (!pskb_may_pull(skb, (sizeof(struct arphdr) +
364 (2 * skb->dev->addr_len) +
365 (2 * sizeof(u32)))))
366 return;
367
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700368 skb_reset_network_header(skb);
Arnaldo Carvalho de Melobadff6d2007-03-13 13:06:52 -0300369 skb_reset_transport_header(skb);
Arnaldo Carvalho de Melod0a92be2007-03-12 20:56:31 -0300370 arp = arp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371
372 if ((arp->ar_hrd != htons(ARPHRD_ETHER) &&
373 arp->ar_hrd != htons(ARPHRD_IEEE802)) ||
374 arp->ar_pro != htons(ETH_P_IP) ||
375 arp->ar_op != htons(ARPOP_REQUEST))
376 return;
377
Neil Horman47bbec02006-12-08 00:05:55 -0800378 arp_ptr = (unsigned char *)(arp+1);
379 /* save the location of the src hw addr */
380 sha = arp_ptr;
381 arp_ptr += skb->dev->addr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382 memcpy(&sip, arp_ptr, 4);
Neil Horman47bbec02006-12-08 00:05:55 -0800383 arp_ptr += 4;
384 /* if we actually cared about dst hw addr, it would get copied here */
385 arp_ptr += skb->dev->addr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386 memcpy(&tip, arp_ptr, 4);
387
388 /* Should we ignore arp? */
389 if (tip != htonl(np->local_ip) || LOOPBACK(tip) || MULTICAST(tip))
390 return;
391
392 size = sizeof(struct arphdr) + 2 * (skb->dev->addr_len + 4);
393 send_skb = find_skb(np, size + LL_RESERVED_SPACE(np->dev),
394 LL_RESERVED_SPACE(np->dev));
395
396 if (!send_skb)
397 return;
398
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700399 skb_reset_network_header(send_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400 arp = (struct arphdr *) skb_put(send_skb, size);
401 send_skb->dev = skb->dev;
402 send_skb->protocol = htons(ETH_P_ARP);
403
404 /* Fill the device header for the ARP frame */
405
406 if (np->dev->hard_header &&
407 np->dev->hard_header(send_skb, skb->dev, ptype,
Neil Horman47bbec02006-12-08 00:05:55 -0800408 sha, np->local_mac,
David S. Millerc68b9072006-11-14 20:40:49 -0800409 send_skb->len) < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410 kfree_skb(send_skb);
411 return;
412 }
413
414 /*
415 * Fill out the arp protocol part.
416 *
417 * we only support ethernet device type,
418 * which (according to RFC 1390) should always equal 1 (Ethernet).
419 */
420
421 arp->ar_hrd = htons(np->dev->type);
422 arp->ar_pro = htons(ETH_P_IP);
423 arp->ar_hln = np->dev->addr_len;
424 arp->ar_pln = 4;
425 arp->ar_op = htons(type);
426
427 arp_ptr=(unsigned char *)(arp + 1);
428 memcpy(arp_ptr, np->dev->dev_addr, np->dev->addr_len);
429 arp_ptr += np->dev->addr_len;
430 memcpy(arp_ptr, &tip, 4);
431 arp_ptr += 4;
Neil Horman47bbec02006-12-08 00:05:55 -0800432 memcpy(arp_ptr, sha, np->dev->addr_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700433 arp_ptr += np->dev->addr_len;
434 memcpy(arp_ptr, &sip, 4);
435
436 netpoll_send_skb(np, send_skb);
437}
438
439int __netpoll_rx(struct sk_buff *skb)
440{
441 int proto, len, ulen;
442 struct iphdr *iph;
443 struct udphdr *uh;
Neil Horman068c6e92006-06-26 00:04:27 -0700444 struct netpoll_info *npi = skb->dev->npinfo;
445 struct netpoll *np = npi->rx_np;
446
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700447 if (!np)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700448 goto out;
449 if (skb->dev->type != ARPHRD_ETHER)
450 goto out;
451
452 /* check if netpoll clients need ARP */
YOSHIFUJI Hideaki724800d2007-03-25 20:13:04 -0700453 if (skb->protocol == htons(ETH_P_ARP) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 atomic_read(&trapped)) {
Neil Horman068c6e92006-06-26 00:04:27 -0700455 skb_queue_tail(&npi->arp_tx, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456 return 1;
457 }
458
459 proto = ntohs(eth_hdr(skb)->h_proto);
460 if (proto != ETH_P_IP)
461 goto out;
462 if (skb->pkt_type == PACKET_OTHERHOST)
463 goto out;
464 if (skb_shared(skb))
465 goto out;
466
467 iph = (struct iphdr *)skb->data;
468 if (!pskb_may_pull(skb, sizeof(struct iphdr)))
469 goto out;
470 if (iph->ihl < 5 || iph->version != 4)
471 goto out;
472 if (!pskb_may_pull(skb, iph->ihl*4))
473 goto out;
474 if (ip_fast_csum((u8 *)iph, iph->ihl) != 0)
475 goto out;
476
477 len = ntohs(iph->tot_len);
478 if (skb->len < len || len < iph->ihl*4)
479 goto out;
480
Aubrey.Li5e7d7fa2007-04-17 12:40:20 -0700481 /*
482 * Our transport medium may have padded the buffer out.
483 * Now We trim to the true length of the frame.
484 */
485 if (pskb_trim_rcsum(skb, len))
486 goto out;
487
Linus Torvalds1da177e2005-04-16 15:20:36 -0700488 if (iph->protocol != IPPROTO_UDP)
489 goto out;
490
491 len -= iph->ihl*4;
492 uh = (struct udphdr *)(((char *)iph) + iph->ihl*4);
493 ulen = ntohs(uh->len);
494
495 if (ulen != len)
496 goto out;
Herbert Xufb286bb2005-11-10 13:01:24 -0800497 if (checksum_udp(skb, uh, ulen, iph->saddr, iph->daddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498 goto out;
499 if (np->local_ip && np->local_ip != ntohl(iph->daddr))
500 goto out;
501 if (np->remote_ip && np->remote_ip != ntohl(iph->saddr))
502 goto out;
503 if (np->local_port && np->local_port != ntohs(uh->dest))
504 goto out;
505
506 np->rx_hook(np, ntohs(uh->source),
507 (char *)(uh+1),
508 ulen - sizeof(struct udphdr));
509
510 kfree_skb(skb);
511 return 1;
512
513out:
514 if (atomic_read(&trapped)) {
515 kfree_skb(skb);
516 return 1;
517 }
518
519 return 0;
520}
521
522int netpoll_parse_options(struct netpoll *np, char *opt)
523{
524 char *cur=opt, *delim;
525
David S. Millerc68b9072006-11-14 20:40:49 -0800526 if (*cur != '@') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700527 if ((delim = strchr(cur, '@')) == NULL)
528 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800529 *delim = 0;
530 np->local_port = simple_strtol(cur, NULL, 10);
531 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700532 }
533 cur++;
534 printk(KERN_INFO "%s: local port %d\n", np->name, np->local_port);
535
David S. Millerc68b9072006-11-14 20:40:49 -0800536 if (*cur != '/') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700537 if ((delim = strchr(cur, '/')) == NULL)
538 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800539 *delim = 0;
540 np->local_ip = ntohl(in_aton(cur));
541 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700542
543 printk(KERN_INFO "%s: local IP %d.%d.%d.%d\n",
544 np->name, HIPQUAD(np->local_ip));
545 }
546 cur++;
547
David S. Millerc68b9072006-11-14 20:40:49 -0800548 if (*cur != ',') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549 /* parse out dev name */
550 if ((delim = strchr(cur, ',')) == NULL)
551 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800552 *delim = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700553 strlcpy(np->dev_name, cur, sizeof(np->dev_name));
David S. Millerc68b9072006-11-14 20:40:49 -0800554 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555 }
556 cur++;
557
558 printk(KERN_INFO "%s: interface %s\n", np->name, np->dev_name);
559
David S. Millerc68b9072006-11-14 20:40:49 -0800560 if (*cur != '@') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 /* dst port */
562 if ((delim = strchr(cur, '@')) == NULL)
563 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800564 *delim = 0;
565 np->remote_port = simple_strtol(cur, NULL, 10);
566 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700567 }
568 cur++;
569 printk(KERN_INFO "%s: remote port %d\n", np->name, np->remote_port);
570
571 /* dst ip */
572 if ((delim = strchr(cur, '/')) == NULL)
573 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800574 *delim = 0;
575 np->remote_ip = ntohl(in_aton(cur));
576 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577
578 printk(KERN_INFO "%s: remote IP %d.%d.%d.%d\n",
David S. Millerc68b9072006-11-14 20:40:49 -0800579 np->name, HIPQUAD(np->remote_ip));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580
David S. Millerc68b9072006-11-14 20:40:49 -0800581 if (*cur != 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700582 /* MAC address */
583 if ((delim = strchr(cur, ':')) == NULL)
584 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800585 *delim = 0;
586 np->remote_mac[0] = simple_strtol(cur, NULL, 16);
587 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 if ((delim = strchr(cur, ':')) == NULL)
589 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800590 *delim = 0;
591 np->remote_mac[1] = simple_strtol(cur, NULL, 16);
592 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593 if ((delim = strchr(cur, ':')) == NULL)
594 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800595 *delim = 0;
596 np->remote_mac[2] = simple_strtol(cur, NULL, 16);
597 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700598 if ((delim = strchr(cur, ':')) == NULL)
599 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800600 *delim = 0;
601 np->remote_mac[3] = simple_strtol(cur, NULL, 16);
602 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603 if ((delim = strchr(cur, ':')) == NULL)
604 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800605 *delim = 0;
606 np->remote_mac[4] = simple_strtol(cur, NULL, 16);
607 cur = delim + 1;
608 np->remote_mac[5] = simple_strtol(cur, NULL, 16);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700609 }
610
611 printk(KERN_INFO "%s: remote ethernet address "
612 "%02x:%02x:%02x:%02x:%02x:%02x\n",
613 np->name,
614 np->remote_mac[0],
615 np->remote_mac[1],
616 np->remote_mac[2],
617 np->remote_mac[3],
618 np->remote_mac[4],
619 np->remote_mac[5]);
620
621 return 0;
622
623 parse_failed:
624 printk(KERN_INFO "%s: couldn't parse config at %s!\n",
625 np->name, cur);
626 return -1;
627}
628
629int netpoll_setup(struct netpoll *np)
630{
631 struct net_device *ndev = NULL;
632 struct in_device *in_dev;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700633 struct netpoll_info *npinfo;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700634 unsigned long flags;
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700635 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700636
637 if (np->dev_name)
638 ndev = dev_get_by_name(np->dev_name);
639 if (!ndev) {
640 printk(KERN_ERR "%s: %s doesn't exist, aborting.\n",
641 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700642 return -ENODEV;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643 }
644
645 np->dev = ndev;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700646 if (!ndev->npinfo) {
647 npinfo = kmalloc(sizeof(*npinfo), GFP_KERNEL);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700648 if (!npinfo) {
649 err = -ENOMEM;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700650 goto release;
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700651 }
Jeff Moyer115c1d62005-06-22 22:05:31 -0700652
Jeff Moyer11513122005-08-11 19:23:04 -0700653 npinfo->rx_flags = 0;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700654 npinfo->rx_np = NULL;
Ingo Molnara9f6a0d2005-09-09 13:10:41 -0700655 spin_lock_init(&npinfo->poll_lock);
Jeff Moyer115c1d62005-06-22 22:05:31 -0700656 npinfo->poll_owner = -1;
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700657
Ingo Molnara9f6a0d2005-09-09 13:10:41 -0700658 spin_lock_init(&npinfo->rx_lock);
Neil Horman068c6e92006-06-26 00:04:27 -0700659 skb_queue_head_init(&npinfo->arp_tx);
Stephen Hemmingerb6cd27e2006-10-26 15:46:51 -0700660 skb_queue_head_init(&npinfo->txq);
David Howells4c1ac1b2006-12-05 14:37:56 +0000661 INIT_DELAYED_WORK(&npinfo->tx_work, queue_process);
Stephen Hemmingerb6cd27e2006-10-26 15:46:51 -0700662
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700663 atomic_set(&npinfo->refcnt, 1);
664 } else {
Jeff Moyer115c1d62005-06-22 22:05:31 -0700665 npinfo = ndev->npinfo;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700666 atomic_inc(&npinfo->refcnt);
667 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668
669 if (!ndev->poll_controller) {
670 printk(KERN_ERR "%s: %s doesn't support polling, aborting.\n",
671 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700672 err = -ENOTSUPP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700673 goto release;
674 }
675
676 if (!netif_running(ndev)) {
677 unsigned long atmost, atleast;
678
679 printk(KERN_INFO "%s: device %s not up yet, forcing it\n",
680 np->name, np->dev_name);
681
Stephen Hemminger6756ae42006-03-20 22:23:58 -0800682 rtnl_lock();
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700683 err = dev_open(ndev);
684 rtnl_unlock();
685
686 if (err) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687 printk(KERN_ERR "%s: failed to open %s\n",
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700688 np->name, ndev->name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700689 goto release;
690 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691
692 atleast = jiffies + HZ/10;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900693 atmost = jiffies + 4*HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694 while (!netif_carrier_ok(ndev)) {
695 if (time_after(jiffies, atmost)) {
696 printk(KERN_NOTICE
697 "%s: timeout waiting for carrier\n",
698 np->name);
699 break;
700 }
701 cond_resched();
702 }
703
704 /* If carrier appears to come up instantly, we don't
705 * trust it and pause so that we don't pump all our
706 * queued console messages into the bitbucket.
707 */
708
709 if (time_before(jiffies, atleast)) {
710 printk(KERN_NOTICE "%s: carrier detect appears"
711 " untrustworthy, waiting 4 seconds\n",
712 np->name);
713 msleep(4000);
714 }
715 }
716
Kris Katterjohn38602882006-01-17 15:15:38 -0800717 if (is_zero_ether_addr(np->local_mac) && ndev->dev_addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 memcpy(np->local_mac, ndev->dev_addr, 6);
719
720 if (!np->local_ip) {
721 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -0700722 in_dev = __in_dev_get_rcu(ndev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723
724 if (!in_dev || !in_dev->ifa_list) {
725 rcu_read_unlock();
726 printk(KERN_ERR "%s: no IP address for %s, aborting\n",
727 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700728 err = -EDESTADDRREQ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729 goto release;
730 }
731
732 np->local_ip = ntohl(in_dev->ifa_list->ifa_local);
733 rcu_read_unlock();
734 printk(KERN_INFO "%s: local IP %d.%d.%d.%d\n",
735 np->name, HIPQUAD(np->local_ip));
736 }
737
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700738 if (np->rx_hook) {
739 spin_lock_irqsave(&npinfo->rx_lock, flags);
740 npinfo->rx_flags |= NETPOLL_RX_ENABLED;
741 npinfo->rx_np = np;
742 spin_unlock_irqrestore(&npinfo->rx_lock, flags);
743 }
Ingo Molnar26520762005-08-11 19:26:42 -0700744
745 /* fill up the skb queue */
746 refill_skbs();
747
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700748 /* last thing to do is link it to the net device structure */
Jeff Moyer115c1d62005-06-22 22:05:31 -0700749 ndev->npinfo = npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700750
Matt Mackall53fb95d2005-08-11 19:27:43 -0700751 /* avoid racing with NAPI reading npinfo */
752 synchronize_rcu();
753
Linus Torvalds1da177e2005-04-16 15:20:36 -0700754 return 0;
755
756 release:
Jeff Moyer115c1d62005-06-22 22:05:31 -0700757 if (!ndev->npinfo)
758 kfree(npinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700759 np->dev = NULL;
760 dev_put(ndev);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700761 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762}
763
David S. Millerc68b9072006-11-14 20:40:49 -0800764static int __init netpoll_init(void)
765{
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800766 skb_queue_head_init(&skb_pool);
767 return 0;
768}
769core_initcall(netpoll_init);
770
Linus Torvalds1da177e2005-04-16 15:20:36 -0700771void netpoll_cleanup(struct netpoll *np)
772{
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700773 struct netpoll_info *npinfo;
774 unsigned long flags;
775
Jeff Moyer115c1d62005-06-22 22:05:31 -0700776 if (np->dev) {
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700777 npinfo = np->dev->npinfo;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700778 if (npinfo) {
779 if (npinfo->rx_np == np) {
780 spin_lock_irqsave(&npinfo->rx_lock, flags);
781 npinfo->rx_np = NULL;
782 npinfo->rx_flags &= ~NETPOLL_RX_ENABLED;
783 spin_unlock_irqrestore(&npinfo->rx_lock, flags);
784 }
785
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700786 if (atomic_dec_and_test(&npinfo->refcnt)) {
787 skb_queue_purge(&npinfo->arp_tx);
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900788 skb_queue_purge(&npinfo->txq);
Jarek Poplawski25442ca2007-07-05 17:42:44 -0700789 cancel_rearming_delayed_work(&npinfo->tx_work);
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700790
Jarek Poplawski17200812007-06-28 22:11:47 -0700791 /* clean after last, unfinished work */
792 if (!skb_queue_empty(&npinfo->txq)) {
793 struct sk_buff *skb;
794 skb = __skb_dequeue(&npinfo->txq);
795 kfree_skb(skb);
796 }
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700797 kfree(npinfo);
Satyam Sharma1498b3f2007-07-09 15:22:23 -0700798 np->dev->npinfo = NULL;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700799 }
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700800 }
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700801
Jeff Moyer115c1d62005-06-22 22:05:31 -0700802 dev_put(np->dev);
803 }
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700804
Linus Torvalds1da177e2005-04-16 15:20:36 -0700805 np->dev = NULL;
806}
807
808int netpoll_trap(void)
809{
810 return atomic_read(&trapped);
811}
812
813void netpoll_set_trap(int trap)
814{
815 if (trap)
816 atomic_inc(&trapped);
817 else
818 atomic_dec(&trapped);
819}
820
821EXPORT_SYMBOL(netpoll_set_trap);
822EXPORT_SYMBOL(netpoll_trap);
823EXPORT_SYMBOL(netpoll_parse_options);
824EXPORT_SYMBOL(netpoll_setup);
825EXPORT_SYMBOL(netpoll_cleanup);
826EXPORT_SYMBOL(netpoll_send_udp);
827EXPORT_SYMBOL(netpoll_poll);