blob: f8e74e511ce63c57f0f1ab473a451c32f9965d06 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Common framework for low-level network console, dump, and debugger code
3 *
4 * Sep 8 2003 Matt Mackall <mpm@selenic.com>
5 *
6 * based on the netconsole code from:
7 *
8 * Copyright (C) 2001 Ingo Molnar <mingo@redhat.com>
9 * Copyright (C) 2002 Red Hat, Inc.
10 */
11
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/netdevice.h>
13#include <linux/etherdevice.h>
14#include <linux/string.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020015#include <linux/if_arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/inetdevice.h>
17#include <linux/inet.h>
18#include <linux/interrupt.h>
19#include <linux/netpoll.h>
20#include <linux/sched.h>
21#include <linux/delay.h>
22#include <linux/rcupdate.h>
23#include <linux/workqueue.h>
24#include <net/tcp.h>
25#include <net/udp.h>
26#include <asm/unaligned.h>
27
28/*
29 * We maintain a small pool of fully-sized skbs, to make sure the
30 * message gets out even in extreme OOM situations.
31 */
32
33#define MAX_UDP_CHUNK 1460
34#define MAX_SKBS 32
35#define MAX_QUEUE_DEPTH (MAX_SKBS / 2)
36
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -080037static struct sk_buff_head skb_pool;
Linus Torvalds1da177e2005-04-16 15:20:36 -070038
39static atomic_t trapped;
40
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -070041#define USEC_PER_POLL 50
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#define NETPOLL_RX_ENABLED 1
43#define NETPOLL_RX_DROP 2
44
45#define MAX_SKB_SIZE \
46 (MAX_UDP_CHUNK + sizeof(struct udphdr) + \
47 sizeof(struct iphdr) + sizeof(struct ethhdr))
48
49static void zap_completion_queue(void);
Neil Horman068c6e92006-06-26 00:04:27 -070050static void arp_reply(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
David Howellsc4028952006-11-22 14:57:56 +000052static void queue_process(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -070053{
David Howells4c1ac1b2006-12-05 14:37:56 +000054 struct netpoll_info *npinfo =
55 container_of(work, struct netpoll_info, tx_work.work);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056 struct sk_buff *skb;
Ingo Molnar36405432006-12-12 17:20:42 +010057 unsigned long flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -070058
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070059 while ((skb = skb_dequeue(&npinfo->txq))) {
60 struct net_device *dev = skb->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070062 if (!netif_device_present(dev) || !netif_running(dev)) {
63 __kfree_skb(skb);
64 continue;
65 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
Ingo Molnar36405432006-12-12 17:20:42 +010067 local_irq_save(flags);
68 netif_tx_lock(dev);
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070069 if (netif_queue_stopped(dev) ||
70 dev->hard_start_xmit(skb, dev) != NETDEV_TX_OK) {
71 skb_queue_head(&npinfo->txq, skb);
Ingo Molnar36405432006-12-12 17:20:42 +010072 netif_tx_unlock(dev);
73 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -070074
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070075 schedule_delayed_work(&npinfo->tx_work, HZ/10);
76 return;
77 }
Ingo Molnar36405432006-12-12 17:20:42 +010078 netif_tx_unlock(dev);
79 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -070080 }
81}
82
Al Virob51655b2006-11-14 21:40:42 -080083static __sum16 checksum_udp(struct sk_buff *skb, struct udphdr *uh,
84 unsigned short ulen, __be32 saddr, __be32 daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -070085{
Al Virod6f5493c2006-11-14 21:26:08 -080086 __wsum psum;
Herbert Xufb286bb2005-11-10 13:01:24 -080087
Herbert Xu60476372007-04-09 11:59:39 -070088 if (uh->check == 0 || skb_csum_unnecessary(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -070089 return 0;
90
Herbert Xufb286bb2005-11-10 13:01:24 -080091 psum = csum_tcpudp_nofold(saddr, daddr, ulen, IPPROTO_UDP, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -070092
Patrick McHardy84fa7932006-08-29 16:44:56 -070093 if (skb->ip_summed == CHECKSUM_COMPLETE &&
Al Virod3bc23e2006-11-14 21:24:49 -080094 !csum_fold(csum_add(psum, skb->csum)))
Herbert Xufb286bb2005-11-10 13:01:24 -080095 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070096
Herbert Xufb286bb2005-11-10 13:01:24 -080097 skb->csum = psum;
98
99 return __skb_checksum_complete(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100}
101
102/*
103 * Check whether delayed processing was scheduled for our NIC. If so,
104 * we attempt to grab the poll lock and use ->poll() to pump the card.
105 * If this fails, either we've recursed in ->poll() or it's already
106 * running on another CPU.
107 *
108 * Note: we don't mask interrupts with this lock because we're using
109 * trylock here and interrupts are already disabled in the softirq
110 * case. Further, we test the poll_owner to avoid recursion on UP
111 * systems where the lock doesn't exist.
112 *
113 * In cases where there is bi-directional communications, reading only
114 * one message at a time can lead to packets being dropped by the
115 * network adapter, forcing superfluous retries and possibly timeouts.
116 * Thus, we set our budget to greater than 1.
117 */
118static void poll_napi(struct netpoll *np)
119{
Jeff Moyer115c1d62005-06-22 22:05:31 -0700120 struct netpoll_info *npinfo = np->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121 int budget = 16;
122
123 if (test_bit(__LINK_STATE_RX_SCHED, &np->dev->state) &&
Jeff Moyer115c1d62005-06-22 22:05:31 -0700124 npinfo->poll_owner != smp_processor_id() &&
125 spin_trylock(&npinfo->poll_lock)) {
126 npinfo->rx_flags |= NETPOLL_RX_DROP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127 atomic_inc(&trapped);
128
129 np->dev->poll(np->dev, &budget);
130
131 atomic_dec(&trapped);
Jeff Moyer115c1d62005-06-22 22:05:31 -0700132 npinfo->rx_flags &= ~NETPOLL_RX_DROP;
133 spin_unlock(&npinfo->poll_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134 }
135}
136
Neil Horman068c6e92006-06-26 00:04:27 -0700137static void service_arp_queue(struct netpoll_info *npi)
138{
139 struct sk_buff *skb;
140
141 if (unlikely(!npi))
142 return;
143
144 skb = skb_dequeue(&npi->arp_tx);
145
146 while (skb != NULL) {
147 arp_reply(skb);
148 skb = skb_dequeue(&npi->arp_tx);
149 }
Neil Horman068c6e92006-06-26 00:04:27 -0700150}
151
Linus Torvalds1da177e2005-04-16 15:20:36 -0700152void netpoll_poll(struct netpoll *np)
153{
David S. Millerc68b9072006-11-14 20:40:49 -0800154 if (!np->dev || !netif_running(np->dev) || !np->dev->poll_controller)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 return;
156
157 /* Process pending work on NIC */
158 np->dev->poll_controller(np->dev);
159 if (np->dev->poll)
160 poll_napi(np);
161
Neil Horman068c6e92006-06-26 00:04:27 -0700162 service_arp_queue(np->dev->npinfo);
163
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164 zap_completion_queue();
165}
166
167static void refill_skbs(void)
168{
169 struct sk_buff *skb;
170 unsigned long flags;
171
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800172 spin_lock_irqsave(&skb_pool.lock, flags);
173 while (skb_pool.qlen < MAX_SKBS) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174 skb = alloc_skb(MAX_SKB_SIZE, GFP_ATOMIC);
175 if (!skb)
176 break;
177
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800178 __skb_queue_tail(&skb_pool, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179 }
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800180 spin_unlock_irqrestore(&skb_pool.lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181}
182
183static void zap_completion_queue(void)
184{
185 unsigned long flags;
186 struct softnet_data *sd = &get_cpu_var(softnet_data);
187
188 if (sd->completion_queue) {
189 struct sk_buff *clist;
190
191 local_irq_save(flags);
192 clist = sd->completion_queue;
193 sd->completion_queue = NULL;
194 local_irq_restore(flags);
195
196 while (clist != NULL) {
197 struct sk_buff *skb = clist;
198 clist = clist->next;
David S. Millerc68b9072006-11-14 20:40:49 -0800199 if (skb->destructor)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200 dev_kfree_skb_any(skb); /* put this one back */
201 else
202 __kfree_skb(skb);
203 }
204 }
205
206 put_cpu_var(softnet_data);
207}
208
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800209static struct sk_buff *find_skb(struct netpoll *np, int len, int reserve)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210{
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800211 int count = 0;
212 struct sk_buff *skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213
214 zap_completion_queue();
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800215 refill_skbs();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700216repeat:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217
218 skb = alloc_skb(len, GFP_ATOMIC);
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800219 if (!skb)
220 skb = skb_dequeue(&skb_pool);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221
222 if (!skb) {
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800223 if (++count < 10) {
224 netpoll_poll(np);
225 goto repeat;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226 }
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800227 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228 }
229
230 atomic_set(&skb->users, 1);
231 skb_reserve(skb, reserve);
232 return skb;
233}
234
235static void netpoll_send_skb(struct netpoll *np, struct sk_buff *skb)
236{
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700237 int status = NETDEV_TX_BUSY;
238 unsigned long tries;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900239 struct net_device *dev = np->dev;
240 struct netpoll_info *npinfo = np->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900242 if (!npinfo || !netif_running(dev) || !netif_device_present(dev)) {
243 __kfree_skb(skb);
244 return;
245 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700247 /* don't get messages out of order, and no recursion */
David S. Millerc68b9072006-11-14 20:40:49 -0800248 if (skb_queue_len(&npinfo->txq) == 0 &&
Andrew Mortone37b8d92006-12-09 14:01:49 -0800249 npinfo->poll_owner != smp_processor_id()) {
Andrew Mortona49f99f2006-12-11 17:24:46 -0800250 unsigned long flags;
251
252 local_irq_save(flags);
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700253 /* try until next clock tick */
254 for (tries = jiffies_to_usecs(1)/USEC_PER_POLL;
255 tries > 0; --tries) {
256 if (netif_tx_trylock(dev)) {
Andrew Mortone37b8d92006-12-09 14:01:49 -0800257 if (!netif_queue_stopped(dev))
258 status = dev->hard_start_xmit(skb, dev);
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700259 netif_tx_unlock(dev);
Matt Mackallf0d34592005-08-11 19:25:11 -0700260
Andrew Mortone37b8d92006-12-09 14:01:49 -0800261 if (status == NETDEV_TX_OK)
262 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263
Andrew Mortone37b8d92006-12-09 14:01:49 -0800264 }
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700265
266 /* tickle device maybe there is some cleanup */
267 netpoll_poll(np);
268
269 udelay(USEC_PER_POLL);
Matt Mackall0db1d6f2005-08-11 19:25:54 -0700270 }
Andrew Mortona49f99f2006-12-11 17:24:46 -0800271 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700274 if (status != NETDEV_TX_OK) {
Stephen Hemminger5de4a472006-10-26 15:46:55 -0700275 skb_queue_tail(&npinfo->txq, skb);
David Howells4c1ac1b2006-12-05 14:37:56 +0000276 schedule_delayed_work(&npinfo->tx_work,0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278}
279
280void netpoll_send_udp(struct netpoll *np, const char *msg, int len)
281{
282 int total_len, eth_len, ip_len, udp_len;
283 struct sk_buff *skb;
284 struct udphdr *udph;
285 struct iphdr *iph;
286 struct ethhdr *eth;
287
288 udp_len = len + sizeof(*udph);
289 ip_len = eth_len = udp_len + sizeof(*iph);
290 total_len = eth_len + ETH_HLEN + NET_IP_ALIGN;
291
292 skb = find_skb(np, total_len, total_len - len);
293 if (!skb)
294 return;
295
Arnaldo Carvalho de Melo27d7ff42007-03-31 11:55:19 -0300296 skb_copy_to_linear_data(skb, msg, len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 skb->len += len;
298
Arnaldo Carvalho de Melo4bedb452007-03-13 14:28:48 -0300299 skb_push(skb, sizeof(*udph));
300 skb_reset_transport_header(skb);
301 udph = udp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302 udph->source = htons(np->local_port);
303 udph->dest = htons(np->remote_port);
304 udph->len = htons(udp_len);
305 udph->check = 0;
Chris Lalancette8e365ee2006-11-07 14:56:19 -0800306 udph->check = csum_tcpudp_magic(htonl(np->local_ip),
307 htonl(np->remote_ip),
308 udp_len, IPPROTO_UDP,
309 csum_partial((unsigned char *)udph, udp_len, 0));
310 if (udph->check == 0)
Al Viro5e57dff2006-11-20 18:08:13 -0800311 udph->check = CSUM_MANGLED_0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312
Arnaldo Carvalho de Meloe2d1bca2007-04-10 20:46:21 -0700313 skb_push(skb, sizeof(*iph));
314 skb_reset_network_header(skb);
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700315 iph = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700316
317 /* iph->version = 4; iph->ihl = 5; */
318 put_unaligned(0x45, (unsigned char *)iph);
319 iph->tos = 0;
320 put_unaligned(htons(ip_len), &(iph->tot_len));
321 iph->id = 0;
322 iph->frag_off = 0;
323 iph->ttl = 64;
324 iph->protocol = IPPROTO_UDP;
325 iph->check = 0;
326 put_unaligned(htonl(np->local_ip), &(iph->saddr));
327 put_unaligned(htonl(np->remote_ip), &(iph->daddr));
328 iph->check = ip_fast_csum((unsigned char *)iph, iph->ihl);
329
330 eth = (struct ethhdr *) skb_push(skb, ETH_HLEN);
Arnaldo Carvalho de Melo459a98e2007-03-19 15:30:44 -0700331 skb_reset_mac_header(skb);
Stephen Hemminger206daaf2006-10-19 23:58:23 -0700332 skb->protocol = eth->h_proto = htons(ETH_P_IP);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 memcpy(eth->h_source, np->local_mac, 6);
334 memcpy(eth->h_dest, np->remote_mac, 6);
335
336 skb->dev = np->dev;
337
338 netpoll_send_skb(np, skb);
339}
340
341static void arp_reply(struct sk_buff *skb)
342{
Jeff Moyer115c1d62005-06-22 22:05:31 -0700343 struct netpoll_info *npinfo = skb->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344 struct arphdr *arp;
345 unsigned char *arp_ptr;
346 int size, type = ARPOP_REPLY, ptype = ETH_P_ARP;
Al Viro252e33462006-11-14 20:48:11 -0800347 __be32 sip, tip;
Neil Horman47bbec02006-12-08 00:05:55 -0800348 unsigned char *sha;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349 struct sk_buff *send_skb;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700350 struct netpoll *np = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700352 if (npinfo->rx_np && npinfo->rx_np->dev == skb->dev)
353 np = npinfo->rx_np;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700354 if (!np)
355 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356
357 /* No arp on this interface */
358 if (skb->dev->flags & IFF_NOARP)
359 return;
360
361 if (!pskb_may_pull(skb, (sizeof(struct arphdr) +
362 (2 * skb->dev->addr_len) +
363 (2 * sizeof(u32)))))
364 return;
365
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700366 skb_reset_network_header(skb);
Arnaldo Carvalho de Melobadff6d2007-03-13 13:06:52 -0300367 skb_reset_transport_header(skb);
Arnaldo Carvalho de Melod0a92be2007-03-12 20:56:31 -0300368 arp = arp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700369
370 if ((arp->ar_hrd != htons(ARPHRD_ETHER) &&
371 arp->ar_hrd != htons(ARPHRD_IEEE802)) ||
372 arp->ar_pro != htons(ETH_P_IP) ||
373 arp->ar_op != htons(ARPOP_REQUEST))
374 return;
375
Neil Horman47bbec02006-12-08 00:05:55 -0800376 arp_ptr = (unsigned char *)(arp+1);
377 /* save the location of the src hw addr */
378 sha = arp_ptr;
379 arp_ptr += skb->dev->addr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380 memcpy(&sip, arp_ptr, 4);
Neil Horman47bbec02006-12-08 00:05:55 -0800381 arp_ptr += 4;
382 /* if we actually cared about dst hw addr, it would get copied here */
383 arp_ptr += skb->dev->addr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384 memcpy(&tip, arp_ptr, 4);
385
386 /* Should we ignore arp? */
387 if (tip != htonl(np->local_ip) || LOOPBACK(tip) || MULTICAST(tip))
388 return;
389
390 size = sizeof(struct arphdr) + 2 * (skb->dev->addr_len + 4);
391 send_skb = find_skb(np, size + LL_RESERVED_SPACE(np->dev),
392 LL_RESERVED_SPACE(np->dev));
393
394 if (!send_skb)
395 return;
396
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700397 skb_reset_network_header(send_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398 arp = (struct arphdr *) skb_put(send_skb, size);
399 send_skb->dev = skb->dev;
400 send_skb->protocol = htons(ETH_P_ARP);
401
402 /* Fill the device header for the ARP frame */
403
404 if (np->dev->hard_header &&
405 np->dev->hard_header(send_skb, skb->dev, ptype,
Neil Horman47bbec02006-12-08 00:05:55 -0800406 sha, np->local_mac,
David S. Millerc68b9072006-11-14 20:40:49 -0800407 send_skb->len) < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408 kfree_skb(send_skb);
409 return;
410 }
411
412 /*
413 * Fill out the arp protocol part.
414 *
415 * we only support ethernet device type,
416 * which (according to RFC 1390) should always equal 1 (Ethernet).
417 */
418
419 arp->ar_hrd = htons(np->dev->type);
420 arp->ar_pro = htons(ETH_P_IP);
421 arp->ar_hln = np->dev->addr_len;
422 arp->ar_pln = 4;
423 arp->ar_op = htons(type);
424
425 arp_ptr=(unsigned char *)(arp + 1);
426 memcpy(arp_ptr, np->dev->dev_addr, np->dev->addr_len);
427 arp_ptr += np->dev->addr_len;
428 memcpy(arp_ptr, &tip, 4);
429 arp_ptr += 4;
Neil Horman47bbec02006-12-08 00:05:55 -0800430 memcpy(arp_ptr, sha, np->dev->addr_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431 arp_ptr += np->dev->addr_len;
432 memcpy(arp_ptr, &sip, 4);
433
434 netpoll_send_skb(np, send_skb);
435}
436
437int __netpoll_rx(struct sk_buff *skb)
438{
439 int proto, len, ulen;
440 struct iphdr *iph;
441 struct udphdr *uh;
Neil Horman068c6e92006-06-26 00:04:27 -0700442 struct netpoll_info *npi = skb->dev->npinfo;
443 struct netpoll *np = npi->rx_np;
444
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700445 if (!np)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700446 goto out;
447 if (skb->dev->type != ARPHRD_ETHER)
448 goto out;
449
450 /* check if netpoll clients need ARP */
YOSHIFUJI Hideaki724800d2007-03-25 20:13:04 -0700451 if (skb->protocol == htons(ETH_P_ARP) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452 atomic_read(&trapped)) {
Neil Horman068c6e92006-06-26 00:04:27 -0700453 skb_queue_tail(&npi->arp_tx, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 return 1;
455 }
456
457 proto = ntohs(eth_hdr(skb)->h_proto);
458 if (proto != ETH_P_IP)
459 goto out;
460 if (skb->pkt_type == PACKET_OTHERHOST)
461 goto out;
462 if (skb_shared(skb))
463 goto out;
464
465 iph = (struct iphdr *)skb->data;
466 if (!pskb_may_pull(skb, sizeof(struct iphdr)))
467 goto out;
468 if (iph->ihl < 5 || iph->version != 4)
469 goto out;
470 if (!pskb_may_pull(skb, iph->ihl*4))
471 goto out;
472 if (ip_fast_csum((u8 *)iph, iph->ihl) != 0)
473 goto out;
474
475 len = ntohs(iph->tot_len);
476 if (skb->len < len || len < iph->ihl*4)
477 goto out;
478
Aubrey.Li5e7d7fa2007-04-17 12:40:20 -0700479 /*
480 * Our transport medium may have padded the buffer out.
481 * Now We trim to the true length of the frame.
482 */
483 if (pskb_trim_rcsum(skb, len))
484 goto out;
485
Linus Torvalds1da177e2005-04-16 15:20:36 -0700486 if (iph->protocol != IPPROTO_UDP)
487 goto out;
488
489 len -= iph->ihl*4;
490 uh = (struct udphdr *)(((char *)iph) + iph->ihl*4);
491 ulen = ntohs(uh->len);
492
493 if (ulen != len)
494 goto out;
Herbert Xufb286bb2005-11-10 13:01:24 -0800495 if (checksum_udp(skb, uh, ulen, iph->saddr, iph->daddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700496 goto out;
497 if (np->local_ip && np->local_ip != ntohl(iph->daddr))
498 goto out;
499 if (np->remote_ip && np->remote_ip != ntohl(iph->saddr))
500 goto out;
501 if (np->local_port && np->local_port != ntohs(uh->dest))
502 goto out;
503
504 np->rx_hook(np, ntohs(uh->source),
505 (char *)(uh+1),
506 ulen - sizeof(struct udphdr));
507
508 kfree_skb(skb);
509 return 1;
510
511out:
512 if (atomic_read(&trapped)) {
513 kfree_skb(skb);
514 return 1;
515 }
516
517 return 0;
518}
519
520int netpoll_parse_options(struct netpoll *np, char *opt)
521{
522 char *cur=opt, *delim;
523
David S. Millerc68b9072006-11-14 20:40:49 -0800524 if (*cur != '@') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700525 if ((delim = strchr(cur, '@')) == NULL)
526 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800527 *delim = 0;
528 np->local_port = simple_strtol(cur, NULL, 10);
529 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530 }
531 cur++;
532 printk(KERN_INFO "%s: local port %d\n", np->name, np->local_port);
533
David S. Millerc68b9072006-11-14 20:40:49 -0800534 if (*cur != '/') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700535 if ((delim = strchr(cur, '/')) == NULL)
536 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800537 *delim = 0;
538 np->local_ip = ntohl(in_aton(cur));
539 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540
541 printk(KERN_INFO "%s: local IP %d.%d.%d.%d\n",
542 np->name, HIPQUAD(np->local_ip));
543 }
544 cur++;
545
David S. Millerc68b9072006-11-14 20:40:49 -0800546 if (*cur != ',') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700547 /* parse out dev name */
548 if ((delim = strchr(cur, ',')) == NULL)
549 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800550 *delim = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551 strlcpy(np->dev_name, cur, sizeof(np->dev_name));
David S. Millerc68b9072006-11-14 20:40:49 -0800552 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700553 }
554 cur++;
555
556 printk(KERN_INFO "%s: interface %s\n", np->name, np->dev_name);
557
David S. Millerc68b9072006-11-14 20:40:49 -0800558 if (*cur != '@') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559 /* dst port */
560 if ((delim = strchr(cur, '@')) == NULL)
561 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800562 *delim = 0;
563 np->remote_port = simple_strtol(cur, NULL, 10);
564 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565 }
566 cur++;
567 printk(KERN_INFO "%s: remote port %d\n", np->name, np->remote_port);
568
569 /* dst ip */
570 if ((delim = strchr(cur, '/')) == NULL)
571 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800572 *delim = 0;
573 np->remote_ip = ntohl(in_aton(cur));
574 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700575
576 printk(KERN_INFO "%s: remote IP %d.%d.%d.%d\n",
David S. Millerc68b9072006-11-14 20:40:49 -0800577 np->name, HIPQUAD(np->remote_ip));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700578
David S. Millerc68b9072006-11-14 20:40:49 -0800579 if (*cur != 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580 /* MAC address */
581 if ((delim = strchr(cur, ':')) == NULL)
582 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800583 *delim = 0;
584 np->remote_mac[0] = simple_strtol(cur, NULL, 16);
585 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586 if ((delim = strchr(cur, ':')) == NULL)
587 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800588 *delim = 0;
589 np->remote_mac[1] = simple_strtol(cur, NULL, 16);
590 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700591 if ((delim = strchr(cur, ':')) == NULL)
592 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800593 *delim = 0;
594 np->remote_mac[2] = simple_strtol(cur, NULL, 16);
595 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596 if ((delim = strchr(cur, ':')) == NULL)
597 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800598 *delim = 0;
599 np->remote_mac[3] = simple_strtol(cur, NULL, 16);
600 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601 if ((delim = strchr(cur, ':')) == NULL)
602 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800603 *delim = 0;
604 np->remote_mac[4] = simple_strtol(cur, NULL, 16);
605 cur = delim + 1;
606 np->remote_mac[5] = simple_strtol(cur, NULL, 16);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607 }
608
609 printk(KERN_INFO "%s: remote ethernet address "
610 "%02x:%02x:%02x:%02x:%02x:%02x\n",
611 np->name,
612 np->remote_mac[0],
613 np->remote_mac[1],
614 np->remote_mac[2],
615 np->remote_mac[3],
616 np->remote_mac[4],
617 np->remote_mac[5]);
618
619 return 0;
620
621 parse_failed:
622 printk(KERN_INFO "%s: couldn't parse config at %s!\n",
623 np->name, cur);
624 return -1;
625}
626
627int netpoll_setup(struct netpoll *np)
628{
629 struct net_device *ndev = NULL;
630 struct in_device *in_dev;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700631 struct netpoll_info *npinfo;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700632 unsigned long flags;
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700633 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634
635 if (np->dev_name)
636 ndev = dev_get_by_name(np->dev_name);
637 if (!ndev) {
638 printk(KERN_ERR "%s: %s doesn't exist, aborting.\n",
639 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700640 return -ENODEV;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700641 }
642
643 np->dev = ndev;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700644 if (!ndev->npinfo) {
645 npinfo = kmalloc(sizeof(*npinfo), GFP_KERNEL);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700646 if (!npinfo) {
647 err = -ENOMEM;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700648 goto release;
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700649 }
Jeff Moyer115c1d62005-06-22 22:05:31 -0700650
Jeff Moyer11513122005-08-11 19:23:04 -0700651 npinfo->rx_flags = 0;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700652 npinfo->rx_np = NULL;
Ingo Molnara9f6a0d2005-09-09 13:10:41 -0700653 spin_lock_init(&npinfo->poll_lock);
Jeff Moyer115c1d62005-06-22 22:05:31 -0700654 npinfo->poll_owner = -1;
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700655
Ingo Molnara9f6a0d2005-09-09 13:10:41 -0700656 spin_lock_init(&npinfo->rx_lock);
Neil Horman068c6e92006-06-26 00:04:27 -0700657 skb_queue_head_init(&npinfo->arp_tx);
Stephen Hemmingerb6cd27e2006-10-26 15:46:51 -0700658 skb_queue_head_init(&npinfo->txq);
David Howells4c1ac1b2006-12-05 14:37:56 +0000659 INIT_DELAYED_WORK(&npinfo->tx_work, queue_process);
Stephen Hemmingerb6cd27e2006-10-26 15:46:51 -0700660
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700661 atomic_set(&npinfo->refcnt, 1);
662 } else {
Jeff Moyer115c1d62005-06-22 22:05:31 -0700663 npinfo = ndev->npinfo;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700664 atomic_inc(&npinfo->refcnt);
665 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700666
667 if (!ndev->poll_controller) {
668 printk(KERN_ERR "%s: %s doesn't support polling, aborting.\n",
669 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700670 err = -ENOTSUPP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700671 goto release;
672 }
673
674 if (!netif_running(ndev)) {
675 unsigned long atmost, atleast;
676
677 printk(KERN_INFO "%s: device %s not up yet, forcing it\n",
678 np->name, np->dev_name);
679
Stephen Hemminger6756ae42006-03-20 22:23:58 -0800680 rtnl_lock();
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700681 err = dev_open(ndev);
682 rtnl_unlock();
683
684 if (err) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700685 printk(KERN_ERR "%s: failed to open %s\n",
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700686 np->name, ndev->name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687 goto release;
688 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700689
690 atleast = jiffies + HZ/10;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900691 atmost = jiffies + 4*HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692 while (!netif_carrier_ok(ndev)) {
693 if (time_after(jiffies, atmost)) {
694 printk(KERN_NOTICE
695 "%s: timeout waiting for carrier\n",
696 np->name);
697 break;
698 }
699 cond_resched();
700 }
701
702 /* If carrier appears to come up instantly, we don't
703 * trust it and pause so that we don't pump all our
704 * queued console messages into the bitbucket.
705 */
706
707 if (time_before(jiffies, atleast)) {
708 printk(KERN_NOTICE "%s: carrier detect appears"
709 " untrustworthy, waiting 4 seconds\n",
710 np->name);
711 msleep(4000);
712 }
713 }
714
Kris Katterjohn38602882006-01-17 15:15:38 -0800715 if (is_zero_ether_addr(np->local_mac) && ndev->dev_addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700716 memcpy(np->local_mac, ndev->dev_addr, 6);
717
718 if (!np->local_ip) {
719 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -0700720 in_dev = __in_dev_get_rcu(ndev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721
722 if (!in_dev || !in_dev->ifa_list) {
723 rcu_read_unlock();
724 printk(KERN_ERR "%s: no IP address for %s, aborting\n",
725 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700726 err = -EDESTADDRREQ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727 goto release;
728 }
729
730 np->local_ip = ntohl(in_dev->ifa_list->ifa_local);
731 rcu_read_unlock();
732 printk(KERN_INFO "%s: local IP %d.%d.%d.%d\n",
733 np->name, HIPQUAD(np->local_ip));
734 }
735
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700736 if (np->rx_hook) {
737 spin_lock_irqsave(&npinfo->rx_lock, flags);
738 npinfo->rx_flags |= NETPOLL_RX_ENABLED;
739 npinfo->rx_np = np;
740 spin_unlock_irqrestore(&npinfo->rx_lock, flags);
741 }
Ingo Molnar26520762005-08-11 19:26:42 -0700742
743 /* fill up the skb queue */
744 refill_skbs();
745
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700746 /* last thing to do is link it to the net device structure */
Jeff Moyer115c1d62005-06-22 22:05:31 -0700747 ndev->npinfo = npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748
Matt Mackall53fb95d2005-08-11 19:27:43 -0700749 /* avoid racing with NAPI reading npinfo */
750 synchronize_rcu();
751
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752 return 0;
753
754 release:
Jeff Moyer115c1d62005-06-22 22:05:31 -0700755 if (!ndev->npinfo)
756 kfree(npinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700757 np->dev = NULL;
758 dev_put(ndev);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700759 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700760}
761
David S. Millerc68b9072006-11-14 20:40:49 -0800762static int __init netpoll_init(void)
763{
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800764 skb_queue_head_init(&skb_pool);
765 return 0;
766}
767core_initcall(netpoll_init);
768
Linus Torvalds1da177e2005-04-16 15:20:36 -0700769void netpoll_cleanup(struct netpoll *np)
770{
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700771 struct netpoll_info *npinfo;
772 unsigned long flags;
773
Jeff Moyer115c1d62005-06-22 22:05:31 -0700774 if (np->dev) {
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700775 npinfo = np->dev->npinfo;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700776 if (npinfo) {
777 if (npinfo->rx_np == np) {
778 spin_lock_irqsave(&npinfo->rx_lock, flags);
779 npinfo->rx_np = NULL;
780 npinfo->rx_flags &= ~NETPOLL_RX_ENABLED;
781 spin_unlock_irqrestore(&npinfo->rx_lock, flags);
782 }
783
784 np->dev->npinfo = NULL;
785 if (atomic_dec_and_test(&npinfo->refcnt)) {
786 skb_queue_purge(&npinfo->arp_tx);
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900787 skb_queue_purge(&npinfo->txq);
Stephen Hemminger6c43ff12006-10-26 15:46:53 -0700788 cancel_rearming_delayed_work(&npinfo->tx_work);
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900789 flush_scheduled_work();
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700790
791 kfree(npinfo);
792 }
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700793 }
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700794
Jeff Moyer115c1d62005-06-22 22:05:31 -0700795 dev_put(np->dev);
796 }
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700797
Linus Torvalds1da177e2005-04-16 15:20:36 -0700798 np->dev = NULL;
799}
800
801int netpoll_trap(void)
802{
803 return atomic_read(&trapped);
804}
805
806void netpoll_set_trap(int trap)
807{
808 if (trap)
809 atomic_inc(&trapped);
810 else
811 atomic_dec(&trapped);
812}
813
814EXPORT_SYMBOL(netpoll_set_trap);
815EXPORT_SYMBOL(netpoll_trap);
816EXPORT_SYMBOL(netpoll_parse_options);
817EXPORT_SYMBOL(netpoll_setup);
818EXPORT_SYMBOL(netpoll_cleanup);
819EXPORT_SYMBOL(netpoll_send_udp);
820EXPORT_SYMBOL(netpoll_poll);