blob: 250868f687627f1bbe6be8dc8f2da459e785b94b [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Common framework for low-level network console, dump, and debugger code
3 *
4 * Sep 8 2003 Matt Mackall <mpm@selenic.com>
5 *
6 * based on the netconsole code from:
7 *
8 * Copyright (C) 2001 Ingo Molnar <mingo@redhat.com>
9 * Copyright (C) 2002 Red Hat, Inc.
10 */
11
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/netdevice.h>
13#include <linux/etherdevice.h>
14#include <linux/string.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020015#include <linux/if_arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/inetdevice.h>
17#include <linux/inet.h>
18#include <linux/interrupt.h>
19#include <linux/netpoll.h>
20#include <linux/sched.h>
21#include <linux/delay.h>
22#include <linux/rcupdate.h>
23#include <linux/workqueue.h>
24#include <net/tcp.h>
25#include <net/udp.h>
26#include <asm/unaligned.h>
27
28/*
29 * We maintain a small pool of fully-sized skbs, to make sure the
30 * message gets out even in extreme OOM situations.
31 */
32
33#define MAX_UDP_CHUNK 1460
34#define MAX_SKBS 32
35#define MAX_QUEUE_DEPTH (MAX_SKBS / 2)
36
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -080037static struct sk_buff_head skb_pool;
Linus Torvalds1da177e2005-04-16 15:20:36 -070038
39static atomic_t trapped;
40
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -070041#define USEC_PER_POLL 50
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#define NETPOLL_RX_ENABLED 1
43#define NETPOLL_RX_DROP 2
44
45#define MAX_SKB_SIZE \
46 (MAX_UDP_CHUNK + sizeof(struct udphdr) + \
47 sizeof(struct iphdr) + sizeof(struct ethhdr))
48
49static void zap_completion_queue(void);
Neil Horman068c6e92006-06-26 00:04:27 -070050static void arp_reply(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
David Howellsc4028952006-11-22 14:57:56 +000052static void queue_process(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -070053{
David Howells4c1ac1b2006-12-05 14:37:56 +000054 struct netpoll_info *npinfo =
55 container_of(work, struct netpoll_info, tx_work.work);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056 struct sk_buff *skb;
Ingo Molnar36405432006-12-12 17:20:42 +010057 unsigned long flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -070058
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070059 while ((skb = skb_dequeue(&npinfo->txq))) {
60 struct net_device *dev = skb->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070062 if (!netif_device_present(dev) || !netif_running(dev)) {
63 __kfree_skb(skb);
64 continue;
65 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
Ingo Molnar36405432006-12-12 17:20:42 +010067 local_irq_save(flags);
68 netif_tx_lock(dev);
Peter P Waskiewicz Jrf25f4e42007-07-06 13:36:20 -070069 if ((netif_queue_stopped(dev) ||
Pavel Emelyanov668f8952007-10-21 17:01:56 -070070 netif_subqueue_stopped(dev, skb)) ||
Peter P Waskiewicz Jrf25f4e42007-07-06 13:36:20 -070071 dev->hard_start_xmit(skb, dev) != NETDEV_TX_OK) {
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070072 skb_queue_head(&npinfo->txq, skb);
Ingo Molnar36405432006-12-12 17:20:42 +010073 netif_tx_unlock(dev);
74 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -070075
Jarek Poplawski25442ca2007-07-05 17:42:44 -070076 schedule_delayed_work(&npinfo->tx_work, HZ/10);
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070077 return;
78 }
Ingo Molnar36405432006-12-12 17:20:42 +010079 netif_tx_unlock(dev);
80 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -070081 }
82}
83
Al Virob51655b2006-11-14 21:40:42 -080084static __sum16 checksum_udp(struct sk_buff *skb, struct udphdr *uh,
85 unsigned short ulen, __be32 saddr, __be32 daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -070086{
Al Virod6f5493c2006-11-14 21:26:08 -080087 __wsum psum;
Herbert Xufb286bb2005-11-10 13:01:24 -080088
Herbert Xu60476372007-04-09 11:59:39 -070089 if (uh->check == 0 || skb_csum_unnecessary(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -070090 return 0;
91
Herbert Xufb286bb2005-11-10 13:01:24 -080092 psum = csum_tcpudp_nofold(saddr, daddr, ulen, IPPROTO_UDP, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
Patrick McHardy84fa7932006-08-29 16:44:56 -070094 if (skb->ip_summed == CHECKSUM_COMPLETE &&
Al Virod3bc23e2006-11-14 21:24:49 -080095 !csum_fold(csum_add(psum, skb->csum)))
Herbert Xufb286bb2005-11-10 13:01:24 -080096 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
Herbert Xufb286bb2005-11-10 13:01:24 -080098 skb->csum = psum;
99
100 return __skb_checksum_complete(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101}
102
103/*
104 * Check whether delayed processing was scheduled for our NIC. If so,
105 * we attempt to grab the poll lock and use ->poll() to pump the card.
106 * If this fails, either we've recursed in ->poll() or it's already
107 * running on another CPU.
108 *
109 * Note: we don't mask interrupts with this lock because we're using
110 * trylock here and interrupts are already disabled in the softirq
111 * case. Further, we test the poll_owner to avoid recursion on UP
112 * systems where the lock doesn't exist.
113 *
114 * In cases where there is bi-directional communications, reading only
115 * one message at a time can lead to packets being dropped by the
116 * network adapter, forcing superfluous retries and possibly timeouts.
117 * Thus, we set our budget to greater than 1.
118 */
David S. Miller0a7606c2007-10-29 21:28:47 -0700119static int poll_one_napi(struct netpoll_info *npinfo,
120 struct napi_struct *napi, int budget)
121{
122 int work;
123
124 /* net_rx_action's ->poll() invocations and our's are
125 * synchronized by this test which is only made while
126 * holding the napi->poll_lock.
127 */
128 if (!test_bit(NAPI_STATE_SCHED, &napi->state))
129 return budget;
130
131 npinfo->rx_flags |= NETPOLL_RX_DROP;
132 atomic_inc(&trapped);
133
134 work = napi->poll(napi, budget);
135
136 atomic_dec(&trapped);
137 npinfo->rx_flags &= ~NETPOLL_RX_DROP;
138
139 return budget - work;
140}
141
Stephen Hemminger51069302007-11-19 19:18:11 -0800142static void poll_napi(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143{
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700144 struct napi_struct *napi;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145 int budget = 16;
146
Stephen Hemminger51069302007-11-19 19:18:11 -0800147 list_for_each_entry(napi, &dev->napi_list, dev_list) {
David S. Miller0a7606c2007-10-29 21:28:47 -0700148 if (napi->poll_owner != smp_processor_id() &&
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700149 spin_trylock(&napi->poll_lock)) {
Stephen Hemminger51069302007-11-19 19:18:11 -0800150 budget = poll_one_napi(dev->npinfo, napi, budget);
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700151 spin_unlock(&napi->poll_lock);
David S. Miller0a7606c2007-10-29 21:28:47 -0700152
153 if (!budget)
154 break;
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700155 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156 }
157}
158
Neil Horman068c6e92006-06-26 00:04:27 -0700159static void service_arp_queue(struct netpoll_info *npi)
160{
Stephen Hemminger51069302007-11-19 19:18:11 -0800161 if (npi) {
162 struct sk_buff *skb;
Neil Horman068c6e92006-06-26 00:04:27 -0700163
Stephen Hemminger51069302007-11-19 19:18:11 -0800164 while ((skb = skb_dequeue(&npi->arp_tx)))
165 arp_reply(skb);
Neil Horman068c6e92006-06-26 00:04:27 -0700166 }
Neil Horman068c6e92006-06-26 00:04:27 -0700167}
168
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169void netpoll_poll(struct netpoll *np)
170{
Stephen Hemminger51069302007-11-19 19:18:11 -0800171 struct net_device *dev = np->dev;
172
173 if (!dev || !netif_running(dev) || !dev->poll_controller)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174 return;
175
176 /* Process pending work on NIC */
Stephen Hemminger51069302007-11-19 19:18:11 -0800177 dev->poll_controller(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178
Stephen Hemminger51069302007-11-19 19:18:11 -0800179 poll_napi(dev);
180
181 service_arp_queue(dev->npinfo);
Neil Horman068c6e92006-06-26 00:04:27 -0700182
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183 zap_completion_queue();
184}
185
186static void refill_skbs(void)
187{
188 struct sk_buff *skb;
189 unsigned long flags;
190
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800191 spin_lock_irqsave(&skb_pool.lock, flags);
192 while (skb_pool.qlen < MAX_SKBS) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193 skb = alloc_skb(MAX_SKB_SIZE, GFP_ATOMIC);
194 if (!skb)
195 break;
196
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800197 __skb_queue_tail(&skb_pool, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198 }
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800199 spin_unlock_irqrestore(&skb_pool.lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200}
201
202static void zap_completion_queue(void)
203{
204 unsigned long flags;
205 struct softnet_data *sd = &get_cpu_var(softnet_data);
206
207 if (sd->completion_queue) {
208 struct sk_buff *clist;
209
210 local_irq_save(flags);
211 clist = sd->completion_queue;
212 sd->completion_queue = NULL;
213 local_irq_restore(flags);
214
215 while (clist != NULL) {
216 struct sk_buff *skb = clist;
217 clist = clist->next;
David S. Millerc68b9072006-11-14 20:40:49 -0800218 if (skb->destructor)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 dev_kfree_skb_any(skb); /* put this one back */
220 else
221 __kfree_skb(skb);
222 }
223 }
224
225 put_cpu_var(softnet_data);
226}
227
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800228static struct sk_buff *find_skb(struct netpoll *np, int len, int reserve)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229{
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800230 int count = 0;
231 struct sk_buff *skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232
233 zap_completion_queue();
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800234 refill_skbs();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235repeat:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236
237 skb = alloc_skb(len, GFP_ATOMIC);
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800238 if (!skb)
239 skb = skb_dequeue(&skb_pool);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240
241 if (!skb) {
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800242 if (++count < 10) {
243 netpoll_poll(np);
244 goto repeat;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 }
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800246 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247 }
248
249 atomic_set(&skb->users, 1);
250 skb_reserve(skb, reserve);
251 return skb;
252}
253
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700254static int netpoll_owner_active(struct net_device *dev)
255{
256 struct napi_struct *napi;
257
258 list_for_each_entry(napi, &dev->napi_list, dev_list) {
259 if (napi->poll_owner == smp_processor_id())
260 return 1;
261 }
262 return 0;
263}
264
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265static void netpoll_send_skb(struct netpoll *np, struct sk_buff *skb)
266{
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700267 int status = NETDEV_TX_BUSY;
268 unsigned long tries;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900269 struct net_device *dev = np->dev;
270 struct netpoll_info *npinfo = np->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900272 if (!npinfo || !netif_running(dev) || !netif_device_present(dev)) {
273 __kfree_skb(skb);
274 return;
275 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700277 /* don't get messages out of order, and no recursion */
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700278 if (skb_queue_len(&npinfo->txq) == 0 && !netpoll_owner_active(dev)) {
Andrew Mortona49f99f2006-12-11 17:24:46 -0800279 unsigned long flags;
280
281 local_irq_save(flags);
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700282 /* try until next clock tick */
283 for (tries = jiffies_to_usecs(1)/USEC_PER_POLL;
284 tries > 0; --tries) {
285 if (netif_tx_trylock(dev)) {
Peter P Waskiewicz Jrf25f4e42007-07-06 13:36:20 -0700286 if (!netif_queue_stopped(dev) &&
Pavel Emelyanov668f8952007-10-21 17:01:56 -0700287 !netif_subqueue_stopped(dev, skb))
Andrew Mortone37b8d92006-12-09 14:01:49 -0800288 status = dev->hard_start_xmit(skb, dev);
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700289 netif_tx_unlock(dev);
Matt Mackallf0d34592005-08-11 19:25:11 -0700290
Andrew Mortone37b8d92006-12-09 14:01:49 -0800291 if (status == NETDEV_TX_OK)
292 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
Andrew Mortone37b8d92006-12-09 14:01:49 -0800294 }
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700295
296 /* tickle device maybe there is some cleanup */
297 netpoll_poll(np);
298
299 udelay(USEC_PER_POLL);
Matt Mackall0db1d6f2005-08-11 19:25:54 -0700300 }
Andrew Mortona49f99f2006-12-11 17:24:46 -0800301 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700304 if (status != NETDEV_TX_OK) {
Stephen Hemminger5de4a472006-10-26 15:46:55 -0700305 skb_queue_tail(&npinfo->txq, skb);
David Howells4c1ac1b2006-12-05 14:37:56 +0000306 schedule_delayed_work(&npinfo->tx_work,0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700308}
309
310void netpoll_send_udp(struct netpoll *np, const char *msg, int len)
311{
312 int total_len, eth_len, ip_len, udp_len;
313 struct sk_buff *skb;
314 struct udphdr *udph;
315 struct iphdr *iph;
316 struct ethhdr *eth;
317
318 udp_len = len + sizeof(*udph);
319 ip_len = eth_len = udp_len + sizeof(*iph);
320 total_len = eth_len + ETH_HLEN + NET_IP_ALIGN;
321
322 skb = find_skb(np, total_len, total_len - len);
323 if (!skb)
324 return;
325
Arnaldo Carvalho de Melo27d7ff42007-03-31 11:55:19 -0300326 skb_copy_to_linear_data(skb, msg, len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 skb->len += len;
328
Arnaldo Carvalho de Melo4bedb452007-03-13 14:28:48 -0300329 skb_push(skb, sizeof(*udph));
330 skb_reset_transport_header(skb);
331 udph = udp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332 udph->source = htons(np->local_port);
333 udph->dest = htons(np->remote_port);
334 udph->len = htons(udp_len);
335 udph->check = 0;
Chris Lalancette8e365ee2006-11-07 14:56:19 -0800336 udph->check = csum_tcpudp_magic(htonl(np->local_ip),
337 htonl(np->remote_ip),
338 udp_len, IPPROTO_UDP,
339 csum_partial((unsigned char *)udph, udp_len, 0));
340 if (udph->check == 0)
Al Viro5e57dff2006-11-20 18:08:13 -0800341 udph->check = CSUM_MANGLED_0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342
Arnaldo Carvalho de Meloe2d1bca2007-04-10 20:46:21 -0700343 skb_push(skb, sizeof(*iph));
344 skb_reset_network_header(skb);
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700345 iph = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346
347 /* iph->version = 4; iph->ihl = 5; */
348 put_unaligned(0x45, (unsigned char *)iph);
349 iph->tos = 0;
350 put_unaligned(htons(ip_len), &(iph->tot_len));
351 iph->id = 0;
352 iph->frag_off = 0;
353 iph->ttl = 64;
354 iph->protocol = IPPROTO_UDP;
355 iph->check = 0;
356 put_unaligned(htonl(np->local_ip), &(iph->saddr));
357 put_unaligned(htonl(np->remote_ip), &(iph->daddr));
358 iph->check = ip_fast_csum((unsigned char *)iph, iph->ihl);
359
360 eth = (struct ethhdr *) skb_push(skb, ETH_HLEN);
Arnaldo Carvalho de Melo459a98e2007-03-19 15:30:44 -0700361 skb_reset_mac_header(skb);
Stephen Hemminger206daaf2006-10-19 23:58:23 -0700362 skb->protocol = eth->h_proto = htons(ETH_P_IP);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363 memcpy(eth->h_source, np->local_mac, 6);
364 memcpy(eth->h_dest, np->remote_mac, 6);
365
366 skb->dev = np->dev;
367
368 netpoll_send_skb(np, skb);
369}
370
371static void arp_reply(struct sk_buff *skb)
372{
Jeff Moyer115c1d62005-06-22 22:05:31 -0700373 struct netpoll_info *npinfo = skb->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374 struct arphdr *arp;
375 unsigned char *arp_ptr;
376 int size, type = ARPOP_REPLY, ptype = ETH_P_ARP;
Al Viro252e3342006-11-14 20:48:11 -0800377 __be32 sip, tip;
Neil Horman47bbec02006-12-08 00:05:55 -0800378 unsigned char *sha;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379 struct sk_buff *send_skb;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700380 struct netpoll *np = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700382 if (npinfo->rx_np && npinfo->rx_np->dev == skb->dev)
383 np = npinfo->rx_np;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700384 if (!np)
385 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386
387 /* No arp on this interface */
388 if (skb->dev->flags & IFF_NOARP)
389 return;
390
391 if (!pskb_may_pull(skb, (sizeof(struct arphdr) +
392 (2 * skb->dev->addr_len) +
393 (2 * sizeof(u32)))))
394 return;
395
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700396 skb_reset_network_header(skb);
Arnaldo Carvalho de Melobadff6d2007-03-13 13:06:52 -0300397 skb_reset_transport_header(skb);
Arnaldo Carvalho de Melod0a92be2007-03-12 20:56:31 -0300398 arp = arp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399
400 if ((arp->ar_hrd != htons(ARPHRD_ETHER) &&
401 arp->ar_hrd != htons(ARPHRD_IEEE802)) ||
402 arp->ar_pro != htons(ETH_P_IP) ||
403 arp->ar_op != htons(ARPOP_REQUEST))
404 return;
405
Neil Horman47bbec02006-12-08 00:05:55 -0800406 arp_ptr = (unsigned char *)(arp+1);
407 /* save the location of the src hw addr */
408 sha = arp_ptr;
409 arp_ptr += skb->dev->addr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410 memcpy(&sip, arp_ptr, 4);
Neil Horman47bbec02006-12-08 00:05:55 -0800411 arp_ptr += 4;
412 /* if we actually cared about dst hw addr, it would get copied here */
413 arp_ptr += skb->dev->addr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 memcpy(&tip, arp_ptr, 4);
415
416 /* Should we ignore arp? */
417 if (tip != htonl(np->local_ip) || LOOPBACK(tip) || MULTICAST(tip))
418 return;
419
420 size = sizeof(struct arphdr) + 2 * (skb->dev->addr_len + 4);
421 send_skb = find_skb(np, size + LL_RESERVED_SPACE(np->dev),
422 LL_RESERVED_SPACE(np->dev));
423
424 if (!send_skb)
425 return;
426
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700427 skb_reset_network_header(send_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700428 arp = (struct arphdr *) skb_put(send_skb, size);
429 send_skb->dev = skb->dev;
430 send_skb->protocol = htons(ETH_P_ARP);
431
432 /* Fill the device header for the ARP frame */
Stephen Hemminger0c4e8582007-10-09 01:36:32 -0700433 if (dev_hard_header(send_skb, skb->dev, ptype,
434 sha, np->local_mac,
435 send_skb->len) < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700436 kfree_skb(send_skb);
437 return;
438 }
439
440 /*
441 * Fill out the arp protocol part.
442 *
443 * we only support ethernet device type,
444 * which (according to RFC 1390) should always equal 1 (Ethernet).
445 */
446
447 arp->ar_hrd = htons(np->dev->type);
448 arp->ar_pro = htons(ETH_P_IP);
449 arp->ar_hln = np->dev->addr_len;
450 arp->ar_pln = 4;
451 arp->ar_op = htons(type);
452
453 arp_ptr=(unsigned char *)(arp + 1);
454 memcpy(arp_ptr, np->dev->dev_addr, np->dev->addr_len);
455 arp_ptr += np->dev->addr_len;
456 memcpy(arp_ptr, &tip, 4);
457 arp_ptr += 4;
Neil Horman47bbec02006-12-08 00:05:55 -0800458 memcpy(arp_ptr, sha, np->dev->addr_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700459 arp_ptr += np->dev->addr_len;
460 memcpy(arp_ptr, &sip, 4);
461
462 netpoll_send_skb(np, send_skb);
463}
464
465int __netpoll_rx(struct sk_buff *skb)
466{
467 int proto, len, ulen;
468 struct iphdr *iph;
469 struct udphdr *uh;
Neil Horman068c6e92006-06-26 00:04:27 -0700470 struct netpoll_info *npi = skb->dev->npinfo;
471 struct netpoll *np = npi->rx_np;
472
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700473 if (!np)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700474 goto out;
475 if (skb->dev->type != ARPHRD_ETHER)
476 goto out;
477
478 /* check if netpoll clients need ARP */
YOSHIFUJI Hideaki724800d2007-03-25 20:13:04 -0700479 if (skb->protocol == htons(ETH_P_ARP) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700480 atomic_read(&trapped)) {
Neil Horman068c6e92006-06-26 00:04:27 -0700481 skb_queue_tail(&npi->arp_tx, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700482 return 1;
483 }
484
485 proto = ntohs(eth_hdr(skb)->h_proto);
486 if (proto != ETH_P_IP)
487 goto out;
488 if (skb->pkt_type == PACKET_OTHERHOST)
489 goto out;
490 if (skb_shared(skb))
491 goto out;
492
493 iph = (struct iphdr *)skb->data;
494 if (!pskb_may_pull(skb, sizeof(struct iphdr)))
495 goto out;
496 if (iph->ihl < 5 || iph->version != 4)
497 goto out;
498 if (!pskb_may_pull(skb, iph->ihl*4))
499 goto out;
500 if (ip_fast_csum((u8 *)iph, iph->ihl) != 0)
501 goto out;
502
503 len = ntohs(iph->tot_len);
504 if (skb->len < len || len < iph->ihl*4)
505 goto out;
506
Aubrey.Li5e7d7fa2007-04-17 12:40:20 -0700507 /*
508 * Our transport medium may have padded the buffer out.
509 * Now We trim to the true length of the frame.
510 */
511 if (pskb_trim_rcsum(skb, len))
512 goto out;
513
Linus Torvalds1da177e2005-04-16 15:20:36 -0700514 if (iph->protocol != IPPROTO_UDP)
515 goto out;
516
517 len -= iph->ihl*4;
518 uh = (struct udphdr *)(((char *)iph) + iph->ihl*4);
519 ulen = ntohs(uh->len);
520
521 if (ulen != len)
522 goto out;
Herbert Xufb286bb2005-11-10 13:01:24 -0800523 if (checksum_udp(skb, uh, ulen, iph->saddr, iph->daddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 goto out;
525 if (np->local_ip && np->local_ip != ntohl(iph->daddr))
526 goto out;
527 if (np->remote_ip && np->remote_ip != ntohl(iph->saddr))
528 goto out;
529 if (np->local_port && np->local_port != ntohs(uh->dest))
530 goto out;
531
532 np->rx_hook(np, ntohs(uh->source),
533 (char *)(uh+1),
534 ulen - sizeof(struct udphdr));
535
536 kfree_skb(skb);
537 return 1;
538
539out:
540 if (atomic_read(&trapped)) {
541 kfree_skb(skb);
542 return 1;
543 }
544
545 return 0;
546}
547
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700548void netpoll_print_options(struct netpoll *np)
549{
Joe Perches0795af52007-10-03 17:59:30 -0700550 DECLARE_MAC_BUF(mac);
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700551 printk(KERN_INFO "%s: local port %d\n",
552 np->name, np->local_port);
553 printk(KERN_INFO "%s: local IP %d.%d.%d.%d\n",
554 np->name, HIPQUAD(np->local_ip));
555 printk(KERN_INFO "%s: interface %s\n",
556 np->name, np->dev_name);
557 printk(KERN_INFO "%s: remote port %d\n",
558 np->name, np->remote_port);
559 printk(KERN_INFO "%s: remote IP %d.%d.%d.%d\n",
560 np->name, HIPQUAD(np->remote_ip));
Joe Perches0795af52007-10-03 17:59:30 -0700561 printk(KERN_INFO "%s: remote ethernet address %s\n",
562 np->name, print_mac(mac, np->remote_mac));
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700563}
564
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565int netpoll_parse_options(struct netpoll *np, char *opt)
566{
567 char *cur=opt, *delim;
568
David S. Millerc68b9072006-11-14 20:40:49 -0800569 if (*cur != '@') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700570 if ((delim = strchr(cur, '@')) == NULL)
571 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800572 *delim = 0;
573 np->local_port = simple_strtol(cur, NULL, 10);
574 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700575 }
576 cur++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577
David S. Millerc68b9072006-11-14 20:40:49 -0800578 if (*cur != '/') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700579 if ((delim = strchr(cur, '/')) == NULL)
580 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800581 *delim = 0;
582 np->local_ip = ntohl(in_aton(cur));
583 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700584 }
585 cur++;
586
David S. Millerc68b9072006-11-14 20:40:49 -0800587 if (*cur != ',') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 /* parse out dev name */
589 if ((delim = strchr(cur, ',')) == NULL)
590 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800591 *delim = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700592 strlcpy(np->dev_name, cur, sizeof(np->dev_name));
David S. Millerc68b9072006-11-14 20:40:49 -0800593 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594 }
595 cur++;
596
David S. Millerc68b9072006-11-14 20:40:49 -0800597 if (*cur != '@') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700598 /* dst port */
599 if ((delim = strchr(cur, '@')) == NULL)
600 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800601 *delim = 0;
602 np->remote_port = simple_strtol(cur, NULL, 10);
603 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604 }
605 cur++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606
607 /* dst ip */
608 if ((delim = strchr(cur, '/')) == NULL)
609 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800610 *delim = 0;
611 np->remote_ip = ntohl(in_aton(cur));
612 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613
David S. Millerc68b9072006-11-14 20:40:49 -0800614 if (*cur != 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700615 /* MAC address */
616 if ((delim = strchr(cur, ':')) == NULL)
617 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800618 *delim = 0;
619 np->remote_mac[0] = simple_strtol(cur, NULL, 16);
620 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621 if ((delim = strchr(cur, ':')) == NULL)
622 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800623 *delim = 0;
624 np->remote_mac[1] = simple_strtol(cur, NULL, 16);
625 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626 if ((delim = strchr(cur, ':')) == NULL)
627 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800628 *delim = 0;
629 np->remote_mac[2] = simple_strtol(cur, NULL, 16);
630 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631 if ((delim = strchr(cur, ':')) == NULL)
632 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800633 *delim = 0;
634 np->remote_mac[3] = simple_strtol(cur, NULL, 16);
635 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700636 if ((delim = strchr(cur, ':')) == NULL)
637 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800638 *delim = 0;
639 np->remote_mac[4] = simple_strtol(cur, NULL, 16);
640 cur = delim + 1;
641 np->remote_mac[5] = simple_strtol(cur, NULL, 16);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700642 }
643
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700644 netpoll_print_options(np);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645
646 return 0;
647
648 parse_failed:
649 printk(KERN_INFO "%s: couldn't parse config at %s!\n",
650 np->name, cur);
651 return -1;
652}
653
654int netpoll_setup(struct netpoll *np)
655{
656 struct net_device *ndev = NULL;
657 struct in_device *in_dev;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700658 struct netpoll_info *npinfo;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700659 unsigned long flags;
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700660 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700661
662 if (np->dev_name)
Eric W. Biederman881d9662007-09-17 11:56:21 -0700663 ndev = dev_get_by_name(&init_net, np->dev_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700664 if (!ndev) {
665 printk(KERN_ERR "%s: %s doesn't exist, aborting.\n",
666 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700667 return -ENODEV;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668 }
669
670 np->dev = ndev;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700671 if (!ndev->npinfo) {
672 npinfo = kmalloc(sizeof(*npinfo), GFP_KERNEL);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700673 if (!npinfo) {
674 err = -ENOMEM;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700675 goto release;
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700676 }
Jeff Moyer115c1d62005-06-22 22:05:31 -0700677
Jeff Moyer11513122005-08-11 19:23:04 -0700678 npinfo->rx_flags = 0;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700679 npinfo->rx_np = NULL;
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700680
Ingo Molnara9f6a0d2005-09-09 13:10:41 -0700681 spin_lock_init(&npinfo->rx_lock);
Neil Horman068c6e92006-06-26 00:04:27 -0700682 skb_queue_head_init(&npinfo->arp_tx);
Stephen Hemmingerb6cd27e2006-10-26 15:46:51 -0700683 skb_queue_head_init(&npinfo->txq);
David Howells4c1ac1b2006-12-05 14:37:56 +0000684 INIT_DELAYED_WORK(&npinfo->tx_work, queue_process);
Stephen Hemmingerb6cd27e2006-10-26 15:46:51 -0700685
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700686 atomic_set(&npinfo->refcnt, 1);
687 } else {
Jeff Moyer115c1d62005-06-22 22:05:31 -0700688 npinfo = ndev->npinfo;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700689 atomic_inc(&npinfo->refcnt);
690 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691
692 if (!ndev->poll_controller) {
693 printk(KERN_ERR "%s: %s doesn't support polling, aborting.\n",
694 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700695 err = -ENOTSUPP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700696 goto release;
697 }
698
699 if (!netif_running(ndev)) {
700 unsigned long atmost, atleast;
701
702 printk(KERN_INFO "%s: device %s not up yet, forcing it\n",
703 np->name, np->dev_name);
704
Stephen Hemminger6756ae42006-03-20 22:23:58 -0800705 rtnl_lock();
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700706 err = dev_open(ndev);
707 rtnl_unlock();
708
709 if (err) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 printk(KERN_ERR "%s: failed to open %s\n",
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700711 np->name, ndev->name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700712 goto release;
713 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700714
715 atleast = jiffies + HZ/10;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900716 atmost = jiffies + 4*HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717 while (!netif_carrier_ok(ndev)) {
718 if (time_after(jiffies, atmost)) {
719 printk(KERN_NOTICE
720 "%s: timeout waiting for carrier\n",
721 np->name);
722 break;
723 }
724 cond_resched();
725 }
726
727 /* If carrier appears to come up instantly, we don't
728 * trust it and pause so that we don't pump all our
729 * queued console messages into the bitbucket.
730 */
731
732 if (time_before(jiffies, atleast)) {
733 printk(KERN_NOTICE "%s: carrier detect appears"
734 " untrustworthy, waiting 4 seconds\n",
735 np->name);
736 msleep(4000);
737 }
738 }
739
Kris Katterjohn38602882006-01-17 15:15:38 -0800740 if (is_zero_ether_addr(np->local_mac) && ndev->dev_addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741 memcpy(np->local_mac, ndev->dev_addr, 6);
742
743 if (!np->local_ip) {
744 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -0700745 in_dev = __in_dev_get_rcu(ndev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700746
747 if (!in_dev || !in_dev->ifa_list) {
748 rcu_read_unlock();
749 printk(KERN_ERR "%s: no IP address for %s, aborting\n",
750 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700751 err = -EDESTADDRREQ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752 goto release;
753 }
754
755 np->local_ip = ntohl(in_dev->ifa_list->ifa_local);
756 rcu_read_unlock();
757 printk(KERN_INFO "%s: local IP %d.%d.%d.%d\n",
758 np->name, HIPQUAD(np->local_ip));
759 }
760
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700761 if (np->rx_hook) {
762 spin_lock_irqsave(&npinfo->rx_lock, flags);
763 npinfo->rx_flags |= NETPOLL_RX_ENABLED;
764 npinfo->rx_np = np;
765 spin_unlock_irqrestore(&npinfo->rx_lock, flags);
766 }
Ingo Molnar26520762005-08-11 19:26:42 -0700767
768 /* fill up the skb queue */
769 refill_skbs();
770
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700771 /* last thing to do is link it to the net device structure */
Jeff Moyer115c1d62005-06-22 22:05:31 -0700772 ndev->npinfo = npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700773
Matt Mackall53fb95d2005-08-11 19:27:43 -0700774 /* avoid racing with NAPI reading npinfo */
775 synchronize_rcu();
776
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777 return 0;
778
779 release:
Jeff Moyer115c1d62005-06-22 22:05:31 -0700780 if (!ndev->npinfo)
781 kfree(npinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700782 np->dev = NULL;
783 dev_put(ndev);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700784 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700785}
786
David S. Millerc68b9072006-11-14 20:40:49 -0800787static int __init netpoll_init(void)
788{
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800789 skb_queue_head_init(&skb_pool);
790 return 0;
791}
792core_initcall(netpoll_init);
793
Linus Torvalds1da177e2005-04-16 15:20:36 -0700794void netpoll_cleanup(struct netpoll *np)
795{
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700796 struct netpoll_info *npinfo;
797 unsigned long flags;
798
Jeff Moyer115c1d62005-06-22 22:05:31 -0700799 if (np->dev) {
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700800 npinfo = np->dev->npinfo;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700801 if (npinfo) {
802 if (npinfo->rx_np == np) {
803 spin_lock_irqsave(&npinfo->rx_lock, flags);
804 npinfo->rx_np = NULL;
805 npinfo->rx_flags &= ~NETPOLL_RX_ENABLED;
806 spin_unlock_irqrestore(&npinfo->rx_lock, flags);
807 }
808
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700809 if (atomic_dec_and_test(&npinfo->refcnt)) {
810 skb_queue_purge(&npinfo->arp_tx);
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900811 skb_queue_purge(&npinfo->txq);
Jarek Poplawski25442ca2007-07-05 17:42:44 -0700812 cancel_rearming_delayed_work(&npinfo->tx_work);
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700813
Jarek Poplawski17200812007-06-28 22:11:47 -0700814 /* clean after last, unfinished work */
Stephen Hemminger0adc9ad2007-11-19 19:15:03 -0800815 __skb_queue_purge(&npinfo->txq);
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700816 kfree(npinfo);
Satyam Sharma1498b3f2007-07-09 15:22:23 -0700817 np->dev->npinfo = NULL;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700818 }
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700819 }
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700820
Jeff Moyer115c1d62005-06-22 22:05:31 -0700821 dev_put(np->dev);
822 }
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700823
Linus Torvalds1da177e2005-04-16 15:20:36 -0700824 np->dev = NULL;
825}
826
827int netpoll_trap(void)
828{
829 return atomic_read(&trapped);
830}
831
832void netpoll_set_trap(int trap)
833{
834 if (trap)
835 atomic_inc(&trapped);
836 else
837 atomic_dec(&trapped);
838}
839
840EXPORT_SYMBOL(netpoll_set_trap);
841EXPORT_SYMBOL(netpoll_trap);
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700842EXPORT_SYMBOL(netpoll_print_options);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700843EXPORT_SYMBOL(netpoll_parse_options);
844EXPORT_SYMBOL(netpoll_setup);
845EXPORT_SYMBOL(netpoll_cleanup);
846EXPORT_SYMBOL(netpoll_send_udp);
847EXPORT_SYMBOL(netpoll_poll);