blob: 4b7e756181c9ec96eea6b0f5397aec3c87008a5a [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Common framework for low-level network console, dump, and debugger code
3 *
4 * Sep 8 2003 Matt Mackall <mpm@selenic.com>
5 *
6 * based on the netconsole code from:
7 *
8 * Copyright (C) 2001 Ingo Molnar <mingo@redhat.com>
9 * Copyright (C) 2002 Red Hat, Inc.
10 */
11
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/netdevice.h>
13#include <linux/etherdevice.h>
14#include <linux/string.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020015#include <linux/if_arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/inetdevice.h>
17#include <linux/inet.h>
18#include <linux/interrupt.h>
19#include <linux/netpoll.h>
20#include <linux/sched.h>
21#include <linux/delay.h>
22#include <linux/rcupdate.h>
23#include <linux/workqueue.h>
24#include <net/tcp.h>
25#include <net/udp.h>
26#include <asm/unaligned.h>
27
28/*
29 * We maintain a small pool of fully-sized skbs, to make sure the
30 * message gets out even in extreme OOM situations.
31 */
32
33#define MAX_UDP_CHUNK 1460
34#define MAX_SKBS 32
35#define MAX_QUEUE_DEPTH (MAX_SKBS / 2)
36
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -080037static struct sk_buff_head skb_pool;
Linus Torvalds1da177e2005-04-16 15:20:36 -070038
39static atomic_t trapped;
40
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -070041#define USEC_PER_POLL 50
David S. Millerd9452e92008-03-04 12:28:49 -080042#define NETPOLL_RX_ENABLED 1
43#define NETPOLL_RX_DROP 2
Linus Torvalds1da177e2005-04-16 15:20:36 -070044
45#define MAX_SKB_SIZE \
46 (MAX_UDP_CHUNK + sizeof(struct udphdr) + \
47 sizeof(struct iphdr) + sizeof(struct ethhdr))
48
49static void zap_completion_queue(void);
Neil Horman068c6e92006-06-26 00:04:27 -070050static void arp_reply(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
David Howellsc4028952006-11-22 14:57:56 +000052static void queue_process(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -070053{
David Howells4c1ac1b2006-12-05 14:37:56 +000054 struct netpoll_info *npinfo =
55 container_of(work, struct netpoll_info, tx_work.work);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056 struct sk_buff *skb;
Ingo Molnar36405432006-12-12 17:20:42 +010057 unsigned long flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -070058
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070059 while ((skb = skb_dequeue(&npinfo->txq))) {
60 struct net_device *dev = skb->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070062 if (!netif_device_present(dev) || !netif_running(dev)) {
63 __kfree_skb(skb);
64 continue;
65 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
Ingo Molnar36405432006-12-12 17:20:42 +010067 local_irq_save(flags);
68 netif_tx_lock(dev);
Peter P Waskiewicz Jrf25f4e42007-07-06 13:36:20 -070069 if ((netif_queue_stopped(dev) ||
Pavel Emelyanov668f8952007-10-21 17:01:56 -070070 netif_subqueue_stopped(dev, skb)) ||
Peter P Waskiewicz Jrf25f4e42007-07-06 13:36:20 -070071 dev->hard_start_xmit(skb, dev) != NETDEV_TX_OK) {
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070072 skb_queue_head(&npinfo->txq, skb);
Ingo Molnar36405432006-12-12 17:20:42 +010073 netif_tx_unlock(dev);
74 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -070075
Jarek Poplawski25442ca2007-07-05 17:42:44 -070076 schedule_delayed_work(&npinfo->tx_work, HZ/10);
Stephen Hemminger6c43ff12006-10-26 15:46:53 -070077 return;
78 }
Ingo Molnar36405432006-12-12 17:20:42 +010079 netif_tx_unlock(dev);
80 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -070081 }
82}
83
Al Virob51655b2006-11-14 21:40:42 -080084static __sum16 checksum_udp(struct sk_buff *skb, struct udphdr *uh,
85 unsigned short ulen, __be32 saddr, __be32 daddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -070086{
Al Virod6f5493c2006-11-14 21:26:08 -080087 __wsum psum;
Herbert Xufb286bb2005-11-10 13:01:24 -080088
Herbert Xu60476372007-04-09 11:59:39 -070089 if (uh->check == 0 || skb_csum_unnecessary(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -070090 return 0;
91
Herbert Xufb286bb2005-11-10 13:01:24 -080092 psum = csum_tcpudp_nofold(saddr, daddr, ulen, IPPROTO_UDP, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
Patrick McHardy84fa7932006-08-29 16:44:56 -070094 if (skb->ip_summed == CHECKSUM_COMPLETE &&
Al Virod3bc23e2006-11-14 21:24:49 -080095 !csum_fold(csum_add(psum, skb->csum)))
Herbert Xufb286bb2005-11-10 13:01:24 -080096 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
Herbert Xufb286bb2005-11-10 13:01:24 -080098 skb->csum = psum;
99
100 return __skb_checksum_complete(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101}
102
103/*
104 * Check whether delayed processing was scheduled for our NIC. If so,
105 * we attempt to grab the poll lock and use ->poll() to pump the card.
106 * If this fails, either we've recursed in ->poll() or it's already
107 * running on another CPU.
108 *
109 * Note: we don't mask interrupts with this lock because we're using
110 * trylock here and interrupts are already disabled in the softirq
111 * case. Further, we test the poll_owner to avoid recursion on UP
112 * systems where the lock doesn't exist.
113 *
114 * In cases where there is bi-directional communications, reading only
115 * one message at a time can lead to packets being dropped by the
116 * network adapter, forcing superfluous retries and possibly timeouts.
117 * Thus, we set our budget to greater than 1.
118 */
David S. Miller0a7606c2007-10-29 21:28:47 -0700119static int poll_one_napi(struct netpoll_info *npinfo,
120 struct napi_struct *napi, int budget)
121{
122 int work;
123
124 /* net_rx_action's ->poll() invocations and our's are
125 * synchronized by this test which is only made while
126 * holding the napi->poll_lock.
127 */
128 if (!test_bit(NAPI_STATE_SCHED, &napi->state))
129 return budget;
130
David S. Millerd9452e92008-03-04 12:28:49 -0800131 npinfo->rx_flags |= NETPOLL_RX_DROP;
David S. Miller0a7606c2007-10-29 21:28:47 -0700132 atomic_inc(&trapped);
133
134 work = napi->poll(napi, budget);
135
136 atomic_dec(&trapped);
David S. Millerd9452e92008-03-04 12:28:49 -0800137 npinfo->rx_flags &= ~NETPOLL_RX_DROP;
David S. Miller0a7606c2007-10-29 21:28:47 -0700138
139 return budget - work;
140}
141
Stephen Hemminger51069302007-11-19 19:18:11 -0800142static void poll_napi(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143{
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700144 struct napi_struct *napi;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145 int budget = 16;
146
Stephen Hemminger51069302007-11-19 19:18:11 -0800147 list_for_each_entry(napi, &dev->napi_list, dev_list) {
David S. Miller0a7606c2007-10-29 21:28:47 -0700148 if (napi->poll_owner != smp_processor_id() &&
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700149 spin_trylock(&napi->poll_lock)) {
Stephen Hemminger51069302007-11-19 19:18:11 -0800150 budget = poll_one_napi(dev->npinfo, napi, budget);
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700151 spin_unlock(&napi->poll_lock);
David S. Miller0a7606c2007-10-29 21:28:47 -0700152
153 if (!budget)
154 break;
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700155 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156 }
157}
158
Neil Horman068c6e92006-06-26 00:04:27 -0700159static void service_arp_queue(struct netpoll_info *npi)
160{
Stephen Hemminger51069302007-11-19 19:18:11 -0800161 if (npi) {
162 struct sk_buff *skb;
Neil Horman068c6e92006-06-26 00:04:27 -0700163
Stephen Hemminger51069302007-11-19 19:18:11 -0800164 while ((skb = skb_dequeue(&npi->arp_tx)))
165 arp_reply(skb);
Neil Horman068c6e92006-06-26 00:04:27 -0700166 }
Neil Horman068c6e92006-06-26 00:04:27 -0700167}
168
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169void netpoll_poll(struct netpoll *np)
170{
Stephen Hemminger51069302007-11-19 19:18:11 -0800171 struct net_device *dev = np->dev;
172
173 if (!dev || !netif_running(dev) || !dev->poll_controller)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174 return;
175
176 /* Process pending work on NIC */
Stephen Hemminger51069302007-11-19 19:18:11 -0800177 dev->poll_controller(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178
Stephen Hemminger51069302007-11-19 19:18:11 -0800179 poll_napi(dev);
180
181 service_arp_queue(dev->npinfo);
Neil Horman068c6e92006-06-26 00:04:27 -0700182
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183 zap_completion_queue();
184}
185
186static void refill_skbs(void)
187{
188 struct sk_buff *skb;
189 unsigned long flags;
190
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800191 spin_lock_irqsave(&skb_pool.lock, flags);
192 while (skb_pool.qlen < MAX_SKBS) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193 skb = alloc_skb(MAX_SKB_SIZE, GFP_ATOMIC);
194 if (!skb)
195 break;
196
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800197 __skb_queue_tail(&skb_pool, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198 }
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800199 spin_unlock_irqrestore(&skb_pool.lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200}
201
202static void zap_completion_queue(void)
203{
204 unsigned long flags;
205 struct softnet_data *sd = &get_cpu_var(softnet_data);
206
207 if (sd->completion_queue) {
208 struct sk_buff *clist;
209
210 local_irq_save(flags);
211 clist = sd->completion_queue;
212 sd->completion_queue = NULL;
213 local_irq_restore(flags);
214
215 while (clist != NULL) {
216 struct sk_buff *skb = clist;
217 clist = clist->next;
David S. Millerc68b9072006-11-14 20:40:49 -0800218 if (skb->destructor)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 dev_kfree_skb_any(skb); /* put this one back */
220 else
221 __kfree_skb(skb);
222 }
223 }
224
225 put_cpu_var(softnet_data);
226}
227
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800228static struct sk_buff *find_skb(struct netpoll *np, int len, int reserve)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229{
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800230 int count = 0;
231 struct sk_buff *skb;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232
233 zap_completion_queue();
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800234 refill_skbs();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235repeat:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236
237 skb = alloc_skb(len, GFP_ATOMIC);
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800238 if (!skb)
239 skb = skb_dequeue(&skb_pool);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240
241 if (!skb) {
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800242 if (++count < 10) {
243 netpoll_poll(np);
244 goto repeat;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 }
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800246 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247 }
248
249 atomic_set(&skb->users, 1);
250 skb_reserve(skb, reserve);
251 return skb;
252}
253
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700254static int netpoll_owner_active(struct net_device *dev)
255{
256 struct napi_struct *napi;
257
258 list_for_each_entry(napi, &dev->napi_list, dev_list) {
259 if (napi->poll_owner == smp_processor_id())
260 return 1;
261 }
262 return 0;
263}
264
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265static void netpoll_send_skb(struct netpoll *np, struct sk_buff *skb)
266{
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700267 int status = NETDEV_TX_BUSY;
268 unsigned long tries;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900269 struct net_device *dev = np->dev;
270 struct netpoll_info *npinfo = np->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900272 if (!npinfo || !netif_running(dev) || !netif_device_present(dev)) {
273 __kfree_skb(skb);
274 return;
275 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700277 /* don't get messages out of order, and no recursion */
Stephen Hemmingerbea33482007-10-03 16:41:36 -0700278 if (skb_queue_len(&npinfo->txq) == 0 && !netpoll_owner_active(dev)) {
Andrew Mortona49f99f2006-12-11 17:24:46 -0800279 unsigned long flags;
280
281 local_irq_save(flags);
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700282 /* try until next clock tick */
283 for (tries = jiffies_to_usecs(1)/USEC_PER_POLL;
284 tries > 0; --tries) {
285 if (netif_tx_trylock(dev)) {
Peter P Waskiewicz Jrf25f4e42007-07-06 13:36:20 -0700286 if (!netif_queue_stopped(dev) &&
Pavel Emelyanov668f8952007-10-21 17:01:56 -0700287 !netif_subqueue_stopped(dev, skb))
Andrew Mortone37b8d92006-12-09 14:01:49 -0800288 status = dev->hard_start_xmit(skb, dev);
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700289 netif_tx_unlock(dev);
Matt Mackallf0d34592005-08-11 19:25:11 -0700290
Andrew Mortone37b8d92006-12-09 14:01:49 -0800291 if (status == NETDEV_TX_OK)
292 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
Andrew Mortone37b8d92006-12-09 14:01:49 -0800294 }
Stephen Hemminger0db3dc72007-06-27 00:39:42 -0700295
296 /* tickle device maybe there is some cleanup */
297 netpoll_poll(np);
298
299 udelay(USEC_PER_POLL);
Matt Mackall0db1d6f2005-08-11 19:25:54 -0700300 }
Andrew Mortona49f99f2006-12-11 17:24:46 -0800301 local_irq_restore(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700304 if (status != NETDEV_TX_OK) {
Stephen Hemminger5de4a472006-10-26 15:46:55 -0700305 skb_queue_tail(&npinfo->txq, skb);
David Howells4c1ac1b2006-12-05 14:37:56 +0000306 schedule_delayed_work(&npinfo->tx_work,0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700308}
309
310void netpoll_send_udp(struct netpoll *np, const char *msg, int len)
311{
312 int total_len, eth_len, ip_len, udp_len;
313 struct sk_buff *skb;
314 struct udphdr *udph;
315 struct iphdr *iph;
316 struct ethhdr *eth;
317
318 udp_len = len + sizeof(*udph);
319 ip_len = eth_len = udp_len + sizeof(*iph);
320 total_len = eth_len + ETH_HLEN + NET_IP_ALIGN;
321
322 skb = find_skb(np, total_len, total_len - len);
323 if (!skb)
324 return;
325
Arnaldo Carvalho de Melo27d7ff42007-03-31 11:55:19 -0300326 skb_copy_to_linear_data(skb, msg, len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 skb->len += len;
328
Arnaldo Carvalho de Melo4bedb452007-03-13 14:28:48 -0300329 skb_push(skb, sizeof(*udph));
330 skb_reset_transport_header(skb);
331 udph = udp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332 udph->source = htons(np->local_port);
333 udph->dest = htons(np->remote_port);
334 udph->len = htons(udp_len);
335 udph->check = 0;
Chris Lalancette8e365ee2006-11-07 14:56:19 -0800336 udph->check = csum_tcpudp_magic(htonl(np->local_ip),
337 htonl(np->remote_ip),
338 udp_len, IPPROTO_UDP,
339 csum_partial((unsigned char *)udph, udp_len, 0));
340 if (udph->check == 0)
Al Viro5e57dff2006-11-20 18:08:13 -0800341 udph->check = CSUM_MANGLED_0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342
Arnaldo Carvalho de Meloe2d1bca2007-04-10 20:46:21 -0700343 skb_push(skb, sizeof(*iph));
344 skb_reset_network_header(skb);
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700345 iph = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346
347 /* iph->version = 4; iph->ihl = 5; */
348 put_unaligned(0x45, (unsigned char *)iph);
349 iph->tos = 0;
350 put_unaligned(htons(ip_len), &(iph->tot_len));
351 iph->id = 0;
352 iph->frag_off = 0;
353 iph->ttl = 64;
354 iph->protocol = IPPROTO_UDP;
355 iph->check = 0;
356 put_unaligned(htonl(np->local_ip), &(iph->saddr));
357 put_unaligned(htonl(np->remote_ip), &(iph->daddr));
358 iph->check = ip_fast_csum((unsigned char *)iph, iph->ihl);
359
360 eth = (struct ethhdr *) skb_push(skb, ETH_HLEN);
Arnaldo Carvalho de Melo459a98e2007-03-19 15:30:44 -0700361 skb_reset_mac_header(skb);
Stephen Hemminger206daaf2006-10-19 23:58:23 -0700362 skb->protocol = eth->h_proto = htons(ETH_P_IP);
Stephen Hemminger09538642007-11-19 19:23:29 -0800363 memcpy(eth->h_source, np->dev->dev_addr, ETH_ALEN);
364 memcpy(eth->h_dest, np->remote_mac, ETH_ALEN);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365
366 skb->dev = np->dev;
367
368 netpoll_send_skb(np, skb);
369}
370
371static void arp_reply(struct sk_buff *skb)
372{
Jeff Moyer115c1d62005-06-22 22:05:31 -0700373 struct netpoll_info *npinfo = skb->dev->npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374 struct arphdr *arp;
375 unsigned char *arp_ptr;
376 int size, type = ARPOP_REPLY, ptype = ETH_P_ARP;
Al Viro252e3342006-11-14 20:48:11 -0800377 __be32 sip, tip;
Neil Horman47bbec02006-12-08 00:05:55 -0800378 unsigned char *sha;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379 struct sk_buff *send_skb;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700380 struct netpoll *np = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700382 if (npinfo->rx_np && npinfo->rx_np->dev == skb->dev)
383 np = npinfo->rx_np;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700384 if (!np)
385 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386
387 /* No arp on this interface */
388 if (skb->dev->flags & IFF_NOARP)
389 return;
390
391 if (!pskb_may_pull(skb, (sizeof(struct arphdr) +
392 (2 * skb->dev->addr_len) +
393 (2 * sizeof(u32)))))
394 return;
395
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700396 skb_reset_network_header(skb);
Arnaldo Carvalho de Melobadff6d2007-03-13 13:06:52 -0300397 skb_reset_transport_header(skb);
Arnaldo Carvalho de Melod0a92be2007-03-12 20:56:31 -0300398 arp = arp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399
400 if ((arp->ar_hrd != htons(ARPHRD_ETHER) &&
401 arp->ar_hrd != htons(ARPHRD_IEEE802)) ||
402 arp->ar_pro != htons(ETH_P_IP) ||
403 arp->ar_op != htons(ARPOP_REQUEST))
404 return;
405
Neil Horman47bbec02006-12-08 00:05:55 -0800406 arp_ptr = (unsigned char *)(arp+1);
407 /* save the location of the src hw addr */
408 sha = arp_ptr;
409 arp_ptr += skb->dev->addr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410 memcpy(&sip, arp_ptr, 4);
Neil Horman47bbec02006-12-08 00:05:55 -0800411 arp_ptr += 4;
412 /* if we actually cared about dst hw addr, it would get copied here */
413 arp_ptr += skb->dev->addr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414 memcpy(&tip, arp_ptr, 4);
415
416 /* Should we ignore arp? */
Joe Perches21cf2252007-12-16 13:44:00 -0800417 if (tip != htonl(np->local_ip) ||
418 ipv4_is_loopback(tip) || ipv4_is_multicast(tip))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700419 return;
420
421 size = sizeof(struct arphdr) + 2 * (skb->dev->addr_len + 4);
422 send_skb = find_skb(np, size + LL_RESERVED_SPACE(np->dev),
423 LL_RESERVED_SPACE(np->dev));
424
425 if (!send_skb)
426 return;
427
Arnaldo Carvalho de Meloc1d2bbe2007-04-10 20:45:18 -0700428 skb_reset_network_header(send_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429 arp = (struct arphdr *) skb_put(send_skb, size);
430 send_skb->dev = skb->dev;
431 send_skb->protocol = htons(ETH_P_ARP);
432
433 /* Fill the device header for the ARP frame */
Stephen Hemminger0c4e8582007-10-09 01:36:32 -0700434 if (dev_hard_header(send_skb, skb->dev, ptype,
Stephen Hemminger09538642007-11-19 19:23:29 -0800435 sha, np->dev->dev_addr,
Stephen Hemminger0c4e8582007-10-09 01:36:32 -0700436 send_skb->len) < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437 kfree_skb(send_skb);
438 return;
439 }
440
441 /*
442 * Fill out the arp protocol part.
443 *
444 * we only support ethernet device type,
445 * which (according to RFC 1390) should always equal 1 (Ethernet).
446 */
447
448 arp->ar_hrd = htons(np->dev->type);
449 arp->ar_pro = htons(ETH_P_IP);
450 arp->ar_hln = np->dev->addr_len;
451 arp->ar_pln = 4;
452 arp->ar_op = htons(type);
453
454 arp_ptr=(unsigned char *)(arp + 1);
455 memcpy(arp_ptr, np->dev->dev_addr, np->dev->addr_len);
456 arp_ptr += np->dev->addr_len;
457 memcpy(arp_ptr, &tip, 4);
458 arp_ptr += 4;
Neil Horman47bbec02006-12-08 00:05:55 -0800459 memcpy(arp_ptr, sha, np->dev->addr_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700460 arp_ptr += np->dev->addr_len;
461 memcpy(arp_ptr, &sip, 4);
462
463 netpoll_send_skb(np, send_skb);
464}
465
466int __netpoll_rx(struct sk_buff *skb)
467{
468 int proto, len, ulen;
469 struct iphdr *iph;
470 struct udphdr *uh;
Neil Horman068c6e92006-06-26 00:04:27 -0700471 struct netpoll_info *npi = skb->dev->npinfo;
472 struct netpoll *np = npi->rx_np;
473
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700474 if (!np)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700475 goto out;
476 if (skb->dev->type != ARPHRD_ETHER)
477 goto out;
478
David S. Millerd9452e92008-03-04 12:28:49 -0800479 /* check if netpoll clients need ARP */
YOSHIFUJI Hideaki724800d2007-03-25 20:13:04 -0700480 if (skb->protocol == htons(ETH_P_ARP) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 atomic_read(&trapped)) {
Neil Horman068c6e92006-06-26 00:04:27 -0700482 skb_queue_tail(&npi->arp_tx, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700483 return 1;
484 }
485
486 proto = ntohs(eth_hdr(skb)->h_proto);
487 if (proto != ETH_P_IP)
488 goto out;
489 if (skb->pkt_type == PACKET_OTHERHOST)
490 goto out;
491 if (skb_shared(skb))
492 goto out;
493
494 iph = (struct iphdr *)skb->data;
495 if (!pskb_may_pull(skb, sizeof(struct iphdr)))
496 goto out;
497 if (iph->ihl < 5 || iph->version != 4)
498 goto out;
499 if (!pskb_may_pull(skb, iph->ihl*4))
500 goto out;
501 if (ip_fast_csum((u8 *)iph, iph->ihl) != 0)
502 goto out;
503
504 len = ntohs(iph->tot_len);
505 if (skb->len < len || len < iph->ihl*4)
506 goto out;
507
Aubrey.Li5e7d7fa2007-04-17 12:40:20 -0700508 /*
509 * Our transport medium may have padded the buffer out.
510 * Now We trim to the true length of the frame.
511 */
512 if (pskb_trim_rcsum(skb, len))
513 goto out;
514
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515 if (iph->protocol != IPPROTO_UDP)
516 goto out;
517
518 len -= iph->ihl*4;
519 uh = (struct udphdr *)(((char *)iph) + iph->ihl*4);
520 ulen = ntohs(uh->len);
521
522 if (ulen != len)
523 goto out;
Herbert Xufb286bb2005-11-10 13:01:24 -0800524 if (checksum_udp(skb, uh, ulen, iph->saddr, iph->daddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700525 goto out;
526 if (np->local_ip && np->local_ip != ntohl(iph->daddr))
527 goto out;
528 if (np->remote_ip && np->remote_ip != ntohl(iph->saddr))
529 goto out;
530 if (np->local_port && np->local_port != ntohs(uh->dest))
531 goto out;
532
533 np->rx_hook(np, ntohs(uh->source),
534 (char *)(uh+1),
535 ulen - sizeof(struct udphdr));
536
537 kfree_skb(skb);
538 return 1;
539
540out:
541 if (atomic_read(&trapped)) {
542 kfree_skb(skb);
543 return 1;
544 }
545
546 return 0;
547}
548
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700549void netpoll_print_options(struct netpoll *np)
550{
Joe Perches0795af52007-10-03 17:59:30 -0700551 DECLARE_MAC_BUF(mac);
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700552 printk(KERN_INFO "%s: local port %d\n",
553 np->name, np->local_port);
554 printk(KERN_INFO "%s: local IP %d.%d.%d.%d\n",
555 np->name, HIPQUAD(np->local_ip));
556 printk(KERN_INFO "%s: interface %s\n",
557 np->name, np->dev_name);
558 printk(KERN_INFO "%s: remote port %d\n",
559 np->name, np->remote_port);
560 printk(KERN_INFO "%s: remote IP %d.%d.%d.%d\n",
561 np->name, HIPQUAD(np->remote_ip));
Joe Perches0795af52007-10-03 17:59:30 -0700562 printk(KERN_INFO "%s: remote ethernet address %s\n",
563 np->name, print_mac(mac, np->remote_mac));
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700564}
565
Linus Torvalds1da177e2005-04-16 15:20:36 -0700566int netpoll_parse_options(struct netpoll *np, char *opt)
567{
568 char *cur=opt, *delim;
569
David S. Millerc68b9072006-11-14 20:40:49 -0800570 if (*cur != '@') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571 if ((delim = strchr(cur, '@')) == NULL)
572 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800573 *delim = 0;
574 np->local_port = simple_strtol(cur, NULL, 10);
575 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576 }
577 cur++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700578
David S. Millerc68b9072006-11-14 20:40:49 -0800579 if (*cur != '/') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580 if ((delim = strchr(cur, '/')) == NULL)
581 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800582 *delim = 0;
583 np->local_ip = ntohl(in_aton(cur));
584 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700585 }
586 cur++;
587
David S. Millerc68b9072006-11-14 20:40:49 -0800588 if (*cur != ',') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589 /* parse out dev name */
590 if ((delim = strchr(cur, ',')) == NULL)
591 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800592 *delim = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593 strlcpy(np->dev_name, cur, sizeof(np->dev_name));
David S. Millerc68b9072006-11-14 20:40:49 -0800594 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595 }
596 cur++;
597
David S. Millerc68b9072006-11-14 20:40:49 -0800598 if (*cur != '@') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700599 /* dst port */
600 if ((delim = strchr(cur, '@')) == NULL)
601 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800602 *delim = 0;
603 np->remote_port = simple_strtol(cur, NULL, 10);
604 cur = delim;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700605 }
606 cur++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607
608 /* dst ip */
609 if ((delim = strchr(cur, '/')) == NULL)
610 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800611 *delim = 0;
612 np->remote_ip = ntohl(in_aton(cur));
613 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700614
David S. Millerc68b9072006-11-14 20:40:49 -0800615 if (*cur != 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700616 /* MAC address */
617 if ((delim = strchr(cur, ':')) == NULL)
618 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800619 *delim = 0;
620 np->remote_mac[0] = simple_strtol(cur, NULL, 16);
621 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700622 if ((delim = strchr(cur, ':')) == NULL)
623 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800624 *delim = 0;
625 np->remote_mac[1] = simple_strtol(cur, NULL, 16);
626 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627 if ((delim = strchr(cur, ':')) == NULL)
628 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800629 *delim = 0;
630 np->remote_mac[2] = simple_strtol(cur, NULL, 16);
631 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700632 if ((delim = strchr(cur, ':')) == NULL)
633 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800634 *delim = 0;
635 np->remote_mac[3] = simple_strtol(cur, NULL, 16);
636 cur = delim + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700637 if ((delim = strchr(cur, ':')) == NULL)
638 goto parse_failed;
David S. Millerc68b9072006-11-14 20:40:49 -0800639 *delim = 0;
640 np->remote_mac[4] = simple_strtol(cur, NULL, 16);
641 cur = delim + 1;
642 np->remote_mac[5] = simple_strtol(cur, NULL, 16);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643 }
644
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700645 netpoll_print_options(np);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700646
647 return 0;
648
649 parse_failed:
650 printk(KERN_INFO "%s: couldn't parse config at %s!\n",
651 np->name, cur);
652 return -1;
653}
654
655int netpoll_setup(struct netpoll *np)
656{
657 struct net_device *ndev = NULL;
658 struct in_device *in_dev;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700659 struct netpoll_info *npinfo;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700660 unsigned long flags;
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700661 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700662
663 if (np->dev_name)
Eric W. Biederman881d9662007-09-17 11:56:21 -0700664 ndev = dev_get_by_name(&init_net, np->dev_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700665 if (!ndev) {
666 printk(KERN_ERR "%s: %s doesn't exist, aborting.\n",
667 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700668 return -ENODEV;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669 }
670
671 np->dev = ndev;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700672 if (!ndev->npinfo) {
673 npinfo = kmalloc(sizeof(*npinfo), GFP_KERNEL);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700674 if (!npinfo) {
675 err = -ENOMEM;
Jeff Moyer115c1d62005-06-22 22:05:31 -0700676 goto release;
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700677 }
Jeff Moyer115c1d62005-06-22 22:05:31 -0700678
David S. Millerd9452e92008-03-04 12:28:49 -0800679 npinfo->rx_flags = 0;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700680 npinfo->rx_np = NULL;
Stephen Hemminger2bdfe0b2006-10-26 15:46:54 -0700681
Ingo Molnara9f6a0d2005-09-09 13:10:41 -0700682 spin_lock_init(&npinfo->rx_lock);
Neil Horman068c6e92006-06-26 00:04:27 -0700683 skb_queue_head_init(&npinfo->arp_tx);
Stephen Hemmingerb6cd27e2006-10-26 15:46:51 -0700684 skb_queue_head_init(&npinfo->txq);
David Howells4c1ac1b2006-12-05 14:37:56 +0000685 INIT_DELAYED_WORK(&npinfo->tx_work, queue_process);
Stephen Hemmingerb6cd27e2006-10-26 15:46:51 -0700686
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700687 atomic_set(&npinfo->refcnt, 1);
688 } else {
Jeff Moyer115c1d62005-06-22 22:05:31 -0700689 npinfo = ndev->npinfo;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700690 atomic_inc(&npinfo->refcnt);
691 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692
693 if (!ndev->poll_controller) {
694 printk(KERN_ERR "%s: %s doesn't support polling, aborting.\n",
695 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700696 err = -ENOTSUPP;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700697 goto release;
698 }
699
700 if (!netif_running(ndev)) {
701 unsigned long atmost, atleast;
702
703 printk(KERN_INFO "%s: device %s not up yet, forcing it\n",
704 np->name, np->dev_name);
705
Stephen Hemminger6756ae42006-03-20 22:23:58 -0800706 rtnl_lock();
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700707 err = dev_open(ndev);
708 rtnl_unlock();
709
710 if (err) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700711 printk(KERN_ERR "%s: failed to open %s\n",
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700712 np->name, ndev->name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713 goto release;
714 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715
716 atleast = jiffies + HZ/10;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900717 atmost = jiffies + 4*HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 while (!netif_carrier_ok(ndev)) {
719 if (time_after(jiffies, atmost)) {
720 printk(KERN_NOTICE
721 "%s: timeout waiting for carrier\n",
722 np->name);
723 break;
724 }
725 cond_resched();
726 }
727
728 /* If carrier appears to come up instantly, we don't
729 * trust it and pause so that we don't pump all our
730 * queued console messages into the bitbucket.
731 */
732
733 if (time_before(jiffies, atleast)) {
734 printk(KERN_NOTICE "%s: carrier detect appears"
735 " untrustworthy, waiting 4 seconds\n",
736 np->name);
737 msleep(4000);
738 }
739 }
740
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741 if (!np->local_ip) {
742 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -0700743 in_dev = __in_dev_get_rcu(ndev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700744
745 if (!in_dev || !in_dev->ifa_list) {
746 rcu_read_unlock();
747 printk(KERN_ERR "%s: no IP address for %s, aborting\n",
748 np->name, np->dev_name);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700749 err = -EDESTADDRREQ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700750 goto release;
751 }
752
753 np->local_ip = ntohl(in_dev->ifa_list->ifa_local);
754 rcu_read_unlock();
755 printk(KERN_INFO "%s: local IP %d.%d.%d.%d\n",
756 np->name, HIPQUAD(np->local_ip));
757 }
758
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700759 if (np->rx_hook) {
760 spin_lock_irqsave(&npinfo->rx_lock, flags);
David S. Millerd9452e92008-03-04 12:28:49 -0800761 npinfo->rx_flags |= NETPOLL_RX_ENABLED;
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700762 npinfo->rx_np = np;
763 spin_unlock_irqrestore(&npinfo->rx_lock, flags);
764 }
Ingo Molnar26520762005-08-11 19:26:42 -0700765
766 /* fill up the skb queue */
767 refill_skbs();
768
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700769 /* last thing to do is link it to the net device structure */
Jeff Moyer115c1d62005-06-22 22:05:31 -0700770 ndev->npinfo = npinfo;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700771
Matt Mackall53fb95d2005-08-11 19:27:43 -0700772 /* avoid racing with NAPI reading npinfo */
773 synchronize_rcu();
774
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775 return 0;
776
777 release:
Jeff Moyer115c1d62005-06-22 22:05:31 -0700778 if (!ndev->npinfo)
779 kfree(npinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780 np->dev = NULL;
781 dev_put(ndev);
Stephen Hemmingerb41848b2006-10-26 15:46:52 -0700782 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700783}
784
David S. Millerc68b9072006-11-14 20:40:49 -0800785static int __init netpoll_init(void)
786{
Stephen Hemmingera1bcfac2006-11-14 10:43:58 -0800787 skb_queue_head_init(&skb_pool);
788 return 0;
789}
790core_initcall(netpoll_init);
791
Linus Torvalds1da177e2005-04-16 15:20:36 -0700792void netpoll_cleanup(struct netpoll *np)
793{
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700794 struct netpoll_info *npinfo;
795 unsigned long flags;
796
Jeff Moyer115c1d62005-06-22 22:05:31 -0700797 if (np->dev) {
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700798 npinfo = np->dev->npinfo;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700799 if (npinfo) {
800 if (npinfo->rx_np == np) {
801 spin_lock_irqsave(&npinfo->rx_lock, flags);
802 npinfo->rx_np = NULL;
David S. Millerd9452e92008-03-04 12:28:49 -0800803 npinfo->rx_flags &= ~NETPOLL_RX_ENABLED;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700804 spin_unlock_irqrestore(&npinfo->rx_lock, flags);
805 }
806
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700807 if (atomic_dec_and_test(&npinfo->refcnt)) {
808 skb_queue_purge(&npinfo->arp_tx);
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900809 skb_queue_purge(&npinfo->txq);
Jarek Poplawski25442ca2007-07-05 17:42:44 -0700810 cancel_rearming_delayed_work(&npinfo->tx_work);
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700811
Jarek Poplawski17200812007-06-28 22:11:47 -0700812 /* clean after last, unfinished work */
Stephen Hemminger0adc9ad2007-11-19 19:15:03 -0800813 __skb_queue_purge(&npinfo->txq);
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700814 kfree(npinfo);
Satyam Sharma1498b3f2007-07-09 15:22:23 -0700815 np->dev->npinfo = NULL;
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700816 }
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700817 }
Stephen Hemminger93ec2c72006-10-26 15:46:50 -0700818
Jeff Moyer115c1d62005-06-22 22:05:31 -0700819 dev_put(np->dev);
820 }
Jeff Moyerfbeec2e2005-06-22 22:05:59 -0700821
Linus Torvalds1da177e2005-04-16 15:20:36 -0700822 np->dev = NULL;
823}
824
825int netpoll_trap(void)
826{
827 return atomic_read(&trapped);
828}
829
830void netpoll_set_trap(int trap)
831{
832 if (trap)
833 atomic_inc(&trapped);
834 else
835 atomic_dec(&trapped);
836}
837
838EXPORT_SYMBOL(netpoll_set_trap);
839EXPORT_SYMBOL(netpoll_trap);
Satyam Sharma0bcc1812007-08-10 15:35:05 -0700840EXPORT_SYMBOL(netpoll_print_options);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700841EXPORT_SYMBOL(netpoll_parse_options);
842EXPORT_SYMBOL(netpoll_setup);
843EXPORT_SYMBOL(netpoll_cleanup);
844EXPORT_SYMBOL(netpoll_send_udp);
845EXPORT_SYMBOL(netpoll_poll);