blob: 08b9519a24f430a7750d91080f2b8f979f290cbc [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
5 *
6 * The IP to API glue.
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09007 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 * Authors: see ip.c
9 *
10 * Fixes:
11 * Many : Split from ip.c , see ip.c for history.
12 * Martin Mares : TOS setting fixed.
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +090013 * Alan Cox : Fixed a couple of oopses in Martin's
Linus Torvalds1da177e2005-04-16 15:20:36 -070014 * TOS tweaks.
15 * Mike McLagan : Routing by source
16 */
17
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/module.h>
19#include <linux/types.h>
20#include <linux/mm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/skbuff.h>
22#include <linux/ip.h>
23#include <linux/icmp.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020024#include <linux/inetdevice.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/netdevice.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090026#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <net/sock.h>
28#include <net/ip.h>
29#include <net/icmp.h>
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -080030#include <net/tcp_states.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070031#include <linux/udp.h>
32#include <linux/igmp.h>
33#include <linux/netfilter.h>
34#include <linux/route.h>
35#include <linux/mroute.h>
36#include <net/route.h>
37#include <net/xfrm.h>
David L Stevensdae50292008-04-27 01:06:07 -070038#include <net/compat.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070039#if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
40#include <net/transp_v6.h>
41#endif
42
43#include <linux/errqueue.h>
44#include <asm/uaccess.h>
45
46#define IP_CMSG_PKTINFO 1
47#define IP_CMSG_TTL 2
48#define IP_CMSG_TOS 4
49#define IP_CMSG_RECVOPTS 8
50#define IP_CMSG_RETOPTS 16
Catherine Zhang2c7946a2006-03-20 22:41:23 -080051#define IP_CMSG_PASSSEC 32
Balazs Scheidlere8b2dfe2008-11-16 19:32:39 -080052#define IP_CMSG_ORIGDSTADDR 64
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
54/*
55 * SOL_IP control messages.
56 */
57
58static void ip_cmsg_recv_pktinfo(struct msghdr *msg, struct sk_buff *skb)
59{
60 struct in_pktinfo info;
Eric Dumazet511c3f92009-06-02 05:14:27 +000061 struct rtable *rt = skb_rtable(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070062
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -070063 info.ipi_addr.s_addr = ip_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -070064 if (rt) {
65 info.ipi_ifindex = rt->rt_iif;
66 info.ipi_spec_dst.s_addr = rt->rt_spec_dst;
67 } else {
68 info.ipi_ifindex = 0;
69 info.ipi_spec_dst.s_addr = 0;
70 }
71
72 put_cmsg(msg, SOL_IP, IP_PKTINFO, sizeof(info), &info);
73}
74
75static void ip_cmsg_recv_ttl(struct msghdr *msg, struct sk_buff *skb)
76{
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -070077 int ttl = ip_hdr(skb)->ttl;
Linus Torvalds1da177e2005-04-16 15:20:36 -070078 put_cmsg(msg, SOL_IP, IP_TTL, sizeof(int), &ttl);
79}
80
81static void ip_cmsg_recv_tos(struct msghdr *msg, struct sk_buff *skb)
82{
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -070083 put_cmsg(msg, SOL_IP, IP_TOS, 1, &ip_hdr(skb)->tos);
Linus Torvalds1da177e2005-04-16 15:20:36 -070084}
85
86static void ip_cmsg_recv_opts(struct msghdr *msg, struct sk_buff *skb)
87{
88 if (IPCB(skb)->opt.optlen == 0)
89 return;
90
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -070091 put_cmsg(msg, SOL_IP, IP_RECVOPTS, IPCB(skb)->opt.optlen,
92 ip_hdr(skb) + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -070093}
94
95
96static void ip_cmsg_recv_retopts(struct msghdr *msg, struct sk_buff *skb)
97{
98 unsigned char optbuf[sizeof(struct ip_options) + 40];
Jianjun Kong09cb1052008-11-03 00:27:11 -080099 struct ip_options * opt = (struct ip_options *)optbuf;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100
101 if (IPCB(skb)->opt.optlen == 0)
102 return;
103
104 if (ip_options_echo(opt, skb)) {
105 msg->msg_flags |= MSG_CTRUNC;
106 return;
107 }
108 ip_options_undo(opt);
109
110 put_cmsg(msg, SOL_IP, IP_RETOPTS, opt->optlen, opt->__data);
111}
112
Catherine Zhang2c7946a2006-03-20 22:41:23 -0800113static void ip_cmsg_recv_security(struct msghdr *msg, struct sk_buff *skb)
114{
115 char *secdata;
Catherine Zhangdc49c1f2006-08-02 14:12:06 -0700116 u32 seclen, secid;
Catherine Zhang2c7946a2006-03-20 22:41:23 -0800117 int err;
118
Catherine Zhangdc49c1f2006-08-02 14:12:06 -0700119 err = security_socket_getpeersec_dgram(NULL, skb, &secid);
120 if (err)
121 return;
122
123 err = security_secid_to_secctx(secid, &secdata, &seclen);
Catherine Zhang2c7946a2006-03-20 22:41:23 -0800124 if (err)
125 return;
126
127 put_cmsg(msg, SOL_IP, SCM_SECURITY, seclen, secdata);
Catherine Zhangdc49c1f2006-08-02 14:12:06 -0700128 security_release_secctx(secdata, seclen);
Catherine Zhang2c7946a2006-03-20 22:41:23 -0800129}
130
Harvey Harrison21d1a162008-11-20 01:54:27 -0800131static void ip_cmsg_recv_dstaddr(struct msghdr *msg, struct sk_buff *skb)
Balazs Scheidlere8b2dfe2008-11-16 19:32:39 -0800132{
133 struct sockaddr_in sin;
134 struct iphdr *iph = ip_hdr(skb);
Harvey Harrison21d1a162008-11-20 01:54:27 -0800135 __be16 *ports = (__be16 *)skb_transport_header(skb);
Balazs Scheidlere8b2dfe2008-11-16 19:32:39 -0800136
137 if (skb_transport_offset(skb) + 4 > skb->len)
138 return;
139
140 /* All current transport protocols have the port numbers in the
141 * first four bytes of the transport header and this function is
142 * written with this assumption in mind.
143 */
144
145 sin.sin_family = AF_INET;
146 sin.sin_addr.s_addr = iph->daddr;
147 sin.sin_port = ports[1];
148 memset(sin.sin_zero, 0, sizeof(sin.sin_zero));
149
150 put_cmsg(msg, SOL_IP, IP_ORIGDSTADDR, sizeof(sin), &sin);
151}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700152
153void ip_cmsg_recv(struct msghdr *msg, struct sk_buff *skb)
154{
155 struct inet_sock *inet = inet_sk(skb->sk);
156 unsigned flags = inet->cmsg_flags;
157
158 /* Ordered by supposed usage frequency */
159 if (flags & 1)
160 ip_cmsg_recv_pktinfo(msg, skb);
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700161 if ((flags >>= 1) == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162 return;
163
164 if (flags & 1)
165 ip_cmsg_recv_ttl(msg, skb);
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700166 if ((flags >>= 1) == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167 return;
168
169 if (flags & 1)
170 ip_cmsg_recv_tos(msg, skb);
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700171 if ((flags >>= 1) == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 return;
173
174 if (flags & 1)
175 ip_cmsg_recv_opts(msg, skb);
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700176 if ((flags >>= 1) == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 return;
178
179 if (flags & 1)
180 ip_cmsg_recv_retopts(msg, skb);
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700181 if ((flags >>= 1) == 0)
Catherine Zhang2c7946a2006-03-20 22:41:23 -0800182 return;
183
184 if (flags & 1)
185 ip_cmsg_recv_security(msg, skb);
Balazs Scheidlere8b2dfe2008-11-16 19:32:39 -0800186
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700187 if ((flags >>= 1) == 0)
Balazs Scheidlere8b2dfe2008-11-16 19:32:39 -0800188 return;
189 if (flags & 1)
190 ip_cmsg_recv_dstaddr(msg, skb);
191
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192}
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700193EXPORT_SYMBOL(ip_cmsg_recv);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194
Denis V. Lunev7a6adb92008-03-24 15:30:27 -0700195int ip_cmsg_send(struct net *net, struct msghdr *msg, struct ipcm_cookie *ipc)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196{
197 int err;
198 struct cmsghdr *cmsg;
199
200 for (cmsg = CMSG_FIRSTHDR(msg); cmsg; cmsg = CMSG_NXTHDR(msg, cmsg)) {
201 if (!CMSG_OK(msg, cmsg))
202 return -EINVAL;
203 if (cmsg->cmsg_level != SOL_IP)
204 continue;
205 switch (cmsg->cmsg_type) {
206 case IP_RETOPTS:
207 err = cmsg->cmsg_len - CMSG_ALIGN(sizeof(struct cmsghdr));
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700208 err = ip_options_get(net, &ipc->opt, CMSG_DATA(cmsg),
209 err < 40 ? err : 40);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210 if (err)
211 return err;
212 break;
213 case IP_PKTINFO:
214 {
215 struct in_pktinfo *info;
216 if (cmsg->cmsg_len != CMSG_LEN(sizeof(struct in_pktinfo)))
217 return -EINVAL;
218 info = (struct in_pktinfo *)CMSG_DATA(cmsg);
219 ipc->oif = info->ipi_ifindex;
220 ipc->addr = info->ipi_spec_dst.s_addr;
221 break;
222 }
223 default:
224 return -EINVAL;
225 }
226 }
227 return 0;
228}
229
230
231/* Special input handler for packets caught by router alert option.
232 They are selected only by protocol field, and then processed likely
233 local ones; but only if someone wants them! Otherwise, router
234 not running rsvpd will kill RSVP.
235
236 It is user level problem, what it will make with them.
237 I have no idea, how it will masquearde or NAT them (it is joke, joke :-)),
238 but receiver should be enough clever f.e. to forward mtrace requests,
239 sent to multicast group to reach destination designated router.
240 */
241struct ip_ra_chain *ip_ra_chain;
Eric Dumazet66018502010-06-07 03:12:08 +0000242static DEFINE_SPINLOCK(ip_ra_lock);
243
244static void ip_ra_free_rcu(struct rcu_head *head)
245{
246 kfree(container_of(head, struct ip_ra_chain, rcu));
247}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700249int ip_ra_control(struct sock *sk, unsigned char on,
250 void (*destructor)(struct sock *))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251{
252 struct ip_ra_chain *ra, *new_ra, **rap;
253
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000254 if (sk->sk_type != SOCK_RAW || inet_sk(sk)->inet_num == IPPROTO_RAW)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 return -EINVAL;
256
257 new_ra = on ? kmalloc(sizeof(*new_ra), GFP_KERNEL) : NULL;
258
Eric Dumazet66018502010-06-07 03:12:08 +0000259 spin_lock_bh(&ip_ra_lock);
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700260 for (rap = &ip_ra_chain; (ra = *rap) != NULL; rap = &ra->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261 if (ra->sk == sk) {
262 if (on) {
Eric Dumazet66018502010-06-07 03:12:08 +0000263 spin_unlock_bh(&ip_ra_lock);
Jesper Juhla51482b2005-11-08 09:41:34 -0800264 kfree(new_ra);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265 return -EADDRINUSE;
266 }
Eric Dumazet66018502010-06-07 03:12:08 +0000267 rcu_assign_pointer(*rap, ra->next);
268 spin_unlock_bh(&ip_ra_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269
270 if (ra->destructor)
271 ra->destructor(sk);
272 sock_put(sk);
Eric Dumazet66018502010-06-07 03:12:08 +0000273 call_rcu(&ra->rcu, ip_ra_free_rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274 return 0;
275 }
276 }
277 if (new_ra == NULL) {
Eric Dumazet66018502010-06-07 03:12:08 +0000278 spin_unlock_bh(&ip_ra_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 return -ENOBUFS;
280 }
281 new_ra->sk = sk;
282 new_ra->destructor = destructor;
283
284 new_ra->next = ra;
Eric Dumazet66018502010-06-07 03:12:08 +0000285 rcu_assign_pointer(*rap, new_ra);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286 sock_hold(sk);
Eric Dumazet66018502010-06-07 03:12:08 +0000287 spin_unlock_bh(&ip_ra_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288
289 return 0;
290}
291
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900292void ip_icmp_error(struct sock *sk, struct sk_buff *skb, int err,
Al Viro35986b32006-09-27 18:34:21 -0700293 __be16 port, u32 info, u8 *payload)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 struct sock_exterr_skb *serr;
296
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 skb = skb_clone(skb, GFP_ATOMIC);
298 if (!skb)
299 return;
300
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900301 serr = SKB_EXT_ERR(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302 serr->ee.ee_errno = err;
303 serr->ee.ee_origin = SO_EE_ORIGIN_ICMP;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300304 serr->ee.ee_type = icmp_hdr(skb)->type;
305 serr->ee.ee_code = icmp_hdr(skb)->code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306 serr->ee.ee_pad = 0;
307 serr->ee.ee_info = info;
308 serr->ee.ee_data = 0;
Arnaldo Carvalho de Melo88c76642007-03-13 14:43:18 -0300309 serr->addr_offset = (u8 *)&(((struct iphdr *)(icmp_hdr(skb) + 1))->daddr) -
Arnaldo Carvalho de Melod56f90a2007-04-10 20:50:43 -0700310 skb_network_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311 serr->port = port;
312
Arnaldo Carvalho de Melobd823932007-03-13 17:10:43 -0300313 if (skb_pull(skb, payload - skb->data) != NULL) {
314 skb_reset_transport_header(skb);
315 if (sock_queue_err_skb(sk, skb) == 0)
316 return;
317 }
318 kfree_skb(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700319}
320
Al Viro05790162006-09-27 18:33:40 -0700321void ip_local_error(struct sock *sk, int err, __be32 daddr, __be16 port, u32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322{
323 struct inet_sock *inet = inet_sk(sk);
324 struct sock_exterr_skb *serr;
325 struct iphdr *iph;
326 struct sk_buff *skb;
327
328 if (!inet->recverr)
329 return;
330
331 skb = alloc_skb(sizeof(struct iphdr), GFP_ATOMIC);
332 if (!skb)
333 return;
334
Arnaldo Carvalho de Melo2ca9e6f2007-03-10 19:15:25 -0300335 skb_put(skb, sizeof(struct iphdr));
336 skb_reset_network_header(skb);
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700337 iph = ip_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338 iph->daddr = daddr;
339
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900340 serr = SKB_EXT_ERR(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 serr->ee.ee_errno = err;
342 serr->ee.ee_origin = SO_EE_ORIGIN_LOCAL;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900343 serr->ee.ee_type = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344 serr->ee.ee_code = 0;
345 serr->ee.ee_pad = 0;
346 serr->ee.ee_info = info;
347 serr->ee.ee_data = 0;
Arnaldo Carvalho de Melod56f90a2007-04-10 20:50:43 -0700348 serr->addr_offset = (u8 *)&iph->daddr - skb_network_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349 serr->port = port;
350
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700351 __skb_pull(skb, skb_tail_pointer(skb) - skb->data);
Arnaldo Carvalho de Melobd823932007-03-13 17:10:43 -0300352 skb_reset_transport_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353
354 if (sock_queue_err_skb(sk, skb))
355 kfree_skb(skb);
356}
357
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900358/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359 * Handle MSG_ERRQUEUE
360 */
361int ip_recv_error(struct sock *sk, struct msghdr *msg, int len)
362{
363 struct sock_exterr_skb *serr;
364 struct sk_buff *skb, *skb2;
365 struct sockaddr_in *sin;
366 struct {
367 struct sock_extended_err ee;
368 struct sockaddr_in offender;
369 } errhdr;
370 int err;
371 int copied;
372
373 err = -EAGAIN;
374 skb = skb_dequeue(&sk->sk_error_queue);
375 if (skb == NULL)
376 goto out;
377
378 copied = skb->len;
379 if (copied > len) {
380 msg->msg_flags |= MSG_TRUNC;
381 copied = len;
382 }
383 err = skb_copy_datagram_iovec(skb, 0, msg->msg_iov, copied);
384 if (err)
385 goto out_free_skb;
386
387 sock_recv_timestamp(msg, sk, skb);
388
389 serr = SKB_EXT_ERR(skb);
390
391 sin = (struct sockaddr_in *)msg->msg_name;
392 if (sin) {
393 sin->sin_family = AF_INET;
Arnaldo Carvalho de Melod56f90a2007-04-10 20:50:43 -0700394 sin->sin_addr.s_addr = *(__be32 *)(skb_network_header(skb) +
395 serr->addr_offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700396 sin->sin_port = serr->port;
397 memset(&sin->sin_zero, 0, sizeof(sin->sin_zero));
398 }
399
400 memcpy(&errhdr.ee, &serr->ee, sizeof(struct sock_extended_err));
401 sin = &errhdr.offender;
402 sin->sin_family = AF_UNSPEC;
403 if (serr->ee.ee_origin == SO_EE_ORIGIN_ICMP) {
404 struct inet_sock *inet = inet_sk(sk);
405
406 sin->sin_family = AF_INET;
Arnaldo Carvalho de Meloeddc9ec2007-04-20 22:47:35 -0700407 sin->sin_addr.s_addr = ip_hdr(skb)->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408 sin->sin_port = 0;
409 memset(&sin->sin_zero, 0, sizeof(sin->sin_zero));
410 if (inet->cmsg_flags)
411 ip_cmsg_recv(msg, skb);
412 }
413
414 put_cmsg(msg, SOL_IP, IP_RECVERR, sizeof(errhdr), &errhdr);
415
416 /* Now we could try to dump offended packet options */
417
418 msg->msg_flags |= MSG_ERRQUEUE;
419 err = copied;
420
421 /* Reset and regenerate socket error */
Herbert Xue0f9f852005-06-18 22:56:18 -0700422 spin_lock_bh(&sk->sk_error_queue.lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700423 sk->sk_err = 0;
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700424 skb2 = skb_peek(&sk->sk_error_queue);
425 if (skb2 != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 sk->sk_err = SKB_EXT_ERR(skb2)->ee.ee_errno;
Herbert Xue0f9f852005-06-18 22:56:18 -0700427 spin_unlock_bh(&sk->sk_error_queue.lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700428 sk->sk_error_report(sk);
429 } else
Herbert Xue0f9f852005-06-18 22:56:18 -0700430 spin_unlock_bh(&sk->sk_error_queue.lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900432out_free_skb:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700433 kfree_skb(skb);
434out:
435 return err;
436}
437
438
439/*
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700440 * Socket option code for IP. This is the end of the line after any
441 * TCP,UDP etc options on an IP socket.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700442 */
443
Dmitry Mishin3fdadf72006-03-20 22:45:21 -0800444static int do_ip_setsockopt(struct sock *sk, int level,
David S. Millerb7058842009-09-30 16:12:20 -0700445 int optname, char __user *optval, unsigned int optlen)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700446{
447 struct inet_sock *inet = inet_sk(sk);
Jianjun Kong09cb1052008-11-03 00:27:11 -0800448 int val = 0, err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700449
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900450 if (((1<<optname) & ((1<<IP_PKTINFO) | (1<<IP_RECVTTL) |
Stephen Hemminger132adf52007-03-08 20:44:43 -0800451 (1<<IP_RECVOPTS) | (1<<IP_RECVTOS) |
452 (1<<IP_RETOPTS) | (1<<IP_TOS) |
453 (1<<IP_TTL) | (1<<IP_HDRINCL) |
454 (1<<IP_MTU_DISCOVER) | (1<<IP_RECVERR) |
455 (1<<IP_ROUTER_ALERT) | (1<<IP_FREEBIND) |
Stephen Hemmingerd218d112010-01-11 16:28:01 -0800456 (1<<IP_PASSSEC) | (1<<IP_TRANSPARENT) |
457 (1<<IP_MINTTL))) ||
Stephen Hemminger132adf52007-03-08 20:44:43 -0800458 optname == IP_MULTICAST_TTL ||
Nivedita Singhvif771bef2009-05-28 07:00:46 +0000459 optname == IP_MULTICAST_ALL ||
Balazs Scheidlere8b2dfe2008-11-16 19:32:39 -0800460 optname == IP_MULTICAST_LOOP ||
461 optname == IP_RECVORIGDSTADDR) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700462 if (optlen >= sizeof(int)) {
463 if (get_user(val, (int __user *) optval))
464 return -EFAULT;
465 } else if (optlen >= sizeof(char)) {
466 unsigned char ucval;
467
468 if (get_user(ucval, (unsigned char __user *) optval))
469 return -EFAULT;
470 val = (int) ucval;
471 }
472 }
473
474 /* If optlen==0, it is equivalent to val == 0 */
475
Pavel Emelyanov6a9fb942007-11-05 21:32:31 -0800476 if (ip_mroute_opt(optname))
Jianjun Kong09cb1052008-11-03 00:27:11 -0800477 return ip_mroute_setsockopt(sk, optname, optval, optlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478
479 err = 0;
480 lock_sock(sk);
481
482 switch (optname) {
Stephen Hemminger132adf52007-03-08 20:44:43 -0800483 case IP_OPTIONS:
484 {
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700485 struct ip_options *opt = NULL;
roel kluin65a1c4f2009-10-23 05:59:21 +0000486 if (optlen > 40)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800487 goto e_inval;
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900488 err = ip_options_get_from_user(sock_net(sk), &opt,
Denis V. Lunevcb846632008-03-24 15:31:00 -0700489 optval, optlen);
Stephen Hemminger132adf52007-03-08 20:44:43 -0800490 if (err)
491 break;
492 if (inet->is_icsk) {
493 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700494#if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800495 if (sk->sk_family == PF_INET ||
496 (!((1 << sk->sk_state) &
497 (TCPF_LISTEN | TCPF_CLOSE)) &&
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000498 inet->inet_daddr != LOOPBACK4_IPV6)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499#endif
Stephen Hemminger132adf52007-03-08 20:44:43 -0800500 if (inet->opt)
501 icsk->icsk_ext_hdr_len -= inet->opt->optlen;
502 if (opt)
503 icsk->icsk_ext_hdr_len += opt->optlen;
504 icsk->icsk_sync_mss(sk, icsk->icsk_pmtu_cookie);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505#if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800506 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700507#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 }
Stephen Hemminger132adf52007-03-08 20:44:43 -0800509 opt = xchg(&inet->opt, opt);
510 kfree(opt);
511 break;
512 }
513 case IP_PKTINFO:
514 if (val)
515 inet->cmsg_flags |= IP_CMSG_PKTINFO;
516 else
517 inet->cmsg_flags &= ~IP_CMSG_PKTINFO;
518 break;
519 case IP_RECVTTL:
520 if (val)
521 inet->cmsg_flags |= IP_CMSG_TTL;
522 else
523 inet->cmsg_flags &= ~IP_CMSG_TTL;
524 break;
525 case IP_RECVTOS:
526 if (val)
527 inet->cmsg_flags |= IP_CMSG_TOS;
528 else
529 inet->cmsg_flags &= ~IP_CMSG_TOS;
530 break;
531 case IP_RECVOPTS:
532 if (val)
533 inet->cmsg_flags |= IP_CMSG_RECVOPTS;
534 else
535 inet->cmsg_flags &= ~IP_CMSG_RECVOPTS;
536 break;
537 case IP_RETOPTS:
538 if (val)
539 inet->cmsg_flags |= IP_CMSG_RETOPTS;
540 else
541 inet->cmsg_flags &= ~IP_CMSG_RETOPTS;
542 break;
543 case IP_PASSSEC:
544 if (val)
545 inet->cmsg_flags |= IP_CMSG_PASSSEC;
546 else
547 inet->cmsg_flags &= ~IP_CMSG_PASSSEC;
548 break;
Balazs Scheidlere8b2dfe2008-11-16 19:32:39 -0800549 case IP_RECVORIGDSTADDR:
550 if (val)
551 inet->cmsg_flags |= IP_CMSG_ORIGDSTADDR;
552 else
553 inet->cmsg_flags &= ~IP_CMSG_ORIGDSTADDR;
554 break;
Stephen Hemminger132adf52007-03-08 20:44:43 -0800555 case IP_TOS: /* This sets both TOS and Precedence */
556 if (sk->sk_type == SOCK_STREAM) {
557 val &= ~3;
558 val |= inet->tos & 3;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559 }
Stephen Hemminger132adf52007-03-08 20:44:43 -0800560 if (inet->tos != val) {
561 inet->tos = val;
562 sk->sk_priority = rt_tos2priority(val);
563 sk_dst_reset(sk);
564 }
565 break;
566 case IP_TTL:
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700567 if (optlen < 1)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800568 goto e_inval;
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700569 if (val != -1 && (val < 0 || val > 255))
Stephen Hemminger132adf52007-03-08 20:44:43 -0800570 goto e_inval;
571 inet->uc_ttl = val;
572 break;
573 case IP_HDRINCL:
574 if (sk->sk_type != SOCK_RAW) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700575 err = -ENOPROTOOPT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576 break;
Stephen Hemminger132adf52007-03-08 20:44:43 -0800577 }
578 inet->hdrincl = val ? 1 : 0;
579 break;
580 case IP_MTU_DISCOVER:
John Dykstra0eae7502009-10-19 21:53:53 -0700581 if (val < IP_PMTUDISC_DONT || val > IP_PMTUDISC_PROBE)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800582 goto e_inval;
583 inet->pmtudisc = val;
584 break;
585 case IP_RECVERR:
586 inet->recverr = !!val;
587 if (!val)
588 skb_queue_purge(&sk->sk_error_queue);
589 break;
590 case IP_MULTICAST_TTL:
591 if (sk->sk_type == SOCK_STREAM)
592 goto e_inval;
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700593 if (optlen < 1)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800594 goto e_inval;
Jianjun Kong09cb1052008-11-03 00:27:11 -0800595 if (val == -1)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800596 val = 1;
597 if (val < 0 || val > 255)
598 goto e_inval;
599 inet->mc_ttl = val;
600 break;
601 case IP_MULTICAST_LOOP:
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700602 if (optlen < 1)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800603 goto e_inval;
604 inet->mc_loop = !!val;
605 break;
606 case IP_MULTICAST_IF:
607 {
608 struct ip_mreqn mreq;
609 struct net_device *dev = NULL;
610
611 if (sk->sk_type == SOCK_STREAM)
612 goto e_inval;
613 /*
614 * Check the arguments are allowable
615 */
616
Shan Wei09159212009-09-22 15:41:10 +0000617 if (optlen < sizeof(struct in_addr))
618 goto e_inval;
619
Stephen Hemminger132adf52007-03-08 20:44:43 -0800620 err = -EFAULT;
621 if (optlen >= sizeof(struct ip_mreqn)) {
Jianjun Kong09cb1052008-11-03 00:27:11 -0800622 if (copy_from_user(&mreq, optval, sizeof(mreq)))
Stephen Hemminger132adf52007-03-08 20:44:43 -0800623 break;
624 } else {
625 memset(&mreq, 0, sizeof(mreq));
626 if (optlen >= sizeof(struct in_addr) &&
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700627 copy_from_user(&mreq.imr_address, optval,
628 sizeof(struct in_addr)))
Stephen Hemminger132adf52007-03-08 20:44:43 -0800629 break;
630 }
631
632 if (!mreq.imr_ifindex) {
Al Viroe6f1ceb2008-03-17 22:44:53 -0700633 if (mreq.imr_address.s_addr == htonl(INADDR_ANY)) {
Stephen Hemminger132adf52007-03-08 20:44:43 -0800634 inet->mc_index = 0;
635 inet->mc_addr = 0;
636 err = 0;
637 break;
638 }
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900639 dev = ip_dev_find(sock_net(sk), mreq.imr_address.s_addr);
Eric Dumazet55b80502009-10-19 06:41:58 +0000640 if (dev)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800641 mreq.imr_ifindex = dev->ifindex;
Stephen Hemminger132adf52007-03-08 20:44:43 -0800642 } else
Eric Dumazet55b80502009-10-19 06:41:58 +0000643 dev = dev_get_by_index(sock_net(sk), mreq.imr_ifindex);
Stephen Hemminger132adf52007-03-08 20:44:43 -0800644
645
646 err = -EADDRNOTAVAIL;
647 if (!dev)
648 break;
Eric Dumazet55b80502009-10-19 06:41:58 +0000649 dev_put(dev);
Stephen Hemminger132adf52007-03-08 20:44:43 -0800650
651 err = -EINVAL;
652 if (sk->sk_bound_dev_if &&
653 mreq.imr_ifindex != sk->sk_bound_dev_if)
654 break;
655
656 inet->mc_index = mreq.imr_ifindex;
657 inet->mc_addr = mreq.imr_address.s_addr;
658 err = 0;
659 break;
660 }
661
662 case IP_ADD_MEMBERSHIP:
663 case IP_DROP_MEMBERSHIP:
664 {
665 struct ip_mreqn mreq;
666
Flavio Leitnera96fb492007-08-24 22:16:39 -0700667 err = -EPROTO;
668 if (inet_sk(sk)->is_icsk)
669 break;
670
Stephen Hemminger132adf52007-03-08 20:44:43 -0800671 if (optlen < sizeof(struct ip_mreq))
672 goto e_inval;
673 err = -EFAULT;
674 if (optlen >= sizeof(struct ip_mreqn)) {
Jianjun Kong09cb1052008-11-03 00:27:11 -0800675 if (copy_from_user(&mreq, optval, sizeof(mreq)))
Stephen Hemminger132adf52007-03-08 20:44:43 -0800676 break;
677 } else {
678 memset(&mreq, 0, sizeof(mreq));
Jianjun Kong09cb1052008-11-03 00:27:11 -0800679 if (copy_from_user(&mreq, optval, sizeof(struct ip_mreq)))
Stephen Hemminger132adf52007-03-08 20:44:43 -0800680 break;
681 }
682
683 if (optname == IP_ADD_MEMBERSHIP)
684 err = ip_mc_join_group(sk, &mreq);
685 else
686 err = ip_mc_leave_group(sk, &mreq);
687 break;
688 }
689 case IP_MSFILTER:
690 {
Stephen Hemminger132adf52007-03-08 20:44:43 -0800691 struct ip_msfilter *msf;
692
693 if (optlen < IP_MSFILTER_SIZE(0))
694 goto e_inval;
695 if (optlen > sysctl_optmem_max) {
696 err = -ENOBUFS;
697 break;
698 }
699 msf = kmalloc(optlen, GFP_KERNEL);
Stephen Hemmingercfcabdc2007-10-09 01:59:42 -0700700 if (!msf) {
Stephen Hemminger132adf52007-03-08 20:44:43 -0800701 err = -ENOBUFS;
702 break;
703 }
704 err = -EFAULT;
705 if (copy_from_user(msf, optval, optlen)) {
706 kfree(msf);
707 break;
708 }
709 /* numsrc >= (1G-4) overflow in 32 bits */
710 if (msf->imsf_numsrc >= 0x3ffffffcU ||
711 msf->imsf_numsrc > sysctl_igmp_max_msf) {
712 kfree(msf);
713 err = -ENOBUFS;
714 break;
715 }
716 if (IP_MSFILTER_SIZE(msf->imsf_numsrc) > optlen) {
717 kfree(msf);
718 err = -EINVAL;
719 break;
720 }
721 err = ip_mc_msfilter(sk, msf, 0);
722 kfree(msf);
723 break;
724 }
725 case IP_BLOCK_SOURCE:
726 case IP_UNBLOCK_SOURCE:
727 case IP_ADD_SOURCE_MEMBERSHIP:
728 case IP_DROP_SOURCE_MEMBERSHIP:
729 {
730 struct ip_mreq_source mreqs;
731 int omode, add;
732
733 if (optlen != sizeof(struct ip_mreq_source))
734 goto e_inval;
735 if (copy_from_user(&mreqs, optval, sizeof(mreqs))) {
736 err = -EFAULT;
737 break;
738 }
739 if (optname == IP_BLOCK_SOURCE) {
740 omode = MCAST_EXCLUDE;
741 add = 1;
742 } else if (optname == IP_UNBLOCK_SOURCE) {
743 omode = MCAST_EXCLUDE;
744 add = 0;
745 } else if (optname == IP_ADD_SOURCE_MEMBERSHIP) {
746 struct ip_mreqn mreq;
747
748 mreq.imr_multiaddr.s_addr = mreqs.imr_multiaddr;
749 mreq.imr_address.s_addr = mreqs.imr_interface;
750 mreq.imr_ifindex = 0;
751 err = ip_mc_join_group(sk, &mreq);
752 if (err && err != -EADDRINUSE)
753 break;
754 omode = MCAST_INCLUDE;
755 add = 1;
756 } else /* IP_DROP_SOURCE_MEMBERSHIP */ {
757 omode = MCAST_INCLUDE;
758 add = 0;
759 }
760 err = ip_mc_source(add, omode, sk, &mreqs, 0);
761 break;
762 }
763 case MCAST_JOIN_GROUP:
764 case MCAST_LEAVE_GROUP:
765 {
766 struct group_req greq;
767 struct sockaddr_in *psin;
768 struct ip_mreqn mreq;
769
770 if (optlen < sizeof(struct group_req))
771 goto e_inval;
772 err = -EFAULT;
773 if (copy_from_user(&greq, optval, sizeof(greq)))
774 break;
775 psin = (struct sockaddr_in *)&greq.gr_group;
776 if (psin->sin_family != AF_INET)
777 goto e_inval;
778 memset(&mreq, 0, sizeof(mreq));
779 mreq.imr_multiaddr = psin->sin_addr;
780 mreq.imr_ifindex = greq.gr_interface;
781
782 if (optname == MCAST_JOIN_GROUP)
783 err = ip_mc_join_group(sk, &mreq);
784 else
785 err = ip_mc_leave_group(sk, &mreq);
786 break;
787 }
788 case MCAST_JOIN_SOURCE_GROUP:
789 case MCAST_LEAVE_SOURCE_GROUP:
790 case MCAST_BLOCK_SOURCE:
791 case MCAST_UNBLOCK_SOURCE:
792 {
793 struct group_source_req greqs;
794 struct ip_mreq_source mreqs;
795 struct sockaddr_in *psin;
796 int omode, add;
797
798 if (optlen != sizeof(struct group_source_req))
799 goto e_inval;
800 if (copy_from_user(&greqs, optval, sizeof(greqs))) {
801 err = -EFAULT;
802 break;
803 }
804 if (greqs.gsr_group.ss_family != AF_INET ||
805 greqs.gsr_source.ss_family != AF_INET) {
806 err = -EADDRNOTAVAIL;
807 break;
808 }
809 psin = (struct sockaddr_in *)&greqs.gsr_group;
810 mreqs.imr_multiaddr = psin->sin_addr.s_addr;
811 psin = (struct sockaddr_in *)&greqs.gsr_source;
812 mreqs.imr_sourceaddr = psin->sin_addr.s_addr;
813 mreqs.imr_interface = 0; /* use index for mc_source */
814
815 if (optname == MCAST_BLOCK_SOURCE) {
816 omode = MCAST_EXCLUDE;
817 add = 1;
818 } else if (optname == MCAST_UNBLOCK_SOURCE) {
819 omode = MCAST_EXCLUDE;
820 add = 0;
821 } else if (optname == MCAST_JOIN_SOURCE_GROUP) {
822 struct ip_mreqn mreq;
823
824 psin = (struct sockaddr_in *)&greqs.gsr_group;
825 mreq.imr_multiaddr = psin->sin_addr;
826 mreq.imr_address.s_addr = 0;
827 mreq.imr_ifindex = greqs.gsr_interface;
828 err = ip_mc_join_group(sk, &mreq);
829 if (err && err != -EADDRINUSE)
830 break;
831 greqs.gsr_interface = mreq.imr_ifindex;
832 omode = MCAST_INCLUDE;
833 add = 1;
834 } else /* MCAST_LEAVE_SOURCE_GROUP */ {
835 omode = MCAST_INCLUDE;
836 add = 0;
837 }
838 err = ip_mc_source(add, omode, sk, &mreqs,
839 greqs.gsr_interface);
840 break;
841 }
842 case MCAST_MSFILTER:
843 {
Stephen Hemminger132adf52007-03-08 20:44:43 -0800844 struct sockaddr_in *psin;
845 struct ip_msfilter *msf = NULL;
846 struct group_filter *gsf = NULL;
847 int msize, i, ifindex;
848
849 if (optlen < GROUP_FILTER_SIZE(0))
850 goto e_inval;
851 if (optlen > sysctl_optmem_max) {
852 err = -ENOBUFS;
853 break;
854 }
Jianjun Kong09cb1052008-11-03 00:27:11 -0800855 gsf = kmalloc(optlen, GFP_KERNEL);
Stephen Hemmingercfcabdc2007-10-09 01:59:42 -0700856 if (!gsf) {
Stephen Hemminger132adf52007-03-08 20:44:43 -0800857 err = -ENOBUFS;
858 break;
859 }
860 err = -EFAULT;
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700861 if (copy_from_user(gsf, optval, optlen))
Stephen Hemminger132adf52007-03-08 20:44:43 -0800862 goto mc_msf_out;
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700863
Stephen Hemminger132adf52007-03-08 20:44:43 -0800864 /* numsrc >= (4G-140)/128 overflow in 32 bits */
865 if (gsf->gf_numsrc >= 0x1ffffff ||
866 gsf->gf_numsrc > sysctl_igmp_max_msf) {
867 err = -ENOBUFS;
868 goto mc_msf_out;
869 }
870 if (GROUP_FILTER_SIZE(gsf->gf_numsrc) > optlen) {
871 err = -EINVAL;
872 goto mc_msf_out;
873 }
874 msize = IP_MSFILTER_SIZE(gsf->gf_numsrc);
Jianjun Kong09cb1052008-11-03 00:27:11 -0800875 msf = kmalloc(msize, GFP_KERNEL);
Stephen Hemmingercfcabdc2007-10-09 01:59:42 -0700876 if (!msf) {
Stephen Hemminger132adf52007-03-08 20:44:43 -0800877 err = -ENOBUFS;
878 goto mc_msf_out;
879 }
880 ifindex = gsf->gf_interface;
881 psin = (struct sockaddr_in *)&gsf->gf_group;
882 if (psin->sin_family != AF_INET) {
883 err = -EADDRNOTAVAIL;
884 goto mc_msf_out;
885 }
886 msf->imsf_multiaddr = psin->sin_addr.s_addr;
887 msf->imsf_interface = 0;
888 msf->imsf_fmode = gsf->gf_fmode;
889 msf->imsf_numsrc = gsf->gf_numsrc;
890 err = -EADDRNOTAVAIL;
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700891 for (i = 0; i < gsf->gf_numsrc; ++i) {
Stephen Hemminger132adf52007-03-08 20:44:43 -0800892 psin = (struct sockaddr_in *)&gsf->gf_slist[i];
893
894 if (psin->sin_family != AF_INET)
895 goto mc_msf_out;
896 msf->imsf_slist[i] = psin->sin_addr.s_addr;
897 }
898 kfree(gsf);
899 gsf = NULL;
900
901 err = ip_mc_msfilter(sk, msf, ifindex);
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700902mc_msf_out:
Stephen Hemminger132adf52007-03-08 20:44:43 -0800903 kfree(msf);
904 kfree(gsf);
905 break;
906 }
Nivedita Singhvif771bef2009-05-28 07:00:46 +0000907 case IP_MULTICAST_ALL:
908 if (optlen < 1)
909 goto e_inval;
910 if (val != 0 && val != 1)
911 goto e_inval;
912 inet->mc_all = val;
913 break;
Stephen Hemminger132adf52007-03-08 20:44:43 -0800914 case IP_ROUTER_ALERT:
915 err = ip_ra_control(sk, val ? 1 : 0, NULL);
916 break;
917
918 case IP_FREEBIND:
Eric Dumazet4d52cfb2009-06-02 00:42:16 -0700919 if (optlen < 1)
Stephen Hemminger132adf52007-03-08 20:44:43 -0800920 goto e_inval;
921 inet->freebind = !!val;
922 break;
923
924 case IP_IPSEC_POLICY:
925 case IP_XFRM_POLICY:
926 err = -EPERM;
927 if (!capable(CAP_NET_ADMIN))
928 break;
929 err = xfrm_user_policy(sk, optname, optval, optlen);
930 break;
931
KOVACS Krisztianf5715ae2008-10-01 07:30:02 -0700932 case IP_TRANSPARENT:
933 if (!capable(CAP_NET_ADMIN)) {
934 err = -EPERM;
935 break;
936 }
937 if (optlen < 1)
938 goto e_inval;
939 inet->transparent = !!val;
940 break;
941
Stephen Hemmingerd218d112010-01-11 16:28:01 -0800942 case IP_MINTTL:
943 if (optlen < 1)
944 goto e_inval;
945 if (val < 0 || val > 255)
946 goto e_inval;
947 inet->min_ttl = val;
948 break;
949
Stephen Hemminger132adf52007-03-08 20:44:43 -0800950 default:
951 err = -ENOPROTOOPT;
952 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700953 }
954 release_sock(sk);
955 return err;
956
957e_inval:
958 release_sock(sk);
959 return -EINVAL;
960}
961
Eric Dumazetf84af322010-04-28 15:31:51 -0700962/**
963 * ip_queue_rcv_skb - Queue an skb into sock receive queue
964 * @sk: socket
965 * @skb: buffer
966 *
967 * Queues an skb into socket receive queue. If IP_CMSG_PKTINFO option
968 * is not set, we drop skb dst entry now, while dst cache line is hot.
969 */
970int ip_queue_rcv_skb(struct sock *sk, struct sk_buff *skb)
971{
972 if (!(inet_sk(sk)->cmsg_flags & IP_CMSG_PKTINFO))
973 skb_dst_drop(skb);
974 return sock_queue_rcv_skb(sk, skb);
975}
976EXPORT_SYMBOL(ip_queue_rcv_skb);
977
Dmitry Mishin3fdadf72006-03-20 22:45:21 -0800978int ip_setsockopt(struct sock *sk, int level,
David S. Millerb7058842009-09-30 16:12:20 -0700979 int optname, char __user *optval, unsigned int optlen)
Dmitry Mishin3fdadf72006-03-20 22:45:21 -0800980{
981 int err;
982
983 if (level != SOL_IP)
984 return -ENOPROTOOPT;
985
986 err = do_ip_setsockopt(sk, level, optname, optval, optlen);
987#ifdef CONFIG_NETFILTER
988 /* we need to exclude all possible ENOPROTOOPTs except default case */
989 if (err == -ENOPROTOOPT && optname != IP_HDRINCL &&
Pavel Emelyanov6a9fb942007-11-05 21:32:31 -0800990 optname != IP_IPSEC_POLICY &&
991 optname != IP_XFRM_POLICY &&
992 !ip_mroute_opt(optname)) {
Dmitry Mishin3fdadf72006-03-20 22:45:21 -0800993 lock_sock(sk);
994 err = nf_setsockopt(sk, PF_INET, optname, optval, optlen);
995 release_sock(sk);
996 }
997#endif
998 return err;
999}
Eric Dumazet4d52cfb2009-06-02 00:42:16 -07001000EXPORT_SYMBOL(ip_setsockopt);
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001001
1002#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001003int compat_ip_setsockopt(struct sock *sk, int level, int optname,
David S. Millerb7058842009-09-30 16:12:20 -07001004 char __user *optval, unsigned int optlen)
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001005{
1006 int err;
1007
1008 if (level != SOL_IP)
1009 return -ENOPROTOOPT;
1010
David L Stevensdae50292008-04-27 01:06:07 -07001011 if (optname >= MCAST_JOIN_GROUP && optname <= MCAST_MSFILTER)
1012 return compat_mc_setsockopt(sk, level, optname, optval, optlen,
1013 ip_setsockopt);
1014
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001015 err = do_ip_setsockopt(sk, level, optname, optval, optlen);
1016#ifdef CONFIG_NETFILTER
1017 /* we need to exclude all possible ENOPROTOOPTs except default case */
1018 if (err == -ENOPROTOOPT && optname != IP_HDRINCL &&
Pavel Emelyanov6a9fb942007-11-05 21:32:31 -08001019 optname != IP_IPSEC_POLICY &&
1020 optname != IP_XFRM_POLICY &&
1021 !ip_mroute_opt(optname)) {
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001022 lock_sock(sk);
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001023 err = compat_nf_setsockopt(sk, PF_INET, optname,
1024 optval, optlen);
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001025 release_sock(sk);
1026 }
1027#endif
1028 return err;
1029}
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001030EXPORT_SYMBOL(compat_ip_setsockopt);
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001031#endif
1032
Linus Torvalds1da177e2005-04-16 15:20:36 -07001033/*
Eric Dumazet4d52cfb2009-06-02 00:42:16 -07001034 * Get the options. Note for future reference. The GET of IP options gets
1035 * the _received_ ones. The set sets the _sent_ ones.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036 */
1037
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001038static int do_ip_getsockopt(struct sock *sk, int level, int optname,
Stephen Hemminger132adf52007-03-08 20:44:43 -08001039 char __user *optval, int __user *optlen)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001040{
1041 struct inet_sock *inet = inet_sk(sk);
1042 int val;
1043 int len;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001044
Stephen Hemminger132adf52007-03-08 20:44:43 -08001045 if (level != SOL_IP)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001046 return -EOPNOTSUPP;
1047
Pavel Emelyanov6a9fb942007-11-05 21:32:31 -08001048 if (ip_mroute_opt(optname))
Jianjun Kong09cb1052008-11-03 00:27:11 -08001049 return ip_mroute_getsockopt(sk, optname, optval, optlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001050
Jianjun Kong09cb1052008-11-03 00:27:11 -08001051 if (get_user(len, optlen))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001052 return -EFAULT;
Stephen Hemminger132adf52007-03-08 20:44:43 -08001053 if (len < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001054 return -EINVAL;
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001055
Linus Torvalds1da177e2005-04-16 15:20:36 -07001056 lock_sock(sk);
1057
Stephen Hemminger132adf52007-03-08 20:44:43 -08001058 switch (optname) {
1059 case IP_OPTIONS:
1060 {
1061 unsigned char optbuf[sizeof(struct ip_options)+40];
Jianjun Kong09cb1052008-11-03 00:27:11 -08001062 struct ip_options * opt = (struct ip_options *)optbuf;
Stephen Hemminger132adf52007-03-08 20:44:43 -08001063 opt->optlen = 0;
1064 if (inet->opt)
1065 memcpy(optbuf, inet->opt,
1066 sizeof(struct ip_options)+
1067 inet->opt->optlen);
1068 release_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001069
Stephen Hemminger132adf52007-03-08 20:44:43 -08001070 if (opt->optlen == 0)
1071 return put_user(0, optlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001072
Stephen Hemminger132adf52007-03-08 20:44:43 -08001073 ip_options_undo(opt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001074
Stephen Hemminger132adf52007-03-08 20:44:43 -08001075 len = min_t(unsigned int, len, opt->optlen);
1076 if (put_user(len, optlen))
1077 return -EFAULT;
1078 if (copy_to_user(optval, opt->__data, len))
1079 return -EFAULT;
1080 return 0;
1081 }
1082 case IP_PKTINFO:
1083 val = (inet->cmsg_flags & IP_CMSG_PKTINFO) != 0;
1084 break;
1085 case IP_RECVTTL:
1086 val = (inet->cmsg_flags & IP_CMSG_TTL) != 0;
1087 break;
1088 case IP_RECVTOS:
1089 val = (inet->cmsg_flags & IP_CMSG_TOS) != 0;
1090 break;
1091 case IP_RECVOPTS:
1092 val = (inet->cmsg_flags & IP_CMSG_RECVOPTS) != 0;
1093 break;
1094 case IP_RETOPTS:
1095 val = (inet->cmsg_flags & IP_CMSG_RETOPTS) != 0;
1096 break;
1097 case IP_PASSSEC:
1098 val = (inet->cmsg_flags & IP_CMSG_PASSSEC) != 0;
1099 break;
Balazs Scheidlere8b2dfe2008-11-16 19:32:39 -08001100 case IP_RECVORIGDSTADDR:
1101 val = (inet->cmsg_flags & IP_CMSG_ORIGDSTADDR) != 0;
1102 break;
Stephen Hemminger132adf52007-03-08 20:44:43 -08001103 case IP_TOS:
1104 val = inet->tos;
1105 break;
1106 case IP_TTL:
1107 val = (inet->uc_ttl == -1 ?
1108 sysctl_ip_default_ttl :
1109 inet->uc_ttl);
1110 break;
1111 case IP_HDRINCL:
1112 val = inet->hdrincl;
1113 break;
1114 case IP_MTU_DISCOVER:
1115 val = inet->pmtudisc;
1116 break;
1117 case IP_MTU:
1118 {
1119 struct dst_entry *dst;
1120 val = 0;
1121 dst = sk_dst_get(sk);
1122 if (dst) {
1123 val = dst_mtu(dst);
1124 dst_release(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001125 }
Stephen Hemminger132adf52007-03-08 20:44:43 -08001126 if (!val) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001127 release_sock(sk);
Stephen Hemminger132adf52007-03-08 20:44:43 -08001128 return -ENOTCONN;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001129 }
Stephen Hemminger132adf52007-03-08 20:44:43 -08001130 break;
1131 }
1132 case IP_RECVERR:
1133 val = inet->recverr;
1134 break;
1135 case IP_MULTICAST_TTL:
1136 val = inet->mc_ttl;
1137 break;
1138 case IP_MULTICAST_LOOP:
1139 val = inet->mc_loop;
1140 break;
1141 case IP_MULTICAST_IF:
1142 {
1143 struct in_addr addr;
1144 len = min_t(unsigned int, len, sizeof(struct in_addr));
1145 addr.s_addr = inet->mc_addr;
1146 release_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001147
Stephen Hemminger132adf52007-03-08 20:44:43 -08001148 if (put_user(len, optlen))
1149 return -EFAULT;
1150 if (copy_to_user(optval, &addr, len))
1151 return -EFAULT;
1152 return 0;
1153 }
1154 case IP_MSFILTER:
1155 {
1156 struct ip_msfilter msf;
1157 int err;
1158
1159 if (len < IP_MSFILTER_SIZE(0)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001160 release_sock(sk);
Stephen Hemminger132adf52007-03-08 20:44:43 -08001161 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 }
Stephen Hemminger132adf52007-03-08 20:44:43 -08001163 if (copy_from_user(&msf, optval, IP_MSFILTER_SIZE(0))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001164 release_sock(sk);
Stephen Hemminger132adf52007-03-08 20:44:43 -08001165 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001166 }
Stephen Hemminger132adf52007-03-08 20:44:43 -08001167 err = ip_mc_msfget(sk, &msf,
1168 (struct ip_msfilter __user *)optval, optlen);
1169 release_sock(sk);
1170 return err;
1171 }
1172 case MCAST_MSFILTER:
1173 {
1174 struct group_filter gsf;
1175 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001176
Stephen Hemminger132adf52007-03-08 20:44:43 -08001177 if (len < GROUP_FILTER_SIZE(0)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001178 release_sock(sk);
Stephen Hemminger132adf52007-03-08 20:44:43 -08001179 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180 }
Stephen Hemminger132adf52007-03-08 20:44:43 -08001181 if (copy_from_user(&gsf, optval, GROUP_FILTER_SIZE(0))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001182 release_sock(sk);
Stephen Hemminger132adf52007-03-08 20:44:43 -08001183 return -EFAULT;
1184 }
1185 err = ip_mc_gsfget(sk, &gsf,
Eric Dumazet4d52cfb2009-06-02 00:42:16 -07001186 (struct group_filter __user *)optval,
1187 optlen);
Stephen Hemminger132adf52007-03-08 20:44:43 -08001188 release_sock(sk);
1189 return err;
1190 }
Nivedita Singhvif771bef2009-05-28 07:00:46 +00001191 case IP_MULTICAST_ALL:
1192 val = inet->mc_all;
1193 break;
Stephen Hemminger132adf52007-03-08 20:44:43 -08001194 case IP_PKTOPTIONS:
1195 {
1196 struct msghdr msg;
1197
1198 release_sock(sk);
1199
1200 if (sk->sk_type != SOCK_STREAM)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201 return -ENOPROTOOPT;
Stephen Hemminger132adf52007-03-08 20:44:43 -08001202
1203 msg.msg_control = optval;
1204 msg.msg_controllen = len;
1205 msg.msg_flags = 0;
1206
1207 if (inet->cmsg_flags & IP_CMSG_PKTINFO) {
1208 struct in_pktinfo info;
1209
Eric Dumazetc720c7e2009-10-15 06:30:45 +00001210 info.ipi_addr.s_addr = inet->inet_rcv_saddr;
1211 info.ipi_spec_dst.s_addr = inet->inet_rcv_saddr;
Stephen Hemminger132adf52007-03-08 20:44:43 -08001212 info.ipi_ifindex = inet->mc_index;
1213 put_cmsg(&msg, SOL_IP, IP_PKTINFO, sizeof(info), &info);
1214 }
1215 if (inet->cmsg_flags & IP_CMSG_TTL) {
1216 int hlim = inet->mc_ttl;
1217 put_cmsg(&msg, SOL_IP, IP_TTL, sizeof(hlim), &hlim);
1218 }
1219 len -= msg.msg_controllen;
1220 return put_user(len, optlen);
1221 }
1222 case IP_FREEBIND:
1223 val = inet->freebind;
1224 break;
KOVACS Krisztianf5715ae2008-10-01 07:30:02 -07001225 case IP_TRANSPARENT:
1226 val = inet->transparent;
1227 break;
Stephen Hemmingerd218d112010-01-11 16:28:01 -08001228 case IP_MINTTL:
1229 val = inet->min_ttl;
1230 break;
Stephen Hemminger132adf52007-03-08 20:44:43 -08001231 default:
1232 release_sock(sk);
1233 return -ENOPROTOOPT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001234 }
1235 release_sock(sk);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001236
Eric Dumazet4d52cfb2009-06-02 00:42:16 -07001237 if (len < sizeof(int) && len > 0 && val >= 0 && val <= 255) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001238 unsigned char ucval = (unsigned char)val;
1239 len = 1;
Stephen Hemminger132adf52007-03-08 20:44:43 -08001240 if (put_user(len, optlen))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001241 return -EFAULT;
Jianjun Kong09cb1052008-11-03 00:27:11 -08001242 if (copy_to_user(optval, &ucval, 1))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001243 return -EFAULT;
1244 } else {
1245 len = min_t(unsigned int, sizeof(int), len);
Stephen Hemminger132adf52007-03-08 20:44:43 -08001246 if (put_user(len, optlen))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001247 return -EFAULT;
Jianjun Kong09cb1052008-11-03 00:27:11 -08001248 if (copy_to_user(optval, &val, len))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001249 return -EFAULT;
1250 }
1251 return 0;
1252}
1253
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001254int ip_getsockopt(struct sock *sk, int level,
Stephen Hemminger132adf52007-03-08 20:44:43 -08001255 int optname, char __user *optval, int __user *optlen)
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001256{
1257 int err;
1258
1259 err = do_ip_getsockopt(sk, level, optname, optval, optlen);
1260#ifdef CONFIG_NETFILTER
1261 /* we need to exclude all possible ENOPROTOOPTs except default case */
Pavel Emelyanov6a9fb942007-11-05 21:32:31 -08001262 if (err == -ENOPROTOOPT && optname != IP_PKTOPTIONS &&
1263 !ip_mroute_opt(optname)) {
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001264 int len;
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001265
Jianjun Kong09cb1052008-11-03 00:27:11 -08001266 if (get_user(len, optlen))
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001267 return -EFAULT;
1268
1269 lock_sock(sk);
1270 err = nf_getsockopt(sk, PF_INET, optname, optval,
1271 &len);
1272 release_sock(sk);
1273 if (err >= 0)
1274 err = put_user(len, optlen);
1275 return err;
1276 }
1277#endif
1278 return err;
1279}
Eric Dumazet4d52cfb2009-06-02 00:42:16 -07001280EXPORT_SYMBOL(ip_getsockopt);
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001281
1282#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001283int compat_ip_getsockopt(struct sock *sk, int level, int optname,
1284 char __user *optval, int __user *optlen)
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001285{
David L Stevens42908c62008-04-29 03:23:22 -07001286 int err;
1287
1288 if (optname == MCAST_MSFILTER)
1289 return compat_mc_getsockopt(sk, level, optname, optval, optlen,
1290 ip_getsockopt);
1291
1292 err = do_ip_getsockopt(sk, level, optname, optval, optlen);
1293
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001294#ifdef CONFIG_NETFILTER
1295 /* we need to exclude all possible ENOPROTOOPTs except default case */
Pavel Emelyanov6a9fb942007-11-05 21:32:31 -08001296 if (err == -ENOPROTOOPT && optname != IP_PKTOPTIONS &&
1297 !ip_mroute_opt(optname)) {
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001298 int len;
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001299
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001300 if (get_user(len, optlen))
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001301 return -EFAULT;
1302
1303 lock_sock(sk);
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001304 err = compat_nf_getsockopt(sk, PF_INET, optname, optval, &len);
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001305 release_sock(sk);
1306 if (err >= 0)
1307 err = put_user(len, optlen);
1308 return err;
1309 }
1310#endif
1311 return err;
1312}
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001313EXPORT_SYMBOL(compat_ip_getsockopt);
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001314#endif