blob: c0bea7bfaa8a713ebc55c5663327e635a97a4b60 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Internet Control Message Protocol (ICMPv6)
3 * Linux INET6 implementation
4 *
5 * Authors:
6 * Pedro Roque <roque@di.fc.ul.pt>
7 *
8 * $Id: icmp.c,v 1.38 2002/02/08 03:57:19 davem Exp $
9 *
10 * Based on net/ipv4/icmp.c
11 *
12 * RFC 1885
13 *
14 * This program is free software; you can redistribute it and/or
15 * modify it under the terms of the GNU General Public License
16 * as published by the Free Software Foundation; either version
17 * 2 of the License, or (at your option) any later version.
18 */
19
20/*
21 * Changes:
22 *
23 * Andi Kleen : exception handling
24 * Andi Kleen add rate limits. never reply to a icmp.
25 * add more length checks and other fixes.
26 * yoshfuji : ensure to sent parameter problem for
27 * fragments.
28 * YOSHIFUJI Hideaki @USAGI: added sysctl for icmp rate limit.
29 * Randy Dunlap and
30 * YOSHIFUJI Hideaki @USAGI: Per-interface statistics support
31 * Kazunori MIYAZAWA @USAGI: change output process to use ip6_append_data
32 */
33
34#include <linux/module.h>
35#include <linux/errno.h>
36#include <linux/types.h>
37#include <linux/socket.h>
38#include <linux/in.h>
39#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070040#include <linux/sockios.h>
41#include <linux/net.h>
42#include <linux/skbuff.h>
43#include <linux/init.h>
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -080044#include <linux/netfilter.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070045
46#ifdef CONFIG_SYSCTL
47#include <linux/sysctl.h>
48#endif
49
50#include <linux/inet.h>
51#include <linux/netdevice.h>
52#include <linux/icmpv6.h>
53
54#include <net/ip.h>
55#include <net/sock.h>
56
57#include <net/ipv6.h>
58#include <net/ip6_checksum.h>
59#include <net/protocol.h>
60#include <net/raw.h>
61#include <net/rawv6.h>
62#include <net/transp_v6.h>
63#include <net/ip6_route.h>
64#include <net/addrconf.h>
65#include <net/icmp.h>
Herbert Xu8b7817f2007-12-12 10:44:43 -080066#include <net/xfrm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
68#include <asm/uaccess.h>
69#include <asm/system.h>
70
Eric Dumazetba899662005-08-26 12:05:31 -070071DEFINE_SNMP_STAT(struct icmpv6_mib, icmpv6_statistics) __read_mostly;
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +090072EXPORT_SYMBOL(icmpv6_statistics);
David L Stevens14878f72007-09-16 16:52:35 -070073DEFINE_SNMP_STAT(struct icmpv6msg_mib, icmpv6msg_statistics) __read_mostly;
74EXPORT_SYMBOL(icmpv6msg_statistics);
Linus Torvalds1da177e2005-04-16 15:20:36 -070075
76/*
77 * The ICMP socket(s). This is the most convenient way to flow control
78 * our ICMP output as well as maintain a clean interface throughout
79 * all layers. All Socketless IP sends will soon be gone.
80 *
81 * On SMP we have one ICMP socket per-cpu.
82 */
83static DEFINE_PER_CPU(struct socket *, __icmpv6_socket) = NULL;
84#define icmpv6_socket __get_cpu_var(__icmpv6_socket)
85
Herbert Xue5bbef22007-10-15 12:50:28 -070086static int icmpv6_rcv(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070087
88static struct inet6_protocol icmpv6_protocol = {
89 .handler = icmpv6_rcv,
Herbert Xu8b7817f2007-12-12 10:44:43 -080090 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
Linus Torvalds1da177e2005-04-16 15:20:36 -070091};
92
93static __inline__ int icmpv6_xmit_lock(void)
94{
95 local_bh_disable();
96
97 if (unlikely(!spin_trylock(&icmpv6_socket->sk->sk_lock.slock))) {
98 /* This can happen if the output path (f.e. SIT or
99 * ip6ip6 tunnel) signals dst_link_failure() for an
100 * outgoing ICMP6 packet.
101 */
102 local_bh_enable();
103 return 1;
104 }
105 return 0;
106}
107
108static __inline__ void icmpv6_xmit_unlock(void)
109{
110 spin_unlock_bh(&icmpv6_socket->sk->sk_lock.slock);
111}
112
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900113/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 * Slightly more convenient version of icmpv6_send.
115 */
116void icmpv6_param_prob(struct sk_buff *skb, int code, int pos)
117{
118 icmpv6_send(skb, ICMPV6_PARAMPROB, code, pos, skb->dev);
119 kfree_skb(skb);
120}
121
122/*
123 * Figure out, may we reply to this packet with icmp error.
124 *
125 * We do not reply, if:
126 * - it was icmp error message.
127 * - it is truncated, so that it is known, that protocol is ICMPV6
128 * (i.e. in the middle of some exthdr)
129 *
130 * --ANK (980726)
131 */
132
133static int is_ineligible(struct sk_buff *skb)
134{
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700135 int ptr = (u8 *)(ipv6_hdr(skb) + 1) - skb->data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700136 int len = skb->len - ptr;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700137 __u8 nexthdr = ipv6_hdr(skb)->nexthdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700138
139 if (len < 0)
140 return 1;
141
Herbert Xu0d3d0772005-04-24 20:16:19 -0700142 ptr = ipv6_skip_exthdr(skb, ptr, &nexthdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143 if (ptr < 0)
144 return 0;
145 if (nexthdr == IPPROTO_ICMPV6) {
146 u8 _type, *tp;
147 tp = skb_header_pointer(skb,
148 ptr+offsetof(struct icmp6hdr, icmp6_type),
149 sizeof(_type), &_type);
150 if (tp == NULL ||
151 !(*tp & ICMPV6_INFOMSG_MASK))
152 return 1;
153 }
154 return 0;
155}
156
Brian Haleyab32ea52006-09-22 14:15:41 -0700157static int sysctl_icmpv6_time __read_mostly = 1*HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900159/*
160 * Check the ICMP output rate limit
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161 */
162static inline int icmpv6_xrlim_allow(struct sock *sk, int type,
163 struct flowi *fl)
164{
165 struct dst_entry *dst;
166 int res = 0;
167
168 /* Informational messages are not limited. */
169 if (type & ICMPV6_INFOMSG_MASK)
170 return 1;
171
172 /* Do not limit pmtu discovery, it would break it. */
173 if (type == ICMPV6_PKT_TOOBIG)
174 return 1;
175
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900176 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 * Look up the output route.
178 * XXX: perhaps the expire for routing entries cloned by
179 * this lookup should be more aggressive (not longer than timeout).
180 */
181 dst = ip6_route_output(sk, fl);
182 if (dst->error) {
YOSHIFUJI Hideakia11d2062006-11-04 20:11:37 +0900183 IP6_INC_STATS(ip6_dst_idev(dst),
184 IPSTATS_MIB_OUTNOROUTES);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700185 } else if (dst->dev && (dst->dev->flags&IFF_LOOPBACK)) {
186 res = 1;
187 } else {
188 struct rt6_info *rt = (struct rt6_info *)dst;
189 int tmo = sysctl_icmpv6_time;
190
191 /* Give more bandwidth to wider prefixes. */
192 if (rt->rt6i_dst.plen < 128)
193 tmo >>= ((128 - rt->rt6i_dst.plen)>>5);
194
195 res = xrlim_allow(dst, tmo);
196 }
197 dst_release(dst);
198 return res;
199}
200
201/*
202 * an inline helper for the "simple" if statement below
203 * checks if parameter problem report is caused by an
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900204 * unrecognized IPv6 option that has the Option Type
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205 * highest-order two bits set to 10
206 */
207
208static __inline__ int opt_unrec(struct sk_buff *skb, __u32 offset)
209{
210 u8 _optval, *op;
211
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -0300212 offset += skb_network_offset(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 op = skb_header_pointer(skb, offset, sizeof(_optval), &_optval);
214 if (op == NULL)
215 return 1;
216 return (*op & 0xC0) == 0x80;
217}
218
219static int icmpv6_push_pending_frames(struct sock *sk, struct flowi *fl, struct icmp6hdr *thdr, int len)
220{
221 struct sk_buff *skb;
222 struct icmp6hdr *icmp6h;
223 int err = 0;
224
225 if ((skb = skb_peek(&sk->sk_write_queue)) == NULL)
226 goto out;
227
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -0300228 icmp6h = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 memcpy(icmp6h, thdr, sizeof(struct icmp6hdr));
230 icmp6h->icmp6_cksum = 0;
231
232 if (skb_queue_len(&sk->sk_write_queue) == 1) {
233 skb->csum = csum_partial((char *)icmp6h,
234 sizeof(struct icmp6hdr), skb->csum);
235 icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
236 &fl->fl6_dst,
237 len, fl->proto,
238 skb->csum);
239 } else {
Al Viro868c86b2006-11-14 21:35:48 -0800240 __wsum tmp_csum = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241
242 skb_queue_walk(&sk->sk_write_queue, skb) {
243 tmp_csum = csum_add(tmp_csum, skb->csum);
244 }
245
246 tmp_csum = csum_partial((char *)icmp6h,
247 sizeof(struct icmp6hdr), tmp_csum);
Al Viro868c86b2006-11-14 21:35:48 -0800248 icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
249 &fl->fl6_dst,
250 len, fl->proto,
251 tmp_csum);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253 ip6_push_pending_frames(sk);
254out:
255 return err;
256}
257
258struct icmpv6_msg {
259 struct sk_buff *skb;
260 int offset;
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -0800261 uint8_t type;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262};
263
264static int icmpv6_getfrag(void *from, char *to, int offset, int len, int odd, struct sk_buff *skb)
265{
266 struct icmpv6_msg *msg = (struct icmpv6_msg *) from;
267 struct sk_buff *org_skb = msg->skb;
Al Viro5f92a732006-11-14 21:36:54 -0800268 __wsum csum = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269
270 csum = skb_copy_and_csum_bits(org_skb, msg->offset + offset,
271 to, len, csum);
272 skb->csum = csum_block_add(skb->csum, csum, odd);
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -0800273 if (!(msg->type & ICMPV6_INFOMSG_MASK))
274 nf_ct_attach(skb, org_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 return 0;
276}
277
Masahide NAKAMURA59fbb3a62007-06-26 23:56:32 -0700278#if defined(CONFIG_IPV6_MIP6) || defined(CONFIG_IPV6_MIP6_MODULE)
Masahide NAKAMURA79383232006-08-23 19:27:25 -0700279static void mip6_addr_swap(struct sk_buff *skb)
280{
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700281 struct ipv6hdr *iph = ipv6_hdr(skb);
Masahide NAKAMURA79383232006-08-23 19:27:25 -0700282 struct inet6_skb_parm *opt = IP6CB(skb);
283 struct ipv6_destopt_hao *hao;
284 struct in6_addr tmp;
285 int off;
286
287 if (opt->dsthao) {
288 off = ipv6_find_tlv(skb, opt->dsthao, IPV6_TLV_HAO);
289 if (likely(off >= 0)) {
Arnaldo Carvalho de Melod56f90a2007-04-10 20:50:43 -0700290 hao = (struct ipv6_destopt_hao *)
291 (skb_network_header(skb) + off);
Masahide NAKAMURA79383232006-08-23 19:27:25 -0700292 ipv6_addr_copy(&tmp, &iph->saddr);
293 ipv6_addr_copy(&iph->saddr, &hao->addr);
294 ipv6_addr_copy(&hao->addr, &tmp);
295 }
296 }
297}
298#else
299static inline void mip6_addr_swap(struct sk_buff *skb) {}
300#endif
301
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302/*
303 * Send an ICMP message in response to a packet in error
304 */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900305void icmpv6_send(struct sk_buff *skb, int type, int code, __u32 info,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306 struct net_device *dev)
307{
308 struct inet6_dev *idev = NULL;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700309 struct ipv6hdr *hdr = ipv6_hdr(skb);
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700310 struct sock *sk;
311 struct ipv6_pinfo *np;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 struct in6_addr *saddr = NULL;
313 struct dst_entry *dst;
Herbert Xu8b7817f2007-12-12 10:44:43 -0800314 struct dst_entry *dst2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 struct icmp6hdr tmp_hdr;
316 struct flowi fl;
Herbert Xu8b7817f2007-12-12 10:44:43 -0800317 struct flowi fl2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318 struct icmpv6_msg msg;
319 int iif = 0;
320 int addr_type = 0;
321 int len;
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900322 int hlimit, tclass;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323 int err = 0;
324
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700325 if ((u8 *)hdr < skb->head ||
326 (skb->network_header + sizeof(*hdr)) > skb->tail)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 return;
328
329 /*
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900330 * Make sure we respect the rules
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331 * i.e. RFC 1885 2.4(e)
332 * Rule (e.1) is enforced by not using icmpv6_send
333 * in any code that processes icmp errors.
334 */
335 addr_type = ipv6_addr_type(&hdr->daddr);
336
337 if (ipv6_chk_addr(&hdr->daddr, skb->dev, 0))
338 saddr = &hdr->daddr;
339
340 /*
341 * Dest addr check
342 */
343
344 if ((addr_type & IPV6_ADDR_MULTICAST || skb->pkt_type != PACKET_HOST)) {
345 if (type != ICMPV6_PKT_TOOBIG &&
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900346 !(type == ICMPV6_PARAMPROB &&
347 code == ICMPV6_UNK_OPTION &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 (opt_unrec(skb, info))))
349 return;
350
351 saddr = NULL;
352 }
353
354 addr_type = ipv6_addr_type(&hdr->saddr);
355
356 /*
357 * Source addr check
358 */
359
360 if (addr_type & IPV6_ADDR_LINKLOCAL)
361 iif = skb->dev->ifindex;
362
363 /*
YOSHIFUJI Hideaki8de33512005-12-21 22:57:06 +0900364 * Must not send error if the source does not uniquely
365 * identify a single node (RFC2463 Section 2.4).
366 * We check unspecified / multicast addresses here,
367 * and anycast addresses will be checked later.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368 */
369 if ((addr_type == IPV6_ADDR_ANY) || (addr_type & IPV6_ADDR_MULTICAST)) {
Patrick McHardy64ce2072005-08-09 20:50:53 -0700370 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: addr_any/mcast source\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371 return;
372 }
373
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900374 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375 * Never answer to a ICMP packet.
376 */
377 if (is_ineligible(skb)) {
Patrick McHardy64ce2072005-08-09 20:50:53 -0700378 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: no reply to icmp error\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379 return;
380 }
381
Masahide NAKAMURA79383232006-08-23 19:27:25 -0700382 mip6_addr_swap(skb);
383
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384 memset(&fl, 0, sizeof(fl));
385 fl.proto = IPPROTO_ICMPV6;
386 ipv6_addr_copy(&fl.fl6_dst, &hdr->saddr);
387 if (saddr)
388 ipv6_addr_copy(&fl.fl6_src, saddr);
389 fl.oif = iif;
390 fl.fl_icmp_type = type;
391 fl.fl_icmp_code = code;
Venkat Yekkiralabeb8d132006-08-04 23:12:42 -0700392 security_skb_classify_flow(skb, &fl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393
394 if (icmpv6_xmit_lock())
395 return;
396
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700397 sk = icmpv6_socket->sk;
398 np = inet6_sk(sk);
399
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400 if (!icmpv6_xrlim_allow(sk, type, &fl))
401 goto out;
402
403 tmp_hdr.icmp6_type = type;
404 tmp_hdr.icmp6_code = code;
405 tmp_hdr.icmp6_cksum = 0;
406 tmp_hdr.icmp6_pointer = htonl(info);
407
408 if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
409 fl.oif = np->mcast_oif;
410
411 err = ip6_dst_lookup(sk, &dst, &fl);
412 if (err)
413 goto out;
YOSHIFUJI Hideaki8de33512005-12-21 22:57:06 +0900414
415 /*
416 * We won't send icmp if the destination is known
417 * anycast.
418 */
419 if (((struct rt6_info *)dst)->rt6i_flags & RTF_ANYCAST) {
420 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: acast source\n");
421 goto out_dst_release;
422 }
423
Herbert Xu8b7817f2007-12-12 10:44:43 -0800424 /* No need to clone since we're just using its address. */
425 dst2 = dst;
426
427 err = xfrm_lookup(&dst, &fl, sk, 0);
428 switch (err) {
429 case 0:
430 if (dst != dst2)
431 goto route_done;
432 break;
433 case -EPERM:
434 dst = NULL;
435 break;
436 default:
437 goto out;
438 }
439
440 if (xfrm_decode_session_reverse(skb, &fl2, AF_INET6))
Patrick McHardye1044112005-09-08 15:11:55 -0700441 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700442
Herbert Xu8b7817f2007-12-12 10:44:43 -0800443 if (ip6_dst_lookup(sk, &dst2, &fl))
444 goto out;
445
446 err = xfrm_lookup(&dst2, &fl, sk, XFRM_LOOKUP_ICMP);
447 if (err == -ENOENT) {
448 if (!dst)
449 goto out;
450 goto route_done;
451 }
452
453 dst_release(dst);
454 dst = dst2;
455
456 if (err)
457 goto out;
458
459route_done:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700460 if (ipv6_addr_is_multicast(&fl.fl6_dst))
461 hlimit = np->mcast_hops;
462 else
463 hlimit = np->hop_limit;
464 if (hlimit < 0)
465 hlimit = dst_metric(dst, RTAX_HOPLIMIT);
466 if (hlimit < 0)
467 hlimit = ipv6_get_hoplimit(dst->dev);
468
YOSHIFUJI Hideakie012d512006-09-13 20:01:28 -0700469 tclass = np->tclass;
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900470 if (tclass < 0)
471 tclass = 0;
472
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473 msg.skb = skb;
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -0300474 msg.offset = skb_network_offset(skb);
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -0800475 msg.type = type;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700476
477 len = skb->len - msg.offset;
478 len = min_t(unsigned int, len, IPV6_MIN_MTU - sizeof(struct ipv6hdr) -sizeof(struct icmp6hdr));
479 if (len < 0) {
Patrick McHardy64ce2072005-08-09 20:50:53 -0700480 LIMIT_NETDEBUG(KERN_DEBUG "icmp: len problem\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 goto out_dst_release;
482 }
483
484 idev = in6_dev_get(skb->dev);
485
486 err = ip6_append_data(sk, icmpv6_getfrag, &msg,
487 len + sizeof(struct icmp6hdr),
488 sizeof(struct icmp6hdr),
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900489 hlimit, tclass, NULL, &fl, (struct rt6_info*)dst,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490 MSG_DONTWAIT);
491 if (err) {
492 ip6_flush_pending_frames(sk);
493 goto out_put;
494 }
495 err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, len + sizeof(struct icmp6hdr));
496
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497out_put:
498 if (likely(idev != NULL))
499 in6_dev_put(idev);
500out_dst_release:
501 dst_release(dst);
502out:
503 icmpv6_xmit_unlock();
504}
505
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +0900506EXPORT_SYMBOL(icmpv6_send);
507
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508static void icmpv6_echo_reply(struct sk_buff *skb)
509{
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700510 struct sock *sk;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 struct inet6_dev *idev;
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700512 struct ipv6_pinfo *np;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700513 struct in6_addr *saddr = NULL;
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -0300514 struct icmp6hdr *icmph = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515 struct icmp6hdr tmp_hdr;
516 struct flowi fl;
517 struct icmpv6_msg msg;
518 struct dst_entry *dst;
519 int err = 0;
520 int hlimit;
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900521 int tclass;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700522
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700523 saddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524
525 if (!ipv6_unicast_destination(skb))
526 saddr = NULL;
527
528 memcpy(&tmp_hdr, icmph, sizeof(tmp_hdr));
529 tmp_hdr.icmp6_type = ICMPV6_ECHO_REPLY;
530
531 memset(&fl, 0, sizeof(fl));
532 fl.proto = IPPROTO_ICMPV6;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700533 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 if (saddr)
535 ipv6_addr_copy(&fl.fl6_src, saddr);
536 fl.oif = skb->dev->ifindex;
537 fl.fl_icmp_type = ICMPV6_ECHO_REPLY;
Venkat Yekkiralabeb8d132006-08-04 23:12:42 -0700538 security_skb_classify_flow(skb, &fl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700539
540 if (icmpv6_xmit_lock())
541 return;
542
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700543 sk = icmpv6_socket->sk;
544 np = inet6_sk(sk);
545
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546 if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
547 fl.oif = np->mcast_oif;
548
549 err = ip6_dst_lookup(sk, &dst, &fl);
550 if (err)
551 goto out;
552 if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
Patrick McHardye1044112005-09-08 15:11:55 -0700553 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700554
555 if (ipv6_addr_is_multicast(&fl.fl6_dst))
556 hlimit = np->mcast_hops;
557 else
558 hlimit = np->hop_limit;
559 if (hlimit < 0)
560 hlimit = dst_metric(dst, RTAX_HOPLIMIT);
561 if (hlimit < 0)
562 hlimit = ipv6_get_hoplimit(dst->dev);
563
YOSHIFUJI Hideakie012d512006-09-13 20:01:28 -0700564 tclass = np->tclass;
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900565 if (tclass < 0)
566 tclass = 0;
567
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568 idev = in6_dev_get(skb->dev);
569
570 msg.skb = skb;
571 msg.offset = 0;
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -0800572 msg.type = ICMPV6_ECHO_REPLY;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573
574 err = ip6_append_data(sk, icmpv6_getfrag, &msg, skb->len + sizeof(struct icmp6hdr),
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900575 sizeof(struct icmp6hdr), hlimit, tclass, NULL, &fl,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576 (struct rt6_info*)dst, MSG_DONTWAIT);
577
578 if (err) {
579 ip6_flush_pending_frames(sk);
580 goto out_put;
581 }
582 err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, skb->len + sizeof(struct icmp6hdr));
583
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900584out_put:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700585 if (likely(idev != NULL))
586 in6_dev_put(idev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700587 dst_release(dst);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900588out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589 icmpv6_xmit_unlock();
590}
591
Al Viro04ce6902006-11-08 00:21:01 -0800592static void icmpv6_notify(struct sk_buff *skb, int type, int code, __be32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594 struct inet6_protocol *ipprot;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595 int inner_offset;
596 int hash;
597 u8 nexthdr;
598
599 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
600 return;
601
602 nexthdr = ((struct ipv6hdr *)skb->data)->nexthdr;
603 if (ipv6_ext_hdr(nexthdr)) {
604 /* now skip over extension headers */
Herbert Xu0d3d0772005-04-24 20:16:19 -0700605 inner_offset = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &nexthdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606 if (inner_offset<0)
607 return;
608 } else {
609 inner_offset = sizeof(struct ipv6hdr);
610 }
611
612 /* Checkin header including 8 bytes of inner protocol header. */
613 if (!pskb_may_pull(skb, inner_offset+8))
614 return;
615
Linus Torvalds1da177e2005-04-16 15:20:36 -0700616 /* BUGGG_FUTURE: we should try to parse exthdrs in this packet.
617 Without this we will not able f.e. to make source routed
618 pmtu discovery.
619 Corresponding argument (opt) to notifiers is already added.
620 --ANK (980726)
621 */
622
623 hash = nexthdr & (MAX_INET_PROTOS - 1);
624
625 rcu_read_lock();
626 ipprot = rcu_dereference(inet6_protos[hash]);
627 if (ipprot && ipprot->err_handler)
628 ipprot->err_handler(skb, NULL, type, code, inner_offset, info);
629 rcu_read_unlock();
630
Pavel Emelyanov69d6da02007-11-19 22:35:57 -0800631 raw6_icmp_error(skb, nexthdr, type, code, inner_offset, info);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700632}
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900633
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634/*
635 * Handle icmp messages
636 */
637
Herbert Xue5bbef22007-10-15 12:50:28 -0700638static int icmpv6_rcv(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700639{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640 struct net_device *dev = skb->dev;
641 struct inet6_dev *idev = __in6_dev_get(dev);
642 struct in6_addr *saddr, *daddr;
643 struct ipv6hdr *orig_hdr;
644 struct icmp6hdr *hdr;
645 int type;
646
Herbert Xu8b7817f2007-12-12 10:44:43 -0800647 if (xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb) &&
648 skb->sp->xvec[skb->sp->len - 1]->props.flags & XFRM_STATE_ICMP) {
649 int nh;
650
651 if (!pskb_may_pull(skb, sizeof(*hdr) + sizeof(*orig_hdr)))
652 goto drop_no_count;
653
654 nh = skb_network_offset(skb);
655 skb_set_network_header(skb, sizeof(*hdr));
656
657 if (!xfrm6_policy_check_reverse(NULL, XFRM_POLICY_IN, skb))
658 goto drop_no_count;
659
660 skb_set_network_header(skb, nh);
661 }
662
Linus Torvalds1da177e2005-04-16 15:20:36 -0700663 ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INMSGS);
664
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700665 saddr = &ipv6_hdr(skb)->saddr;
666 daddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700667
668 /* Perform checksum. */
Herbert Xufb286bb2005-11-10 13:01:24 -0800669 switch (skb->ip_summed) {
Patrick McHardy84fa7932006-08-29 16:44:56 -0700670 case CHECKSUM_COMPLETE:
Herbert Xufb286bb2005-11-10 13:01:24 -0800671 if (!csum_ipv6_magic(saddr, daddr, skb->len, IPPROTO_ICMPV6,
672 skb->csum))
673 break;
674 /* fall through */
675 case CHECKSUM_NONE:
Al Viro868c86b2006-11-14 21:35:48 -0800676 skb->csum = ~csum_unfold(csum_ipv6_magic(saddr, daddr, skb->len,
677 IPPROTO_ICMPV6, 0));
Herbert Xufb286bb2005-11-10 13:01:24 -0800678 if (__skb_checksum_complete(skb)) {
Joe Perches46b86a22006-01-13 14:29:07 -0800679 LIMIT_NETDEBUG(KERN_DEBUG "ICMPv6 checksum failed [" NIP6_FMT " > " NIP6_FMT "]\n",
Patrick McHardy64ce2072005-08-09 20:50:53 -0700680 NIP6(*saddr), NIP6(*daddr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700681 goto discard_it;
682 }
683 }
684
Herbert Xu8b7817f2007-12-12 10:44:43 -0800685 __skb_pull(skb, sizeof(*hdr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700686
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -0300687 hdr = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700688
689 type = hdr->icmp6_type;
690
David L Stevens14878f72007-09-16 16:52:35 -0700691 ICMP6MSGIN_INC_STATS_BH(idev, type);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692
693 switch (type) {
694 case ICMPV6_ECHO_REQUEST:
695 icmpv6_echo_reply(skb);
696 break;
697
698 case ICMPV6_ECHO_REPLY:
699 /* we couldn't care less */
700 break;
701
702 case ICMPV6_PKT_TOOBIG:
703 /* BUGGG_FUTURE: if packet contains rthdr, we cannot update
704 standard destination cache. Seems, only "advanced"
705 destination cache will allow to solve this problem
706 --ANK (980726)
707 */
708 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
709 goto discard_it;
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -0300710 hdr = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700711 orig_hdr = (struct ipv6hdr *) (hdr + 1);
712 rt6_pmtu_discovery(&orig_hdr->daddr, &orig_hdr->saddr, dev,
713 ntohl(hdr->icmp6_mtu));
714
715 /*
716 * Drop through to notify
717 */
718
719 case ICMPV6_DEST_UNREACH:
720 case ICMPV6_TIME_EXCEED:
721 case ICMPV6_PARAMPROB:
722 icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
723 break;
724
725 case NDISC_ROUTER_SOLICITATION:
726 case NDISC_ROUTER_ADVERTISEMENT:
727 case NDISC_NEIGHBOUR_SOLICITATION:
728 case NDISC_NEIGHBOUR_ADVERTISEMENT:
729 case NDISC_REDIRECT:
730 ndisc_rcv(skb);
731 break;
732
733 case ICMPV6_MGM_QUERY:
734 igmp6_event_query(skb);
735 break;
736
737 case ICMPV6_MGM_REPORT:
738 igmp6_event_report(skb);
739 break;
740
741 case ICMPV6_MGM_REDUCTION:
742 case ICMPV6_NI_QUERY:
743 case ICMPV6_NI_REPLY:
744 case ICMPV6_MLD2_REPORT:
745 case ICMPV6_DHAAD_REQUEST:
746 case ICMPV6_DHAAD_REPLY:
747 case ICMPV6_MOBILE_PREFIX_SOL:
748 case ICMPV6_MOBILE_PREFIX_ADV:
749 break;
750
751 default:
Patrick McHardy64ce2072005-08-09 20:50:53 -0700752 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6: msg of unknown type\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700753
754 /* informational */
755 if (type & ICMPV6_INFOMSG_MASK)
756 break;
757
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900758 /*
759 * error of unknown type.
760 * must pass to upper level
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761 */
762
763 icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
Stephen Hemminger3ff50b72007-04-20 17:09:22 -0700764 }
765
Linus Torvalds1da177e2005-04-16 15:20:36 -0700766 kfree_skb(skb);
767 return 0;
768
769discard_it:
770 ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INERRORS);
Herbert Xu8b7817f2007-12-12 10:44:43 -0800771drop_no_count:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772 kfree_skb(skb);
773 return 0;
774}
775
Ingo Molnar640c41c2006-08-15 00:06:56 -0700776/*
777 * Special lock-class for __icmpv6_socket:
778 */
779static struct lock_class_key icmpv6_socket_sk_dst_lock_key;
780
Linus Torvalds1da177e2005-04-16 15:20:36 -0700781int __init icmpv6_init(struct net_proto_family *ops)
782{
783 struct sock *sk;
784 int err, i, j;
785
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -0700786 for_each_possible_cpu(i) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700787 err = sock_create_kern(PF_INET6, SOCK_RAW, IPPROTO_ICMPV6,
788 &per_cpu(__icmpv6_socket, i));
789 if (err < 0) {
790 printk(KERN_ERR
791 "Failed to initialize the ICMP6 control socket "
792 "(err %d).\n",
793 err);
794 goto fail;
795 }
796
797 sk = per_cpu(__icmpv6_socket, i)->sk;
798 sk->sk_allocation = GFP_ATOMIC;
Ingo Molnar640c41c2006-08-15 00:06:56 -0700799 /*
800 * Split off their lock-class, because sk->sk_dst_lock
801 * gets used from softirqs, which is safe for
802 * __icmpv6_socket (because those never get directly used
803 * via userspace syscalls), but unsafe for normal sockets.
804 */
805 lockdep_set_class(&sk->sk_dst_lock,
806 &icmpv6_socket_sk_dst_lock_key);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700807
808 /* Enough space for 2 64K ICMP packets, including
809 * sk_buff struct overhead.
810 */
811 sk->sk_sndbuf =
812 (2 * ((64 * 1024) + sizeof(struct sk_buff)));
813
814 sk->sk_prot->unhash(sk);
815 }
816
817
818 if (inet6_add_protocol(&icmpv6_protocol, IPPROTO_ICMPV6) < 0) {
819 printk(KERN_ERR "Failed to register ICMP6 protocol\n");
820 err = -EAGAIN;
821 goto fail;
822 }
823
824 return 0;
825
826 fail:
827 for (j = 0; j < i; j++) {
828 if (!cpu_possible(j))
829 continue;
830 sock_release(per_cpu(__icmpv6_socket, j));
831 }
832
833 return err;
834}
835
836void icmpv6_cleanup(void)
837{
838 int i;
839
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -0700840 for_each_possible_cpu(i) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700841 sock_release(per_cpu(__icmpv6_socket, i));
842 }
843 inet6_del_protocol(&icmpv6_protocol, IPPROTO_ICMPV6);
844}
845
Arjan van de Ven9b5b5cf2005-11-29 16:21:38 -0800846static const struct icmp6_err {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700847 int err;
848 int fatal;
849} tab_unreach[] = {
850 { /* NOROUTE */
851 .err = ENETUNREACH,
852 .fatal = 0,
853 },
854 { /* ADM_PROHIBITED */
855 .err = EACCES,
856 .fatal = 1,
857 },
858 { /* Was NOT_NEIGHBOUR, now reserved */
859 .err = EHOSTUNREACH,
860 .fatal = 0,
861 },
862 { /* ADDR_UNREACH */
863 .err = EHOSTUNREACH,
864 .fatal = 0,
865 },
866 { /* PORT_UNREACH */
867 .err = ECONNREFUSED,
868 .fatal = 1,
869 },
870};
871
872int icmpv6_err_convert(int type, int code, int *err)
873{
874 int fatal = 0;
875
876 *err = EPROTO;
877
878 switch (type) {
879 case ICMPV6_DEST_UNREACH:
880 fatal = 1;
881 if (code <= ICMPV6_PORT_UNREACH) {
882 *err = tab_unreach[code].err;
883 fatal = tab_unreach[code].fatal;
884 }
885 break;
886
887 case ICMPV6_PKT_TOOBIG:
888 *err = EMSGSIZE;
889 break;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900890
Linus Torvalds1da177e2005-04-16 15:20:36 -0700891 case ICMPV6_PARAMPROB:
892 *err = EPROTO;
893 fatal = 1;
894 break;
895
896 case ICMPV6_TIME_EXCEED:
897 *err = EHOSTUNREACH;
898 break;
Stephen Hemminger3ff50b72007-04-20 17:09:22 -0700899 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700900
901 return fatal;
902}
903
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +0900904EXPORT_SYMBOL(icmpv6_err_convert);
905
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906#ifdef CONFIG_SYSCTL
907ctl_table ipv6_icmp_table[] = {
908 {
909 .ctl_name = NET_IPV6_ICMP_RATELIMIT,
910 .procname = "ratelimit",
911 .data = &sysctl_icmpv6_time,
912 .maxlen = sizeof(int),
913 .mode = 0644,
914 .proc_handler = &proc_dointvec
915 },
916 { .ctl_name = 0 },
917};
918#endif
919