blob: 510aa747a404a13ad4bb81b404bf96b9f44c0035 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Neighbour Discovery for IPv6
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09003 * Linux INET6 implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * Authors:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09006 * Pedro Roque <roque@di.fc.ul.pt>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 * Mike Shaver <shaver@ingenia.com>
8 *
9 * This program is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU General Public License
11 * as published by the Free Software Foundation; either version
12 * 2 of the License, or (at your option) any later version.
13 */
14
15/*
16 * Changes:
17 *
Pierre Ynard31910572007-10-10 21:22:05 -070018 * Pierre Ynard : export userland ND options
19 * through netlink (RDNSS support)
Linus Torvalds1da177e2005-04-16 15:20:36 -070020 * Lars Fenneberg : fixed MTU setting on receipt
21 * of an RA.
Linus Torvalds1da177e2005-04-16 15:20:36 -070022 * Janos Farkas : kmalloc failure checks
23 * Alexey Kuznetsov : state machine reworked
24 * and moved to net/core.
25 * Pekka Savola : RFC2461 validation
26 * YOSHIFUJI Hideaki @USAGI : Verify ND options properly
27 */
28
29/* Set to 3 to get tracing... */
30#define ND_DEBUG 1
31
32#define ND_PRINTK(fmt, args...) do { if (net_ratelimit()) { printk(fmt, ## args); } } while(0)
33#define ND_NOPRINTK(x...) do { ; } while(0)
34#define ND_PRINTK0 ND_PRINTK
35#define ND_PRINTK1 ND_NOPRINTK
36#define ND_PRINTK2 ND_NOPRINTK
37#define ND_PRINTK3 ND_NOPRINTK
38#if ND_DEBUG >= 1
39#undef ND_PRINTK1
40#define ND_PRINTK1 ND_PRINTK
41#endif
42#if ND_DEBUG >= 2
43#undef ND_PRINTK2
44#define ND_PRINTK2 ND_PRINTK
45#endif
46#if ND_DEBUG >= 3
47#undef ND_PRINTK3
48#define ND_PRINTK3 ND_PRINTK
49#endif
50
51#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070052#include <linux/errno.h>
53#include <linux/types.h>
54#include <linux/socket.h>
55#include <linux/sockios.h>
56#include <linux/sched.h>
57#include <linux/net.h>
58#include <linux/in6.h>
59#include <linux/route.h>
60#include <linux/init.h>
61#include <linux/rcupdate.h>
62#ifdef CONFIG_SYSCTL
63#include <linux/sysctl.h>
64#endif
65
Thomas Graf18237302006-08-04 23:04:54 -070066#include <linux/if_addr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067#include <linux/if_arp.h>
68#include <linux/ipv6.h>
69#include <linux/icmpv6.h>
70#include <linux/jhash.h>
71
72#include <net/sock.h>
73#include <net/snmp.h>
74
75#include <net/ipv6.h>
76#include <net/protocol.h>
77#include <net/ndisc.h>
78#include <net/ip6_route.h>
79#include <net/addrconf.h>
80#include <net/icmp.h>
81
Pierre Ynard31910572007-10-10 21:22:05 -070082#include <net/netlink.h>
83#include <linux/rtnetlink.h>
84
Linus Torvalds1da177e2005-04-16 15:20:36 -070085#include <net/flow.h>
86#include <net/ip6_checksum.h>
87#include <linux/proc_fs.h>
88
89#include <linux/netfilter.h>
90#include <linux/netfilter_ipv6.h>
91
Linus Torvalds1da177e2005-04-16 15:20:36 -070092static u32 ndisc_hash(const void *pkey, const struct net_device *dev);
93static int ndisc_constructor(struct neighbour *neigh);
94static void ndisc_solicit(struct neighbour *neigh, struct sk_buff *skb);
95static void ndisc_error_report(struct neighbour *neigh, struct sk_buff *skb);
96static int pndisc_constructor(struct pneigh_entry *n);
97static void pndisc_destructor(struct pneigh_entry *n);
98static void pndisc_redo(struct sk_buff *skb);
99
100static struct neigh_ops ndisc_generic_ops = {
101 .family = AF_INET6,
102 .solicit = ndisc_solicit,
103 .error_report = ndisc_error_report,
104 .output = neigh_resolve_output,
105 .connected_output = neigh_connected_output,
106 .hh_output = dev_queue_xmit,
107 .queue_xmit = dev_queue_xmit,
108};
109
110static struct neigh_ops ndisc_hh_ops = {
111 .family = AF_INET6,
112 .solicit = ndisc_solicit,
113 .error_report = ndisc_error_report,
114 .output = neigh_resolve_output,
115 .connected_output = neigh_resolve_output,
116 .hh_output = dev_queue_xmit,
117 .queue_xmit = dev_queue_xmit,
118};
119
120
121static struct neigh_ops ndisc_direct_ops = {
122 .family = AF_INET6,
123 .output = dev_queue_xmit,
124 .connected_output = dev_queue_xmit,
125 .hh_output = dev_queue_xmit,
126 .queue_xmit = dev_queue_xmit,
127};
128
129struct neigh_table nd_tbl = {
130 .family = AF_INET6,
131 .entry_size = sizeof(struct neighbour) + sizeof(struct in6_addr),
132 .key_len = sizeof(struct in6_addr),
133 .hash = ndisc_hash,
134 .constructor = ndisc_constructor,
135 .pconstructor = pndisc_constructor,
136 .pdestructor = pndisc_destructor,
137 .proxy_redo = pndisc_redo,
138 .id = "ndisc_cache",
139 .parms = {
140 .tbl = &nd_tbl,
141 .base_reachable_time = 30 * HZ,
142 .retrans_time = 1 * HZ,
143 .gc_staletime = 60 * HZ,
144 .reachable_time = 30 * HZ,
145 .delay_probe_time = 5 * HZ,
146 .queue_len = 3,
147 .ucast_probes = 3,
148 .mcast_probes = 3,
149 .anycast_delay = 1 * HZ,
150 .proxy_delay = (8 * HZ) / 10,
151 .proxy_qlen = 64,
152 },
153 .gc_interval = 30 * HZ,
154 .gc_thresh1 = 128,
155 .gc_thresh2 = 512,
156 .gc_thresh3 = 1024,
157};
158
159/* ND options */
160struct ndisc_options {
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800161 struct nd_opt_hdr *nd_opt_array[__ND_OPT_ARRAY_MAX];
162#ifdef CONFIG_IPV6_ROUTE_INFO
163 struct nd_opt_hdr *nd_opts_ri;
164 struct nd_opt_hdr *nd_opts_ri_end;
165#endif
Pierre Ynard31910572007-10-10 21:22:05 -0700166 struct nd_opt_hdr *nd_useropts;
167 struct nd_opt_hdr *nd_useropts_end;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168};
169
170#define nd_opts_src_lladdr nd_opt_array[ND_OPT_SOURCE_LL_ADDR]
171#define nd_opts_tgt_lladdr nd_opt_array[ND_OPT_TARGET_LL_ADDR]
172#define nd_opts_pi nd_opt_array[ND_OPT_PREFIX_INFO]
173#define nd_opts_pi_end nd_opt_array[__ND_OPT_PREFIX_INFO_END]
174#define nd_opts_rh nd_opt_array[ND_OPT_REDIRECT_HDR]
175#define nd_opts_mtu nd_opt_array[ND_OPT_MTU]
176
177#define NDISC_OPT_SPACE(len) (((len)+2+7)&~7)
178
179/*
180 * Return the padding between the option length and the start of the
181 * link addr. Currently only IP-over-InfiniBand needs this, although
182 * if RFC 3831 IPv6-over-Fibre Channel is ever implemented it may
183 * also need a pad of 2.
184 */
185static int ndisc_addr_option_pad(unsigned short type)
186{
187 switch (type) {
188 case ARPHRD_INFINIBAND: return 2;
189 default: return 0;
190 }
191}
192
193static inline int ndisc_opt_addr_space(struct net_device *dev)
194{
195 return NDISC_OPT_SPACE(dev->addr_len + ndisc_addr_option_pad(dev->type));
196}
197
198static u8 *ndisc_fill_addr_option(u8 *opt, int type, void *data, int data_len,
199 unsigned short addr_type)
200{
201 int space = NDISC_OPT_SPACE(data_len);
202 int pad = ndisc_addr_option_pad(addr_type);
203
204 opt[0] = type;
205 opt[1] = space>>3;
206
207 memset(opt + 2, 0, pad);
208 opt += pad;
209 space -= pad;
210
211 memcpy(opt+2, data, data_len);
212 data_len += 2;
213 opt += data_len;
214 if ((space -= data_len) > 0)
215 memset(opt, 0, space);
216 return opt + space;
217}
218
219static struct nd_opt_hdr *ndisc_next_option(struct nd_opt_hdr *cur,
220 struct nd_opt_hdr *end)
221{
222 int type;
223 if (!cur || !end || cur >= end)
224 return NULL;
225 type = cur->nd_opt_type;
226 do {
227 cur = ((void *)cur) + (cur->nd_opt_len << 3);
228 } while(cur < end && cur->nd_opt_type != type);
229 return (cur <= end && cur->nd_opt_type == type ? cur : NULL);
230}
231
Pierre Ynard31910572007-10-10 21:22:05 -0700232static inline int ndisc_is_useropt(struct nd_opt_hdr *opt)
233{
234 return (opt->nd_opt_type == ND_OPT_RDNSS);
235}
236
237static struct nd_opt_hdr *ndisc_next_useropt(struct nd_opt_hdr *cur,
238 struct nd_opt_hdr *end)
239{
240 if (!cur || !end || cur >= end)
241 return NULL;
242 do {
243 cur = ((void *)cur) + (cur->nd_opt_len << 3);
244 } while(cur < end && !ndisc_is_useropt(cur));
245 return (cur <= end && ndisc_is_useropt(cur) ? cur : NULL);
246}
247
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248static struct ndisc_options *ndisc_parse_options(u8 *opt, int opt_len,
249 struct ndisc_options *ndopts)
250{
251 struct nd_opt_hdr *nd_opt = (struct nd_opt_hdr *)opt;
252
253 if (!nd_opt || opt_len < 0 || !ndopts)
254 return NULL;
255 memset(ndopts, 0, sizeof(*ndopts));
256 while (opt_len) {
257 int l;
258 if (opt_len < sizeof(struct nd_opt_hdr))
259 return NULL;
260 l = nd_opt->nd_opt_len << 3;
261 if (opt_len < l || l == 0)
262 return NULL;
263 switch (nd_opt->nd_opt_type) {
264 case ND_OPT_SOURCE_LL_ADDR:
265 case ND_OPT_TARGET_LL_ADDR:
266 case ND_OPT_MTU:
267 case ND_OPT_REDIRECT_HDR:
268 if (ndopts->nd_opt_array[nd_opt->nd_opt_type]) {
269 ND_PRINTK2(KERN_WARNING
270 "%s(): duplicated ND6 option found: type=%d\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -0800271 __func__,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272 nd_opt->nd_opt_type);
273 } else {
274 ndopts->nd_opt_array[nd_opt->nd_opt_type] = nd_opt;
275 }
276 break;
277 case ND_OPT_PREFIX_INFO:
278 ndopts->nd_opts_pi_end = nd_opt;
Stephen Hemmingercfcabdc2007-10-09 01:59:42 -0700279 if (!ndopts->nd_opt_array[nd_opt->nd_opt_type])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280 ndopts->nd_opt_array[nd_opt->nd_opt_type] = nd_opt;
281 break;
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800282#ifdef CONFIG_IPV6_ROUTE_INFO
283 case ND_OPT_ROUTE_INFO:
284 ndopts->nd_opts_ri_end = nd_opt;
285 if (!ndopts->nd_opts_ri)
286 ndopts->nd_opts_ri = nd_opt;
287 break;
288#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289 default:
Pierre Ynard31910572007-10-10 21:22:05 -0700290 if (ndisc_is_useropt(nd_opt)) {
291 ndopts->nd_useropts_end = nd_opt;
292 if (!ndopts->nd_useropts)
293 ndopts->nd_useropts = nd_opt;
294 } else {
295 /*
296 * Unknown options must be silently ignored,
297 * to accommodate future extension to the
298 * protocol.
299 */
300 ND_PRINTK2(KERN_NOTICE
301 "%s(): ignored unsupported option; type=%d, len=%d\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -0800302 __func__,
Pierre Ynard31910572007-10-10 21:22:05 -0700303 nd_opt->nd_opt_type, nd_opt->nd_opt_len);
304 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700305 }
306 opt_len -= l;
307 nd_opt = ((void *)nd_opt) + l;
308 }
309 return ndopts;
310}
311
312static inline u8 *ndisc_opt_addr_data(struct nd_opt_hdr *p,
313 struct net_device *dev)
314{
315 u8 *lladdr = (u8 *)(p + 1);
316 int lladdrlen = p->nd_opt_len << 3;
317 int prepad = ndisc_addr_option_pad(dev->type);
318 if (lladdrlen != NDISC_OPT_SPACE(dev->addr_len + prepad))
319 return NULL;
320 return (lladdr + prepad);
321}
322
323int ndisc_mc_map(struct in6_addr *addr, char *buf, struct net_device *dev, int dir)
324{
325 switch (dev->type) {
326 case ARPHRD_ETHER:
327 case ARPHRD_IEEE802: /* Not sure. Check it later. --ANK */
328 case ARPHRD_FDDI:
329 ipv6_eth_mc_map(addr, buf);
330 return 0;
331 case ARPHRD_IEEE802_TR:
332 ipv6_tr_mc_map(addr,buf);
333 return 0;
334 case ARPHRD_ARCNET:
335 ipv6_arcnet_mc_map(addr, buf);
336 return 0;
337 case ARPHRD_INFINIBAND:
Rolf Manderscheida9e527e2007-12-10 13:38:41 -0700338 ipv6_ib_mc_map(addr, dev->broadcast, buf);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 return 0;
340 default:
341 if (dir) {
342 memcpy(buf, dev->broadcast, dev->addr_len);
343 return 0;
344 }
345 }
346 return -EINVAL;
347}
348
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +0900349EXPORT_SYMBOL(ndisc_mc_map);
350
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351static u32 ndisc_hash(const void *pkey, const struct net_device *dev)
352{
353 const u32 *p32 = pkey;
354 u32 addr_hash, i;
355
356 addr_hash = 0;
357 for (i = 0; i < (sizeof(struct in6_addr) / sizeof(u32)); i++)
358 addr_hash ^= *p32++;
359
360 return jhash_2words(addr_hash, dev->ifindex, nd_tbl.hash_rnd);
361}
362
363static int ndisc_constructor(struct neighbour *neigh)
364{
365 struct in6_addr *addr = (struct in6_addr*)&neigh->primary_key;
366 struct net_device *dev = neigh->dev;
367 struct inet6_dev *in6_dev;
368 struct neigh_parms *parms;
369 int is_multicast = ipv6_addr_is_multicast(addr);
370
371 rcu_read_lock();
372 in6_dev = in6_dev_get(dev);
373 if (in6_dev == NULL) {
374 rcu_read_unlock();
375 return -EINVAL;
376 }
377
378 parms = in6_dev->nd_parms;
379 __neigh_parms_put(neigh->parms);
380 neigh->parms = neigh_parms_clone(parms);
381 rcu_read_unlock();
382
383 neigh->type = is_multicast ? RTN_MULTICAST : RTN_UNICAST;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700384 if (!dev->header_ops) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700385 neigh->nud_state = NUD_NOARP;
386 neigh->ops = &ndisc_direct_ops;
387 neigh->output = neigh->ops->queue_xmit;
388 } else {
389 if (is_multicast) {
390 neigh->nud_state = NUD_NOARP;
391 ndisc_mc_map(addr, neigh->ha, dev, 1);
392 } else if (dev->flags&(IFF_NOARP|IFF_LOOPBACK)) {
393 neigh->nud_state = NUD_NOARP;
394 memcpy(neigh->ha, dev->dev_addr, dev->addr_len);
395 if (dev->flags&IFF_LOOPBACK)
396 neigh->type = RTN_LOCAL;
397 } else if (dev->flags&IFF_POINTOPOINT) {
398 neigh->nud_state = NUD_NOARP;
399 memcpy(neigh->ha, dev->broadcast, dev->addr_len);
400 }
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700401 if (dev->header_ops->cache)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402 neigh->ops = &ndisc_hh_ops;
403 else
404 neigh->ops = &ndisc_generic_ops;
405 if (neigh->nud_state&NUD_VALID)
406 neigh->output = neigh->ops->connected_output;
407 else
408 neigh->output = neigh->ops->output;
409 }
410 in6_dev_put(in6_dev);
411 return 0;
412}
413
414static int pndisc_constructor(struct pneigh_entry *n)
415{
416 struct in6_addr *addr = (struct in6_addr*)&n->key;
417 struct in6_addr maddr;
418 struct net_device *dev = n->dev;
419
420 if (dev == NULL || __in6_dev_get(dev) == NULL)
421 return -EINVAL;
422 addrconf_addr_solict_mult(addr, &maddr);
423 ipv6_dev_mc_inc(dev, &maddr);
424 return 0;
425}
426
427static void pndisc_destructor(struct pneigh_entry *n)
428{
429 struct in6_addr *addr = (struct in6_addr*)&n->key;
430 struct in6_addr maddr;
431 struct net_device *dev = n->dev;
432
433 if (dev == NULL || __in6_dev_get(dev) == NULL)
434 return;
435 addrconf_addr_solict_mult(addr, &maddr);
436 ipv6_dev_mc_dec(dev, &maddr);
437}
438
439/*
440 * Send a Neighbour Advertisement
441 */
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900442static void __ndisc_send(struct net_device *dev,
443 struct neighbour *neigh,
444 struct in6_addr *daddr, struct in6_addr *saddr,
445 struct icmp6hdr *icmp6h, struct in6_addr *target,
David L Stevens14878f72007-09-16 16:52:35 -0700446 int llinfo)
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900447{
448 struct flowi fl;
449 struct dst_entry *dst;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900450 struct net *net = dev_net(dev);
Daniel Lezcano1762f7e2008-03-07 11:15:34 -0800451 struct sock *sk = net->ipv6.ndisc_sk;
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900452 struct sk_buff *skb;
453 struct icmp6hdr *hdr;
454 struct inet6_dev *idev;
455 int len;
456 int err;
David L Stevens14878f72007-09-16 16:52:35 -0700457 u8 *opt, type;
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900458
David L Stevens14878f72007-09-16 16:52:35 -0700459 type = icmp6h->icmp6_type;
460
Daniel Lezcano1762f7e2008-03-07 11:15:34 -0800461 icmpv6_flow_init(sk, &fl, type, saddr, daddr, dev->ifindex);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900462
YOSHIFUJI Hideaki3b009442007-12-06 16:11:48 -0800463 dst = icmp6_dst_alloc(dev, neigh, daddr);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900464 if (!dst)
465 return;
466
467 err = xfrm_lookup(&dst, &fl, NULL, 0);
468 if (err < 0)
469 return;
470
471 if (!dev->addr_len)
472 llinfo = 0;
473
474 len = sizeof(struct icmp6hdr) + (target ? sizeof(*target) : 0);
475 if (llinfo)
476 len += ndisc_opt_addr_space(dev);
477
478 skb = sock_alloc_send_skb(sk,
479 (MAX_HEADER + sizeof(struct ipv6hdr) +
480 len + LL_RESERVED_SPACE(dev)),
481 1, &err);
482 if (!skb) {
483 ND_PRINTK0(KERN_ERR
484 "ICMPv6 ND: %s() failed to allocate an skb.\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -0800485 __func__);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900486 dst_release(dst);
487 return;
488 }
489
490 skb_reserve(skb, LL_RESERVED_SPACE(dev));
491 ip6_nd_hdr(sk, skb, dev, saddr, daddr, IPPROTO_ICMPV6, len);
492
493 skb->transport_header = skb->tail;
494 skb_put(skb, len);
495
496 hdr = (struct icmp6hdr *)skb_transport_header(skb);
497 memcpy(hdr, icmp6h, sizeof(*hdr));
498
499 opt = skb_transport_header(skb) + sizeof(struct icmp6hdr);
500 if (target) {
501 ipv6_addr_copy((struct in6_addr *)opt, target);
502 opt += sizeof(*target);
503 }
504
505 if (llinfo)
506 ndisc_fill_addr_option(opt, llinfo, dev->dev_addr,
507 dev->addr_len, dev->type);
508
509 hdr->icmp6_cksum = csum_ipv6_magic(saddr, daddr, len,
510 IPPROTO_ICMPV6,
511 csum_partial((__u8 *) hdr,
512 len, 0));
513
514 skb->dst = dst;
515
516 idev = in6_dev_get(dst->dev);
517 IP6_INC_STATS(idev, IPSTATS_MIB_OUTREQUESTS);
518
Patrick McHardy6e23ae22007-11-19 18:53:30 -0800519 err = NF_HOOK(PF_INET6, NF_INET_LOCAL_OUT, skb, NULL, dst->dev,
520 dst_output);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900521 if (!err) {
David L Stevens14878f72007-09-16 16:52:35 -0700522 ICMP6MSGOUT_INC_STATS(idev, type);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900523 ICMP6_INC_STATS(idev, ICMP6_MIB_OUTMSGS);
524 }
525
526 if (likely(idev != NULL))
527 in6_dev_put(idev);
528}
529
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530static void ndisc_send_na(struct net_device *dev, struct neighbour *neigh,
531 struct in6_addr *daddr, struct in6_addr *solicited_addr,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900532 int router, int solicited, int override, int inc_opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700533{
534 struct in6_addr tmpaddr;
535 struct inet6_ifaddr *ifp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536 struct in6_addr *src_addr;
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900537 struct icmp6hdr icmp6h = {
538 .icmp6_type = NDISC_NEIGHBOUR_ADVERTISEMENT,
539 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540
541 /* for anycast or proxy, solicited_addr != src_addr */
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900542 ifp = ipv6_get_ifaddr(dev_net(dev), solicited_addr, dev, 1);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900543 if (ifp) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700544 src_addr = solicited_addr;
Neil Horman95c385b2007-04-25 17:08:10 -0700545 if (ifp->flags & IFA_F_OPTIMISTIC)
546 override = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700547 in6_ifa_put(ifp);
548 } else {
YOSHIFUJI Hideaki7cbca672008-03-25 09:37:42 +0900549 if (ipv6_dev_get_saddr(dev, daddr,
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900550 inet6_sk(dev_net(dev)->ipv6.ndisc_sk)->srcprefs,
YOSHIFUJI Hideaki7cbca672008-03-25 09:37:42 +0900551 &tmpaddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700552 return;
553 src_addr = &tmpaddr;
554 }
555
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900556 icmp6h.icmp6_router = router;
557 icmp6h.icmp6_solicited = solicited;
558 icmp6h.icmp6_override = override;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900560 __ndisc_send(dev, neigh, daddr, src_addr,
561 &icmp6h, solicited_addr,
David L Stevens14878f72007-09-16 16:52:35 -0700562 inc_opt ? ND_OPT_TARGET_LL_ADDR : 0);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900563}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700564
565void ndisc_send_ns(struct net_device *dev, struct neighbour *neigh,
566 struct in6_addr *solicit,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900567 struct in6_addr *daddr, struct in6_addr *saddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700569 struct in6_addr addr_buf;
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900570 struct icmp6hdr icmp6h = {
571 .icmp6_type = NDISC_NEIGHBOUR_SOLICITATION,
572 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573
574 if (saddr == NULL) {
Neil Horman95c385b2007-04-25 17:08:10 -0700575 if (ipv6_get_lladdr(dev, &addr_buf,
576 (IFA_F_TENTATIVE|IFA_F_OPTIMISTIC)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577 return;
578 saddr = &addr_buf;
579 }
580
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900581 __ndisc_send(dev, neigh, daddr, saddr,
582 &icmp6h, solicit,
David L Stevens14878f72007-09-16 16:52:35 -0700583 !ipv6_addr_any(saddr) ? ND_OPT_SOURCE_LL_ADDR : 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700584}
585
586void ndisc_send_rs(struct net_device *dev, struct in6_addr *saddr,
587 struct in6_addr *daddr)
588{
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900589 struct icmp6hdr icmp6h = {
590 .icmp6_type = NDISC_ROUTER_SOLICITATION,
591 };
Neil Horman95c385b2007-04-25 17:08:10 -0700592 int send_sllao = dev->addr_len;
Neil Horman95c385b2007-04-25 17:08:10 -0700593
594#ifdef CONFIG_IPV6_OPTIMISTIC_DAD
595 /*
596 * According to section 2.2 of RFC 4429, we must not
597 * send router solicitations with a sllao from
598 * optimistic addresses, but we may send the solicitation
599 * if we don't include the sllao. So here we check
600 * if our address is optimistic, and if so, we
Joe Perchesbea85192007-12-20 14:01:35 -0800601 * suppress the inclusion of the sllao.
Neil Horman95c385b2007-04-25 17:08:10 -0700602 */
603 if (send_sllao) {
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900604 struct inet6_ifaddr *ifp = ipv6_get_ifaddr(dev_net(dev), saddr,
Daniel Lezcano1cab3da2008-01-10 22:44:09 -0800605 dev, 1);
Neil Horman95c385b2007-04-25 17:08:10 -0700606 if (ifp) {
607 if (ifp->flags & IFA_F_OPTIMISTIC) {
YOSHIFUJI Hideakica043562007-02-28 23:13:20 +0900608 send_sllao = 0;
Neil Horman95c385b2007-04-25 17:08:10 -0700609 }
YOSHIFUJI Hideakica043562007-02-28 23:13:20 +0900610 in6_ifa_put(ifp);
Neil Horman95c385b2007-04-25 17:08:10 -0700611 } else {
612 send_sllao = 0;
613 }
614 }
615#endif
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900616 __ndisc_send(dev, NULL, daddr, saddr,
617 &icmp6h, NULL,
David L Stevens14878f72007-09-16 16:52:35 -0700618 send_sllao ? ND_OPT_SOURCE_LL_ADDR : 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619}
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900620
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621
622static void ndisc_error_report(struct neighbour *neigh, struct sk_buff *skb)
623{
624 /*
625 * "The sender MUST return an ICMP
626 * destination unreachable"
627 */
628 dst_link_failure(skb);
629 kfree_skb(skb);
630}
631
632/* Called with locked neigh: either read or both */
633
634static void ndisc_solicit(struct neighbour *neigh, struct sk_buff *skb)
635{
636 struct in6_addr *saddr = NULL;
637 struct in6_addr mcaddr;
638 struct net_device *dev = neigh->dev;
639 struct in6_addr *target = (struct in6_addr *)&neigh->primary_key;
640 int probes = atomic_read(&neigh->probes);
641
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900642 if (skb && ipv6_chk_addr(dev_net(dev), &ipv6_hdr(skb)->saddr, dev, 1))
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700643 saddr = &ipv6_hdr(skb)->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700644
645 if ((probes -= neigh->parms->ucast_probes) < 0) {
646 if (!(neigh->nud_state & NUD_VALID)) {
647 ND_PRINTK1(KERN_DEBUG
648 "%s(): trying to ucast probe in NUD_INVALID: "
Joe Perches46b86a22006-01-13 14:29:07 -0800649 NIP6_FMT "\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -0800650 __func__,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700651 NIP6(*target));
652 }
653 ndisc_send_ns(dev, neigh, target, target, saddr);
654 } else if ((probes -= neigh->parms->app_probes) < 0) {
655#ifdef CONFIG_ARPD
656 neigh_app_ns(neigh);
657#endif
658 } else {
659 addrconf_addr_solict_mult(target, &mcaddr);
660 ndisc_send_ns(dev, NULL, target, &mcaddr, saddr);
661 }
662}
663
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900664static int pndisc_is_router(const void *pkey,
665 struct net_device *dev)
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700666{
667 struct pneigh_entry *n;
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900668 int ret = -1;
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700669
670 read_lock_bh(&nd_tbl.lock);
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900671 n = __pneigh_lookup(&nd_tbl, dev_net(dev), pkey, dev);
672 if (n)
673 ret = !!(n->flags & NTF_ROUTER);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700674 read_unlock_bh(&nd_tbl.lock);
675
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900676 return ret;
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700677}
678
Linus Torvalds1da177e2005-04-16 15:20:36 -0700679static void ndisc_recv_ns(struct sk_buff *skb)
680{
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -0700681 struct nd_msg *msg = (struct nd_msg *)skb_transport_header(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700682 struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
683 struct in6_addr *daddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684 u8 *lladdr = NULL;
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700685 u32 ndoptlen = skb->tail - (skb->transport_header +
686 offsetof(struct nd_msg, opt));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687 struct ndisc_options ndopts;
688 struct net_device *dev = skb->dev;
689 struct inet6_ifaddr *ifp;
690 struct inet6_dev *idev = NULL;
691 struct neighbour *neigh;
692 int dad = ipv6_addr_any(saddr);
693 int inc;
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900694 int is_router = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695
696 if (ipv6_addr_is_multicast(&msg->target)) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900697 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698 "ICMPv6 NS: multicast target address");
699 return;
700 }
701
702 /*
703 * RFC2461 7.1.1:
704 * DAD has to be destined for solicited node multicast address.
705 */
706 if (dad &&
707 !(daddr->s6_addr32[0] == htonl(0xff020000) &&
708 daddr->s6_addr32[1] == htonl(0x00000000) &&
709 daddr->s6_addr32[2] == htonl(0x00000001) &&
710 daddr->s6_addr [12] == 0xff )) {
711 ND_PRINTK2(KERN_WARNING
712 "ICMPv6 NS: bad DAD packet (wrong destination)\n");
713 return;
714 }
715
716 if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts)) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900717 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 "ICMPv6 NS: invalid ND options\n");
719 return;
720 }
721
722 if (ndopts.nd_opts_src_lladdr) {
723 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr, dev);
724 if (!lladdr) {
725 ND_PRINTK2(KERN_WARNING
726 "ICMPv6 NS: invalid link-layer address length\n");
727 return;
728 }
729
730 /* RFC2461 7.1.1:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900731 * If the IP source address is the unspecified address,
732 * there MUST NOT be source link-layer address option
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 * in the message.
734 */
735 if (dad) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900736 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -0700737 "ICMPv6 NS: bad DAD packet (link-layer address option)\n");
738 return;
739 }
740 }
741
742 inc = ipv6_addr_is_multicast(daddr);
743
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900744 ifp = ipv6_get_ifaddr(dev_net(dev), &msg->target, dev, 1);
Daniel Lezcanoa18bc692008-03-07 11:14:49 -0800745 if (ifp) {
Neil Horman95c385b2007-04-25 17:08:10 -0700746
747 if (ifp->flags & (IFA_F_TENTATIVE|IFA_F_OPTIMISTIC)) {
748 if (dad) {
749 if (dev->type == ARPHRD_IEEE802_TR) {
Arnaldo Carvalho de Melo98e399f2007-03-19 15:33:04 -0700750 const unsigned char *sadr;
751 sadr = skb_mac_header(skb);
Neil Horman95c385b2007-04-25 17:08:10 -0700752 if (((sadr[8] ^ dev->dev_addr[0]) & 0x7f) == 0 &&
753 sadr[9] == dev->dev_addr[1] &&
754 sadr[10] == dev->dev_addr[2] &&
755 sadr[11] == dev->dev_addr[3] &&
756 sadr[12] == dev->dev_addr[4] &&
757 sadr[13] == dev->dev_addr[5]) {
758 /* looped-back to us */
759 goto out;
760 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761 }
Neil Horman95c385b2007-04-25 17:08:10 -0700762
763 /*
764 * We are colliding with another node
765 * who is doing DAD
766 * so fail our DAD process
767 */
768 addrconf_dad_failure(ifp);
Denis V. Lunev9e3be4b2007-09-11 11:04:49 +0200769 return;
Neil Horman95c385b2007-04-25 17:08:10 -0700770 } else {
771 /*
772 * This is not a dad solicitation.
773 * If we are an optimistic node,
774 * we should respond.
775 * Otherwise, we should ignore it.
776 */
777 if (!(ifp->flags & IFA_F_OPTIMISTIC))
778 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700779 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780 }
781
782 idev = ifp->idev;
783 } else {
784 idev = in6_dev_get(dev);
785 if (!idev) {
786 /* XXX: count this drop? */
787 return;
788 }
789
Daniel Lezcano6ab57e72008-03-26 16:52:32 -0700790 if (ipv6_chk_acast_addr(dev_net(dev), dev, &msg->target) ||
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900791 (idev->cnf.forwarding &&
YOSHIFUJI Hideakifbea49e2006-09-22 14:43:49 -0700792 (ipv6_devconf.proxy_ndp || idev->cnf.proxy_ndp) &&
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900793 (is_router = pndisc_is_router(&msg->target, dev)) >= 0)) {
Patrick McHardya61bbcf2005-08-14 17:24:31 -0700794 if (!(NEIGH_CB(skb)->flags & LOCALLY_ENQUEUED) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700795 skb->pkt_type != PACKET_HOST &&
796 inc != 0 &&
797 idev->nd_parms->proxy_delay != 0) {
798 /*
799 * for anycast or proxy,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900800 * sender should delay its response
801 * by a random time between 0 and
Linus Torvalds1da177e2005-04-16 15:20:36 -0700802 * MAX_ANYCAST_DELAY_TIME seconds.
803 * (RFC2461) -- yoshfuji
804 */
805 struct sk_buff *n = skb_clone(skb, GFP_ATOMIC);
806 if (n)
807 pneigh_enqueue(&nd_tbl, idev->nd_parms, n);
808 goto out;
809 }
810 } else
811 goto out;
812 }
813
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900814 if (is_router < 0)
815 is_router = !!idev->cnf.forwarding;
Ville Nuorvala62dd9312006-09-22 14:43:19 -0700816
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817 if (dad) {
818 struct in6_addr maddr;
819
820 ipv6_addr_all_nodes(&maddr);
821 ndisc_send_na(dev, NULL, &maddr, &msg->target,
Ville Nuorvala62dd9312006-09-22 14:43:19 -0700822 is_router, 0, (ifp != NULL), 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700823 goto out;
824 }
825
826 if (inc)
827 NEIGH_CACHE_STAT_INC(&nd_tbl, rcv_probes_mcast);
828 else
829 NEIGH_CACHE_STAT_INC(&nd_tbl, rcv_probes_ucast);
830
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900831 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700832 * update / create cache entry
833 * for the source address
834 */
835 neigh = __neigh_lookup(&nd_tbl, saddr, dev,
836 !inc || lladdr || !dev->addr_len);
837 if (neigh)
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900838 neigh_update(neigh, lladdr, NUD_STALE,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700839 NEIGH_UPDATE_F_WEAK_OVERRIDE|
840 NEIGH_UPDATE_F_OVERRIDE);
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700841 if (neigh || !dev->header_ops) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700842 ndisc_send_na(dev, neigh, saddr, &msg->target,
Ville Nuorvala62dd9312006-09-22 14:43:19 -0700843 is_router,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700844 1, (ifp != NULL && inc), inc);
845 if (neigh)
846 neigh_release(neigh);
847 }
848
849out:
850 if (ifp)
851 in6_ifa_put(ifp);
852 else
853 in6_dev_put(idev);
854
855 return;
856}
857
858static void ndisc_recv_na(struct sk_buff *skb)
859{
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -0700860 struct nd_msg *msg = (struct nd_msg *)skb_transport_header(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700861 struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
862 struct in6_addr *daddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700863 u8 *lladdr = NULL;
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700864 u32 ndoptlen = skb->tail - (skb->transport_header +
865 offsetof(struct nd_msg, opt));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700866 struct ndisc_options ndopts;
867 struct net_device *dev = skb->dev;
868 struct inet6_ifaddr *ifp;
869 struct neighbour *neigh;
870
871 if (skb->len < sizeof(struct nd_msg)) {
872 ND_PRINTK2(KERN_WARNING
873 "ICMPv6 NA: packet too short\n");
874 return;
875 }
876
877 if (ipv6_addr_is_multicast(&msg->target)) {
878 ND_PRINTK2(KERN_WARNING
879 "ICMPv6 NA: target address is multicast.\n");
880 return;
881 }
882
883 if (ipv6_addr_is_multicast(daddr) &&
884 msg->icmph.icmp6_solicited) {
885 ND_PRINTK2(KERN_WARNING
886 "ICMPv6 NA: solicited NA is multicasted.\n");
887 return;
888 }
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900889
Linus Torvalds1da177e2005-04-16 15:20:36 -0700890 if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts)) {
891 ND_PRINTK2(KERN_WARNING
892 "ICMPv6 NS: invalid ND option\n");
893 return;
894 }
895 if (ndopts.nd_opts_tgt_lladdr) {
896 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_tgt_lladdr, dev);
897 if (!lladdr) {
898 ND_PRINTK2(KERN_WARNING
899 "ICMPv6 NA: invalid link-layer address length\n");
900 return;
901 }
902 }
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900903 ifp = ipv6_get_ifaddr(dev_net(dev), &msg->target, dev, 1);
Daniel Lezcanoa18bc692008-03-07 11:14:49 -0800904 if (ifp) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700905 if (ifp->flags & IFA_F_TENTATIVE) {
906 addrconf_dad_failure(ifp);
907 return;
908 }
909 /* What should we make now? The advertisement
910 is invalid, but ndisc specs say nothing
911 about it. It could be misconfiguration, or
912 an smart proxy agent tries to help us :-)
913 */
914 ND_PRINTK1(KERN_WARNING
915 "ICMPv6 NA: someone advertises our address on %s!\n",
916 ifp->idev->dev->name);
917 in6_ifa_put(ifp);
918 return;
919 }
920 neigh = neigh_lookup(&nd_tbl, &msg->target, dev);
921
922 if (neigh) {
923 u8 old_flags = neigh->flags;
924
925 if (neigh->nud_state & NUD_FAILED)
926 goto out;
927
Ville Nuorvala5f3e6e92006-09-22 14:42:46 -0700928 /*
929 * Don't update the neighbor cache entry on a proxy NA from
930 * ourselves because either the proxied node is off link or it
931 * has already sent a NA to us.
932 */
933 if (lladdr && !memcmp(lladdr, dev->dev_addr, dev->addr_len) &&
YOSHIFUJI Hideakifbea49e2006-09-22 14:43:49 -0700934 ipv6_devconf.forwarding && ipv6_devconf.proxy_ndp &&
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900935 pneigh_lookup(&nd_tbl, dev_net(dev), &msg->target, dev, 0)) {
YOSHIFUJI Hideakifbea49e2006-09-22 14:43:49 -0700936 /* XXX: idev->cnf.prixy_ndp */
Ville Nuorvala5f3e6e92006-09-22 14:42:46 -0700937 goto out;
YOSHIFUJI Hideakifbea49e2006-09-22 14:43:49 -0700938 }
Ville Nuorvala5f3e6e92006-09-22 14:42:46 -0700939
Linus Torvalds1da177e2005-04-16 15:20:36 -0700940 neigh_update(neigh, lladdr,
941 msg->icmph.icmp6_solicited ? NUD_REACHABLE : NUD_STALE,
942 NEIGH_UPDATE_F_WEAK_OVERRIDE|
943 (msg->icmph.icmp6_override ? NEIGH_UPDATE_F_OVERRIDE : 0)|
944 NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
945 (msg->icmph.icmp6_router ? NEIGH_UPDATE_F_ISROUTER : 0));
946
947 if ((old_flags & ~neigh->flags) & NTF_ROUTER) {
948 /*
949 * Change: router to host
950 */
951 struct rt6_info *rt;
952 rt = rt6_get_dflt_router(saddr, dev);
953 if (rt)
Thomas Grafe0a1ad732006-08-22 00:00:21 -0700954 ip6_del_rt(rt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700955 }
956
957out:
958 neigh_release(neigh);
959 }
960}
961
962static void ndisc_recv_rs(struct sk_buff *skb)
963{
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -0700964 struct rs_msg *rs_msg = (struct rs_msg *)skb_transport_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700965 unsigned long ndoptlen = skb->len - sizeof(*rs_msg);
966 struct neighbour *neigh;
967 struct inet6_dev *idev;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700968 struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700969 struct ndisc_options ndopts;
970 u8 *lladdr = NULL;
971
972 if (skb->len < sizeof(*rs_msg))
973 return;
974
975 idev = in6_dev_get(skb->dev);
976 if (!idev) {
977 if (net_ratelimit())
978 ND_PRINTK1("ICMP6 RS: can't find in6 device\n");
979 return;
980 }
981
982 /* Don't accept RS if we're not in router mode */
983 if (!idev->cnf.forwarding)
984 goto out;
985
986 /*
987 * Don't update NCE if src = ::;
988 * this implies that the source node has no ip address assigned yet.
989 */
990 if (ipv6_addr_any(saddr))
991 goto out;
992
993 /* Parse ND options */
994 if (!ndisc_parse_options(rs_msg->opt, ndoptlen, &ndopts)) {
995 if (net_ratelimit())
996 ND_PRINTK2("ICMP6 NS: invalid ND option, ignored\n");
997 goto out;
998 }
999
1000 if (ndopts.nd_opts_src_lladdr) {
1001 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr,
1002 skb->dev);
1003 if (!lladdr)
1004 goto out;
1005 }
1006
1007 neigh = __neigh_lookup(&nd_tbl, saddr, skb->dev, 1);
1008 if (neigh) {
1009 neigh_update(neigh, lladdr, NUD_STALE,
1010 NEIGH_UPDATE_F_WEAK_OVERRIDE|
1011 NEIGH_UPDATE_F_OVERRIDE|
1012 NEIGH_UPDATE_F_OVERRIDE_ISROUTER);
1013 neigh_release(neigh);
1014 }
1015out:
1016 in6_dev_put(idev);
1017}
1018
Pierre Ynard31910572007-10-10 21:22:05 -07001019static void ndisc_ra_useropt(struct sk_buff *ra, struct nd_opt_hdr *opt)
1020{
1021 struct icmp6hdr *icmp6h = (struct icmp6hdr *)skb_transport_header(ra);
1022 struct sk_buff *skb;
1023 struct nlmsghdr *nlh;
1024 struct nduseroptmsg *ndmsg;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001025 struct net *net = dev_net(ra->dev);
Pierre Ynard31910572007-10-10 21:22:05 -07001026 int err;
1027 int base_size = NLMSG_ALIGN(sizeof(struct nduseroptmsg)
1028 + (opt->nd_opt_len << 3));
1029 size_t msg_size = base_size + nla_total_size(sizeof(struct in6_addr));
1030
1031 skb = nlmsg_new(msg_size, GFP_ATOMIC);
1032 if (skb == NULL) {
1033 err = -ENOBUFS;
1034 goto errout;
1035 }
1036
1037 nlh = nlmsg_put(skb, 0, 0, RTM_NEWNDUSEROPT, base_size, 0);
1038 if (nlh == NULL) {
1039 goto nla_put_failure;
1040 }
1041
1042 ndmsg = nlmsg_data(nlh);
1043 ndmsg->nduseropt_family = AF_INET6;
Pierre Ynarddbb2ed22007-11-12 17:58:35 -08001044 ndmsg->nduseropt_ifindex = ra->dev->ifindex;
Pierre Ynard31910572007-10-10 21:22:05 -07001045 ndmsg->nduseropt_icmp_type = icmp6h->icmp6_type;
1046 ndmsg->nduseropt_icmp_code = icmp6h->icmp6_code;
1047 ndmsg->nduseropt_opts_len = opt->nd_opt_len << 3;
1048
1049 memcpy(ndmsg + 1, opt, opt->nd_opt_len << 3);
1050
1051 NLA_PUT(skb, NDUSEROPT_SRCADDR, sizeof(struct in6_addr),
1052 &ipv6_hdr(ra)->saddr);
1053 nlmsg_end(skb, nlh);
1054
Daniel Lezcanoa18bc692008-03-07 11:14:49 -08001055 err = rtnl_notify(skb, net, 0, RTNLGRP_ND_USEROPT, NULL,
Denis V. Lunev97c53ca2007-11-19 22:26:51 -08001056 GFP_ATOMIC);
Pierre Ynard31910572007-10-10 21:22:05 -07001057 if (err < 0)
1058 goto errout;
1059
1060 return;
1061
1062nla_put_failure:
1063 nlmsg_free(skb);
1064 err = -EMSGSIZE;
1065errout:
Daniel Lezcanoa18bc692008-03-07 11:14:49 -08001066 rtnl_set_sk_err(net, RTNLGRP_ND_USEROPT, err);
Pierre Ynard31910572007-10-10 21:22:05 -07001067}
1068
Linus Torvalds1da177e2005-04-16 15:20:36 -07001069static void ndisc_router_discovery(struct sk_buff *skb)
1070{
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -07001071 struct ra_msg *ra_msg = (struct ra_msg *)skb_transport_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001072 struct neighbour *neigh = NULL;
1073 struct inet6_dev *in6_dev;
YOSHIFUJI Hideaki65f5c7c2006-03-20 16:55:08 -08001074 struct rt6_info *rt = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001075 int lifetime;
1076 struct ndisc_options ndopts;
1077 int optlen;
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001078 unsigned int pref = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001079
1080 __u8 * opt = (__u8 *)(ra_msg + 1);
1081
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -07001082 optlen = (skb->tail - skb->transport_header) - sizeof(struct ra_msg);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001083
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001084 if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001085 ND_PRINTK2(KERN_WARNING
1086 "ICMPv6 RA: source address is not link-local.\n");
1087 return;
1088 }
1089 if (optlen < 0) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001090 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -07001091 "ICMPv6 RA: packet too short\n");
1092 return;
1093 }
1094
1095 /*
1096 * set the RA_RECV flag in the interface
1097 */
1098
1099 in6_dev = in6_dev_get(skb->dev);
1100 if (in6_dev == NULL) {
1101 ND_PRINTK0(KERN_ERR
1102 "ICMPv6 RA: can't find inet6 device for %s.\n",
1103 skb->dev->name);
1104 return;
1105 }
1106 if (in6_dev->cnf.forwarding || !in6_dev->cnf.accept_ra) {
1107 in6_dev_put(in6_dev);
1108 return;
1109 }
1110
1111 if (!ndisc_parse_options(opt, optlen, &ndopts)) {
1112 in6_dev_put(in6_dev);
1113 ND_PRINTK2(KERN_WARNING
1114 "ICMP6 RA: invalid ND options\n");
1115 return;
1116 }
1117
1118 if (in6_dev->if_flags & IF_RS_SENT) {
1119 /*
1120 * flag that an RA was received after an RS was sent
1121 * out on this interface.
1122 */
1123 in6_dev->if_flags |= IF_RA_RCVD;
1124 }
1125
1126 /*
1127 * Remember the managed/otherconf flags from most recently
1128 * received RA message (RFC 2462) -- yoshfuji
1129 */
1130 in6_dev->if_flags = (in6_dev->if_flags & ~(IF_RA_MANAGED |
1131 IF_RA_OTHERCONF)) |
1132 (ra_msg->icmph.icmp6_addrconf_managed ?
1133 IF_RA_MANAGED : 0) |
1134 (ra_msg->icmph.icmp6_addrconf_other ?
1135 IF_RA_OTHERCONF : 0);
1136
YOSHIFUJI Hideaki65f5c7c2006-03-20 16:55:08 -08001137 if (!in6_dev->cnf.accept_ra_defrtr)
1138 goto skip_defrtr;
1139
Linus Torvalds1da177e2005-04-16 15:20:36 -07001140 lifetime = ntohs(ra_msg->icmph.icmp6_rt_lifetime);
1141
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001142#ifdef CONFIG_IPV6_ROUTER_PREF
1143 pref = ra_msg->icmph.icmp6_router_pref;
1144 /* 10b is handled as if it were 00b (medium) */
YOSHIFUJI Hideaki930d6ff2006-03-20 17:05:30 -08001145 if (pref == ICMPV6_ROUTER_PREF_INVALID ||
YOSHIFUJI Hideaki6d5b78c2007-06-22 16:07:04 -07001146 !in6_dev->cnf.accept_ra_rtr_pref)
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001147 pref = ICMPV6_ROUTER_PREF_MEDIUM;
1148#endif
1149
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001150 rt = rt6_get_dflt_router(&ipv6_hdr(skb)->saddr, skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001151
1152 if (rt)
1153 neigh = rt->rt6i_nexthop;
1154
1155 if (rt && lifetime == 0) {
1156 neigh_clone(neigh);
Thomas Grafe0a1ad732006-08-22 00:00:21 -07001157 ip6_del_rt(rt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158 rt = NULL;
1159 }
1160
1161 if (rt == NULL && lifetime) {
1162 ND_PRINTK3(KERN_DEBUG
1163 "ICMPv6 RA: adding default router.\n");
1164
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001165 rt = rt6_add_dflt_router(&ipv6_hdr(skb)->saddr, skb->dev, pref);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001166 if (rt == NULL) {
1167 ND_PRINTK0(KERN_ERR
1168 "ICMPv6 RA: %s() failed to add default route.\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -08001169 __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001170 in6_dev_put(in6_dev);
1171 return;
1172 }
1173
1174 neigh = rt->rt6i_nexthop;
1175 if (neigh == NULL) {
1176 ND_PRINTK0(KERN_ERR
1177 "ICMPv6 RA: %s() got default router without neighbour.\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -08001178 __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001179 dst_release(&rt->u.dst);
1180 in6_dev_put(in6_dev);
1181 return;
1182 }
1183 neigh->flags |= NTF_ROUTER;
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001184 } else if (rt) {
1185 rt->rt6i_flags |= (rt->rt6i_flags & ~RTF_PREF_MASK) | RTF_PREF(pref);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001186 }
1187
1188 if (rt)
1189 rt->rt6i_expires = jiffies + (HZ * lifetime);
1190
1191 if (ra_msg->icmph.icmp6_hop_limit) {
1192 in6_dev->cnf.hop_limit = ra_msg->icmph.icmp6_hop_limit;
1193 if (rt)
1194 rt->u.dst.metrics[RTAX_HOPLIMIT-1] = ra_msg->icmph.icmp6_hop_limit;
1195 }
1196
YOSHIFUJI Hideaki65f5c7c2006-03-20 16:55:08 -08001197skip_defrtr:
1198
Linus Torvalds1da177e2005-04-16 15:20:36 -07001199 /*
1200 * Update Reachable Time and Retrans Timer
1201 */
1202
1203 if (in6_dev->nd_parms) {
1204 unsigned long rtime = ntohl(ra_msg->retrans_timer);
1205
1206 if (rtime && rtime/1000 < MAX_SCHEDULE_TIMEOUT/HZ) {
1207 rtime = (rtime*HZ)/1000;
1208 if (rtime < HZ/10)
1209 rtime = HZ/10;
1210 in6_dev->nd_parms->retrans_time = rtime;
1211 in6_dev->tstamp = jiffies;
1212 inet6_ifinfo_notify(RTM_NEWLINK, in6_dev);
1213 }
1214
1215 rtime = ntohl(ra_msg->reachable_time);
1216 if (rtime && rtime/1000 < MAX_SCHEDULE_TIMEOUT/(3*HZ)) {
1217 rtime = (rtime*HZ)/1000;
1218
1219 if (rtime < HZ/10)
1220 rtime = HZ/10;
1221
1222 if (rtime != in6_dev->nd_parms->base_reachable_time) {
1223 in6_dev->nd_parms->base_reachable_time = rtime;
1224 in6_dev->nd_parms->gc_staletime = 3 * rtime;
1225 in6_dev->nd_parms->reachable_time = neigh_rand_reach_time(rtime);
1226 in6_dev->tstamp = jiffies;
1227 inet6_ifinfo_notify(RTM_NEWLINK, in6_dev);
1228 }
1229 }
1230 }
1231
1232 /*
1233 * Process options.
1234 */
1235
1236 if (!neigh)
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001237 neigh = __neigh_lookup(&nd_tbl, &ipv6_hdr(skb)->saddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001238 skb->dev, 1);
1239 if (neigh) {
1240 u8 *lladdr = NULL;
1241 if (ndopts.nd_opts_src_lladdr) {
1242 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr,
1243 skb->dev);
1244 if (!lladdr) {
1245 ND_PRINTK2(KERN_WARNING
1246 "ICMPv6 RA: invalid link-layer address length\n");
1247 goto out;
1248 }
1249 }
1250 neigh_update(neigh, lladdr, NUD_STALE,
1251 NEIGH_UPDATE_F_WEAK_OVERRIDE|
1252 NEIGH_UPDATE_F_OVERRIDE|
1253 NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
1254 NEIGH_UPDATE_F_ISROUTER);
1255 }
1256
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001257#ifdef CONFIG_IPV6_ROUTE_INFO
YOSHIFUJI Hideaki09c884d2006-03-20 17:07:03 -08001258 if (in6_dev->cnf.accept_ra_rtr_pref && ndopts.nd_opts_ri) {
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001259 struct nd_opt_hdr *p;
1260 for (p = ndopts.nd_opts_ri;
1261 p;
1262 p = ndisc_next_option(p, ndopts.nd_opts_ri_end)) {
YOSHIFUJI Hideaki09c884d2006-03-20 17:07:03 -08001263 if (((struct route_info *)p)->prefix_len > in6_dev->cnf.accept_ra_rt_info_max_plen)
1264 continue;
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001265 rt6_route_rcv(skb->dev, (u8*)p, (p->nd_opt_len) << 3,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001266 &ipv6_hdr(skb)->saddr);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001267 }
1268 }
1269#endif
1270
YOSHIFUJI Hideakic4fd30e2006-03-20 16:55:26 -08001271 if (in6_dev->cnf.accept_ra_pinfo && ndopts.nd_opts_pi) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001272 struct nd_opt_hdr *p;
1273 for (p = ndopts.nd_opts_pi;
1274 p;
1275 p = ndisc_next_option(p, ndopts.nd_opts_pi_end)) {
1276 addrconf_prefix_rcv(skb->dev, (u8*)p, (p->nd_opt_len) << 3);
1277 }
1278 }
1279
1280 if (ndopts.nd_opts_mtu) {
Al Viroe69a4ad2006-11-14 20:56:00 -08001281 __be32 n;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001282 u32 mtu;
1283
Al Viroe69a4ad2006-11-14 20:56:00 -08001284 memcpy(&n, ((u8*)(ndopts.nd_opts_mtu+1))+2, sizeof(mtu));
1285 mtu = ntohl(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001286
1287 if (mtu < IPV6_MIN_MTU || mtu > skb->dev->mtu) {
1288 ND_PRINTK2(KERN_WARNING
1289 "ICMPv6 RA: invalid mtu: %d\n",
1290 mtu);
1291 } else if (in6_dev->cnf.mtu6 != mtu) {
1292 in6_dev->cnf.mtu6 = mtu;
1293
1294 if (rt)
1295 rt->u.dst.metrics[RTAX_MTU-1] = mtu;
1296
1297 rt6_mtu_change(skb->dev, mtu);
1298 }
1299 }
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001300
Pierre Ynard31910572007-10-10 21:22:05 -07001301 if (ndopts.nd_useropts) {
YOSHIFUJI Hideaki61cf46ad2008-01-22 17:32:53 +09001302 struct nd_opt_hdr *p;
1303 for (p = ndopts.nd_useropts;
1304 p;
1305 p = ndisc_next_useropt(p, ndopts.nd_useropts_end)) {
1306 ndisc_ra_useropt(skb, p);
Pierre Ynard31910572007-10-10 21:22:05 -07001307 }
1308 }
1309
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310 if (ndopts.nd_opts_tgt_lladdr || ndopts.nd_opts_rh) {
1311 ND_PRINTK2(KERN_WARNING
1312 "ICMPv6 RA: invalid RA options");
1313 }
1314out:
1315 if (rt)
1316 dst_release(&rt->u.dst);
1317 else if (neigh)
1318 neigh_release(neigh);
1319 in6_dev_put(in6_dev);
1320}
1321
1322static void ndisc_redirect_rcv(struct sk_buff *skb)
1323{
1324 struct inet6_dev *in6_dev;
1325 struct icmp6hdr *icmph;
1326 struct in6_addr *dest;
1327 struct in6_addr *target; /* new first hop to destination */
1328 struct neighbour *neigh;
1329 int on_link = 0;
1330 struct ndisc_options ndopts;
1331 int optlen;
1332 u8 *lladdr = NULL;
1333
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001334 if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001335 ND_PRINTK2(KERN_WARNING
1336 "ICMPv6 Redirect: source address is not link-local.\n");
1337 return;
1338 }
1339
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -07001340 optlen = skb->tail - skb->transport_header;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001341 optlen -= sizeof(struct icmp6hdr) + 2 * sizeof(struct in6_addr);
1342
1343 if (optlen < 0) {
1344 ND_PRINTK2(KERN_WARNING
1345 "ICMPv6 Redirect: packet too short\n");
1346 return;
1347 }
1348
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -03001349 icmph = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001350 target = (struct in6_addr *) (icmph + 1);
1351 dest = target + 1;
1352
1353 if (ipv6_addr_is_multicast(dest)) {
1354 ND_PRINTK2(KERN_WARNING
1355 "ICMPv6 Redirect: destination address is multicast.\n");
1356 return;
1357 }
1358
1359 if (ipv6_addr_equal(dest, target)) {
1360 on_link = 1;
Brian Haleybf0b48d2007-10-08 00:12:05 -07001361 } else if (ipv6_addr_type(target) !=
1362 (IPV6_ADDR_UNICAST|IPV6_ADDR_LINKLOCAL)) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001363 ND_PRINTK2(KERN_WARNING
Brian Haleybf0b48d2007-10-08 00:12:05 -07001364 "ICMPv6 Redirect: target address is not link-local unicast.\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001365 return;
1366 }
1367
1368 in6_dev = in6_dev_get(skb->dev);
1369 if (!in6_dev)
1370 return;
1371 if (in6_dev->cnf.forwarding || !in6_dev->cnf.accept_redirects) {
1372 in6_dev_put(in6_dev);
1373 return;
1374 }
1375
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001376 /* RFC2461 8.1:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001377 * The IP source address of the Redirect MUST be the same as the current
1378 * first-hop router for the specified ICMP Destination Address.
1379 */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001380
Linus Torvalds1da177e2005-04-16 15:20:36 -07001381 if (!ndisc_parse_options((u8*)(dest + 1), optlen, &ndopts)) {
1382 ND_PRINTK2(KERN_WARNING
1383 "ICMPv6 Redirect: invalid ND options\n");
1384 in6_dev_put(in6_dev);
1385 return;
1386 }
1387 if (ndopts.nd_opts_tgt_lladdr) {
1388 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_tgt_lladdr,
1389 skb->dev);
1390 if (!lladdr) {
1391 ND_PRINTK2(KERN_WARNING
1392 "ICMPv6 Redirect: invalid link-layer address length\n");
1393 in6_dev_put(in6_dev);
1394 return;
1395 }
1396 }
1397
1398 neigh = __neigh_lookup(&nd_tbl, target, skb->dev, 1);
1399 if (neigh) {
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001400 rt6_redirect(dest, &ipv6_hdr(skb)->daddr,
1401 &ipv6_hdr(skb)->saddr, neigh, lladdr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001402 on_link);
1403 neigh_release(neigh);
1404 }
1405 in6_dev_put(in6_dev);
1406}
1407
1408void ndisc_send_redirect(struct sk_buff *skb, struct neighbour *neigh,
1409 struct in6_addr *target)
1410{
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001411 struct net_device *dev = skb->dev;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001412 struct net *net = dev_net(dev);
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001413 struct sock *sk = net->ipv6.ndisc_sk;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001414 int len = sizeof(struct icmp6hdr) + 2 * sizeof(struct in6_addr);
1415 struct sk_buff *buff;
1416 struct icmp6hdr *icmph;
1417 struct in6_addr saddr_buf;
1418 struct in6_addr *addrp;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001419 struct rt6_info *rt;
1420 struct dst_entry *dst;
1421 struct inet6_dev *idev;
1422 struct flowi fl;
1423 u8 *opt;
1424 int rd_len;
1425 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001426 u8 ha_buf[MAX_ADDR_LEN], *ha = NULL;
1427
Neil Horman95c385b2007-04-25 17:08:10 -07001428 if (ipv6_get_lladdr(dev, &saddr_buf, IFA_F_TENTATIVE)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001429 ND_PRINTK2(KERN_WARNING
1430 "ICMPv6 Redirect: no link-local address on %s\n",
1431 dev->name);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001432 return;
1433 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001434
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001435 if (!ipv6_addr_equal(&ipv6_hdr(skb)->daddr, target) &&
Brian Haleybf0b48d2007-10-08 00:12:05 -07001436 ipv6_addr_type(target) != (IPV6_ADDR_UNICAST|IPV6_ADDR_LINKLOCAL)) {
Li Yewang29556522007-01-30 14:33:20 -08001437 ND_PRINTK2(KERN_WARNING
Brian Haleybf0b48d2007-10-08 00:12:05 -07001438 "ICMPv6 Redirect: target address is not link-local unicast.\n");
Li Yewang29556522007-01-30 14:33:20 -08001439 return;
1440 }
1441
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001442 icmpv6_flow_init(sk, &fl, NDISC_REDIRECT,
YOSHIFUJI Hideaki95e41e92007-12-06 15:43:30 -08001443 &saddr_buf, &ipv6_hdr(skb)->saddr, dev->ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001444
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001445 dst = ip6_route_output(net, NULL, &fl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001446 if (dst == NULL)
1447 return;
1448
1449 err = xfrm_lookup(&dst, &fl, NULL, 0);
Patrick McHardye104411b2005-09-08 15:11:55 -07001450 if (err)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001451 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001452
1453 rt = (struct rt6_info *) dst;
1454
1455 if (rt->rt6i_flags & RTF_GATEWAY) {
1456 ND_PRINTK2(KERN_WARNING
1457 "ICMPv6 Redirect: destination is not a neighbour.\n");
1458 dst_release(dst);
1459 return;
1460 }
1461 if (!xrlim_allow(dst, 1*HZ)) {
1462 dst_release(dst);
1463 return;
1464 }
1465
1466 if (dev->addr_len) {
1467 read_lock_bh(&neigh->lock);
1468 if (neigh->nud_state & NUD_VALID) {
1469 memcpy(ha_buf, neigh->ha, dev->addr_len);
1470 read_unlock_bh(&neigh->lock);
1471 ha = ha_buf;
1472 len += ndisc_opt_addr_space(dev);
1473 } else
1474 read_unlock_bh(&neigh->lock);
1475 }
1476
1477 rd_len = min_t(unsigned int,
1478 IPV6_MIN_MTU-sizeof(struct ipv6hdr)-len, skb->len + 8);
1479 rd_len &= ~0x7;
1480 len += rd_len;
1481
David S. Millerd54a81d2006-12-02 21:00:06 -08001482 buff = sock_alloc_send_skb(sk,
1483 (MAX_HEADER + sizeof(struct ipv6hdr) +
1484 len + LL_RESERVED_SPACE(dev)),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001485 1, &err);
1486 if (buff == NULL) {
1487 ND_PRINTK0(KERN_ERR
1488 "ICMPv6 Redirect: %s() failed to allocate an skb.\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -08001489 __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001490 dst_release(dst);
1491 return;
1492 }
1493
Linus Torvalds1da177e2005-04-16 15:20:36 -07001494 skb_reserve(buff, LL_RESERVED_SPACE(dev));
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001495 ip6_nd_hdr(sk, buff, dev, &saddr_buf, &ipv6_hdr(skb)->saddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001496 IPPROTO_ICMPV6, len);
1497
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -07001498 skb_set_transport_header(buff, skb_tail_pointer(buff) - buff->data);
Arnaldo Carvalho de Melod10ba342007-03-14 21:05:37 -03001499 skb_put(buff, len);
1500 icmph = icmp6_hdr(buff);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001501
1502 memset(icmph, 0, sizeof(struct icmp6hdr));
1503 icmph->icmp6_type = NDISC_REDIRECT;
1504
1505 /*
1506 * copy target and destination addresses
1507 */
1508
1509 addrp = (struct in6_addr *)(icmph + 1);
1510 ipv6_addr_copy(addrp, target);
1511 addrp++;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001512 ipv6_addr_copy(addrp, &ipv6_hdr(skb)->daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001513
1514 opt = (u8*) (addrp + 1);
1515
1516 /*
1517 * include target_address option
1518 */
1519
1520 if (ha)
1521 opt = ndisc_fill_addr_option(opt, ND_OPT_TARGET_LL_ADDR, ha,
1522 dev->addr_len, dev->type);
1523
1524 /*
1525 * build redirect option and copy skb over to the new packet.
1526 */
1527
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001528 memset(opt, 0, 8);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001529 *(opt++) = ND_OPT_REDIRECT_HDR;
1530 *(opt++) = (rd_len >> 3);
1531 opt += 6;
1532
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001533 memcpy(opt, ipv6_hdr(skb), rd_len - 8);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001534
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001535 icmph->icmp6_cksum = csum_ipv6_magic(&saddr_buf, &ipv6_hdr(skb)->saddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001536 len, IPPROTO_ICMPV6,
1537 csum_partial((u8 *) icmph, len, 0));
1538
1539 buff->dst = dst;
1540 idev = in6_dev_get(dst->dev);
YOSHIFUJI Hideakia11d2062006-11-04 20:11:37 +09001541 IP6_INC_STATS(idev, IPSTATS_MIB_OUTREQUESTS);
Patrick McHardy6e23ae22007-11-19 18:53:30 -08001542 err = NF_HOOK(PF_INET6, NF_INET_LOCAL_OUT, buff, NULL, dst->dev,
1543 dst_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001544 if (!err) {
David L Stevens14878f72007-09-16 16:52:35 -07001545 ICMP6MSGOUT_INC_STATS(idev, NDISC_REDIRECT);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001546 ICMP6_INC_STATS(idev, ICMP6_MIB_OUTMSGS);
1547 }
1548
1549 if (likely(idev != NULL))
1550 in6_dev_put(idev);
1551}
1552
1553static void pndisc_redo(struct sk_buff *skb)
1554{
YOSHIFUJI Hideaki140e26fc2005-10-05 12:11:41 -07001555 ndisc_recv_ns(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001556 kfree_skb(skb);
1557}
1558
1559int ndisc_rcv(struct sk_buff *skb)
1560{
1561 struct nd_msg *msg;
1562
1563 if (!pskb_may_pull(skb, skb->len))
1564 return 0;
1565
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -07001566 msg = (struct nd_msg *)skb_transport_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001567
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -07001568 __skb_push(skb, skb->data - skb_transport_header(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001569
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001570 if (ipv6_hdr(skb)->hop_limit != 255) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001571 ND_PRINTK2(KERN_WARNING
1572 "ICMPv6 NDISC: invalid hop-limit: %d\n",
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001573 ipv6_hdr(skb)->hop_limit);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001574 return 0;
1575 }
1576
1577 if (msg->icmph.icmp6_code != 0) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001578 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -07001579 "ICMPv6 NDISC: invalid ICMPv6 code: %d\n",
1580 msg->icmph.icmp6_code);
1581 return 0;
1582 }
1583
Patrick McHardya61bbcf2005-08-14 17:24:31 -07001584 memset(NEIGH_CB(skb), 0, sizeof(struct neighbour_cb));
1585
Linus Torvalds1da177e2005-04-16 15:20:36 -07001586 switch (msg->icmph.icmp6_type) {
1587 case NDISC_NEIGHBOUR_SOLICITATION:
1588 ndisc_recv_ns(skb);
1589 break;
1590
1591 case NDISC_NEIGHBOUR_ADVERTISEMENT:
1592 ndisc_recv_na(skb);
1593 break;
1594
1595 case NDISC_ROUTER_SOLICITATION:
1596 ndisc_recv_rs(skb);
1597 break;
1598
1599 case NDISC_ROUTER_ADVERTISEMENT:
1600 ndisc_router_discovery(skb);
1601 break;
1602
1603 case NDISC_REDIRECT:
1604 ndisc_redirect_rcv(skb);
1605 break;
Stephen Hemminger3ff50b72007-04-20 17:09:22 -07001606 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001607
1608 return 0;
1609}
1610
1611static int ndisc_netdev_event(struct notifier_block *this, unsigned long event, void *ptr)
1612{
1613 struct net_device *dev = ptr;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001614 struct net *net = dev_net(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001615
1616 switch (event) {
1617 case NETDEV_CHANGEADDR:
1618 neigh_changeaddr(&nd_tbl, dev);
Daniel Lezcano5b7c9312008-03-03 23:28:58 -08001619 fib6_run_gc(~0UL, net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001620 break;
1621 case NETDEV_DOWN:
1622 neigh_ifdown(&nd_tbl, dev);
Daniel Lezcano5b7c9312008-03-03 23:28:58 -08001623 fib6_run_gc(~0UL, net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001624 break;
1625 default:
1626 break;
1627 }
1628
1629 return NOTIFY_DONE;
1630}
1631
1632static struct notifier_block ndisc_netdev_notifier = {
1633 .notifier_call = ndisc_netdev_event,
1634};
1635
1636#ifdef CONFIG_SYSCTL
1637static void ndisc_warn_deprecated_sysctl(struct ctl_table *ctl,
1638 const char *func, const char *dev_name)
1639{
1640 static char warncomm[TASK_COMM_LEN];
1641 static int warned;
1642 if (strcmp(warncomm, current->comm) && warned < 5) {
1643 strcpy(warncomm, current->comm);
1644 printk(KERN_WARNING
1645 "process `%s' is using deprecated sysctl (%s) "
1646 "net.ipv6.neigh.%s.%s; "
1647 "Use net.ipv6.neigh.%s.%s_ms "
1648 "instead.\n",
1649 warncomm, func,
1650 dev_name, ctl->procname,
1651 dev_name, ctl->procname);
1652 warned++;
1653 }
1654}
1655
1656int ndisc_ifinfo_sysctl_change(struct ctl_table *ctl, int write, struct file * filp, void __user *buffer, size_t *lenp, loff_t *ppos)
1657{
1658 struct net_device *dev = ctl->extra1;
1659 struct inet6_dev *idev;
1660 int ret;
1661
Eric W. Biedermand12af672007-10-18 03:05:25 -07001662 if ((strcmp(ctl->procname, "retrans_time") == 0) ||
1663 (strcmp(ctl->procname, "base_reachable_time") == 0))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001664 ndisc_warn_deprecated_sysctl(ctl, "syscall", dev ? dev->name : "default");
1665
Eric W. Biedermand12af672007-10-18 03:05:25 -07001666 if (strcmp(ctl->procname, "retrans_time") == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001667 ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
Eric W. Biedermand12af672007-10-18 03:05:25 -07001668
1669 else if (strcmp(ctl->procname, "base_reachable_time") == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001670 ret = proc_dointvec_jiffies(ctl, write,
1671 filp, buffer, lenp, ppos);
Eric W. Biedermand12af672007-10-18 03:05:25 -07001672
1673 else if ((strcmp(ctl->procname, "retrans_time_ms") == 0) ||
YOSHIFUJI Hideakiad02ac12007-10-29 01:32:23 -07001674 (strcmp(ctl->procname, "base_reachable_time_ms") == 0))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001675 ret = proc_dointvec_ms_jiffies(ctl, write,
1676 filp, buffer, lenp, ppos);
Eric W. Biedermand12af672007-10-18 03:05:25 -07001677 else
Linus Torvalds1da177e2005-04-16 15:20:36 -07001678 ret = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001679
1680 if (write && ret == 0 && dev && (idev = in6_dev_get(dev)) != NULL) {
Eric W. Biedermand12af672007-10-18 03:05:25 -07001681 if (ctl->data == &idev->nd_parms->base_reachable_time)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001682 idev->nd_parms->reachable_time = neigh_rand_reach_time(idev->nd_parms->base_reachable_time);
1683 idev->tstamp = jiffies;
1684 inet6_ifinfo_notify(RTM_NEWLINK, idev);
1685 in6_dev_put(idev);
1686 }
1687 return ret;
1688}
1689
1690static int ndisc_ifinfo_sysctl_strategy(ctl_table *ctl, int __user *name,
1691 int nlen, void __user *oldval,
1692 size_t __user *oldlenp,
Alexey Dobriyan1f29bcd2006-12-10 02:19:10 -08001693 void __user *newval, size_t newlen)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001694{
1695 struct net_device *dev = ctl->extra1;
1696 struct inet6_dev *idev;
1697 int ret;
1698
1699 if (ctl->ctl_name == NET_NEIGH_RETRANS_TIME ||
1700 ctl->ctl_name == NET_NEIGH_REACHABLE_TIME)
1701 ndisc_warn_deprecated_sysctl(ctl, "procfs", dev ? dev->name : "default");
1702
1703 switch (ctl->ctl_name) {
1704 case NET_NEIGH_REACHABLE_TIME:
1705 ret = sysctl_jiffies(ctl, name, nlen,
Alexey Dobriyan1f29bcd2006-12-10 02:19:10 -08001706 oldval, oldlenp, newval, newlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001707 break;
1708 case NET_NEIGH_RETRANS_TIME_MS:
1709 case NET_NEIGH_REACHABLE_TIME_MS:
1710 ret = sysctl_ms_jiffies(ctl, name, nlen,
Alexey Dobriyan1f29bcd2006-12-10 02:19:10 -08001711 oldval, oldlenp, newval, newlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001712 break;
1713 default:
1714 ret = 0;
1715 }
1716
1717 if (newval && newlen && ret > 0 &&
1718 dev && (idev = in6_dev_get(dev)) != NULL) {
1719 if (ctl->ctl_name == NET_NEIGH_REACHABLE_TIME ||
1720 ctl->ctl_name == NET_NEIGH_REACHABLE_TIME_MS)
1721 idev->nd_parms->reachable_time = neigh_rand_reach_time(idev->nd_parms->base_reachable_time);
1722 idev->tstamp = jiffies;
1723 inet6_ifinfo_notify(RTM_NEWLINK, idev);
1724 in6_dev_put(idev);
1725 }
1726
1727 return ret;
1728}
1729
1730#endif
1731
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001732static int ndisc_net_init(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001733{
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001734 struct socket *sock;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001735 struct ipv6_pinfo *np;
1736 struct sock *sk;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001737 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001738
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001739 err = sock_create_kern(PF_INET6, SOCK_RAW, IPPROTO_ICMPV6, &sock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001740 if (err < 0) {
1741 ND_PRINTK0(KERN_ERR
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001742 "ICMPv6 NDISC: Failed to initialize the control socket (err %d).\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001743 err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001744 return err;
1745 }
1746
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001747 net->ipv6.ndisc_sk = sk = sock->sk;
1748 sk_change_net(sk, net);
1749
Linus Torvalds1da177e2005-04-16 15:20:36 -07001750 np = inet6_sk(sk);
1751 sk->sk_allocation = GFP_ATOMIC;
1752 np->hop_limit = 255;
1753 /* Do not loopback ndisc messages */
1754 np->mc_loop = 0;
1755 sk->sk_prot->unhash(sk);
1756
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001757 return 0;
1758}
1759
1760static void ndisc_net_exit(struct net *net)
1761{
1762 sk_release_kernel(net->ipv6.ndisc_sk);
1763}
1764
1765static struct pernet_operations ndisc_net_ops = {
1766 .init = ndisc_net_init,
1767 .exit = ndisc_net_exit,
1768};
1769
1770int __init ndisc_init(void)
1771{
1772 int err;
1773
1774 err = register_pernet_subsys(&ndisc_net_ops);
1775 if (err)
1776 return err;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001777 /*
1778 * Initialize the neighbour table
1779 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001780 neigh_table_init(&nd_tbl);
1781
1782#ifdef CONFIG_SYSCTL
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001783 err = neigh_sysctl_register(NULL, &nd_tbl.parms, NET_IPV6,
1784 NET_IPV6_NEIGH, "ipv6",
1785 &ndisc_ifinfo_sysctl_change,
1786 &ndisc_ifinfo_sysctl_strategy);
1787 if (err)
1788 goto out_unregister_pernet;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001789#endif
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001790 err = register_netdevice_notifier(&ndisc_netdev_notifier);
1791 if (err)
1792 goto out_unregister_sysctl;
1793out:
1794 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001795
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001796out_unregister_sysctl:
1797#ifdef CONFIG_SYSCTL
1798 neigh_sysctl_unregister(&nd_tbl.parms);
1799out_unregister_pernet:
1800#endif
1801 unregister_pernet_subsys(&ndisc_net_ops);
1802 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001803}
1804
1805void ndisc_cleanup(void)
1806{
Dmitry Mishin36f73d02006-11-03 16:08:19 -08001807 unregister_netdevice_notifier(&ndisc_netdev_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001808#ifdef CONFIG_SYSCTL
1809 neigh_sysctl_unregister(&nd_tbl.parms);
1810#endif
1811 neigh_table_clear(&nd_tbl);
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001812 unregister_pernet_subsys(&ndisc_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001813}