[NETNS][IPV6]: inet6_addr - check ipv6 address per namespace
[pandora-kernel.git] / net / ipv6 / ndisc.c
1 /*
2  *      Neighbour Discovery for IPv6
3  *      Linux INET6 implementation
4  *
5  *      Authors:
6  *      Pedro Roque             <roque@di.fc.ul.pt>
7  *      Mike Shaver             <shaver@ingenia.com>
8  *
9  *      This program is free software; you can redistribute it and/or
10  *      modify it under the terms of the GNU General Public License
11  *      as published by the Free Software Foundation; either version
12  *      2 of the License, or (at your option) any later version.
13  */
14
15 /*
16  *      Changes:
17  *
18  *      Pierre Ynard                    :       export userland ND options
19  *                                              through netlink (RDNSS support)
20  *      Lars Fenneberg                  :       fixed MTU setting on receipt
21  *                                              of an RA.
22  *      Janos Farkas                    :       kmalloc failure checks
23  *      Alexey Kuznetsov                :       state machine reworked
24  *                                              and moved to net/core.
25  *      Pekka Savola                    :       RFC2461 validation
26  *      YOSHIFUJI Hideaki @USAGI        :       Verify ND options properly
27  */
28
29 /* Set to 3 to get tracing... */
30 #define ND_DEBUG 1
31
32 #define ND_PRINTK(fmt, args...) do { if (net_ratelimit()) { printk(fmt, ## args); } } while(0)
33 #define ND_NOPRINTK(x...) do { ; } while(0)
34 #define ND_PRINTK0 ND_PRINTK
35 #define ND_PRINTK1 ND_NOPRINTK
36 #define ND_PRINTK2 ND_NOPRINTK
37 #define ND_PRINTK3 ND_NOPRINTK
38 #if ND_DEBUG >= 1
39 #undef ND_PRINTK1
40 #define ND_PRINTK1 ND_PRINTK
41 #endif
42 #if ND_DEBUG >= 2
43 #undef ND_PRINTK2
44 #define ND_PRINTK2 ND_PRINTK
45 #endif
46 #if ND_DEBUG >= 3
47 #undef ND_PRINTK3
48 #define ND_PRINTK3 ND_PRINTK
49 #endif
50
51 #include <linux/module.h>
52 #include <linux/errno.h>
53 #include <linux/types.h>
54 #include <linux/socket.h>
55 #include <linux/sockios.h>
56 #include <linux/sched.h>
57 #include <linux/net.h>
58 #include <linux/in6.h>
59 #include <linux/route.h>
60 #include <linux/init.h>
61 #include <linux/rcupdate.h>
62 #ifdef CONFIG_SYSCTL
63 #include <linux/sysctl.h>
64 #endif
65
66 #include <linux/if_addr.h>
67 #include <linux/if_arp.h>
68 #include <linux/ipv6.h>
69 #include <linux/icmpv6.h>
70 #include <linux/jhash.h>
71
72 #include <net/sock.h>
73 #include <net/snmp.h>
74
75 #include <net/ipv6.h>
76 #include <net/protocol.h>
77 #include <net/ndisc.h>
78 #include <net/ip6_route.h>
79 #include <net/addrconf.h>
80 #include <net/icmp.h>
81
82 #include <net/netlink.h>
83 #include <linux/rtnetlink.h>
84
85 #include <net/flow.h>
86 #include <net/ip6_checksum.h>
87 #include <linux/proc_fs.h>
88
89 #include <linux/netfilter.h>
90 #include <linux/netfilter_ipv6.h>
91
92 static struct socket *ndisc_socket;
93
94 static u32 ndisc_hash(const void *pkey, const struct net_device *dev);
95 static int ndisc_constructor(struct neighbour *neigh);
96 static void ndisc_solicit(struct neighbour *neigh, struct sk_buff *skb);
97 static void ndisc_error_report(struct neighbour *neigh, struct sk_buff *skb);
98 static int pndisc_constructor(struct pneigh_entry *n);
99 static void pndisc_destructor(struct pneigh_entry *n);
100 static void pndisc_redo(struct sk_buff *skb);
101
102 static struct neigh_ops ndisc_generic_ops = {
103         .family =               AF_INET6,
104         .solicit =              ndisc_solicit,
105         .error_report =         ndisc_error_report,
106         .output =               neigh_resolve_output,
107         .connected_output =     neigh_connected_output,
108         .hh_output =            dev_queue_xmit,
109         .queue_xmit =           dev_queue_xmit,
110 };
111
112 static struct neigh_ops ndisc_hh_ops = {
113         .family =               AF_INET6,
114         .solicit =              ndisc_solicit,
115         .error_report =         ndisc_error_report,
116         .output =               neigh_resolve_output,
117         .connected_output =     neigh_resolve_output,
118         .hh_output =            dev_queue_xmit,
119         .queue_xmit =           dev_queue_xmit,
120 };
121
122
123 static struct neigh_ops ndisc_direct_ops = {
124         .family =               AF_INET6,
125         .output =               dev_queue_xmit,
126         .connected_output =     dev_queue_xmit,
127         .hh_output =            dev_queue_xmit,
128         .queue_xmit =           dev_queue_xmit,
129 };
130
131 struct neigh_table nd_tbl = {
132         .family =       AF_INET6,
133         .entry_size =   sizeof(struct neighbour) + sizeof(struct in6_addr),
134         .key_len =      sizeof(struct in6_addr),
135         .hash =         ndisc_hash,
136         .constructor =  ndisc_constructor,
137         .pconstructor = pndisc_constructor,
138         .pdestructor =  pndisc_destructor,
139         .proxy_redo =   pndisc_redo,
140         .id =           "ndisc_cache",
141         .parms = {
142                 .tbl =                  &nd_tbl,
143                 .base_reachable_time =  30 * HZ,
144                 .retrans_time =  1 * HZ,
145                 .gc_staletime = 60 * HZ,
146                 .reachable_time =               30 * HZ,
147                 .delay_probe_time =      5 * HZ,
148                 .queue_len =             3,
149                 .ucast_probes =  3,
150                 .mcast_probes =  3,
151                 .anycast_delay =         1 * HZ,
152                 .proxy_delay =          (8 * HZ) / 10,
153                 .proxy_qlen =           64,
154         },
155         .gc_interval =    30 * HZ,
156         .gc_thresh1 =    128,
157         .gc_thresh2 =    512,
158         .gc_thresh3 =   1024,
159 };
160
161 /* ND options */
162 struct ndisc_options {
163         struct nd_opt_hdr *nd_opt_array[__ND_OPT_ARRAY_MAX];
164 #ifdef CONFIG_IPV6_ROUTE_INFO
165         struct nd_opt_hdr *nd_opts_ri;
166         struct nd_opt_hdr *nd_opts_ri_end;
167 #endif
168         struct nd_opt_hdr *nd_useropts;
169         struct nd_opt_hdr *nd_useropts_end;
170 };
171
172 #define nd_opts_src_lladdr      nd_opt_array[ND_OPT_SOURCE_LL_ADDR]
173 #define nd_opts_tgt_lladdr      nd_opt_array[ND_OPT_TARGET_LL_ADDR]
174 #define nd_opts_pi              nd_opt_array[ND_OPT_PREFIX_INFO]
175 #define nd_opts_pi_end          nd_opt_array[__ND_OPT_PREFIX_INFO_END]
176 #define nd_opts_rh              nd_opt_array[ND_OPT_REDIRECT_HDR]
177 #define nd_opts_mtu             nd_opt_array[ND_OPT_MTU]
178
179 #define NDISC_OPT_SPACE(len) (((len)+2+7)&~7)
180
181 /*
182  * Return the padding between the option length and the start of the
183  * link addr.  Currently only IP-over-InfiniBand needs this, although
184  * if RFC 3831 IPv6-over-Fibre Channel is ever implemented it may
185  * also need a pad of 2.
186  */
187 static int ndisc_addr_option_pad(unsigned short type)
188 {
189         switch (type) {
190         case ARPHRD_INFINIBAND: return 2;
191         default:                return 0;
192         }
193 }
194
195 static inline int ndisc_opt_addr_space(struct net_device *dev)
196 {
197         return NDISC_OPT_SPACE(dev->addr_len + ndisc_addr_option_pad(dev->type));
198 }
199
200 static u8 *ndisc_fill_addr_option(u8 *opt, int type, void *data, int data_len,
201                                   unsigned short addr_type)
202 {
203         int space = NDISC_OPT_SPACE(data_len);
204         int pad   = ndisc_addr_option_pad(addr_type);
205
206         opt[0] = type;
207         opt[1] = space>>3;
208
209         memset(opt + 2, 0, pad);
210         opt   += pad;
211         space -= pad;
212
213         memcpy(opt+2, data, data_len);
214         data_len += 2;
215         opt += data_len;
216         if ((space -= data_len) > 0)
217                 memset(opt, 0, space);
218         return opt + space;
219 }
220
221 static struct nd_opt_hdr *ndisc_next_option(struct nd_opt_hdr *cur,
222                                             struct nd_opt_hdr *end)
223 {
224         int type;
225         if (!cur || !end || cur >= end)
226                 return NULL;
227         type = cur->nd_opt_type;
228         do {
229                 cur = ((void *)cur) + (cur->nd_opt_len << 3);
230         } while(cur < end && cur->nd_opt_type != type);
231         return (cur <= end && cur->nd_opt_type == type ? cur : NULL);
232 }
233
234 static inline int ndisc_is_useropt(struct nd_opt_hdr *opt)
235 {
236         return (opt->nd_opt_type == ND_OPT_RDNSS);
237 }
238
239 static struct nd_opt_hdr *ndisc_next_useropt(struct nd_opt_hdr *cur,
240                                              struct nd_opt_hdr *end)
241 {
242         if (!cur || !end || cur >= end)
243                 return NULL;
244         do {
245                 cur = ((void *)cur) + (cur->nd_opt_len << 3);
246         } while(cur < end && !ndisc_is_useropt(cur));
247         return (cur <= end && ndisc_is_useropt(cur) ? cur : NULL);
248 }
249
250 static struct ndisc_options *ndisc_parse_options(u8 *opt, int opt_len,
251                                                  struct ndisc_options *ndopts)
252 {
253         struct nd_opt_hdr *nd_opt = (struct nd_opt_hdr *)opt;
254
255         if (!nd_opt || opt_len < 0 || !ndopts)
256                 return NULL;
257         memset(ndopts, 0, sizeof(*ndopts));
258         while (opt_len) {
259                 int l;
260                 if (opt_len < sizeof(struct nd_opt_hdr))
261                         return NULL;
262                 l = nd_opt->nd_opt_len << 3;
263                 if (opt_len < l || l == 0)
264                         return NULL;
265                 switch (nd_opt->nd_opt_type) {
266                 case ND_OPT_SOURCE_LL_ADDR:
267                 case ND_OPT_TARGET_LL_ADDR:
268                 case ND_OPT_MTU:
269                 case ND_OPT_REDIRECT_HDR:
270                         if (ndopts->nd_opt_array[nd_opt->nd_opt_type]) {
271                                 ND_PRINTK2(KERN_WARNING
272                                            "%s(): duplicated ND6 option found: type=%d\n",
273                                            __FUNCTION__,
274                                            nd_opt->nd_opt_type);
275                         } else {
276                                 ndopts->nd_opt_array[nd_opt->nd_opt_type] = nd_opt;
277                         }
278                         break;
279                 case ND_OPT_PREFIX_INFO:
280                         ndopts->nd_opts_pi_end = nd_opt;
281                         if (!ndopts->nd_opt_array[nd_opt->nd_opt_type])
282                                 ndopts->nd_opt_array[nd_opt->nd_opt_type] = nd_opt;
283                         break;
284 #ifdef CONFIG_IPV6_ROUTE_INFO
285                 case ND_OPT_ROUTE_INFO:
286                         ndopts->nd_opts_ri_end = nd_opt;
287                         if (!ndopts->nd_opts_ri)
288                                 ndopts->nd_opts_ri = nd_opt;
289                         break;
290 #endif
291                 default:
292                         if (ndisc_is_useropt(nd_opt)) {
293                                 ndopts->nd_useropts_end = nd_opt;
294                                 if (!ndopts->nd_useropts)
295                                         ndopts->nd_useropts = nd_opt;
296                         } else {
297                                 /*
298                                  * Unknown options must be silently ignored,
299                                  * to accommodate future extension to the
300                                  * protocol.
301                                  */
302                                 ND_PRINTK2(KERN_NOTICE
303                                            "%s(): ignored unsupported option; type=%d, len=%d\n",
304                                            __FUNCTION__,
305                                            nd_opt->nd_opt_type, nd_opt->nd_opt_len);
306                         }
307                 }
308                 opt_len -= l;
309                 nd_opt = ((void *)nd_opt) + l;
310         }
311         return ndopts;
312 }
313
314 static inline u8 *ndisc_opt_addr_data(struct nd_opt_hdr *p,
315                                       struct net_device *dev)
316 {
317         u8 *lladdr = (u8 *)(p + 1);
318         int lladdrlen = p->nd_opt_len << 3;
319         int prepad = ndisc_addr_option_pad(dev->type);
320         if (lladdrlen != NDISC_OPT_SPACE(dev->addr_len + prepad))
321                 return NULL;
322         return (lladdr + prepad);
323 }
324
325 int ndisc_mc_map(struct in6_addr *addr, char *buf, struct net_device *dev, int dir)
326 {
327         switch (dev->type) {
328         case ARPHRD_ETHER:
329         case ARPHRD_IEEE802:    /* Not sure. Check it later. --ANK */
330         case ARPHRD_FDDI:
331                 ipv6_eth_mc_map(addr, buf);
332                 return 0;
333         case ARPHRD_IEEE802_TR:
334                 ipv6_tr_mc_map(addr,buf);
335                 return 0;
336         case ARPHRD_ARCNET:
337                 ipv6_arcnet_mc_map(addr, buf);
338                 return 0;
339         case ARPHRD_INFINIBAND:
340                 ipv6_ib_mc_map(addr, dev->broadcast, buf);
341                 return 0;
342         default:
343                 if (dir) {
344                         memcpy(buf, dev->broadcast, dev->addr_len);
345                         return 0;
346                 }
347         }
348         return -EINVAL;
349 }
350
351 EXPORT_SYMBOL(ndisc_mc_map);
352
353 static u32 ndisc_hash(const void *pkey, const struct net_device *dev)
354 {
355         const u32 *p32 = pkey;
356         u32 addr_hash, i;
357
358         addr_hash = 0;
359         for (i = 0; i < (sizeof(struct in6_addr) / sizeof(u32)); i++)
360                 addr_hash ^= *p32++;
361
362         return jhash_2words(addr_hash, dev->ifindex, nd_tbl.hash_rnd);
363 }
364
365 static int ndisc_constructor(struct neighbour *neigh)
366 {
367         struct in6_addr *addr = (struct in6_addr*)&neigh->primary_key;
368         struct net_device *dev = neigh->dev;
369         struct inet6_dev *in6_dev;
370         struct neigh_parms *parms;
371         int is_multicast = ipv6_addr_is_multicast(addr);
372
373         rcu_read_lock();
374         in6_dev = in6_dev_get(dev);
375         if (in6_dev == NULL) {
376                 rcu_read_unlock();
377                 return -EINVAL;
378         }
379
380         parms = in6_dev->nd_parms;
381         __neigh_parms_put(neigh->parms);
382         neigh->parms = neigh_parms_clone(parms);
383         rcu_read_unlock();
384
385         neigh->type = is_multicast ? RTN_MULTICAST : RTN_UNICAST;
386         if (!dev->header_ops) {
387                 neigh->nud_state = NUD_NOARP;
388                 neigh->ops = &ndisc_direct_ops;
389                 neigh->output = neigh->ops->queue_xmit;
390         } else {
391                 if (is_multicast) {
392                         neigh->nud_state = NUD_NOARP;
393                         ndisc_mc_map(addr, neigh->ha, dev, 1);
394                 } else if (dev->flags&(IFF_NOARP|IFF_LOOPBACK)) {
395                         neigh->nud_state = NUD_NOARP;
396                         memcpy(neigh->ha, dev->dev_addr, dev->addr_len);
397                         if (dev->flags&IFF_LOOPBACK)
398                                 neigh->type = RTN_LOCAL;
399                 } else if (dev->flags&IFF_POINTOPOINT) {
400                         neigh->nud_state = NUD_NOARP;
401                         memcpy(neigh->ha, dev->broadcast, dev->addr_len);
402                 }
403                 if (dev->header_ops->cache)
404                         neigh->ops = &ndisc_hh_ops;
405                 else
406                         neigh->ops = &ndisc_generic_ops;
407                 if (neigh->nud_state&NUD_VALID)
408                         neigh->output = neigh->ops->connected_output;
409                 else
410                         neigh->output = neigh->ops->output;
411         }
412         in6_dev_put(in6_dev);
413         return 0;
414 }
415
416 static int pndisc_constructor(struct pneigh_entry *n)
417 {
418         struct in6_addr *addr = (struct in6_addr*)&n->key;
419         struct in6_addr maddr;
420         struct net_device *dev = n->dev;
421
422         if (dev == NULL || __in6_dev_get(dev) == NULL)
423                 return -EINVAL;
424         addrconf_addr_solict_mult(addr, &maddr);
425         ipv6_dev_mc_inc(dev, &maddr);
426         return 0;
427 }
428
429 static void pndisc_destructor(struct pneigh_entry *n)
430 {
431         struct in6_addr *addr = (struct in6_addr*)&n->key;
432         struct in6_addr maddr;
433         struct net_device *dev = n->dev;
434
435         if (dev == NULL || __in6_dev_get(dev) == NULL)
436                 return;
437         addrconf_addr_solict_mult(addr, &maddr);
438         ipv6_dev_mc_dec(dev, &maddr);
439 }
440
441 /*
442  *      Send a Neighbour Advertisement
443  */
444
445 static inline void ndisc_flow_init(struct flowi *fl, u8 type,
446                             struct in6_addr *saddr, struct in6_addr *daddr,
447                             int oif)
448 {
449         memset(fl, 0, sizeof(*fl));
450         ipv6_addr_copy(&fl->fl6_src, saddr);
451         ipv6_addr_copy(&fl->fl6_dst, daddr);
452         fl->proto               = IPPROTO_ICMPV6;
453         fl->fl_icmp_type        = type;
454         fl->fl_icmp_code        = 0;
455         fl->oif                 = oif;
456         security_sk_classify_flow(ndisc_socket->sk, fl);
457 }
458
459 static void __ndisc_send(struct net_device *dev,
460                          struct neighbour *neigh,
461                          struct in6_addr *daddr, struct in6_addr *saddr,
462                          struct icmp6hdr *icmp6h, struct in6_addr *target,
463                          int llinfo)
464 {
465         struct flowi fl;
466         struct dst_entry *dst;
467         struct sock *sk = ndisc_socket->sk;
468         struct sk_buff *skb;
469         struct icmp6hdr *hdr;
470         struct inet6_dev *idev;
471         int len;
472         int err;
473         u8 *opt, type;
474
475         type = icmp6h->icmp6_type;
476
477         ndisc_flow_init(&fl, type, saddr, daddr,
478                         dev->ifindex);
479
480         dst = ndisc_dst_alloc(dev, neigh, daddr, ip6_output);
481         if (!dst)
482                 return;
483
484         err = xfrm_lookup(&dst, &fl, NULL, 0);
485         if (err < 0)
486                 return;
487
488         if (!dev->addr_len)
489                 llinfo = 0;
490
491         len = sizeof(struct icmp6hdr) + (target ? sizeof(*target) : 0);
492         if (llinfo)
493                 len += ndisc_opt_addr_space(dev);
494
495         skb = sock_alloc_send_skb(sk,
496                                   (MAX_HEADER + sizeof(struct ipv6hdr) +
497                                    len + LL_RESERVED_SPACE(dev)),
498                                   1, &err);
499         if (!skb) {
500                 ND_PRINTK0(KERN_ERR
501                            "ICMPv6 ND: %s() failed to allocate an skb.\n",
502                            __FUNCTION__);
503                 dst_release(dst);
504                 return;
505         }
506
507         skb_reserve(skb, LL_RESERVED_SPACE(dev));
508         ip6_nd_hdr(sk, skb, dev, saddr, daddr, IPPROTO_ICMPV6, len);
509
510         skb->transport_header = skb->tail;
511         skb_put(skb, len);
512
513         hdr = (struct icmp6hdr *)skb_transport_header(skb);
514         memcpy(hdr, icmp6h, sizeof(*hdr));
515
516         opt = skb_transport_header(skb) + sizeof(struct icmp6hdr);
517         if (target) {
518                 ipv6_addr_copy((struct in6_addr *)opt, target);
519                 opt += sizeof(*target);
520         }
521
522         if (llinfo)
523                 ndisc_fill_addr_option(opt, llinfo, dev->dev_addr,
524                                        dev->addr_len, dev->type);
525
526         hdr->icmp6_cksum = csum_ipv6_magic(saddr, daddr, len,
527                                            IPPROTO_ICMPV6,
528                                            csum_partial((__u8 *) hdr,
529                                                         len, 0));
530
531         skb->dst = dst;
532
533         idev = in6_dev_get(dst->dev);
534         IP6_INC_STATS(idev, IPSTATS_MIB_OUTREQUESTS);
535
536         err = NF_HOOK(PF_INET6, NF_INET_LOCAL_OUT, skb, NULL, dst->dev,
537                       dst_output);
538         if (!err) {
539                 ICMP6MSGOUT_INC_STATS(idev, type);
540                 ICMP6_INC_STATS(idev, ICMP6_MIB_OUTMSGS);
541         }
542
543         if (likely(idev != NULL))
544                 in6_dev_put(idev);
545 }
546
547 static void ndisc_send_na(struct net_device *dev, struct neighbour *neigh,
548                    struct in6_addr *daddr, struct in6_addr *solicited_addr,
549                    int router, int solicited, int override, int inc_opt)
550 {
551         struct in6_addr tmpaddr;
552         struct inet6_ifaddr *ifp;
553         struct in6_addr *src_addr;
554         struct icmp6hdr icmp6h = {
555                 .icmp6_type = NDISC_NEIGHBOUR_ADVERTISEMENT,
556         };
557
558         /* for anycast or proxy, solicited_addr != src_addr */
559         ifp = ipv6_get_ifaddr(solicited_addr, dev, 1);
560         if (ifp) {
561                 src_addr = solicited_addr;
562                 if (ifp->flags & IFA_F_OPTIMISTIC)
563                         override = 0;
564                 in6_ifa_put(ifp);
565         } else {
566                 if (ipv6_dev_get_saddr(dev, daddr, &tmpaddr))
567                         return;
568                 src_addr = &tmpaddr;
569         }
570
571         icmp6h.icmp6_router = router;
572         icmp6h.icmp6_solicited = solicited;
573         icmp6h.icmp6_override = override;
574
575         __ndisc_send(dev, neigh, daddr, src_addr,
576                      &icmp6h, solicited_addr,
577                      inc_opt ? ND_OPT_TARGET_LL_ADDR : 0);
578 }
579
580 void ndisc_send_ns(struct net_device *dev, struct neighbour *neigh,
581                    struct in6_addr *solicit,
582                    struct in6_addr *daddr, struct in6_addr *saddr)
583 {
584         struct in6_addr addr_buf;
585         struct icmp6hdr icmp6h = {
586                 .icmp6_type = NDISC_NEIGHBOUR_SOLICITATION,
587         };
588
589         if (saddr == NULL) {
590                 if (ipv6_get_lladdr(dev, &addr_buf,
591                                    (IFA_F_TENTATIVE|IFA_F_OPTIMISTIC)))
592                         return;
593                 saddr = &addr_buf;
594         }
595
596         __ndisc_send(dev, neigh, daddr, saddr,
597                      &icmp6h, solicit,
598                      !ipv6_addr_any(saddr) ? ND_OPT_SOURCE_LL_ADDR : 0);
599 }
600
601 void ndisc_send_rs(struct net_device *dev, struct in6_addr *saddr,
602                    struct in6_addr *daddr)
603 {
604         struct icmp6hdr icmp6h = {
605                 .icmp6_type = NDISC_ROUTER_SOLICITATION,
606         };
607         int send_sllao = dev->addr_len;
608
609 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD
610         /*
611          * According to section 2.2 of RFC 4429, we must not
612          * send router solicitations with a sllao from
613          * optimistic addresses, but we may send the solicitation
614          * if we don't include the sllao.  So here we check
615          * if our address is optimistic, and if so, we
616          * suppress the inclusion of the sllao.
617          */
618         if (send_sllao) {
619                 struct inet6_ifaddr *ifp = ipv6_get_ifaddr(saddr, dev, 1);
620                 if (ifp) {
621                         if (ifp->flags & IFA_F_OPTIMISTIC)  {
622                                 send_sllao = 0;
623                         }
624                         in6_ifa_put(ifp);
625                 } else {
626                         send_sllao = 0;
627                 }
628         }
629 #endif
630         __ndisc_send(dev, NULL, daddr, saddr,
631                      &icmp6h, NULL,
632                      send_sllao ? ND_OPT_SOURCE_LL_ADDR : 0);
633 }
634
635
636 static void ndisc_error_report(struct neighbour *neigh, struct sk_buff *skb)
637 {
638         /*
639          *      "The sender MUST return an ICMP
640          *       destination unreachable"
641          */
642         dst_link_failure(skb);
643         kfree_skb(skb);
644 }
645
646 /* Called with locked neigh: either read or both */
647
648 static void ndisc_solicit(struct neighbour *neigh, struct sk_buff *skb)
649 {
650         struct in6_addr *saddr = NULL;
651         struct in6_addr mcaddr;
652         struct net_device *dev = neigh->dev;
653         struct in6_addr *target = (struct in6_addr *)&neigh->primary_key;
654         int probes = atomic_read(&neigh->probes);
655
656         if (skb && ipv6_chk_addr(&init_net, &ipv6_hdr(skb)->saddr, dev, 1))
657                 saddr = &ipv6_hdr(skb)->saddr;
658
659         if ((probes -= neigh->parms->ucast_probes) < 0) {
660                 if (!(neigh->nud_state & NUD_VALID)) {
661                         ND_PRINTK1(KERN_DEBUG
662                                    "%s(): trying to ucast probe in NUD_INVALID: "
663                                    NIP6_FMT "\n",
664                                    __FUNCTION__,
665                                    NIP6(*target));
666                 }
667                 ndisc_send_ns(dev, neigh, target, target, saddr);
668         } else if ((probes -= neigh->parms->app_probes) < 0) {
669 #ifdef CONFIG_ARPD
670                 neigh_app_ns(neigh);
671 #endif
672         } else {
673                 addrconf_addr_solict_mult(target, &mcaddr);
674                 ndisc_send_ns(dev, NULL, target, &mcaddr, saddr);
675         }
676 }
677
678 static void ndisc_recv_ns(struct sk_buff *skb)
679 {
680         struct nd_msg *msg = (struct nd_msg *)skb_transport_header(skb);
681         struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
682         struct in6_addr *daddr = &ipv6_hdr(skb)->daddr;
683         u8 *lladdr = NULL;
684         u32 ndoptlen = skb->tail - (skb->transport_header +
685                                     offsetof(struct nd_msg, opt));
686         struct ndisc_options ndopts;
687         struct net_device *dev = skb->dev;
688         struct inet6_ifaddr *ifp;
689         struct inet6_dev *idev = NULL;
690         struct neighbour *neigh;
691         struct pneigh_entry *pneigh = NULL;
692         int dad = ipv6_addr_any(saddr);
693         int inc;
694         int is_router;
695
696         if (ipv6_addr_is_multicast(&msg->target)) {
697                 ND_PRINTK2(KERN_WARNING
698                            "ICMPv6 NS: multicast target address");
699                 return;
700         }
701
702         /*
703          * RFC2461 7.1.1:
704          * DAD has to be destined for solicited node multicast address.
705          */
706         if (dad &&
707             !(daddr->s6_addr32[0] == htonl(0xff020000) &&
708               daddr->s6_addr32[1] == htonl(0x00000000) &&
709               daddr->s6_addr32[2] == htonl(0x00000001) &&
710               daddr->s6_addr [12] == 0xff )) {
711                 ND_PRINTK2(KERN_WARNING
712                            "ICMPv6 NS: bad DAD packet (wrong destination)\n");
713                 return;
714         }
715
716         if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts)) {
717                 ND_PRINTK2(KERN_WARNING
718                            "ICMPv6 NS: invalid ND options\n");
719                 return;
720         }
721
722         if (ndopts.nd_opts_src_lladdr) {
723                 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr, dev);
724                 if (!lladdr) {
725                         ND_PRINTK2(KERN_WARNING
726                                    "ICMPv6 NS: invalid link-layer address length\n");
727                         return;
728                 }
729
730                 /* RFC2461 7.1.1:
731                  *      If the IP source address is the unspecified address,
732                  *      there MUST NOT be source link-layer address option
733                  *      in the message.
734                  */
735                 if (dad) {
736                         ND_PRINTK2(KERN_WARNING
737                                    "ICMPv6 NS: bad DAD packet (link-layer address option)\n");
738                         return;
739                 }
740         }
741
742         inc = ipv6_addr_is_multicast(daddr);
743
744         if ((ifp = ipv6_get_ifaddr(&msg->target, dev, 1)) != NULL) {
745
746                 if (ifp->flags & (IFA_F_TENTATIVE|IFA_F_OPTIMISTIC)) {
747                         if (dad) {
748                                 if (dev->type == ARPHRD_IEEE802_TR) {
749                                         const unsigned char *sadr;
750                                         sadr = skb_mac_header(skb);
751                                         if (((sadr[8] ^ dev->dev_addr[0]) & 0x7f) == 0 &&
752                                             sadr[9] == dev->dev_addr[1] &&
753                                             sadr[10] == dev->dev_addr[2] &&
754                                             sadr[11] == dev->dev_addr[3] &&
755                                             sadr[12] == dev->dev_addr[4] &&
756                                             sadr[13] == dev->dev_addr[5]) {
757                                                 /* looped-back to us */
758                                                 goto out;
759                                         }
760                                 }
761
762                                 /*
763                                  * We are colliding with another node
764                                  * who is doing DAD
765                                  * so fail our DAD process
766                                  */
767                                 addrconf_dad_failure(ifp);
768                                 return;
769                         } else {
770                                 /*
771                                  * This is not a dad solicitation.
772                                  * If we are an optimistic node,
773                                  * we should respond.
774                                  * Otherwise, we should ignore it.
775                                  */
776                                 if (!(ifp->flags & IFA_F_OPTIMISTIC))
777                                         goto out;
778                         }
779                 }
780
781                 idev = ifp->idev;
782         } else {
783                 idev = in6_dev_get(dev);
784                 if (!idev) {
785                         /* XXX: count this drop? */
786                         return;
787                 }
788
789                 if (ipv6_chk_acast_addr(dev, &msg->target) ||
790                     (idev->cnf.forwarding &&
791                      (ipv6_devconf.proxy_ndp || idev->cnf.proxy_ndp) &&
792                      (pneigh = pneigh_lookup(&nd_tbl, &init_net,
793                                              &msg->target, dev, 0)) != NULL)) {
794                         if (!(NEIGH_CB(skb)->flags & LOCALLY_ENQUEUED) &&
795                             skb->pkt_type != PACKET_HOST &&
796                             inc != 0 &&
797                             idev->nd_parms->proxy_delay != 0) {
798                                 /*
799                                  * for anycast or proxy,
800                                  * sender should delay its response
801                                  * by a random time between 0 and
802                                  * MAX_ANYCAST_DELAY_TIME seconds.
803                                  * (RFC2461) -- yoshfuji
804                                  */
805                                 struct sk_buff *n = skb_clone(skb, GFP_ATOMIC);
806                                 if (n)
807                                         pneigh_enqueue(&nd_tbl, idev->nd_parms, n);
808                                 goto out;
809                         }
810                 } else
811                         goto out;
812         }
813
814         is_router = !!(pneigh ? pneigh->flags & NTF_ROUTER : idev->cnf.forwarding);
815
816         if (dad) {
817                 struct in6_addr maddr;
818
819                 ipv6_addr_all_nodes(&maddr);
820                 ndisc_send_na(dev, NULL, &maddr, &msg->target,
821                               is_router, 0, (ifp != NULL), 1);
822                 goto out;
823         }
824
825         if (inc)
826                 NEIGH_CACHE_STAT_INC(&nd_tbl, rcv_probes_mcast);
827         else
828                 NEIGH_CACHE_STAT_INC(&nd_tbl, rcv_probes_ucast);
829
830         /*
831          *      update / create cache entry
832          *      for the source address
833          */
834         neigh = __neigh_lookup(&nd_tbl, saddr, dev,
835                                !inc || lladdr || !dev->addr_len);
836         if (neigh)
837                 neigh_update(neigh, lladdr, NUD_STALE,
838                              NEIGH_UPDATE_F_WEAK_OVERRIDE|
839                              NEIGH_UPDATE_F_OVERRIDE);
840         if (neigh || !dev->header_ops) {
841                 ndisc_send_na(dev, neigh, saddr, &msg->target,
842                               is_router,
843                               1, (ifp != NULL && inc), inc);
844                 if (neigh)
845                         neigh_release(neigh);
846         }
847
848 out:
849         if (ifp)
850                 in6_ifa_put(ifp);
851         else
852                 in6_dev_put(idev);
853
854         return;
855 }
856
857 static void ndisc_recv_na(struct sk_buff *skb)
858 {
859         struct nd_msg *msg = (struct nd_msg *)skb_transport_header(skb);
860         struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
861         struct in6_addr *daddr = &ipv6_hdr(skb)->daddr;
862         u8 *lladdr = NULL;
863         u32 ndoptlen = skb->tail - (skb->transport_header +
864                                     offsetof(struct nd_msg, opt));
865         struct ndisc_options ndopts;
866         struct net_device *dev = skb->dev;
867         struct inet6_ifaddr *ifp;
868         struct neighbour *neigh;
869
870         if (skb->len < sizeof(struct nd_msg)) {
871                 ND_PRINTK2(KERN_WARNING
872                            "ICMPv6 NA: packet too short\n");
873                 return;
874         }
875
876         if (ipv6_addr_is_multicast(&msg->target)) {
877                 ND_PRINTK2(KERN_WARNING
878                            "ICMPv6 NA: target address is multicast.\n");
879                 return;
880         }
881
882         if (ipv6_addr_is_multicast(daddr) &&
883             msg->icmph.icmp6_solicited) {
884                 ND_PRINTK2(KERN_WARNING
885                            "ICMPv6 NA: solicited NA is multicasted.\n");
886                 return;
887         }
888
889         if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts)) {
890                 ND_PRINTK2(KERN_WARNING
891                            "ICMPv6 NS: invalid ND option\n");
892                 return;
893         }
894         if (ndopts.nd_opts_tgt_lladdr) {
895                 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_tgt_lladdr, dev);
896                 if (!lladdr) {
897                         ND_PRINTK2(KERN_WARNING
898                                    "ICMPv6 NA: invalid link-layer address length\n");
899                         return;
900                 }
901         }
902         if ((ifp = ipv6_get_ifaddr(&msg->target, dev, 1))) {
903                 if (ifp->flags & IFA_F_TENTATIVE) {
904                         addrconf_dad_failure(ifp);
905                         return;
906                 }
907                 /* What should we make now? The advertisement
908                    is invalid, but ndisc specs say nothing
909                    about it. It could be misconfiguration, or
910                    an smart proxy agent tries to help us :-)
911                  */
912                 ND_PRINTK1(KERN_WARNING
913                            "ICMPv6 NA: someone advertises our address on %s!\n",
914                            ifp->idev->dev->name);
915                 in6_ifa_put(ifp);
916                 return;
917         }
918         neigh = neigh_lookup(&nd_tbl, &msg->target, dev);
919
920         if (neigh) {
921                 u8 old_flags = neigh->flags;
922
923                 if (neigh->nud_state & NUD_FAILED)
924                         goto out;
925
926                 /*
927                  * Don't update the neighbor cache entry on a proxy NA from
928                  * ourselves because either the proxied node is off link or it
929                  * has already sent a NA to us.
930                  */
931                 if (lladdr && !memcmp(lladdr, dev->dev_addr, dev->addr_len) &&
932                     ipv6_devconf.forwarding && ipv6_devconf.proxy_ndp &&
933                     pneigh_lookup(&nd_tbl, &init_net, &msg->target, dev, 0)) {
934                         /* XXX: idev->cnf.prixy_ndp */
935                         goto out;
936                 }
937
938                 neigh_update(neigh, lladdr,
939                              msg->icmph.icmp6_solicited ? NUD_REACHABLE : NUD_STALE,
940                              NEIGH_UPDATE_F_WEAK_OVERRIDE|
941                              (msg->icmph.icmp6_override ? NEIGH_UPDATE_F_OVERRIDE : 0)|
942                              NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
943                              (msg->icmph.icmp6_router ? NEIGH_UPDATE_F_ISROUTER : 0));
944
945                 if ((old_flags & ~neigh->flags) & NTF_ROUTER) {
946                         /*
947                          * Change: router to host
948                          */
949                         struct rt6_info *rt;
950                         rt = rt6_get_dflt_router(saddr, dev);
951                         if (rt)
952                                 ip6_del_rt(rt);
953                 }
954
955 out:
956                 neigh_release(neigh);
957         }
958 }
959
960 static void ndisc_recv_rs(struct sk_buff *skb)
961 {
962         struct rs_msg *rs_msg = (struct rs_msg *)skb_transport_header(skb);
963         unsigned long ndoptlen = skb->len - sizeof(*rs_msg);
964         struct neighbour *neigh;
965         struct inet6_dev *idev;
966         struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
967         struct ndisc_options ndopts;
968         u8 *lladdr = NULL;
969
970         if (skb->len < sizeof(*rs_msg))
971                 return;
972
973         idev = in6_dev_get(skb->dev);
974         if (!idev) {
975                 if (net_ratelimit())
976                         ND_PRINTK1("ICMP6 RS: can't find in6 device\n");
977                 return;
978         }
979
980         /* Don't accept RS if we're not in router mode */
981         if (!idev->cnf.forwarding)
982                 goto out;
983
984         /*
985          * Don't update NCE if src = ::;
986          * this implies that the source node has no ip address assigned yet.
987          */
988         if (ipv6_addr_any(saddr))
989                 goto out;
990
991         /* Parse ND options */
992         if (!ndisc_parse_options(rs_msg->opt, ndoptlen, &ndopts)) {
993                 if (net_ratelimit())
994                         ND_PRINTK2("ICMP6 NS: invalid ND option, ignored\n");
995                 goto out;
996         }
997
998         if (ndopts.nd_opts_src_lladdr) {
999                 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr,
1000                                              skb->dev);
1001                 if (!lladdr)
1002                         goto out;
1003         }
1004
1005         neigh = __neigh_lookup(&nd_tbl, saddr, skb->dev, 1);
1006         if (neigh) {
1007                 neigh_update(neigh, lladdr, NUD_STALE,
1008                              NEIGH_UPDATE_F_WEAK_OVERRIDE|
1009                              NEIGH_UPDATE_F_OVERRIDE|
1010                              NEIGH_UPDATE_F_OVERRIDE_ISROUTER);
1011                 neigh_release(neigh);
1012         }
1013 out:
1014         in6_dev_put(idev);
1015 }
1016
1017 static void ndisc_ra_useropt(struct sk_buff *ra, struct nd_opt_hdr *opt)
1018 {
1019         struct icmp6hdr *icmp6h = (struct icmp6hdr *)skb_transport_header(ra);
1020         struct sk_buff *skb;
1021         struct nlmsghdr *nlh;
1022         struct nduseroptmsg *ndmsg;
1023         int err;
1024         int base_size = NLMSG_ALIGN(sizeof(struct nduseroptmsg)
1025                                     + (opt->nd_opt_len << 3));
1026         size_t msg_size = base_size + nla_total_size(sizeof(struct in6_addr));
1027
1028         skb = nlmsg_new(msg_size, GFP_ATOMIC);
1029         if (skb == NULL) {
1030                 err = -ENOBUFS;
1031                 goto errout;
1032         }
1033
1034         nlh = nlmsg_put(skb, 0, 0, RTM_NEWNDUSEROPT, base_size, 0);
1035         if (nlh == NULL) {
1036                 goto nla_put_failure;
1037         }
1038
1039         ndmsg = nlmsg_data(nlh);
1040         ndmsg->nduseropt_family = AF_INET6;
1041         ndmsg->nduseropt_ifindex = ra->dev->ifindex;
1042         ndmsg->nduseropt_icmp_type = icmp6h->icmp6_type;
1043         ndmsg->nduseropt_icmp_code = icmp6h->icmp6_code;
1044         ndmsg->nduseropt_opts_len = opt->nd_opt_len << 3;
1045
1046         memcpy(ndmsg + 1, opt, opt->nd_opt_len << 3);
1047
1048         NLA_PUT(skb, NDUSEROPT_SRCADDR, sizeof(struct in6_addr),
1049                 &ipv6_hdr(ra)->saddr);
1050         nlmsg_end(skb, nlh);
1051
1052         err = rtnl_notify(skb, &init_net, 0, RTNLGRP_ND_USEROPT, NULL,
1053                           GFP_ATOMIC);
1054         if (err < 0)
1055                 goto errout;
1056
1057         return;
1058
1059 nla_put_failure:
1060         nlmsg_free(skb);
1061         err = -EMSGSIZE;
1062 errout:
1063         rtnl_set_sk_err(&init_net, RTNLGRP_ND_USEROPT, err);
1064 }
1065
1066 static void ndisc_router_discovery(struct sk_buff *skb)
1067 {
1068         struct ra_msg *ra_msg = (struct ra_msg *)skb_transport_header(skb);
1069         struct neighbour *neigh = NULL;
1070         struct inet6_dev *in6_dev;
1071         struct rt6_info *rt = NULL;
1072         int lifetime;
1073         struct ndisc_options ndopts;
1074         int optlen;
1075         unsigned int pref = 0;
1076
1077         __u8 * opt = (__u8 *)(ra_msg + 1);
1078
1079         optlen = (skb->tail - skb->transport_header) - sizeof(struct ra_msg);
1080
1081         if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL)) {
1082                 ND_PRINTK2(KERN_WARNING
1083                            "ICMPv6 RA: source address is not link-local.\n");
1084                 return;
1085         }
1086         if (optlen < 0) {
1087                 ND_PRINTK2(KERN_WARNING
1088                            "ICMPv6 RA: packet too short\n");
1089                 return;
1090         }
1091
1092         /*
1093          *      set the RA_RECV flag in the interface
1094          */
1095
1096         in6_dev = in6_dev_get(skb->dev);
1097         if (in6_dev == NULL) {
1098                 ND_PRINTK0(KERN_ERR
1099                            "ICMPv6 RA: can't find inet6 device for %s.\n",
1100                            skb->dev->name);
1101                 return;
1102         }
1103         if (in6_dev->cnf.forwarding || !in6_dev->cnf.accept_ra) {
1104                 in6_dev_put(in6_dev);
1105                 return;
1106         }
1107
1108         if (!ndisc_parse_options(opt, optlen, &ndopts)) {
1109                 in6_dev_put(in6_dev);
1110                 ND_PRINTK2(KERN_WARNING
1111                            "ICMP6 RA: invalid ND options\n");
1112                 return;
1113         }
1114
1115         if (in6_dev->if_flags & IF_RS_SENT) {
1116                 /*
1117                  *      flag that an RA was received after an RS was sent
1118                  *      out on this interface.
1119                  */
1120                 in6_dev->if_flags |= IF_RA_RCVD;
1121         }
1122
1123         /*
1124          * Remember the managed/otherconf flags from most recently
1125          * received RA message (RFC 2462) -- yoshfuji
1126          */
1127         in6_dev->if_flags = (in6_dev->if_flags & ~(IF_RA_MANAGED |
1128                                 IF_RA_OTHERCONF)) |
1129                                 (ra_msg->icmph.icmp6_addrconf_managed ?
1130                                         IF_RA_MANAGED : 0) |
1131                                 (ra_msg->icmph.icmp6_addrconf_other ?
1132                                         IF_RA_OTHERCONF : 0);
1133
1134         if (!in6_dev->cnf.accept_ra_defrtr)
1135                 goto skip_defrtr;
1136
1137         lifetime = ntohs(ra_msg->icmph.icmp6_rt_lifetime);
1138
1139 #ifdef CONFIG_IPV6_ROUTER_PREF
1140         pref = ra_msg->icmph.icmp6_router_pref;
1141         /* 10b is handled as if it were 00b (medium) */
1142         if (pref == ICMPV6_ROUTER_PREF_INVALID ||
1143             !in6_dev->cnf.accept_ra_rtr_pref)
1144                 pref = ICMPV6_ROUTER_PREF_MEDIUM;
1145 #endif
1146
1147         rt = rt6_get_dflt_router(&ipv6_hdr(skb)->saddr, skb->dev);
1148
1149         if (rt)
1150                 neigh = rt->rt6i_nexthop;
1151
1152         if (rt && lifetime == 0) {
1153                 neigh_clone(neigh);
1154                 ip6_del_rt(rt);
1155                 rt = NULL;
1156         }
1157
1158         if (rt == NULL && lifetime) {
1159                 ND_PRINTK3(KERN_DEBUG
1160                            "ICMPv6 RA: adding default router.\n");
1161
1162                 rt = rt6_add_dflt_router(&ipv6_hdr(skb)->saddr, skb->dev, pref);
1163                 if (rt == NULL) {
1164                         ND_PRINTK0(KERN_ERR
1165                                    "ICMPv6 RA: %s() failed to add default route.\n",
1166                                    __FUNCTION__);
1167                         in6_dev_put(in6_dev);
1168                         return;
1169                 }
1170
1171                 neigh = rt->rt6i_nexthop;
1172                 if (neigh == NULL) {
1173                         ND_PRINTK0(KERN_ERR
1174                                    "ICMPv6 RA: %s() got default router without neighbour.\n",
1175                                    __FUNCTION__);
1176                         dst_release(&rt->u.dst);
1177                         in6_dev_put(in6_dev);
1178                         return;
1179                 }
1180                 neigh->flags |= NTF_ROUTER;
1181         } else if (rt) {
1182                 rt->rt6i_flags |= (rt->rt6i_flags & ~RTF_PREF_MASK) | RTF_PREF(pref);
1183         }
1184
1185         if (rt)
1186                 rt->rt6i_expires = jiffies + (HZ * lifetime);
1187
1188         if (ra_msg->icmph.icmp6_hop_limit) {
1189                 in6_dev->cnf.hop_limit = ra_msg->icmph.icmp6_hop_limit;
1190                 if (rt)
1191                         rt->u.dst.metrics[RTAX_HOPLIMIT-1] = ra_msg->icmph.icmp6_hop_limit;
1192         }
1193
1194 skip_defrtr:
1195
1196         /*
1197          *      Update Reachable Time and Retrans Timer
1198          */
1199
1200         if (in6_dev->nd_parms) {
1201                 unsigned long rtime = ntohl(ra_msg->retrans_timer);
1202
1203                 if (rtime && rtime/1000 < MAX_SCHEDULE_TIMEOUT/HZ) {
1204                         rtime = (rtime*HZ)/1000;
1205                         if (rtime < HZ/10)
1206                                 rtime = HZ/10;
1207                         in6_dev->nd_parms->retrans_time = rtime;
1208                         in6_dev->tstamp = jiffies;
1209                         inet6_ifinfo_notify(RTM_NEWLINK, in6_dev);
1210                 }
1211
1212                 rtime = ntohl(ra_msg->reachable_time);
1213                 if (rtime && rtime/1000 < MAX_SCHEDULE_TIMEOUT/(3*HZ)) {
1214                         rtime = (rtime*HZ)/1000;
1215
1216                         if (rtime < HZ/10)
1217                                 rtime = HZ/10;
1218
1219                         if (rtime != in6_dev->nd_parms->base_reachable_time) {
1220                                 in6_dev->nd_parms->base_reachable_time = rtime;
1221                                 in6_dev->nd_parms->gc_staletime = 3 * rtime;
1222                                 in6_dev->nd_parms->reachable_time = neigh_rand_reach_time(rtime);
1223                                 in6_dev->tstamp = jiffies;
1224                                 inet6_ifinfo_notify(RTM_NEWLINK, in6_dev);
1225                         }
1226                 }
1227         }
1228
1229         /*
1230          *      Process options.
1231          */
1232
1233         if (!neigh)
1234                 neigh = __neigh_lookup(&nd_tbl, &ipv6_hdr(skb)->saddr,
1235                                        skb->dev, 1);
1236         if (neigh) {
1237                 u8 *lladdr = NULL;
1238                 if (ndopts.nd_opts_src_lladdr) {
1239                         lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr,
1240                                                      skb->dev);
1241                         if (!lladdr) {
1242                                 ND_PRINTK2(KERN_WARNING
1243                                            "ICMPv6 RA: invalid link-layer address length\n");
1244                                 goto out;
1245                         }
1246                 }
1247                 neigh_update(neigh, lladdr, NUD_STALE,
1248                              NEIGH_UPDATE_F_WEAK_OVERRIDE|
1249                              NEIGH_UPDATE_F_OVERRIDE|
1250                              NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
1251                              NEIGH_UPDATE_F_ISROUTER);
1252         }
1253
1254 #ifdef CONFIG_IPV6_ROUTE_INFO
1255         if (in6_dev->cnf.accept_ra_rtr_pref && ndopts.nd_opts_ri) {
1256                 struct nd_opt_hdr *p;
1257                 for (p = ndopts.nd_opts_ri;
1258                      p;
1259                      p = ndisc_next_option(p, ndopts.nd_opts_ri_end)) {
1260                         if (((struct route_info *)p)->prefix_len > in6_dev->cnf.accept_ra_rt_info_max_plen)
1261                                 continue;
1262                         rt6_route_rcv(skb->dev, (u8*)p, (p->nd_opt_len) << 3,
1263                                       &ipv6_hdr(skb)->saddr);
1264                 }
1265         }
1266 #endif
1267
1268         if (in6_dev->cnf.accept_ra_pinfo && ndopts.nd_opts_pi) {
1269                 struct nd_opt_hdr *p;
1270                 for (p = ndopts.nd_opts_pi;
1271                      p;
1272                      p = ndisc_next_option(p, ndopts.nd_opts_pi_end)) {
1273                         addrconf_prefix_rcv(skb->dev, (u8*)p, (p->nd_opt_len) << 3);
1274                 }
1275         }
1276
1277         if (ndopts.nd_opts_mtu) {
1278                 __be32 n;
1279                 u32 mtu;
1280
1281                 memcpy(&n, ((u8*)(ndopts.nd_opts_mtu+1))+2, sizeof(mtu));
1282                 mtu = ntohl(n);
1283
1284                 if (mtu < IPV6_MIN_MTU || mtu > skb->dev->mtu) {
1285                         ND_PRINTK2(KERN_WARNING
1286                                    "ICMPv6 RA: invalid mtu: %d\n",
1287                                    mtu);
1288                 } else if (in6_dev->cnf.mtu6 != mtu) {
1289                         in6_dev->cnf.mtu6 = mtu;
1290
1291                         if (rt)
1292                                 rt->u.dst.metrics[RTAX_MTU-1] = mtu;
1293
1294                         rt6_mtu_change(skb->dev, mtu);
1295                 }
1296         }
1297
1298         if (ndopts.nd_useropts) {
1299                 struct nd_opt_hdr *opt;
1300                 for (opt = ndopts.nd_useropts;
1301                      opt;
1302                      opt = ndisc_next_useropt(opt, ndopts.nd_useropts_end)) {
1303                                 ndisc_ra_useropt(skb, opt);
1304                 }
1305         }
1306
1307         if (ndopts.nd_opts_tgt_lladdr || ndopts.nd_opts_rh) {
1308                 ND_PRINTK2(KERN_WARNING
1309                            "ICMPv6 RA: invalid RA options");
1310         }
1311 out:
1312         if (rt)
1313                 dst_release(&rt->u.dst);
1314         else if (neigh)
1315                 neigh_release(neigh);
1316         in6_dev_put(in6_dev);
1317 }
1318
1319 static void ndisc_redirect_rcv(struct sk_buff *skb)
1320 {
1321         struct inet6_dev *in6_dev;
1322         struct icmp6hdr *icmph;
1323         struct in6_addr *dest;
1324         struct in6_addr *target;        /* new first hop to destination */
1325         struct neighbour *neigh;
1326         int on_link = 0;
1327         struct ndisc_options ndopts;
1328         int optlen;
1329         u8 *lladdr = NULL;
1330
1331         if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL)) {
1332                 ND_PRINTK2(KERN_WARNING
1333                            "ICMPv6 Redirect: source address is not link-local.\n");
1334                 return;
1335         }
1336
1337         optlen = skb->tail - skb->transport_header;
1338         optlen -= sizeof(struct icmp6hdr) + 2 * sizeof(struct in6_addr);
1339
1340         if (optlen < 0) {
1341                 ND_PRINTK2(KERN_WARNING
1342                            "ICMPv6 Redirect: packet too short\n");
1343                 return;
1344         }
1345
1346         icmph = icmp6_hdr(skb);
1347         target = (struct in6_addr *) (icmph + 1);
1348         dest = target + 1;
1349
1350         if (ipv6_addr_is_multicast(dest)) {
1351                 ND_PRINTK2(KERN_WARNING
1352                            "ICMPv6 Redirect: destination address is multicast.\n");
1353                 return;
1354         }
1355
1356         if (ipv6_addr_equal(dest, target)) {
1357                 on_link = 1;
1358         } else if (ipv6_addr_type(target) !=
1359                    (IPV6_ADDR_UNICAST|IPV6_ADDR_LINKLOCAL)) {
1360                 ND_PRINTK2(KERN_WARNING
1361                            "ICMPv6 Redirect: target address is not link-local unicast.\n");
1362                 return;
1363         }
1364
1365         in6_dev = in6_dev_get(skb->dev);
1366         if (!in6_dev)
1367                 return;
1368         if (in6_dev->cnf.forwarding || !in6_dev->cnf.accept_redirects) {
1369                 in6_dev_put(in6_dev);
1370                 return;
1371         }
1372
1373         /* RFC2461 8.1:
1374          *      The IP source address of the Redirect MUST be the same as the current
1375          *      first-hop router for the specified ICMP Destination Address.
1376          */
1377
1378         if (!ndisc_parse_options((u8*)(dest + 1), optlen, &ndopts)) {
1379                 ND_PRINTK2(KERN_WARNING
1380                            "ICMPv6 Redirect: invalid ND options\n");
1381                 in6_dev_put(in6_dev);
1382                 return;
1383         }
1384         if (ndopts.nd_opts_tgt_lladdr) {
1385                 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_tgt_lladdr,
1386                                              skb->dev);
1387                 if (!lladdr) {
1388                         ND_PRINTK2(KERN_WARNING
1389                                    "ICMPv6 Redirect: invalid link-layer address length\n");
1390                         in6_dev_put(in6_dev);
1391                         return;
1392                 }
1393         }
1394
1395         neigh = __neigh_lookup(&nd_tbl, target, skb->dev, 1);
1396         if (neigh) {
1397                 rt6_redirect(dest, &ipv6_hdr(skb)->daddr,
1398                              &ipv6_hdr(skb)->saddr, neigh, lladdr,
1399                              on_link);
1400                 neigh_release(neigh);
1401         }
1402         in6_dev_put(in6_dev);
1403 }
1404
1405 void ndisc_send_redirect(struct sk_buff *skb, struct neighbour *neigh,
1406                          struct in6_addr *target)
1407 {
1408         struct sock *sk = ndisc_socket->sk;
1409         int len = sizeof(struct icmp6hdr) + 2 * sizeof(struct in6_addr);
1410         struct sk_buff *buff;
1411         struct icmp6hdr *icmph;
1412         struct in6_addr saddr_buf;
1413         struct in6_addr *addrp;
1414         struct net_device *dev;
1415         struct rt6_info *rt;
1416         struct dst_entry *dst;
1417         struct inet6_dev *idev;
1418         struct flowi fl;
1419         u8 *opt;
1420         int rd_len;
1421         int err;
1422         int hlen;
1423         u8 ha_buf[MAX_ADDR_LEN], *ha = NULL;
1424
1425         dev = skb->dev;
1426
1427         if (ipv6_get_lladdr(dev, &saddr_buf, IFA_F_TENTATIVE)) {
1428                 ND_PRINTK2(KERN_WARNING
1429                            "ICMPv6 Redirect: no link-local address on %s\n",
1430                            dev->name);
1431                 return;
1432         }
1433
1434         if (!ipv6_addr_equal(&ipv6_hdr(skb)->daddr, target) &&
1435             ipv6_addr_type(target) != (IPV6_ADDR_UNICAST|IPV6_ADDR_LINKLOCAL)) {
1436                 ND_PRINTK2(KERN_WARNING
1437                         "ICMPv6 Redirect: target address is not link-local unicast.\n");
1438                 return;
1439         }
1440
1441         ndisc_flow_init(&fl, NDISC_REDIRECT, &saddr_buf, &ipv6_hdr(skb)->saddr,
1442                         dev->ifindex);
1443
1444         dst = ip6_route_output(NULL, &fl);
1445         if (dst == NULL)
1446                 return;
1447
1448         err = xfrm_lookup(&dst, &fl, NULL, 0);
1449         if (err)
1450                 return;
1451
1452         rt = (struct rt6_info *) dst;
1453
1454         if (rt->rt6i_flags & RTF_GATEWAY) {
1455                 ND_PRINTK2(KERN_WARNING
1456                            "ICMPv6 Redirect: destination is not a neighbour.\n");
1457                 dst_release(dst);
1458                 return;
1459         }
1460         if (!xrlim_allow(dst, 1*HZ)) {
1461                 dst_release(dst);
1462                 return;
1463         }
1464
1465         if (dev->addr_len) {
1466                 read_lock_bh(&neigh->lock);
1467                 if (neigh->nud_state & NUD_VALID) {
1468                         memcpy(ha_buf, neigh->ha, dev->addr_len);
1469                         read_unlock_bh(&neigh->lock);
1470                         ha = ha_buf;
1471                         len += ndisc_opt_addr_space(dev);
1472                 } else
1473                         read_unlock_bh(&neigh->lock);
1474         }
1475
1476         rd_len = min_t(unsigned int,
1477                      IPV6_MIN_MTU-sizeof(struct ipv6hdr)-len, skb->len + 8);
1478         rd_len &= ~0x7;
1479         len += rd_len;
1480
1481         buff = sock_alloc_send_skb(sk,
1482                                    (MAX_HEADER + sizeof(struct ipv6hdr) +
1483                                     len + LL_RESERVED_SPACE(dev)),
1484                                    1, &err);
1485         if (buff == NULL) {
1486                 ND_PRINTK0(KERN_ERR
1487                            "ICMPv6 Redirect: %s() failed to allocate an skb.\n",
1488                            __FUNCTION__);
1489                 dst_release(dst);
1490                 return;
1491         }
1492
1493         hlen = 0;
1494
1495         skb_reserve(buff, LL_RESERVED_SPACE(dev));
1496         ip6_nd_hdr(sk, buff, dev, &saddr_buf, &ipv6_hdr(skb)->saddr,
1497                    IPPROTO_ICMPV6, len);
1498
1499         skb_set_transport_header(buff, skb_tail_pointer(buff) - buff->data);
1500         skb_put(buff, len);
1501         icmph = icmp6_hdr(buff);
1502
1503         memset(icmph, 0, sizeof(struct icmp6hdr));
1504         icmph->icmp6_type = NDISC_REDIRECT;
1505
1506         /*
1507          *      copy target and destination addresses
1508          */
1509
1510         addrp = (struct in6_addr *)(icmph + 1);
1511         ipv6_addr_copy(addrp, target);
1512         addrp++;
1513         ipv6_addr_copy(addrp, &ipv6_hdr(skb)->daddr);
1514
1515         opt = (u8*) (addrp + 1);
1516
1517         /*
1518          *      include target_address option
1519          */
1520
1521         if (ha)
1522                 opt = ndisc_fill_addr_option(opt, ND_OPT_TARGET_LL_ADDR, ha,
1523                                              dev->addr_len, dev->type);
1524
1525         /*
1526          *      build redirect option and copy skb over to the new packet.
1527          */
1528
1529         memset(opt, 0, 8);
1530         *(opt++) = ND_OPT_REDIRECT_HDR;
1531         *(opt++) = (rd_len >> 3);
1532         opt += 6;
1533
1534         memcpy(opt, ipv6_hdr(skb), rd_len - 8);
1535
1536         icmph->icmp6_cksum = csum_ipv6_magic(&saddr_buf, &ipv6_hdr(skb)->saddr,
1537                                              len, IPPROTO_ICMPV6,
1538                                              csum_partial((u8 *) icmph, len, 0));
1539
1540         buff->dst = dst;
1541         idev = in6_dev_get(dst->dev);
1542         IP6_INC_STATS(idev, IPSTATS_MIB_OUTREQUESTS);
1543         err = NF_HOOK(PF_INET6, NF_INET_LOCAL_OUT, buff, NULL, dst->dev,
1544                       dst_output);
1545         if (!err) {
1546                 ICMP6MSGOUT_INC_STATS(idev, NDISC_REDIRECT);
1547                 ICMP6_INC_STATS(idev, ICMP6_MIB_OUTMSGS);
1548         }
1549
1550         if (likely(idev != NULL))
1551                 in6_dev_put(idev);
1552 }
1553
1554 static void pndisc_redo(struct sk_buff *skb)
1555 {
1556         ndisc_recv_ns(skb);
1557         kfree_skb(skb);
1558 }
1559
1560 int ndisc_rcv(struct sk_buff *skb)
1561 {
1562         struct nd_msg *msg;
1563
1564         if (!pskb_may_pull(skb, skb->len))
1565                 return 0;
1566
1567         msg = (struct nd_msg *)skb_transport_header(skb);
1568
1569         __skb_push(skb, skb->data - skb_transport_header(skb));
1570
1571         if (ipv6_hdr(skb)->hop_limit != 255) {
1572                 ND_PRINTK2(KERN_WARNING
1573                            "ICMPv6 NDISC: invalid hop-limit: %d\n",
1574                            ipv6_hdr(skb)->hop_limit);
1575                 return 0;
1576         }
1577
1578         if (msg->icmph.icmp6_code != 0) {
1579                 ND_PRINTK2(KERN_WARNING
1580                            "ICMPv6 NDISC: invalid ICMPv6 code: %d\n",
1581                            msg->icmph.icmp6_code);
1582                 return 0;
1583         }
1584
1585         memset(NEIGH_CB(skb), 0, sizeof(struct neighbour_cb));
1586
1587         switch (msg->icmph.icmp6_type) {
1588         case NDISC_NEIGHBOUR_SOLICITATION:
1589                 ndisc_recv_ns(skb);
1590                 break;
1591
1592         case NDISC_NEIGHBOUR_ADVERTISEMENT:
1593                 ndisc_recv_na(skb);
1594                 break;
1595
1596         case NDISC_ROUTER_SOLICITATION:
1597                 ndisc_recv_rs(skb);
1598                 break;
1599
1600         case NDISC_ROUTER_ADVERTISEMENT:
1601                 ndisc_router_discovery(skb);
1602                 break;
1603
1604         case NDISC_REDIRECT:
1605                 ndisc_redirect_rcv(skb);
1606                 break;
1607         }
1608
1609         return 0;
1610 }
1611
1612 static int ndisc_netdev_event(struct notifier_block *this, unsigned long event, void *ptr)
1613 {
1614         struct net_device *dev = ptr;
1615
1616         if (dev->nd_net != &init_net)
1617                 return NOTIFY_DONE;
1618
1619         switch (event) {
1620         case NETDEV_CHANGEADDR:
1621                 neigh_changeaddr(&nd_tbl, dev);
1622                 fib6_run_gc(~0UL);
1623                 break;
1624         case NETDEV_DOWN:
1625                 neigh_ifdown(&nd_tbl, dev);
1626                 fib6_run_gc(~0UL);
1627                 break;
1628         default:
1629                 break;
1630         }
1631
1632         return NOTIFY_DONE;
1633 }
1634
1635 static struct notifier_block ndisc_netdev_notifier = {
1636         .notifier_call = ndisc_netdev_event,
1637 };
1638
1639 #ifdef CONFIG_SYSCTL
1640 static void ndisc_warn_deprecated_sysctl(struct ctl_table *ctl,
1641                                          const char *func, const char *dev_name)
1642 {
1643         static char warncomm[TASK_COMM_LEN];
1644         static int warned;
1645         if (strcmp(warncomm, current->comm) && warned < 5) {
1646                 strcpy(warncomm, current->comm);
1647                 printk(KERN_WARNING
1648                         "process `%s' is using deprecated sysctl (%s) "
1649                         "net.ipv6.neigh.%s.%s; "
1650                         "Use net.ipv6.neigh.%s.%s_ms "
1651                         "instead.\n",
1652                         warncomm, func,
1653                         dev_name, ctl->procname,
1654                         dev_name, ctl->procname);
1655                 warned++;
1656         }
1657 }
1658
1659 int ndisc_ifinfo_sysctl_change(struct ctl_table *ctl, int write, struct file * filp, void __user *buffer, size_t *lenp, loff_t *ppos)
1660 {
1661         struct net_device *dev = ctl->extra1;
1662         struct inet6_dev *idev;
1663         int ret;
1664
1665         if ((strcmp(ctl->procname, "retrans_time") == 0) ||
1666             (strcmp(ctl->procname, "base_reachable_time") == 0))
1667                 ndisc_warn_deprecated_sysctl(ctl, "syscall", dev ? dev->name : "default");
1668
1669         if (strcmp(ctl->procname, "retrans_time") == 0)
1670                 ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1671
1672         else if (strcmp(ctl->procname, "base_reachable_time") == 0)
1673                 ret = proc_dointvec_jiffies(ctl, write,
1674                                             filp, buffer, lenp, ppos);
1675
1676         else if ((strcmp(ctl->procname, "retrans_time_ms") == 0) ||
1677                  (strcmp(ctl->procname, "base_reachable_time_ms") == 0))
1678                 ret = proc_dointvec_ms_jiffies(ctl, write,
1679                                                filp, buffer, lenp, ppos);
1680         else
1681                 ret = -1;
1682
1683         if (write && ret == 0 && dev && (idev = in6_dev_get(dev)) != NULL) {
1684                 if (ctl->data == &idev->nd_parms->base_reachable_time)
1685                         idev->nd_parms->reachable_time = neigh_rand_reach_time(idev->nd_parms->base_reachable_time);
1686                 idev->tstamp = jiffies;
1687                 inet6_ifinfo_notify(RTM_NEWLINK, idev);
1688                 in6_dev_put(idev);
1689         }
1690         return ret;
1691 }
1692
1693 static int ndisc_ifinfo_sysctl_strategy(ctl_table *ctl, int __user *name,
1694                                         int nlen, void __user *oldval,
1695                                         size_t __user *oldlenp,
1696                                         void __user *newval, size_t newlen)
1697 {
1698         struct net_device *dev = ctl->extra1;
1699         struct inet6_dev *idev;
1700         int ret;
1701
1702         if (ctl->ctl_name == NET_NEIGH_RETRANS_TIME ||
1703             ctl->ctl_name == NET_NEIGH_REACHABLE_TIME)
1704                 ndisc_warn_deprecated_sysctl(ctl, "procfs", dev ? dev->name : "default");
1705
1706         switch (ctl->ctl_name) {
1707         case NET_NEIGH_REACHABLE_TIME:
1708                 ret = sysctl_jiffies(ctl, name, nlen,
1709                                      oldval, oldlenp, newval, newlen);
1710                 break;
1711         case NET_NEIGH_RETRANS_TIME_MS:
1712         case NET_NEIGH_REACHABLE_TIME_MS:
1713                  ret = sysctl_ms_jiffies(ctl, name, nlen,
1714                                          oldval, oldlenp, newval, newlen);
1715                  break;
1716         default:
1717                 ret = 0;
1718         }
1719
1720         if (newval && newlen && ret > 0 &&
1721             dev && (idev = in6_dev_get(dev)) != NULL) {
1722                 if (ctl->ctl_name == NET_NEIGH_REACHABLE_TIME ||
1723                     ctl->ctl_name == NET_NEIGH_REACHABLE_TIME_MS)
1724                         idev->nd_parms->reachable_time = neigh_rand_reach_time(idev->nd_parms->base_reachable_time);
1725                 idev->tstamp = jiffies;
1726                 inet6_ifinfo_notify(RTM_NEWLINK, idev);
1727                 in6_dev_put(idev);
1728         }
1729
1730         return ret;
1731 }
1732
1733 #endif
1734
1735 int __init ndisc_init(struct net_proto_family *ops)
1736 {
1737         struct ipv6_pinfo *np;
1738         struct sock *sk;
1739         int err;
1740
1741         err = sock_create_kern(PF_INET6, SOCK_RAW, IPPROTO_ICMPV6, &ndisc_socket);
1742         if (err < 0) {
1743                 ND_PRINTK0(KERN_ERR
1744                            "ICMPv6 NDISC: Failed to initialize the control socket (err %d).\n",
1745                            err);
1746                 ndisc_socket = NULL; /* For safety. */
1747                 return err;
1748         }
1749
1750         sk = ndisc_socket->sk;
1751         np = inet6_sk(sk);
1752         sk->sk_allocation = GFP_ATOMIC;
1753         np->hop_limit = 255;
1754         /* Do not loopback ndisc messages */
1755         np->mc_loop = 0;
1756         sk->sk_prot->unhash(sk);
1757
1758         /*
1759          * Initialize the neighbour table
1760          */
1761
1762         neigh_table_init(&nd_tbl);
1763
1764 #ifdef CONFIG_SYSCTL
1765         neigh_sysctl_register(NULL, &nd_tbl.parms, NET_IPV6, NET_IPV6_NEIGH,
1766                               "ipv6",
1767                               &ndisc_ifinfo_sysctl_change,
1768                               &ndisc_ifinfo_sysctl_strategy);
1769 #endif
1770
1771         register_netdevice_notifier(&ndisc_netdev_notifier);
1772         return 0;
1773 }
1774
1775 void ndisc_cleanup(void)
1776 {
1777         unregister_netdevice_notifier(&ndisc_netdev_notifier);
1778 #ifdef CONFIG_SYSCTL
1779         neigh_sysctl_unregister(&nd_tbl.parms);
1780 #endif
1781         neigh_table_clear(&nd_tbl);
1782         sock_release(ndisc_socket);
1783         ndisc_socket = NULL; /* For safety. */
1784 }