Add the rt linux 4.1.3-rt3 as base
[kvmfornfv.git] / kernel / net / ipv6 / ndisc.c
1 /*
2  *      Neighbour Discovery for IPv6
3  *      Linux INET6 implementation
4  *
5  *      Authors:
6  *      Pedro Roque             <roque@di.fc.ul.pt>
7  *      Mike Shaver             <shaver@ingenia.com>
8  *
9  *      This program is free software; you can redistribute it and/or
10  *      modify it under the terms of the GNU General Public License
11  *      as published by the Free Software Foundation; either version
12  *      2 of the License, or (at your option) any later version.
13  */
14
15 /*
16  *      Changes:
17  *
18  *      Alexey I. Froloff               :       RFC6106 (DNSSL) support
19  *      Pierre Ynard                    :       export userland ND options
20  *                                              through netlink (RDNSS support)
21  *      Lars Fenneberg                  :       fixed MTU setting on receipt
22  *                                              of an RA.
23  *      Janos Farkas                    :       kmalloc failure checks
24  *      Alexey Kuznetsov                :       state machine reworked
25  *                                              and moved to net/core.
26  *      Pekka Savola                    :       RFC2461 validation
27  *      YOSHIFUJI Hideaki @USAGI        :       Verify ND options properly
28  */
29
30 #define pr_fmt(fmt) "ICMPv6: " fmt
31
32 #include <linux/module.h>
33 #include <linux/errno.h>
34 #include <linux/types.h>
35 #include <linux/socket.h>
36 #include <linux/sockios.h>
37 #include <linux/sched.h>
38 #include <linux/net.h>
39 #include <linux/in6.h>
40 #include <linux/route.h>
41 #include <linux/init.h>
42 #include <linux/rcupdate.h>
43 #include <linux/slab.h>
44 #ifdef CONFIG_SYSCTL
45 #include <linux/sysctl.h>
46 #endif
47
48 #include <linux/if_addr.h>
49 #include <linux/if_arp.h>
50 #include <linux/ipv6.h>
51 #include <linux/icmpv6.h>
52 #include <linux/jhash.h>
53
54 #include <net/sock.h>
55 #include <net/snmp.h>
56
57 #include <net/ipv6.h>
58 #include <net/protocol.h>
59 #include <net/ndisc.h>
60 #include <net/ip6_route.h>
61 #include <net/addrconf.h>
62 #include <net/icmp.h>
63
64 #include <net/netlink.h>
65 #include <linux/rtnetlink.h>
66
67 #include <net/flow.h>
68 #include <net/ip6_checksum.h>
69 #include <net/inet_common.h>
70 #include <linux/proc_fs.h>
71
72 #include <linux/netfilter.h>
73 #include <linux/netfilter_ipv6.h>
74
75 /* Set to 3 to get tracing... */
76 #define ND_DEBUG 1
77
78 #define ND_PRINTK(val, level, fmt, ...)                         \
79 do {                                                            \
80         if (val <= ND_DEBUG)                                    \
81                 net_##level##_ratelimited(fmt, ##__VA_ARGS__);  \
82 } while (0)
83
84 static u32 ndisc_hash(const void *pkey,
85                       const struct net_device *dev,
86                       __u32 *hash_rnd);
87 static bool ndisc_key_eq(const struct neighbour *neigh, const void *pkey);
88 static int ndisc_constructor(struct neighbour *neigh);
89 static void ndisc_solicit(struct neighbour *neigh, struct sk_buff *skb);
90 static void ndisc_error_report(struct neighbour *neigh, struct sk_buff *skb);
91 static int pndisc_constructor(struct pneigh_entry *n);
92 static void pndisc_destructor(struct pneigh_entry *n);
93 static void pndisc_redo(struct sk_buff *skb);
94
95 static const struct neigh_ops ndisc_generic_ops = {
96         .family =               AF_INET6,
97         .solicit =              ndisc_solicit,
98         .error_report =         ndisc_error_report,
99         .output =               neigh_resolve_output,
100         .connected_output =     neigh_connected_output,
101 };
102
103 static const struct neigh_ops ndisc_hh_ops = {
104         .family =               AF_INET6,
105         .solicit =              ndisc_solicit,
106         .error_report =         ndisc_error_report,
107         .output =               neigh_resolve_output,
108         .connected_output =     neigh_resolve_output,
109 };
110
111
112 static const struct neigh_ops ndisc_direct_ops = {
113         .family =               AF_INET6,
114         .output =               neigh_direct_output,
115         .connected_output =     neigh_direct_output,
116 };
117
118 struct neigh_table nd_tbl = {
119         .family =       AF_INET6,
120         .key_len =      sizeof(struct in6_addr),
121         .protocol =     cpu_to_be16(ETH_P_IPV6),
122         .hash =         ndisc_hash,
123         .key_eq =       ndisc_key_eq,
124         .constructor =  ndisc_constructor,
125         .pconstructor = pndisc_constructor,
126         .pdestructor =  pndisc_destructor,
127         .proxy_redo =   pndisc_redo,
128         .id =           "ndisc_cache",
129         .parms = {
130                 .tbl                    = &nd_tbl,
131                 .reachable_time         = ND_REACHABLE_TIME,
132                 .data = {
133                         [NEIGH_VAR_MCAST_PROBES] = 3,
134                         [NEIGH_VAR_UCAST_PROBES] = 3,
135                         [NEIGH_VAR_RETRANS_TIME] = ND_RETRANS_TIMER,
136                         [NEIGH_VAR_BASE_REACHABLE_TIME] = ND_REACHABLE_TIME,
137                         [NEIGH_VAR_DELAY_PROBE_TIME] = 5 * HZ,
138                         [NEIGH_VAR_GC_STALETIME] = 60 * HZ,
139                         [NEIGH_VAR_QUEUE_LEN_BYTES] = 64 * 1024,
140                         [NEIGH_VAR_PROXY_QLEN] = 64,
141                         [NEIGH_VAR_ANYCAST_DELAY] = 1 * HZ,
142                         [NEIGH_VAR_PROXY_DELAY] = (8 * HZ) / 10,
143                 },
144         },
145         .gc_interval =    30 * HZ,
146         .gc_thresh1 =    128,
147         .gc_thresh2 =    512,
148         .gc_thresh3 =   1024,
149 };
150
151 static void ndisc_fill_addr_option(struct sk_buff *skb, int type, void *data)
152 {
153         int pad   = ndisc_addr_option_pad(skb->dev->type);
154         int data_len = skb->dev->addr_len;
155         int space = ndisc_opt_addr_space(skb->dev);
156         u8 *opt = skb_put(skb, space);
157
158         opt[0] = type;
159         opt[1] = space>>3;
160
161         memset(opt + 2, 0, pad);
162         opt   += pad;
163         space -= pad;
164
165         memcpy(opt+2, data, data_len);
166         data_len += 2;
167         opt += data_len;
168         space -= data_len;
169         if (space > 0)
170                 memset(opt, 0, space);
171 }
172
173 static struct nd_opt_hdr *ndisc_next_option(struct nd_opt_hdr *cur,
174                                             struct nd_opt_hdr *end)
175 {
176         int type;
177         if (!cur || !end || cur >= end)
178                 return NULL;
179         type = cur->nd_opt_type;
180         do {
181                 cur = ((void *)cur) + (cur->nd_opt_len << 3);
182         } while (cur < end && cur->nd_opt_type != type);
183         return cur <= end && cur->nd_opt_type == type ? cur : NULL;
184 }
185
186 static inline int ndisc_is_useropt(struct nd_opt_hdr *opt)
187 {
188         return opt->nd_opt_type == ND_OPT_RDNSS ||
189                 opt->nd_opt_type == ND_OPT_DNSSL;
190 }
191
192 static struct nd_opt_hdr *ndisc_next_useropt(struct nd_opt_hdr *cur,
193                                              struct nd_opt_hdr *end)
194 {
195         if (!cur || !end || cur >= end)
196                 return NULL;
197         do {
198                 cur = ((void *)cur) + (cur->nd_opt_len << 3);
199         } while (cur < end && !ndisc_is_useropt(cur));
200         return cur <= end && ndisc_is_useropt(cur) ? cur : NULL;
201 }
202
203 struct ndisc_options *ndisc_parse_options(u8 *opt, int opt_len,
204                                           struct ndisc_options *ndopts)
205 {
206         struct nd_opt_hdr *nd_opt = (struct nd_opt_hdr *)opt;
207
208         if (!nd_opt || opt_len < 0 || !ndopts)
209                 return NULL;
210         memset(ndopts, 0, sizeof(*ndopts));
211         while (opt_len) {
212                 int l;
213                 if (opt_len < sizeof(struct nd_opt_hdr))
214                         return NULL;
215                 l = nd_opt->nd_opt_len << 3;
216                 if (opt_len < l || l == 0)
217                         return NULL;
218                 switch (nd_opt->nd_opt_type) {
219                 case ND_OPT_SOURCE_LL_ADDR:
220                 case ND_OPT_TARGET_LL_ADDR:
221                 case ND_OPT_MTU:
222                 case ND_OPT_REDIRECT_HDR:
223                         if (ndopts->nd_opt_array[nd_opt->nd_opt_type]) {
224                                 ND_PRINTK(2, warn,
225                                           "%s: duplicated ND6 option found: type=%d\n",
226                                           __func__, nd_opt->nd_opt_type);
227                         } else {
228                                 ndopts->nd_opt_array[nd_opt->nd_opt_type] = nd_opt;
229                         }
230                         break;
231                 case ND_OPT_PREFIX_INFO:
232                         ndopts->nd_opts_pi_end = nd_opt;
233                         if (!ndopts->nd_opt_array[nd_opt->nd_opt_type])
234                                 ndopts->nd_opt_array[nd_opt->nd_opt_type] = nd_opt;
235                         break;
236 #ifdef CONFIG_IPV6_ROUTE_INFO
237                 case ND_OPT_ROUTE_INFO:
238                         ndopts->nd_opts_ri_end = nd_opt;
239                         if (!ndopts->nd_opts_ri)
240                                 ndopts->nd_opts_ri = nd_opt;
241                         break;
242 #endif
243                 default:
244                         if (ndisc_is_useropt(nd_opt)) {
245                                 ndopts->nd_useropts_end = nd_opt;
246                                 if (!ndopts->nd_useropts)
247                                         ndopts->nd_useropts = nd_opt;
248                         } else {
249                                 /*
250                                  * Unknown options must be silently ignored,
251                                  * to accommodate future extension to the
252                                  * protocol.
253                                  */
254                                 ND_PRINTK(2, notice,
255                                           "%s: ignored unsupported option; type=%d, len=%d\n",
256                                           __func__,
257                                           nd_opt->nd_opt_type,
258                                           nd_opt->nd_opt_len);
259                         }
260                 }
261                 opt_len -= l;
262                 nd_opt = ((void *)nd_opt) + l;
263         }
264         return ndopts;
265 }
266
267 int ndisc_mc_map(const struct in6_addr *addr, char *buf, struct net_device *dev, int dir)
268 {
269         switch (dev->type) {
270         case ARPHRD_ETHER:
271         case ARPHRD_IEEE802:    /* Not sure. Check it later. --ANK */
272         case ARPHRD_FDDI:
273                 ipv6_eth_mc_map(addr, buf);
274                 return 0;
275         case ARPHRD_ARCNET:
276                 ipv6_arcnet_mc_map(addr, buf);
277                 return 0;
278         case ARPHRD_INFINIBAND:
279                 ipv6_ib_mc_map(addr, dev->broadcast, buf);
280                 return 0;
281         case ARPHRD_IPGRE:
282                 return ipv6_ipgre_mc_map(addr, dev->broadcast, buf);
283         default:
284                 if (dir) {
285                         memcpy(buf, dev->broadcast, dev->addr_len);
286                         return 0;
287                 }
288         }
289         return -EINVAL;
290 }
291 EXPORT_SYMBOL(ndisc_mc_map);
292
293 static u32 ndisc_hash(const void *pkey,
294                       const struct net_device *dev,
295                       __u32 *hash_rnd)
296 {
297         return ndisc_hashfn(pkey, dev, hash_rnd);
298 }
299
300 static bool ndisc_key_eq(const struct neighbour *n, const void *pkey)
301 {
302         return neigh_key_eq128(n, pkey);
303 }
304
305 static int ndisc_constructor(struct neighbour *neigh)
306 {
307         struct in6_addr *addr = (struct in6_addr *)&neigh->primary_key;
308         struct net_device *dev = neigh->dev;
309         struct inet6_dev *in6_dev;
310         struct neigh_parms *parms;
311         bool is_multicast = ipv6_addr_is_multicast(addr);
312
313         in6_dev = in6_dev_get(dev);
314         if (!in6_dev) {
315                 return -EINVAL;
316         }
317
318         parms = in6_dev->nd_parms;
319         __neigh_parms_put(neigh->parms);
320         neigh->parms = neigh_parms_clone(parms);
321
322         neigh->type = is_multicast ? RTN_MULTICAST : RTN_UNICAST;
323         if (!dev->header_ops) {
324                 neigh->nud_state = NUD_NOARP;
325                 neigh->ops = &ndisc_direct_ops;
326                 neigh->output = neigh_direct_output;
327         } else {
328                 if (is_multicast) {
329                         neigh->nud_state = NUD_NOARP;
330                         ndisc_mc_map(addr, neigh->ha, dev, 1);
331                 } else if (dev->flags&(IFF_NOARP|IFF_LOOPBACK)) {
332                         neigh->nud_state = NUD_NOARP;
333                         memcpy(neigh->ha, dev->dev_addr, dev->addr_len);
334                         if (dev->flags&IFF_LOOPBACK)
335                                 neigh->type = RTN_LOCAL;
336                 } else if (dev->flags&IFF_POINTOPOINT) {
337                         neigh->nud_state = NUD_NOARP;
338                         memcpy(neigh->ha, dev->broadcast, dev->addr_len);
339                 }
340                 if (dev->header_ops->cache)
341                         neigh->ops = &ndisc_hh_ops;
342                 else
343                         neigh->ops = &ndisc_generic_ops;
344                 if (neigh->nud_state&NUD_VALID)
345                         neigh->output = neigh->ops->connected_output;
346                 else
347                         neigh->output = neigh->ops->output;
348         }
349         in6_dev_put(in6_dev);
350         return 0;
351 }
352
353 static int pndisc_constructor(struct pneigh_entry *n)
354 {
355         struct in6_addr *addr = (struct in6_addr *)&n->key;
356         struct in6_addr maddr;
357         struct net_device *dev = n->dev;
358
359         if (!dev || !__in6_dev_get(dev))
360                 return -EINVAL;
361         addrconf_addr_solict_mult(addr, &maddr);
362         ipv6_dev_mc_inc(dev, &maddr);
363         return 0;
364 }
365
366 static void pndisc_destructor(struct pneigh_entry *n)
367 {
368         struct in6_addr *addr = (struct in6_addr *)&n->key;
369         struct in6_addr maddr;
370         struct net_device *dev = n->dev;
371
372         if (!dev || !__in6_dev_get(dev))
373                 return;
374         addrconf_addr_solict_mult(addr, &maddr);
375         ipv6_dev_mc_dec(dev, &maddr);
376 }
377
378 static struct sk_buff *ndisc_alloc_skb(struct net_device *dev,
379                                        int len)
380 {
381         int hlen = LL_RESERVED_SPACE(dev);
382         int tlen = dev->needed_tailroom;
383         struct sock *sk = dev_net(dev)->ipv6.ndisc_sk;
384         struct sk_buff *skb;
385
386         skb = alloc_skb(hlen + sizeof(struct ipv6hdr) + len + tlen, GFP_ATOMIC);
387         if (!skb) {
388                 ND_PRINTK(0, err, "ndisc: %s failed to allocate an skb\n",
389                           __func__);
390                 return NULL;
391         }
392
393         skb->protocol = htons(ETH_P_IPV6);
394         skb->dev = dev;
395
396         skb_reserve(skb, hlen + sizeof(struct ipv6hdr));
397         skb_reset_transport_header(skb);
398
399         /* Manually assign socket ownership as we avoid calling
400          * sock_alloc_send_pskb() to bypass wmem buffer limits
401          */
402         skb_set_owner_w(skb, sk);
403
404         return skb;
405 }
406
407 static void ip6_nd_hdr(struct sk_buff *skb,
408                        const struct in6_addr *saddr,
409                        const struct in6_addr *daddr,
410                        int hop_limit, int len)
411 {
412         struct ipv6hdr *hdr;
413
414         skb_push(skb, sizeof(*hdr));
415         skb_reset_network_header(skb);
416         hdr = ipv6_hdr(skb);
417
418         ip6_flow_hdr(hdr, 0, 0);
419
420         hdr->payload_len = htons(len);
421         hdr->nexthdr = IPPROTO_ICMPV6;
422         hdr->hop_limit = hop_limit;
423
424         hdr->saddr = *saddr;
425         hdr->daddr = *daddr;
426 }
427
428 static void ndisc_send_skb(struct sk_buff *skb,
429                            const struct in6_addr *daddr,
430                            const struct in6_addr *saddr)
431 {
432         struct dst_entry *dst = skb_dst(skb);
433         struct net *net = dev_net(skb->dev);
434         struct sock *sk = net->ipv6.ndisc_sk;
435         struct inet6_dev *idev;
436         int err;
437         struct icmp6hdr *icmp6h = icmp6_hdr(skb);
438         u8 type;
439
440         type = icmp6h->icmp6_type;
441
442         if (!dst) {
443                 struct flowi6 fl6;
444
445                 icmpv6_flow_init(sk, &fl6, type, saddr, daddr, skb->dev->ifindex);
446                 dst = icmp6_dst_alloc(skb->dev, &fl6);
447                 if (IS_ERR(dst)) {
448                         kfree_skb(skb);
449                         return;
450                 }
451
452                 skb_dst_set(skb, dst);
453         }
454
455         icmp6h->icmp6_cksum = csum_ipv6_magic(saddr, daddr, skb->len,
456                                               IPPROTO_ICMPV6,
457                                               csum_partial(icmp6h,
458                                                            skb->len, 0));
459
460         ip6_nd_hdr(skb, saddr, daddr, inet6_sk(sk)->hop_limit, skb->len);
461
462         rcu_read_lock();
463         idev = __in6_dev_get(dst->dev);
464         IP6_UPD_PO_STATS(net, idev, IPSTATS_MIB_OUT, skb->len);
465
466         err = NF_HOOK(NFPROTO_IPV6, NF_INET_LOCAL_OUT, sk, skb,
467                       NULL, dst->dev,
468                       dst_output_sk);
469         if (!err) {
470                 ICMP6MSGOUT_INC_STATS(net, idev, type);
471                 ICMP6_INC_STATS(net, idev, ICMP6_MIB_OUTMSGS);
472         }
473
474         rcu_read_unlock();
475 }
476
477 void ndisc_send_na(struct net_device *dev, struct neighbour *neigh,
478                    const struct in6_addr *daddr,
479                    const struct in6_addr *solicited_addr,
480                    bool router, bool solicited, bool override, bool inc_opt)
481 {
482         struct sk_buff *skb;
483         struct in6_addr tmpaddr;
484         struct inet6_ifaddr *ifp;
485         const struct in6_addr *src_addr;
486         struct nd_msg *msg;
487         int optlen = 0;
488
489         /* for anycast or proxy, solicited_addr != src_addr */
490         ifp = ipv6_get_ifaddr(dev_net(dev), solicited_addr, dev, 1);
491         if (ifp) {
492                 src_addr = solicited_addr;
493                 if (ifp->flags & IFA_F_OPTIMISTIC)
494                         override = false;
495                 inc_opt |= ifp->idev->cnf.force_tllao;
496                 in6_ifa_put(ifp);
497         } else {
498                 if (ipv6_dev_get_saddr(dev_net(dev), dev, daddr,
499                                        inet6_sk(dev_net(dev)->ipv6.ndisc_sk)->srcprefs,
500                                        &tmpaddr))
501                         return;
502                 src_addr = &tmpaddr;
503         }
504
505         if (!dev->addr_len)
506                 inc_opt = 0;
507         if (inc_opt)
508                 optlen += ndisc_opt_addr_space(dev);
509
510         skb = ndisc_alloc_skb(dev, sizeof(*msg) + optlen);
511         if (!skb)
512                 return;
513
514         msg = (struct nd_msg *)skb_put(skb, sizeof(*msg));
515         *msg = (struct nd_msg) {
516                 .icmph = {
517                         .icmp6_type = NDISC_NEIGHBOUR_ADVERTISEMENT,
518                         .icmp6_router = router,
519                         .icmp6_solicited = solicited,
520                         .icmp6_override = override,
521                 },
522                 .target = *solicited_addr,
523         };
524
525         if (inc_opt)
526                 ndisc_fill_addr_option(skb, ND_OPT_TARGET_LL_ADDR,
527                                        dev->dev_addr);
528
529
530         ndisc_send_skb(skb, daddr, src_addr);
531 }
532
533 static void ndisc_send_unsol_na(struct net_device *dev)
534 {
535         struct inet6_dev *idev;
536         struct inet6_ifaddr *ifa;
537
538         idev = in6_dev_get(dev);
539         if (!idev)
540                 return;
541
542         read_lock_bh(&idev->lock);
543         list_for_each_entry(ifa, &idev->addr_list, if_list) {
544                 ndisc_send_na(dev, NULL, &in6addr_linklocal_allnodes, &ifa->addr,
545                               /*router=*/ !!idev->cnf.forwarding,
546                               /*solicited=*/ false, /*override=*/ true,
547                               /*inc_opt=*/ true);
548         }
549         read_unlock_bh(&idev->lock);
550
551         in6_dev_put(idev);
552 }
553
554 void ndisc_send_ns(struct net_device *dev, struct neighbour *neigh,
555                    const struct in6_addr *solicit,
556                    const struct in6_addr *daddr, const struct in6_addr *saddr)
557 {
558         struct sk_buff *skb;
559         struct in6_addr addr_buf;
560         int inc_opt = dev->addr_len;
561         int optlen = 0;
562         struct nd_msg *msg;
563
564         if (!saddr) {
565                 if (ipv6_get_lladdr(dev, &addr_buf,
566                                    (IFA_F_TENTATIVE|IFA_F_OPTIMISTIC)))
567                         return;
568                 saddr = &addr_buf;
569         }
570
571         if (ipv6_addr_any(saddr))
572                 inc_opt = false;
573         if (inc_opt)
574                 optlen += ndisc_opt_addr_space(dev);
575
576         skb = ndisc_alloc_skb(dev, sizeof(*msg) + optlen);
577         if (!skb)
578                 return;
579
580         msg = (struct nd_msg *)skb_put(skb, sizeof(*msg));
581         *msg = (struct nd_msg) {
582                 .icmph = {
583                         .icmp6_type = NDISC_NEIGHBOUR_SOLICITATION,
584                 },
585                 .target = *solicit,
586         };
587
588         if (inc_opt)
589                 ndisc_fill_addr_option(skb, ND_OPT_SOURCE_LL_ADDR,
590                                        dev->dev_addr);
591
592         ndisc_send_skb(skb, daddr, saddr);
593 }
594
595 void ndisc_send_rs(struct net_device *dev, const struct in6_addr *saddr,
596                    const struct in6_addr *daddr)
597 {
598         struct sk_buff *skb;
599         struct rs_msg *msg;
600         int send_sllao = dev->addr_len;
601         int optlen = 0;
602
603 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD
604         /*
605          * According to section 2.2 of RFC 4429, we must not
606          * send router solicitations with a sllao from
607          * optimistic addresses, but we may send the solicitation
608          * if we don't include the sllao.  So here we check
609          * if our address is optimistic, and if so, we
610          * suppress the inclusion of the sllao.
611          */
612         if (send_sllao) {
613                 struct inet6_ifaddr *ifp = ipv6_get_ifaddr(dev_net(dev), saddr,
614                                                            dev, 1);
615                 if (ifp) {
616                         if (ifp->flags & IFA_F_OPTIMISTIC)  {
617                                 send_sllao = 0;
618                         }
619                         in6_ifa_put(ifp);
620                 } else {
621                         send_sllao = 0;
622                 }
623         }
624 #endif
625         if (send_sllao)
626                 optlen += ndisc_opt_addr_space(dev);
627
628         skb = ndisc_alloc_skb(dev, sizeof(*msg) + optlen);
629         if (!skb)
630                 return;
631
632         msg = (struct rs_msg *)skb_put(skb, sizeof(*msg));
633         *msg = (struct rs_msg) {
634                 .icmph = {
635                         .icmp6_type = NDISC_ROUTER_SOLICITATION,
636                 },
637         };
638
639         if (send_sllao)
640                 ndisc_fill_addr_option(skb, ND_OPT_SOURCE_LL_ADDR,
641                                        dev->dev_addr);
642
643         ndisc_send_skb(skb, daddr, saddr);
644 }
645
646
647 static void ndisc_error_report(struct neighbour *neigh, struct sk_buff *skb)
648 {
649         /*
650          *      "The sender MUST return an ICMP
651          *       destination unreachable"
652          */
653         dst_link_failure(skb);
654         kfree_skb(skb);
655 }
656
657 /* Called with locked neigh: either read or both */
658
659 static void ndisc_solicit(struct neighbour *neigh, struct sk_buff *skb)
660 {
661         struct in6_addr *saddr = NULL;
662         struct in6_addr mcaddr;
663         struct net_device *dev = neigh->dev;
664         struct in6_addr *target = (struct in6_addr *)&neigh->primary_key;
665         int probes = atomic_read(&neigh->probes);
666
667         if (skb && ipv6_chk_addr_and_flags(dev_net(dev), &ipv6_hdr(skb)->saddr,
668                                            dev, 1,
669                                            IFA_F_TENTATIVE|IFA_F_OPTIMISTIC))
670                 saddr = &ipv6_hdr(skb)->saddr;
671         probes -= NEIGH_VAR(neigh->parms, UCAST_PROBES);
672         if (probes < 0) {
673                 if (!(neigh->nud_state & NUD_VALID)) {
674                         ND_PRINTK(1, dbg,
675                                   "%s: trying to ucast probe in NUD_INVALID: %pI6\n",
676                                   __func__, target);
677                 }
678                 ndisc_send_ns(dev, neigh, target, target, saddr);
679         } else if ((probes -= NEIGH_VAR(neigh->parms, APP_PROBES)) < 0) {
680                 neigh_app_ns(neigh);
681         } else {
682                 addrconf_addr_solict_mult(target, &mcaddr);
683                 ndisc_send_ns(dev, NULL, target, &mcaddr, saddr);
684         }
685 }
686
687 static int pndisc_is_router(const void *pkey,
688                             struct net_device *dev)
689 {
690         struct pneigh_entry *n;
691         int ret = -1;
692
693         read_lock_bh(&nd_tbl.lock);
694         n = __pneigh_lookup(&nd_tbl, dev_net(dev), pkey, dev);
695         if (n)
696                 ret = !!(n->flags & NTF_ROUTER);
697         read_unlock_bh(&nd_tbl.lock);
698
699         return ret;
700 }
701
702 static void ndisc_recv_ns(struct sk_buff *skb)
703 {
704         struct nd_msg *msg = (struct nd_msg *)skb_transport_header(skb);
705         const struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
706         const struct in6_addr *daddr = &ipv6_hdr(skb)->daddr;
707         u8 *lladdr = NULL;
708         u32 ndoptlen = skb_tail_pointer(skb) - (skb_transport_header(skb) +
709                                     offsetof(struct nd_msg, opt));
710         struct ndisc_options ndopts;
711         struct net_device *dev = skb->dev;
712         struct inet6_ifaddr *ifp;
713         struct inet6_dev *idev = NULL;
714         struct neighbour *neigh;
715         int dad = ipv6_addr_any(saddr);
716         bool inc;
717         int is_router = -1;
718
719         if (skb->len < sizeof(struct nd_msg)) {
720                 ND_PRINTK(2, warn, "NS: packet too short\n");
721                 return;
722         }
723
724         if (ipv6_addr_is_multicast(&msg->target)) {
725                 ND_PRINTK(2, warn, "NS: multicast target address\n");
726                 return;
727         }
728
729         /*
730          * RFC2461 7.1.1:
731          * DAD has to be destined for solicited node multicast address.
732          */
733         if (dad && !ipv6_addr_is_solict_mult(daddr)) {
734                 ND_PRINTK(2, warn, "NS: bad DAD packet (wrong destination)\n");
735                 return;
736         }
737
738         if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts)) {
739                 ND_PRINTK(2, warn, "NS: invalid ND options\n");
740                 return;
741         }
742
743         if (ndopts.nd_opts_src_lladdr) {
744                 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr, dev);
745                 if (!lladdr) {
746                         ND_PRINTK(2, warn,
747                                   "NS: invalid link-layer address length\n");
748                         return;
749                 }
750
751                 /* RFC2461 7.1.1:
752                  *      If the IP source address is the unspecified address,
753                  *      there MUST NOT be source link-layer address option
754                  *      in the message.
755                  */
756                 if (dad) {
757                         ND_PRINTK(2, warn,
758                                   "NS: bad DAD packet (link-layer address option)\n");
759                         return;
760                 }
761         }
762
763         inc = ipv6_addr_is_multicast(daddr);
764
765         ifp = ipv6_get_ifaddr(dev_net(dev), &msg->target, dev, 1);
766         if (ifp) {
767
768                 if (ifp->flags & (IFA_F_TENTATIVE|IFA_F_OPTIMISTIC)) {
769                         if (dad) {
770                                 /*
771                                  * We are colliding with another node
772                                  * who is doing DAD
773                                  * so fail our DAD process
774                                  */
775                                 addrconf_dad_failure(ifp);
776                                 return;
777                         } else {
778                                 /*
779                                  * This is not a dad solicitation.
780                                  * If we are an optimistic node,
781                                  * we should respond.
782                                  * Otherwise, we should ignore it.
783                                  */
784                                 if (!(ifp->flags & IFA_F_OPTIMISTIC))
785                                         goto out;
786                         }
787                 }
788
789                 idev = ifp->idev;
790         } else {
791                 struct net *net = dev_net(dev);
792
793                 idev = in6_dev_get(dev);
794                 if (!idev) {
795                         /* XXX: count this drop? */
796                         return;
797                 }
798
799                 if (ipv6_chk_acast_addr(net, dev, &msg->target) ||
800                     (idev->cnf.forwarding &&
801                      (net->ipv6.devconf_all->proxy_ndp || idev->cnf.proxy_ndp) &&
802                      (is_router = pndisc_is_router(&msg->target, dev)) >= 0)) {
803                         if (!(NEIGH_CB(skb)->flags & LOCALLY_ENQUEUED) &&
804                             skb->pkt_type != PACKET_HOST &&
805                             inc &&
806                             NEIGH_VAR(idev->nd_parms, PROXY_DELAY) != 0) {
807                                 /*
808                                  * for anycast or proxy,
809                                  * sender should delay its response
810                                  * by a random time between 0 and
811                                  * MAX_ANYCAST_DELAY_TIME seconds.
812                                  * (RFC2461) -- yoshfuji
813                                  */
814                                 struct sk_buff *n = skb_clone(skb, GFP_ATOMIC);
815                                 if (n)
816                                         pneigh_enqueue(&nd_tbl, idev->nd_parms, n);
817                                 goto out;
818                         }
819                 } else
820                         goto out;
821         }
822
823         if (is_router < 0)
824                 is_router = idev->cnf.forwarding;
825
826         if (dad) {
827                 ndisc_send_na(dev, NULL, &in6addr_linklocal_allnodes, &msg->target,
828                               !!is_router, false, (ifp != NULL), true);
829                 goto out;
830         }
831
832         if (inc)
833                 NEIGH_CACHE_STAT_INC(&nd_tbl, rcv_probes_mcast);
834         else
835                 NEIGH_CACHE_STAT_INC(&nd_tbl, rcv_probes_ucast);
836
837         /*
838          *      update / create cache entry
839          *      for the source address
840          */
841         neigh = __neigh_lookup(&nd_tbl, saddr, dev,
842                                !inc || lladdr || !dev->addr_len);
843         if (neigh)
844                 neigh_update(neigh, lladdr, NUD_STALE,
845                              NEIGH_UPDATE_F_WEAK_OVERRIDE|
846                              NEIGH_UPDATE_F_OVERRIDE);
847         if (neigh || !dev->header_ops) {
848                 ndisc_send_na(dev, neigh, saddr, &msg->target,
849                               !!is_router,
850                               true, (ifp != NULL && inc), inc);
851                 if (neigh)
852                         neigh_release(neigh);
853         }
854
855 out:
856         if (ifp)
857                 in6_ifa_put(ifp);
858         else
859                 in6_dev_put(idev);
860 }
861
862 static void ndisc_recv_na(struct sk_buff *skb)
863 {
864         struct nd_msg *msg = (struct nd_msg *)skb_transport_header(skb);
865         struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
866         const struct in6_addr *daddr = &ipv6_hdr(skb)->daddr;
867         u8 *lladdr = NULL;
868         u32 ndoptlen = skb_tail_pointer(skb) - (skb_transport_header(skb) +
869                                     offsetof(struct nd_msg, opt));
870         struct ndisc_options ndopts;
871         struct net_device *dev = skb->dev;
872         struct inet6_ifaddr *ifp;
873         struct neighbour *neigh;
874
875         if (skb->len < sizeof(struct nd_msg)) {
876                 ND_PRINTK(2, warn, "NA: packet too short\n");
877                 return;
878         }
879
880         if (ipv6_addr_is_multicast(&msg->target)) {
881                 ND_PRINTK(2, warn, "NA: target address is multicast\n");
882                 return;
883         }
884
885         if (ipv6_addr_is_multicast(daddr) &&
886             msg->icmph.icmp6_solicited) {
887                 ND_PRINTK(2, warn, "NA: solicited NA is multicasted\n");
888                 return;
889         }
890
891         if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts)) {
892                 ND_PRINTK(2, warn, "NS: invalid ND option\n");
893                 return;
894         }
895         if (ndopts.nd_opts_tgt_lladdr) {
896                 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_tgt_lladdr, dev);
897                 if (!lladdr) {
898                         ND_PRINTK(2, warn,
899                                   "NA: invalid link-layer address length\n");
900                         return;
901                 }
902         }
903         ifp = ipv6_get_ifaddr(dev_net(dev), &msg->target, dev, 1);
904         if (ifp) {
905                 if (skb->pkt_type != PACKET_LOOPBACK
906                     && (ifp->flags & IFA_F_TENTATIVE)) {
907                                 addrconf_dad_failure(ifp);
908                                 return;
909                 }
910                 /* What should we make now? The advertisement
911                    is invalid, but ndisc specs say nothing
912                    about it. It could be misconfiguration, or
913                    an smart proxy agent tries to help us :-)
914
915                    We should not print the error if NA has been
916                    received from loopback - it is just our own
917                    unsolicited advertisement.
918                  */
919                 if (skb->pkt_type != PACKET_LOOPBACK)
920                         ND_PRINTK(1, warn,
921                                   "NA: someone advertises our address %pI6 on %s!\n",
922                                   &ifp->addr, ifp->idev->dev->name);
923                 in6_ifa_put(ifp);
924                 return;
925         }
926         neigh = neigh_lookup(&nd_tbl, &msg->target, dev);
927
928         if (neigh) {
929                 u8 old_flags = neigh->flags;
930                 struct net *net = dev_net(dev);
931
932                 if (neigh->nud_state & NUD_FAILED)
933                         goto out;
934
935                 /*
936                  * Don't update the neighbor cache entry on a proxy NA from
937                  * ourselves because either the proxied node is off link or it
938                  * has already sent a NA to us.
939                  */
940                 if (lladdr && !memcmp(lladdr, dev->dev_addr, dev->addr_len) &&
941                     net->ipv6.devconf_all->forwarding && net->ipv6.devconf_all->proxy_ndp &&
942                     pneigh_lookup(&nd_tbl, net, &msg->target, dev, 0)) {
943                         /* XXX: idev->cnf.proxy_ndp */
944                         goto out;
945                 }
946
947                 neigh_update(neigh, lladdr,
948                              msg->icmph.icmp6_solicited ? NUD_REACHABLE : NUD_STALE,
949                              NEIGH_UPDATE_F_WEAK_OVERRIDE|
950                              (msg->icmph.icmp6_override ? NEIGH_UPDATE_F_OVERRIDE : 0)|
951                              NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
952                              (msg->icmph.icmp6_router ? NEIGH_UPDATE_F_ISROUTER : 0));
953
954                 if ((old_flags & ~neigh->flags) & NTF_ROUTER) {
955                         /*
956                          * Change: router to host
957                          */
958                         rt6_clean_tohost(dev_net(dev),  saddr);
959                 }
960
961 out:
962                 neigh_release(neigh);
963         }
964 }
965
966 static void ndisc_recv_rs(struct sk_buff *skb)
967 {
968         struct rs_msg *rs_msg = (struct rs_msg *)skb_transport_header(skb);
969         unsigned long ndoptlen = skb->len - sizeof(*rs_msg);
970         struct neighbour *neigh;
971         struct inet6_dev *idev;
972         const struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
973         struct ndisc_options ndopts;
974         u8 *lladdr = NULL;
975
976         if (skb->len < sizeof(*rs_msg))
977                 return;
978
979         idev = __in6_dev_get(skb->dev);
980         if (!idev) {
981                 ND_PRINTK(1, err, "RS: can't find in6 device\n");
982                 return;
983         }
984
985         /* Don't accept RS if we're not in router mode */
986         if (!idev->cnf.forwarding)
987                 goto out;
988
989         /*
990          * Don't update NCE if src = ::;
991          * this implies that the source node has no ip address assigned yet.
992          */
993         if (ipv6_addr_any(saddr))
994                 goto out;
995
996         /* Parse ND options */
997         if (!ndisc_parse_options(rs_msg->opt, ndoptlen, &ndopts)) {
998                 ND_PRINTK(2, notice, "NS: invalid ND option, ignored\n");
999                 goto out;
1000         }
1001
1002         if (ndopts.nd_opts_src_lladdr) {
1003                 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr,
1004                                              skb->dev);
1005                 if (!lladdr)
1006                         goto out;
1007         }
1008
1009         neigh = __neigh_lookup(&nd_tbl, saddr, skb->dev, 1);
1010         if (neigh) {
1011                 neigh_update(neigh, lladdr, NUD_STALE,
1012                              NEIGH_UPDATE_F_WEAK_OVERRIDE|
1013                              NEIGH_UPDATE_F_OVERRIDE|
1014                              NEIGH_UPDATE_F_OVERRIDE_ISROUTER);
1015                 neigh_release(neigh);
1016         }
1017 out:
1018         return;
1019 }
1020
1021 static void ndisc_ra_useropt(struct sk_buff *ra, struct nd_opt_hdr *opt)
1022 {
1023         struct icmp6hdr *icmp6h = (struct icmp6hdr *)skb_transport_header(ra);
1024         struct sk_buff *skb;
1025         struct nlmsghdr *nlh;
1026         struct nduseroptmsg *ndmsg;
1027         struct net *net = dev_net(ra->dev);
1028         int err;
1029         int base_size = NLMSG_ALIGN(sizeof(struct nduseroptmsg)
1030                                     + (opt->nd_opt_len << 3));
1031         size_t msg_size = base_size + nla_total_size(sizeof(struct in6_addr));
1032
1033         skb = nlmsg_new(msg_size, GFP_ATOMIC);
1034         if (!skb) {
1035                 err = -ENOBUFS;
1036                 goto errout;
1037         }
1038
1039         nlh = nlmsg_put(skb, 0, 0, RTM_NEWNDUSEROPT, base_size, 0);
1040         if (!nlh) {
1041                 goto nla_put_failure;
1042         }
1043
1044         ndmsg = nlmsg_data(nlh);
1045         ndmsg->nduseropt_family = AF_INET6;
1046         ndmsg->nduseropt_ifindex = ra->dev->ifindex;
1047         ndmsg->nduseropt_icmp_type = icmp6h->icmp6_type;
1048         ndmsg->nduseropt_icmp_code = icmp6h->icmp6_code;
1049         ndmsg->nduseropt_opts_len = opt->nd_opt_len << 3;
1050
1051         memcpy(ndmsg + 1, opt, opt->nd_opt_len << 3);
1052
1053         if (nla_put_in6_addr(skb, NDUSEROPT_SRCADDR, &ipv6_hdr(ra)->saddr))
1054                 goto nla_put_failure;
1055         nlmsg_end(skb, nlh);
1056
1057         rtnl_notify(skb, net, 0, RTNLGRP_ND_USEROPT, NULL, GFP_ATOMIC);
1058         return;
1059
1060 nla_put_failure:
1061         nlmsg_free(skb);
1062         err = -EMSGSIZE;
1063 errout:
1064         rtnl_set_sk_err(net, RTNLGRP_ND_USEROPT, err);
1065 }
1066
1067 static void ndisc_router_discovery(struct sk_buff *skb)
1068 {
1069         struct ra_msg *ra_msg = (struct ra_msg *)skb_transport_header(skb);
1070         struct neighbour *neigh = NULL;
1071         struct inet6_dev *in6_dev;
1072         struct rt6_info *rt = NULL;
1073         int lifetime;
1074         struct ndisc_options ndopts;
1075         int optlen;
1076         unsigned int pref = 0;
1077
1078         __u8 *opt = (__u8 *)(ra_msg + 1);
1079
1080         optlen = (skb_tail_pointer(skb) - skb_transport_header(skb)) -
1081                 sizeof(struct ra_msg);
1082
1083         ND_PRINTK(2, info,
1084                   "RA: %s, dev: %s\n",
1085                   __func__, skb->dev->name);
1086         if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL)) {
1087                 ND_PRINTK(2, warn, "RA: source address is not link-local\n");
1088                 return;
1089         }
1090         if (optlen < 0) {
1091                 ND_PRINTK(2, warn, "RA: packet too short\n");
1092                 return;
1093         }
1094
1095 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1096         if (skb->ndisc_nodetype == NDISC_NODETYPE_HOST) {
1097                 ND_PRINTK(2, warn, "RA: from host or unauthorized router\n");
1098                 return;
1099         }
1100 #endif
1101
1102         /*
1103          *      set the RA_RECV flag in the interface
1104          */
1105
1106         in6_dev = __in6_dev_get(skb->dev);
1107         if (!in6_dev) {
1108                 ND_PRINTK(0, err, "RA: can't find inet6 device for %s\n",
1109                           skb->dev->name);
1110                 return;
1111         }
1112
1113         if (!ndisc_parse_options(opt, optlen, &ndopts)) {
1114                 ND_PRINTK(2, warn, "RA: invalid ND options\n");
1115                 return;
1116         }
1117
1118         if (!ipv6_accept_ra(in6_dev)) {
1119                 ND_PRINTK(2, info,
1120                           "RA: %s, did not accept ra for dev: %s\n",
1121                           __func__, skb->dev->name);
1122                 goto skip_linkparms;
1123         }
1124
1125 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1126         /* skip link-specific parameters from interior routers */
1127         if (skb->ndisc_nodetype == NDISC_NODETYPE_NODEFAULT) {
1128                 ND_PRINTK(2, info,
1129                           "RA: %s, nodetype is NODEFAULT, dev: %s\n",
1130                           __func__, skb->dev->name);
1131                 goto skip_linkparms;
1132         }
1133 #endif
1134
1135         if (in6_dev->if_flags & IF_RS_SENT) {
1136                 /*
1137                  *      flag that an RA was received after an RS was sent
1138                  *      out on this interface.
1139                  */
1140                 in6_dev->if_flags |= IF_RA_RCVD;
1141         }
1142
1143         /*
1144          * Remember the managed/otherconf flags from most recently
1145          * received RA message (RFC 2462) -- yoshfuji
1146          */
1147         in6_dev->if_flags = (in6_dev->if_flags & ~(IF_RA_MANAGED |
1148                                 IF_RA_OTHERCONF)) |
1149                                 (ra_msg->icmph.icmp6_addrconf_managed ?
1150                                         IF_RA_MANAGED : 0) |
1151                                 (ra_msg->icmph.icmp6_addrconf_other ?
1152                                         IF_RA_OTHERCONF : 0);
1153
1154         if (!in6_dev->cnf.accept_ra_defrtr) {
1155                 ND_PRINTK(2, info,
1156                           "RA: %s, defrtr is false for dev: %s\n",
1157                           __func__, skb->dev->name);
1158                 goto skip_defrtr;
1159         }
1160
1161         /* Do not accept RA with source-addr found on local machine unless
1162          * accept_ra_from_local is set to true.
1163          */
1164         if (!in6_dev->cnf.accept_ra_from_local &&
1165             ipv6_chk_addr(dev_net(in6_dev->dev), &ipv6_hdr(skb)->saddr,
1166                           NULL, 0)) {
1167                 ND_PRINTK(2, info,
1168                           "RA from local address detected on dev: %s: default router ignored\n",
1169                           skb->dev->name);
1170                 goto skip_defrtr;
1171         }
1172
1173         lifetime = ntohs(ra_msg->icmph.icmp6_rt_lifetime);
1174
1175 #ifdef CONFIG_IPV6_ROUTER_PREF
1176         pref = ra_msg->icmph.icmp6_router_pref;
1177         /* 10b is handled as if it were 00b (medium) */
1178         if (pref == ICMPV6_ROUTER_PREF_INVALID ||
1179             !in6_dev->cnf.accept_ra_rtr_pref)
1180                 pref = ICMPV6_ROUTER_PREF_MEDIUM;
1181 #endif
1182
1183         rt = rt6_get_dflt_router(&ipv6_hdr(skb)->saddr, skb->dev);
1184
1185         if (rt) {
1186                 neigh = dst_neigh_lookup(&rt->dst, &ipv6_hdr(skb)->saddr);
1187                 if (!neigh) {
1188                         ND_PRINTK(0, err,
1189                                   "RA: %s got default router without neighbour\n",
1190                                   __func__);
1191                         ip6_rt_put(rt);
1192                         return;
1193                 }
1194         }
1195         if (rt && lifetime == 0) {
1196                 ip6_del_rt(rt);
1197                 rt = NULL;
1198         }
1199
1200         ND_PRINTK(3, info, "RA: rt: %p  lifetime: %d, for dev: %s\n",
1201                   rt, lifetime, skb->dev->name);
1202         if (!rt && lifetime) {
1203                 ND_PRINTK(3, info, "RA: adding default router\n");
1204
1205                 rt = rt6_add_dflt_router(&ipv6_hdr(skb)->saddr, skb->dev, pref);
1206                 if (!rt) {
1207                         ND_PRINTK(0, err,
1208                                   "RA: %s failed to add default route\n",
1209                                   __func__);
1210                         return;
1211                 }
1212
1213                 neigh = dst_neigh_lookup(&rt->dst, &ipv6_hdr(skb)->saddr);
1214                 if (!neigh) {
1215                         ND_PRINTK(0, err,
1216                                   "RA: %s got default router without neighbour\n",
1217                                   __func__);
1218                         ip6_rt_put(rt);
1219                         return;
1220                 }
1221                 neigh->flags |= NTF_ROUTER;
1222         } else if (rt) {
1223                 rt->rt6i_flags = (rt->rt6i_flags & ~RTF_PREF_MASK) | RTF_PREF(pref);
1224         }
1225
1226         if (rt)
1227                 rt6_set_expires(rt, jiffies + (HZ * lifetime));
1228         if (ra_msg->icmph.icmp6_hop_limit) {
1229                 /* Only set hop_limit on the interface if it is higher than
1230                  * the current hop_limit.
1231                  */
1232                 if (in6_dev->cnf.hop_limit < ra_msg->icmph.icmp6_hop_limit) {
1233                         in6_dev->cnf.hop_limit = ra_msg->icmph.icmp6_hop_limit;
1234                 } else {
1235                         ND_PRINTK(2, warn, "RA: Got route advertisement with lower hop_limit than current\n");
1236                 }
1237                 if (rt)
1238                         dst_metric_set(&rt->dst, RTAX_HOPLIMIT,
1239                                        ra_msg->icmph.icmp6_hop_limit);
1240         }
1241
1242 skip_defrtr:
1243
1244         /*
1245          *      Update Reachable Time and Retrans Timer
1246          */
1247
1248         if (in6_dev->nd_parms) {
1249                 unsigned long rtime = ntohl(ra_msg->retrans_timer);
1250
1251                 if (rtime && rtime/1000 < MAX_SCHEDULE_TIMEOUT/HZ) {
1252                         rtime = (rtime*HZ)/1000;
1253                         if (rtime < HZ/10)
1254                                 rtime = HZ/10;
1255                         NEIGH_VAR_SET(in6_dev->nd_parms, RETRANS_TIME, rtime);
1256                         in6_dev->tstamp = jiffies;
1257                         inet6_ifinfo_notify(RTM_NEWLINK, in6_dev);
1258                 }
1259
1260                 rtime = ntohl(ra_msg->reachable_time);
1261                 if (rtime && rtime/1000 < MAX_SCHEDULE_TIMEOUT/(3*HZ)) {
1262                         rtime = (rtime*HZ)/1000;
1263
1264                         if (rtime < HZ/10)
1265                                 rtime = HZ/10;
1266
1267                         if (rtime != NEIGH_VAR(in6_dev->nd_parms, BASE_REACHABLE_TIME)) {
1268                                 NEIGH_VAR_SET(in6_dev->nd_parms,
1269                                               BASE_REACHABLE_TIME, rtime);
1270                                 NEIGH_VAR_SET(in6_dev->nd_parms,
1271                                               GC_STALETIME, 3 * rtime);
1272                                 in6_dev->nd_parms->reachable_time = neigh_rand_reach_time(rtime);
1273                                 in6_dev->tstamp = jiffies;
1274                                 inet6_ifinfo_notify(RTM_NEWLINK, in6_dev);
1275                         }
1276                 }
1277         }
1278
1279 skip_linkparms:
1280
1281         /*
1282          *      Process options.
1283          */
1284
1285         if (!neigh)
1286                 neigh = __neigh_lookup(&nd_tbl, &ipv6_hdr(skb)->saddr,
1287                                        skb->dev, 1);
1288         if (neigh) {
1289                 u8 *lladdr = NULL;
1290                 if (ndopts.nd_opts_src_lladdr) {
1291                         lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr,
1292                                                      skb->dev);
1293                         if (!lladdr) {
1294                                 ND_PRINTK(2, warn,
1295                                           "RA: invalid link-layer address length\n");
1296                                 goto out;
1297                         }
1298                 }
1299                 neigh_update(neigh, lladdr, NUD_STALE,
1300                              NEIGH_UPDATE_F_WEAK_OVERRIDE|
1301                              NEIGH_UPDATE_F_OVERRIDE|
1302                              NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
1303                              NEIGH_UPDATE_F_ISROUTER);
1304         }
1305
1306         if (!ipv6_accept_ra(in6_dev)) {
1307                 ND_PRINTK(2, info,
1308                           "RA: %s, accept_ra is false for dev: %s\n",
1309                           __func__, skb->dev->name);
1310                 goto out;
1311         }
1312
1313 #ifdef CONFIG_IPV6_ROUTE_INFO
1314         if (!in6_dev->cnf.accept_ra_from_local &&
1315             ipv6_chk_addr(dev_net(in6_dev->dev), &ipv6_hdr(skb)->saddr,
1316                           NULL, 0)) {
1317                 ND_PRINTK(2, info,
1318                           "RA from local address detected on dev: %s: router info ignored.\n",
1319                           skb->dev->name);
1320                 goto skip_routeinfo;
1321         }
1322
1323         if (in6_dev->cnf.accept_ra_rtr_pref && ndopts.nd_opts_ri) {
1324                 struct nd_opt_hdr *p;
1325                 for (p = ndopts.nd_opts_ri;
1326                      p;
1327                      p = ndisc_next_option(p, ndopts.nd_opts_ri_end)) {
1328                         struct route_info *ri = (struct route_info *)p;
1329 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1330                         if (skb->ndisc_nodetype == NDISC_NODETYPE_NODEFAULT &&
1331                             ri->prefix_len == 0)
1332                                 continue;
1333 #endif
1334                         if (ri->prefix_len == 0 &&
1335                             !in6_dev->cnf.accept_ra_defrtr)
1336                                 continue;
1337                         if (ri->prefix_len > in6_dev->cnf.accept_ra_rt_info_max_plen)
1338                                 continue;
1339                         rt6_route_rcv(skb->dev, (u8 *)p, (p->nd_opt_len) << 3,
1340                                       &ipv6_hdr(skb)->saddr);
1341                 }
1342         }
1343
1344 skip_routeinfo:
1345 #endif
1346
1347 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1348         /* skip link-specific ndopts from interior routers */
1349         if (skb->ndisc_nodetype == NDISC_NODETYPE_NODEFAULT) {
1350                 ND_PRINTK(2, info,
1351                           "RA: %s, nodetype is NODEFAULT (interior routes), dev: %s\n",
1352                           __func__, skb->dev->name);
1353                 goto out;
1354         }
1355 #endif
1356
1357         if (in6_dev->cnf.accept_ra_pinfo && ndopts.nd_opts_pi) {
1358                 struct nd_opt_hdr *p;
1359                 for (p = ndopts.nd_opts_pi;
1360                      p;
1361                      p = ndisc_next_option(p, ndopts.nd_opts_pi_end)) {
1362                         addrconf_prefix_rcv(skb->dev, (u8 *)p,
1363                                             (p->nd_opt_len) << 3,
1364                                             ndopts.nd_opts_src_lladdr != NULL);
1365                 }
1366         }
1367
1368         if (ndopts.nd_opts_mtu && in6_dev->cnf.accept_ra_mtu) {
1369                 __be32 n;
1370                 u32 mtu;
1371
1372                 memcpy(&n, ((u8 *)(ndopts.nd_opts_mtu+1))+2, sizeof(mtu));
1373                 mtu = ntohl(n);
1374
1375                 if (mtu < IPV6_MIN_MTU || mtu > skb->dev->mtu) {
1376                         ND_PRINTK(2, warn, "RA: invalid mtu: %d\n", mtu);
1377                 } else if (in6_dev->cnf.mtu6 != mtu) {
1378                         in6_dev->cnf.mtu6 = mtu;
1379
1380                         if (rt)
1381                                 dst_metric_set(&rt->dst, RTAX_MTU, mtu);
1382
1383                         rt6_mtu_change(skb->dev, mtu);
1384                 }
1385         }
1386
1387         if (ndopts.nd_useropts) {
1388                 struct nd_opt_hdr *p;
1389                 for (p = ndopts.nd_useropts;
1390                      p;
1391                      p = ndisc_next_useropt(p, ndopts.nd_useropts_end)) {
1392                         ndisc_ra_useropt(skb, p);
1393                 }
1394         }
1395
1396         if (ndopts.nd_opts_tgt_lladdr || ndopts.nd_opts_rh) {
1397                 ND_PRINTK(2, warn, "RA: invalid RA options\n");
1398         }
1399 out:
1400         ip6_rt_put(rt);
1401         if (neigh)
1402                 neigh_release(neigh);
1403 }
1404
1405 static void ndisc_redirect_rcv(struct sk_buff *skb)
1406 {
1407         u8 *hdr;
1408         struct ndisc_options ndopts;
1409         struct rd_msg *msg = (struct rd_msg *)skb_transport_header(skb);
1410         u32 ndoptlen = skb_tail_pointer(skb) - (skb_transport_header(skb) +
1411                                     offsetof(struct rd_msg, opt));
1412
1413 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1414         switch (skb->ndisc_nodetype) {
1415         case NDISC_NODETYPE_HOST:
1416         case NDISC_NODETYPE_NODEFAULT:
1417                 ND_PRINTK(2, warn,
1418                           "Redirect: from host or unauthorized router\n");
1419                 return;
1420         }
1421 #endif
1422
1423         if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL)) {
1424                 ND_PRINTK(2, warn,
1425                           "Redirect: source address is not link-local\n");
1426                 return;
1427         }
1428
1429         if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts))
1430                 return;
1431
1432         if (!ndopts.nd_opts_rh) {
1433                 ip6_redirect_no_header(skb, dev_net(skb->dev),
1434                                         skb->dev->ifindex, 0);
1435                 return;
1436         }
1437
1438         hdr = (u8 *)ndopts.nd_opts_rh;
1439         hdr += 8;
1440         if (!pskb_pull(skb, hdr - skb_transport_header(skb)))
1441                 return;
1442
1443         icmpv6_notify(skb, NDISC_REDIRECT, 0, 0);
1444 }
1445
1446 static void ndisc_fill_redirect_hdr_option(struct sk_buff *skb,
1447                                            struct sk_buff *orig_skb,
1448                                            int rd_len)
1449 {
1450         u8 *opt = skb_put(skb, rd_len);
1451
1452         memset(opt, 0, 8);
1453         *(opt++) = ND_OPT_REDIRECT_HDR;
1454         *(opt++) = (rd_len >> 3);
1455         opt += 6;
1456
1457         memcpy(opt, ipv6_hdr(orig_skb), rd_len - 8);
1458 }
1459
1460 void ndisc_send_redirect(struct sk_buff *skb, const struct in6_addr *target)
1461 {
1462         struct net_device *dev = skb->dev;
1463         struct net *net = dev_net(dev);
1464         struct sock *sk = net->ipv6.ndisc_sk;
1465         int optlen = 0;
1466         struct inet_peer *peer;
1467         struct sk_buff *buff;
1468         struct rd_msg *msg;
1469         struct in6_addr saddr_buf;
1470         struct rt6_info *rt;
1471         struct dst_entry *dst;
1472         struct flowi6 fl6;
1473         int rd_len;
1474         u8 ha_buf[MAX_ADDR_LEN], *ha = NULL;
1475         bool ret;
1476
1477         if (ipv6_get_lladdr(dev, &saddr_buf, IFA_F_TENTATIVE)) {
1478                 ND_PRINTK(2, warn, "Redirect: no link-local address on %s\n",
1479                           dev->name);
1480                 return;
1481         }
1482
1483         if (!ipv6_addr_equal(&ipv6_hdr(skb)->daddr, target) &&
1484             ipv6_addr_type(target) != (IPV6_ADDR_UNICAST|IPV6_ADDR_LINKLOCAL)) {
1485                 ND_PRINTK(2, warn,
1486                           "Redirect: target address is not link-local unicast\n");
1487                 return;
1488         }
1489
1490         icmpv6_flow_init(sk, &fl6, NDISC_REDIRECT,
1491                          &saddr_buf, &ipv6_hdr(skb)->saddr, dev->ifindex);
1492
1493         dst = ip6_route_output(net, NULL, &fl6);
1494         if (dst->error) {
1495                 dst_release(dst);
1496                 return;
1497         }
1498         dst = xfrm_lookup(net, dst, flowi6_to_flowi(&fl6), NULL, 0);
1499         if (IS_ERR(dst))
1500                 return;
1501
1502         rt = (struct rt6_info *) dst;
1503
1504         if (rt->rt6i_flags & RTF_GATEWAY) {
1505                 ND_PRINTK(2, warn,
1506                           "Redirect: destination is not a neighbour\n");
1507                 goto release;
1508         }
1509         peer = inet_getpeer_v6(net->ipv6.peers, &rt->rt6i_dst.addr, 1);
1510         ret = inet_peer_xrlim_allow(peer, 1*HZ);
1511         if (peer)
1512                 inet_putpeer(peer);
1513         if (!ret)
1514                 goto release;
1515
1516         if (dev->addr_len) {
1517                 struct neighbour *neigh = dst_neigh_lookup(skb_dst(skb), target);
1518                 if (!neigh) {
1519                         ND_PRINTK(2, warn,
1520                                   "Redirect: no neigh for target address\n");
1521                         goto release;
1522                 }
1523
1524                 read_lock_bh(&neigh->lock);
1525                 if (neigh->nud_state & NUD_VALID) {
1526                         memcpy(ha_buf, neigh->ha, dev->addr_len);
1527                         read_unlock_bh(&neigh->lock);
1528                         ha = ha_buf;
1529                         optlen += ndisc_opt_addr_space(dev);
1530                 } else
1531                         read_unlock_bh(&neigh->lock);
1532
1533                 neigh_release(neigh);
1534         }
1535
1536         rd_len = min_t(unsigned int,
1537                        IPV6_MIN_MTU - sizeof(struct ipv6hdr) - sizeof(*msg) - optlen,
1538                        skb->len + 8);
1539         rd_len &= ~0x7;
1540         optlen += rd_len;
1541
1542         buff = ndisc_alloc_skb(dev, sizeof(*msg) + optlen);
1543         if (!buff)
1544                 goto release;
1545
1546         msg = (struct rd_msg *)skb_put(buff, sizeof(*msg));
1547         *msg = (struct rd_msg) {
1548                 .icmph = {
1549                         .icmp6_type = NDISC_REDIRECT,
1550                 },
1551                 .target = *target,
1552                 .dest = ipv6_hdr(skb)->daddr,
1553         };
1554
1555         /*
1556          *      include target_address option
1557          */
1558
1559         if (ha)
1560                 ndisc_fill_addr_option(buff, ND_OPT_TARGET_LL_ADDR, ha);
1561
1562         /*
1563          *      build redirect option and copy skb over to the new packet.
1564          */
1565
1566         if (rd_len)
1567                 ndisc_fill_redirect_hdr_option(buff, skb, rd_len);
1568
1569         skb_dst_set(buff, dst);
1570         ndisc_send_skb(buff, &ipv6_hdr(skb)->saddr, &saddr_buf);
1571         return;
1572
1573 release:
1574         dst_release(dst);
1575 }
1576
1577 static void pndisc_redo(struct sk_buff *skb)
1578 {
1579         ndisc_recv_ns(skb);
1580         kfree_skb(skb);
1581 }
1582
1583 static bool ndisc_suppress_frag_ndisc(struct sk_buff *skb)
1584 {
1585         struct inet6_dev *idev = __in6_dev_get(skb->dev);
1586
1587         if (!idev)
1588                 return true;
1589         if (IP6CB(skb)->flags & IP6SKB_FRAGMENTED &&
1590             idev->cnf.suppress_frag_ndisc) {
1591                 net_warn_ratelimited("Received fragmented ndisc packet. Carefully consider disabling suppress_frag_ndisc.\n");
1592                 return true;
1593         }
1594         return false;
1595 }
1596
1597 int ndisc_rcv(struct sk_buff *skb)
1598 {
1599         struct nd_msg *msg;
1600
1601         if (ndisc_suppress_frag_ndisc(skb))
1602                 return 0;
1603
1604         if (skb_linearize(skb))
1605                 return 0;
1606
1607         msg = (struct nd_msg *)skb_transport_header(skb);
1608
1609         __skb_push(skb, skb->data - skb_transport_header(skb));
1610
1611         if (ipv6_hdr(skb)->hop_limit != 255) {
1612                 ND_PRINTK(2, warn, "NDISC: invalid hop-limit: %d\n",
1613                           ipv6_hdr(skb)->hop_limit);
1614                 return 0;
1615         }
1616
1617         if (msg->icmph.icmp6_code != 0) {
1618                 ND_PRINTK(2, warn, "NDISC: invalid ICMPv6 code: %d\n",
1619                           msg->icmph.icmp6_code);
1620                 return 0;
1621         }
1622
1623         memset(NEIGH_CB(skb), 0, sizeof(struct neighbour_cb));
1624
1625         switch (msg->icmph.icmp6_type) {
1626         case NDISC_NEIGHBOUR_SOLICITATION:
1627                 ndisc_recv_ns(skb);
1628                 break;
1629
1630         case NDISC_NEIGHBOUR_ADVERTISEMENT:
1631                 ndisc_recv_na(skb);
1632                 break;
1633
1634         case NDISC_ROUTER_SOLICITATION:
1635                 ndisc_recv_rs(skb);
1636                 break;
1637
1638         case NDISC_ROUTER_ADVERTISEMENT:
1639                 ndisc_router_discovery(skb);
1640                 break;
1641
1642         case NDISC_REDIRECT:
1643                 ndisc_redirect_rcv(skb);
1644                 break;
1645         }
1646
1647         return 0;
1648 }
1649
1650 static int ndisc_netdev_event(struct notifier_block *this, unsigned long event, void *ptr)
1651 {
1652         struct net_device *dev = netdev_notifier_info_to_dev(ptr);
1653         struct net *net = dev_net(dev);
1654         struct inet6_dev *idev;
1655
1656         switch (event) {
1657         case NETDEV_CHANGEADDR:
1658                 neigh_changeaddr(&nd_tbl, dev);
1659                 fib6_run_gc(0, net, false);
1660                 idev = in6_dev_get(dev);
1661                 if (!idev)
1662                         break;
1663                 if (idev->cnf.ndisc_notify)
1664                         ndisc_send_unsol_na(dev);
1665                 in6_dev_put(idev);
1666                 break;
1667         case NETDEV_DOWN:
1668                 neigh_ifdown(&nd_tbl, dev);
1669                 fib6_run_gc(0, net, false);
1670                 break;
1671         case NETDEV_NOTIFY_PEERS:
1672                 ndisc_send_unsol_na(dev);
1673                 break;
1674         default:
1675                 break;
1676         }
1677
1678         return NOTIFY_DONE;
1679 }
1680
1681 static struct notifier_block ndisc_netdev_notifier = {
1682         .notifier_call = ndisc_netdev_event,
1683 };
1684
1685 #ifdef CONFIG_SYSCTL
1686 static void ndisc_warn_deprecated_sysctl(struct ctl_table *ctl,
1687                                          const char *func, const char *dev_name)
1688 {
1689         static char warncomm[TASK_COMM_LEN];
1690         static int warned;
1691         if (strcmp(warncomm, current->comm) && warned < 5) {
1692                 strcpy(warncomm, current->comm);
1693                 pr_warn("process `%s' is using deprecated sysctl (%s) net.ipv6.neigh.%s.%s - use net.ipv6.neigh.%s.%s_ms instead\n",
1694                         warncomm, func,
1695                         dev_name, ctl->procname,
1696                         dev_name, ctl->procname);
1697                 warned++;
1698         }
1699 }
1700
1701 int ndisc_ifinfo_sysctl_change(struct ctl_table *ctl, int write, void __user *buffer, size_t *lenp, loff_t *ppos)
1702 {
1703         struct net_device *dev = ctl->extra1;
1704         struct inet6_dev *idev;
1705         int ret;
1706
1707         if ((strcmp(ctl->procname, "retrans_time") == 0) ||
1708             (strcmp(ctl->procname, "base_reachable_time") == 0))
1709                 ndisc_warn_deprecated_sysctl(ctl, "syscall", dev ? dev->name : "default");
1710
1711         if (strcmp(ctl->procname, "retrans_time") == 0)
1712                 ret = neigh_proc_dointvec(ctl, write, buffer, lenp, ppos);
1713
1714         else if (strcmp(ctl->procname, "base_reachable_time") == 0)
1715                 ret = neigh_proc_dointvec_jiffies(ctl, write,
1716                                                   buffer, lenp, ppos);
1717
1718         else if ((strcmp(ctl->procname, "retrans_time_ms") == 0) ||
1719                  (strcmp(ctl->procname, "base_reachable_time_ms") == 0))
1720                 ret = neigh_proc_dointvec_ms_jiffies(ctl, write,
1721                                                      buffer, lenp, ppos);
1722         else
1723                 ret = -1;
1724
1725         if (write && ret == 0 && dev && (idev = in6_dev_get(dev)) != NULL) {
1726                 if (ctl->data == &NEIGH_VAR(idev->nd_parms, BASE_REACHABLE_TIME))
1727                         idev->nd_parms->reachable_time =
1728                                         neigh_rand_reach_time(NEIGH_VAR(idev->nd_parms, BASE_REACHABLE_TIME));
1729                 idev->tstamp = jiffies;
1730                 inet6_ifinfo_notify(RTM_NEWLINK, idev);
1731                 in6_dev_put(idev);
1732         }
1733         return ret;
1734 }
1735
1736
1737 #endif
1738
1739 static int __net_init ndisc_net_init(struct net *net)
1740 {
1741         struct ipv6_pinfo *np;
1742         struct sock *sk;
1743         int err;
1744
1745         err = inet_ctl_sock_create(&sk, PF_INET6,
1746                                    SOCK_RAW, IPPROTO_ICMPV6, net);
1747         if (err < 0) {
1748                 ND_PRINTK(0, err,
1749                           "NDISC: Failed to initialize the control socket (err %d)\n",
1750                           err);
1751                 return err;
1752         }
1753
1754         net->ipv6.ndisc_sk = sk;
1755
1756         np = inet6_sk(sk);
1757         np->hop_limit = 255;
1758         /* Do not loopback ndisc messages */
1759         np->mc_loop = 0;
1760
1761         return 0;
1762 }
1763
1764 static void __net_exit ndisc_net_exit(struct net *net)
1765 {
1766         inet_ctl_sock_destroy(net->ipv6.ndisc_sk);
1767 }
1768
1769 static struct pernet_operations ndisc_net_ops = {
1770         .init = ndisc_net_init,
1771         .exit = ndisc_net_exit,
1772 };
1773
1774 int __init ndisc_init(void)
1775 {
1776         int err;
1777
1778         err = register_pernet_subsys(&ndisc_net_ops);
1779         if (err)
1780                 return err;
1781         /*
1782          * Initialize the neighbour table
1783          */
1784         neigh_table_init(NEIGH_ND_TABLE, &nd_tbl);
1785
1786 #ifdef CONFIG_SYSCTL
1787         err = neigh_sysctl_register(NULL, &nd_tbl.parms,
1788                                     ndisc_ifinfo_sysctl_change);
1789         if (err)
1790                 goto out_unregister_pernet;
1791 out:
1792 #endif
1793         return err;
1794
1795 #ifdef CONFIG_SYSCTL
1796 out_unregister_pernet:
1797         unregister_pernet_subsys(&ndisc_net_ops);
1798         goto out;
1799 #endif
1800 }
1801
1802 int __init ndisc_late_init(void)
1803 {
1804         return register_netdevice_notifier(&ndisc_netdev_notifier);
1805 }
1806
1807 void ndisc_late_cleanup(void)
1808 {
1809         unregister_netdevice_notifier(&ndisc_netdev_notifier);
1810 }
1811
1812 void ndisc_cleanup(void)
1813 {
1814 #ifdef CONFIG_SYSCTL
1815         neigh_sysctl_unregister(&nd_tbl.parms);
1816 #endif
1817         neigh_table_clear(NEIGH_ND_TABLE, &nd_tbl);
1818         unregister_pernet_subsys(&ndisc_net_ops);
1819 }